zhiyang1 commited on Jul 27

Commit

29975e8

verified ·

1 Parent(s): f3e1f63

Upload folder using huggingface_hub

Browse files

Files changed (26) hide show

checkpoint-38000/config.json +79 -0
checkpoint-38000/generation_config.json +6 -0
checkpoint-38000/model-00001-of-00002.safetensors +3 -0
checkpoint-38000/model-00002-of-00002.safetensors +3 -0
checkpoint-38000/model.safetensors.index.json +0 -0
checkpoint-38000/optimizer.pt +3 -0
checkpoint-38000/rng_state_0.pth +3 -0
checkpoint-38000/rng_state_1.pth +3 -0
checkpoint-38000/rng_state_2.pth +3 -0
checkpoint-38000/rng_state_3.pth +3 -0
checkpoint-38000/scheduler.pt +3 -0
checkpoint-38000/trainer_state.json +0 -0
checkpoint-38000/training_args.bin +3 -0
checkpoint-40000/config.json +79 -0
checkpoint-40000/generation_config.json +6 -0
checkpoint-40000/model-00001-of-00002.safetensors +3 -0
checkpoint-40000/model-00002-of-00002.safetensors +3 -0
checkpoint-40000/model.safetensors.index.json +0 -0
checkpoint-40000/optimizer.pt +3 -0
checkpoint-40000/rng_state_0.pth +3 -0
checkpoint-40000/rng_state_1.pth +3 -0
checkpoint-40000/rng_state_2.pth +3 -0
checkpoint-40000/rng_state_3.pth +3 -0
checkpoint-40000/scheduler.pt +3 -0
checkpoint-40000/trainer_state.json +0 -0
checkpoint-40000/training_args.bin +3 -0

checkpoint-38000/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "ar_steps": 1,
+  "architectures": [
+    "DiffVLMDiffusion"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "condition_layer": -1,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 1536,
+  "image_token_id": 151655,
+  "img_cross_attention_dim": 2048,
+  "img_diffuser_depth": 1,
+  "img_ffn_dim_multiplier": null,
+  "img_hidden_size": 1536,
+  "img_multiple_of": 256,
+  "img_norm_eps": 1e-05,
+  "img_num_attention_heads": 12,
+  "img_num_kv_heads": 12,
+  "img_qk_norm": true,
+  "in_channels": 32,
+  "initializer_range": 0.02,
+  "inject_img_diffuser": false,
+  "input_size": 32,
+  "intermediate_size": 8960,
+  "layer_group_size": 7,
+  "layerwise_start_idx": 0,
+  "lora_alpha": 16,
+  "lora_bias": "none",
+  "lora_dropout": 0.05,
+  "lora_enable": false,
+  "lora_r": 64,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen2_vl",
+  "non_linearity": 1,
+  "norm_elementwise_affine": true,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 2,
+  "patch_size": 1,
+  "repa_coeff": 0.5,
+  "repa_layers": null,
+  "repa_shared": false,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": {
+    "mrope_section": [
+      16,
+      24,
+      24
+    ],
+    "rope_type": "default",
+    "type": "default"
+  },
+  "rope_theta": 1000000.0,
+  "sample_size": 128,
+  "sampling_steps": 28,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "use_repa": false,
+  "use_residual_attn": true,
+  "use_sliding_window": false,
+  "vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
+  "video_token_id": 151656,
+  "vision_config": {
+    "hidden_size": 1536,
+    "in_chans": 3,
+    "model_type": "qwen2_vl",
+    "spatial_patch_size": 14
+  },
+  "vision_end_token_id": 151653,
+  "vision_start_token_id": 151652,
+  "vision_token_id": 151654,
+  "vocab_size": 151936
+}

checkpoint-38000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 151643,
+  "eos_token_id": 151645,
+  "transformers_version": "4.47.0"
+}

checkpoint-38000/model-00001-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:dbb81d846ac864dd378b8a6a64144c123e160fa935577480bc902aaeaee7aec0
+size 4974360904

checkpoint-38000/model-00002-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b9ca2dd3d9cda303fefebf06e45bebeee72618f41f33439439ef7f5b20047a15
+size 3234250886

checkpoint-38000/model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-38000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d08c8ab7b0ae86164a5af3aada9fd41157543c8e8eafcd33018ab53889830957
+size 7455061885

checkpoint-38000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60f0d6503f62ccdf31b06090d38b410356f491999e30ebaa4d50263817fd6248
+size 15024

checkpoint-38000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:cd7e64b2fa64eefe739fc7ed7b50901fda06959dd050983e1363bf61a7e95420
+size 15024

checkpoint-38000/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:60c721a8d8da920188a14c9372c04d9ba9bf036bba96d9e53e721d11436e0d40
+size 15024

checkpoint-38000/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a2254c4824f10888c17c54bd15efb33e13b814b26c4e2b743789e0a86cb0359
+size 15024

checkpoint-38000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f7b987c90811de117ba5bf2f292e72dca849fcd63c0aaf7fff0a35abb1ab8e4c
+size 1064

checkpoint-38000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-38000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66b2766db25b9b8bf494151fa7b3f46947dd1e41dc8576a87992122e6043123d
+size 6008

checkpoint-40000/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "ar_steps": 1,
+  "architectures": [
+    "DiffVLMDiffusion"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "condition_layer": -1,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 1536,
+  "image_token_id": 151655,
+  "img_cross_attention_dim": 2048,
+  "img_diffuser_depth": 1,
+  "img_ffn_dim_multiplier": null,
+  "img_hidden_size": 1536,
+  "img_multiple_of": 256,
+  "img_norm_eps": 1e-05,
+  "img_num_attention_heads": 12,
+  "img_num_kv_heads": 12,
+  "img_qk_norm": true,
+  "in_channels": 32,
+  "initializer_range": 0.02,
+  "inject_img_diffuser": false,
+  "input_size": 32,
+  "intermediate_size": 8960,
+  "layer_group_size": 7,
+  "layerwise_start_idx": 0,
+  "lora_alpha": 16,
+  "lora_bias": "none",
+  "lora_dropout": 0.05,
+  "lora_enable": false,
+  "lora_r": 64,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen2_vl",
+  "non_linearity": 1,
+  "norm_elementwise_affine": true,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 2,
+  "patch_size": 1,
+  "repa_coeff": 0.5,
+  "repa_layers": null,
+  "repa_shared": false,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": {
+    "mrope_section": [
+      16,
+      24,
+      24
+    ],
+    "rope_type": "default",
+    "type": "default"
+  },
+  "rope_theta": 1000000.0,
+  "sample_size": 128,
+  "sampling_steps": 28,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "use_repa": false,
+  "use_residual_attn": true,
+  "use_sliding_window": false,
+  "vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
+  "video_token_id": 151656,
+  "vision_config": {
+    "hidden_size": 1536,
+    "in_chans": 3,
+    "model_type": "qwen2_vl",
+    "spatial_patch_size": 14
+  },
+  "vision_end_token_id": 151653,
+  "vision_start_token_id": 151652,
+  "vision_token_id": 151654,
+  "vocab_size": 151936
+}

checkpoint-40000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 151643,
+  "eos_token_id": 151645,
+  "transformers_version": "4.47.0"
+}

checkpoint-40000/model-00001-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:13b49549995af6d9c8279764d2578fb056f2231e52ba1582f61cfb0767f354c2
+size 4974360904

checkpoint-40000/model-00002-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0168f758953f199e38ce7ecaa66beddc6661b6cc4ae1ed507d21750e7d24d620
+size 3234250886

checkpoint-40000/model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-40000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1cbac46f291c06cfbc64d703fea049a90d3875a9f74a805f05b31a33c4fba48f
+size 7455061885

checkpoint-40000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a56383f4f2e8b022d47f7e0995963d51bc093a55e5158368fb7ac4fb6dec31a7
+size 15024

checkpoint-40000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9594ccddf4177429832197c78503d5a7ddb51fc8e50268d01392824d46790cc9
+size 15024

checkpoint-40000/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35ce058f34975a7c9afea28e4aa5020607e1b81b2133db54f141dcf10759b71b
+size 15024

checkpoint-40000/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0ae282094e5af5fc3326b545c4ddd1f0b9c7842212200f65028ac05ca82948a0
+size 15024

checkpoint-40000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:825e1818d8a0f8348d506acdab26ab27594e76e01808880216f9807387891534
+size 1064

checkpoint-40000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-40000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:66b2766db25b9b8bf494151fa7b3f46947dd1e41dc8576a87992122e6043123d
+size 6008