Upload folder using huggingface_hub
Browse files- .gitattributes +2 -0
- checkpoint-132000/config.json +79 -0
- checkpoint-132000/generation_config.json +6 -0
- checkpoint-132000/model.safetensors +3 -0
- checkpoint-132000/optimizer.pt +3 -0
- checkpoint-132000/rng_state_0.pth +3 -0
- checkpoint-132000/rng_state_1.pth +3 -0
- checkpoint-132000/rng_state_10.pth +3 -0
- checkpoint-132000/rng_state_11.pth +3 -0
- checkpoint-132000/rng_state_12.pth +3 -0
- checkpoint-132000/rng_state_13.pth +3 -0
- checkpoint-132000/rng_state_14.pth +3 -0
- checkpoint-132000/rng_state_15.pth +3 -0
- checkpoint-132000/rng_state_2.pth +3 -0
- checkpoint-132000/rng_state_3.pth +3 -0
- checkpoint-132000/rng_state_4.pth +3 -0
- checkpoint-132000/rng_state_5.pth +3 -0
- checkpoint-132000/rng_state_6.pth +3 -0
- checkpoint-132000/rng_state_7.pth +3 -0
- checkpoint-132000/rng_state_8.pth +3 -0
- checkpoint-132000/rng_state_9.pth +3 -0
- checkpoint-132000/scheduler.pt +3 -0
- checkpoint-132000/trainer_state.json +3 -0
- checkpoint-132000/training_args.bin +3 -0
- checkpoint-133000/config.json +79 -0
- checkpoint-133000/generation_config.json +6 -0
- checkpoint-133000/model.safetensors +3 -0
- checkpoint-133000/optimizer.pt +3 -0
- checkpoint-133000/rng_state_0.pth +3 -0
- checkpoint-133000/rng_state_1.pth +3 -0
- checkpoint-133000/rng_state_10.pth +3 -0
- checkpoint-133000/rng_state_11.pth +3 -0
- checkpoint-133000/rng_state_12.pth +3 -0
- checkpoint-133000/rng_state_13.pth +3 -0
- checkpoint-133000/rng_state_14.pth +3 -0
- checkpoint-133000/rng_state_15.pth +3 -0
- checkpoint-133000/rng_state_2.pth +3 -0
- checkpoint-133000/rng_state_3.pth +3 -0
- checkpoint-133000/rng_state_4.pth +3 -0
- checkpoint-133000/rng_state_5.pth +3 -0
- checkpoint-133000/rng_state_6.pth +3 -0
- checkpoint-133000/rng_state_7.pth +3 -0
- checkpoint-133000/rng_state_8.pth +3 -0
- checkpoint-133000/rng_state_9.pth +3 -0
- checkpoint-133000/scheduler.pt +3 -0
- checkpoint-133000/trainer_state.json +3 -0
- checkpoint-133000/training_args.bin +3 -0
.gitattributes
CHANGED
@@ -64,3 +64,5 @@ checkpoint-124000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
64 |
checkpoint-125000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
65 |
checkpoint-129000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
66 |
checkpoint-130000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
64 |
checkpoint-125000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
65 |
checkpoint-129000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
66 |
checkpoint-130000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
67 |
+
checkpoint-132000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
68 |
+
checkpoint-133000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
checkpoint-132000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMDiffusion"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 2,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-132000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-132000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:690d9e8af347be05811cc6a159ab5e85536d58d1bd55e8ca18ba491e5049dd13
|
3 |
+
size 4538452374
|
checkpoint-132000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfec93174f72b757896344374091f24b25009a0900f9b44141164b878b22520b
|
3 |
+
size 6630551906
|
checkpoint-132000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e92c0d362214349bf408e8a48dc1b9d5acdad6cbad45568243f3ef39107330a0
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1743f9caf45d88a336760b79a4b76d09f357bb31f69706da6f6b2d0a91b380e
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2dd22ccefeb7715911daf714ec1ff9674c29e6d80bef81e27e7b7112bd8f28ef
|
3 |
+
size 15997
|
checkpoint-132000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e33c4dc8386ef53b55b6f0c38de20a38909a7abcdf032a76fa26be68ae13a6e
|
3 |
+
size 15997
|
checkpoint-132000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fcb0f1bd47772ea7af5a7bb7cf8f5846839a9cde3cac95a354a622532072069
|
3 |
+
size 15997
|
checkpoint-132000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e37f71fca0878962db5f2a95a9c47381eaac675adceaf3e0e046278595f3d53e
|
3 |
+
size 15997
|
checkpoint-132000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3972b0a34e492269c0257e7bb2e5e9b5d115556a26945b357a929ad9b24a1d
|
3 |
+
size 15997
|
checkpoint-132000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18b21aeb2539843e641a0f9a97059c7e54d7735571b65f9f47678013b39651b0
|
3 |
+
size 15997
|
checkpoint-132000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4899839ea856cea8463fad2c42d8eff2953478a14408f1761e9eed1d0d153ef8
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d589d86d265c973d1b51bc6df0a6ffa89d9b70d52e5a1c532162e21694e69354
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:871ce3ce4d84fed13d62a280c2b05bb3c014963485abadf17660b14405e0d38a
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81bafe92cff5ba0bb152462eb7efe0b0a63af13d8ac5636f709d3232f8297527
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f82e22cea08f759e28c0a99a83c24fd4ecfdcbccc8b0c6d19897db953661d3a
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ca7da9dec0bdacff08727e69648e11c32397e165d40208db4b8b167a0ee37c8
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ed7704074532ce0ea861c1b1fbc116be3fb0651826791f5bd94793490cb9aba
|
3 |
+
size 15984
|
checkpoint-132000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:78b9331e3d740b9b5333da0d7b70bb6c38c4c33f104092618026dbe13f1179fd
|
3 |
+
size 15984
|
checkpoint-132000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ffa8bf1429574ee07b3782d9886351a7c39e396e0bbc70f2adcf6a48437f0d3
|
3 |
+
size 1064
|
checkpoint-132000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c719ba9d5e1f1ba88e2bc7597363ecfa7c423579c691b036c836a66ca354c77
|
3 |
+
size 20447258
|
checkpoint-132000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3203b22e20d61aa91f3f02b462125020339348687e668ab4fd5e01e20a7c85cb
|
3 |
+
size 6008
|
checkpoint-133000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMDiffusion"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 2,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-133000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-133000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59d9c7428d083ea72e992d8de429b2a962def6ff88310ec161934e4fe852c056
|
3 |
+
size 4538452374
|
checkpoint-133000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dfce75d92cc5ee3ddc7a6c626c42cda1d44e192873a9a81c0d26c82e0ebd2dbe
|
3 |
+
size 6630551906
|
checkpoint-133000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a6c77ac9a1e217f6f5cbf2c166fb9e142c9db1351a65638e419d7b12136d3d3
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b613feaddb40be695e622ba311cca1fe24c8ecec828f1339c574b8f2f5194506
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dff86b167bf96ef1f142e47956f7c75ce6a97caad3dbfbd01eb4810740b9d3ce
|
3 |
+
size 15997
|
checkpoint-133000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8510a185babb01a2ebf31c7c64561f68ac10482216922a900db9bbdda6362e35
|
3 |
+
size 15997
|
checkpoint-133000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b48225d91169b126d8b69080a6a87c1c8a16c8d79da78918d947d03369a628cd
|
3 |
+
size 15997
|
checkpoint-133000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c821d49f6eada136e366e3340ea2ff6fedd0a4d3afe271e0937dc4d2a3263a59
|
3 |
+
size 15997
|
checkpoint-133000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2edad7934c7e0f1a734f48a6d7426f88356d4052304eebb262ac5e2d586435c
|
3 |
+
size 15997
|
checkpoint-133000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:235df1060c745806de684c3dd37106912059ee0fe13cd41af50d0e635407c6bd
|
3 |
+
size 15997
|
checkpoint-133000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b9835937281921e7924ce254a66f956343f8926193bbf8f942a182c7867f8e3
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb04b4c29b8e4cfaf60a8cae2418e90cc4d07feb054ed2af898af3393a6b907f
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21f28c6bf4121f5c47ef6c4061eb153bb673166122e65a90dc836db592e0c0a4
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c82208c9ccc92d86e1a57cface0d39dbcb5e922a4eb632673818ef93157f7955
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ec3966680147c0cbe11d602ef3b0f62f60c6a57cbe5d5247d7cd7412d5ba5a8
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1c85a18dac593f2c26a47afa4a500e19b69f7443cb4e8541daeb368224f6030a
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ed3839505e0ee87269cbe28c943c5c5e33f8638dda93b008aa4171a56ab14a4c
|
3 |
+
size 15984
|
checkpoint-133000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:503613116baad3c509d3e02eba5a828c1c85aa9f6f953352ba321b2467f242a8
|
3 |
+
size 15984
|
checkpoint-133000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8d160eb063d90aeb536da903ba2c387ca3a10d87ce3f6c8ae315e21198d632a
|
3 |
+
size 1064
|
checkpoint-133000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:36b07a72352333241443a13d7d4fa8fa8414635834dde720214596dc67e33a11
|
3 |
+
size 20603014
|
checkpoint-133000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2249053f2df631376158cbe7753f768696a3970d402ba540d194b401cdc7f7fc
|
3 |
+
size 5944
|