Upload folder using huggingface_hub
Browse files- .gitattributes +2 -0
- checkpoint-168000/config.json +79 -0
- checkpoint-168000/generation_config.json +6 -0
- checkpoint-168000/model.safetensors +3 -0
- checkpoint-168000/optimizer.pt +3 -0
- checkpoint-168000/rng_state_0.pth +3 -0
- checkpoint-168000/rng_state_1.pth +3 -0
- checkpoint-168000/rng_state_10.pth +3 -0
- checkpoint-168000/rng_state_11.pth +3 -0
- checkpoint-168000/rng_state_12.pth +3 -0
- checkpoint-168000/rng_state_13.pth +3 -0
- checkpoint-168000/rng_state_14.pth +3 -0
- checkpoint-168000/rng_state_15.pth +3 -0
- checkpoint-168000/rng_state_2.pth +3 -0
- checkpoint-168000/rng_state_3.pth +3 -0
- checkpoint-168000/rng_state_4.pth +3 -0
- checkpoint-168000/rng_state_5.pth +3 -0
- checkpoint-168000/rng_state_6.pth +3 -0
- checkpoint-168000/rng_state_7.pth +3 -0
- checkpoint-168000/rng_state_8.pth +3 -0
- checkpoint-168000/rng_state_9.pth +3 -0
- checkpoint-168000/scheduler.pt +3 -0
- checkpoint-168000/trainer_state.json +3 -0
- checkpoint-168000/training_args.bin +3 -0
- checkpoint-169000/config.json +79 -0
- checkpoint-169000/generation_config.json +6 -0
- checkpoint-169000/model.safetensors +3 -0
- checkpoint-169000/optimizer.pt +3 -0
- checkpoint-169000/rng_state_0.pth +3 -0
- checkpoint-169000/rng_state_1.pth +3 -0
- checkpoint-169000/rng_state_10.pth +3 -0
- checkpoint-169000/rng_state_11.pth +3 -0
- checkpoint-169000/rng_state_12.pth +3 -0
- checkpoint-169000/rng_state_13.pth +3 -0
- checkpoint-169000/rng_state_14.pth +3 -0
- checkpoint-169000/rng_state_15.pth +3 -0
- checkpoint-169000/rng_state_2.pth +3 -0
- checkpoint-169000/rng_state_3.pth +3 -0
- checkpoint-169000/rng_state_4.pth +3 -0
- checkpoint-169000/rng_state_5.pth +3 -0
- checkpoint-169000/rng_state_6.pth +3 -0
- checkpoint-169000/rng_state_7.pth +3 -0
- checkpoint-169000/rng_state_8.pth +3 -0
- checkpoint-169000/rng_state_9.pth +3 -0
- checkpoint-169000/scheduler.pt +3 -0
- checkpoint-169000/trainer_state.json +3 -0
- checkpoint-169000/training_args.bin +3 -0
.gitattributes
CHANGED
@@ -77,3 +77,5 @@ checkpoint-157000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
77 |
checkpoint-159000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
78 |
checkpoint-160000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
79 |
checkpoint-161000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
77 |
checkpoint-159000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
78 |
checkpoint-160000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
79 |
checkpoint-161000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
80 |
+
checkpoint-168000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
81 |
+
checkpoint-169000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
checkpoint-168000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMDiffusion"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 2,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-168000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-168000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:864bc3dfb85898f714496ba232e581624e8df07656d414b34ead803fc28eca58
|
3 |
+
size 4538452374
|
checkpoint-168000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60c32710892400c09b359cc7adebfd421c41834d20660d53aa98b61f6a5a2fa3
|
3 |
+
size 6630551906
|
checkpoint-168000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bd879f0a85629f26275208944052b96fe6dc5701bf37f01e55f484389f0419c
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6436d18d10ace2540296dae77c9f0ea9c37eead19e2b89e31063b363d6597e0e
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8d927271bca68ea59bfcb88c0faa4b7e705b1916e752d8c13b97808f57616637
|
3 |
+
size 15997
|
checkpoint-168000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f70b378554bc2b53b2eb7900390299e3bb2894b5092f96ccf4283afb1bccc07a
|
3 |
+
size 15997
|
checkpoint-168000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65bd414648daf6de10ab62b6a7ea0465cdfd7f28193534c9e3974eefb93cea96
|
3 |
+
size 15997
|
checkpoint-168000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f27d1a8257bfd68118455fa2f8aca374ba6f2581a43f664a9b154edfdc97d3fc
|
3 |
+
size 15997
|
checkpoint-168000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb6f5337c26779e7d106a6bfe58d780ba3872bb14a58b276dfd450ab72726c84
|
3 |
+
size 15997
|
checkpoint-168000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:182d7305349dea99745d45b906fadf27fb4fdedc74eaaee6a94310e4a236dd50
|
3 |
+
size 15997
|
checkpoint-168000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4373cf29eb2dfa4e6a8ef2a7ac4bac7240f5187a1ce8ab2b0f37cd2cacc20ce6
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eaf3ec6c2b600020f6696745f30dcd62fa9cb1a85cd4d75097af6b9e96ff562a
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ffc8dfcee775c49d113b77ba66b0bbd0eaf63c7757127aa0b890bf54d34c504c
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b00338f98aa37f1511360777ca049fd3aa002cd2307752b96e8ac8788fd40a0
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fde5d58b4bb646e820fdf362c13a2fd7bd55b64e6a02aed8a28a0b62bee58aab
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08dd594a62fdf851a551b54324b75342c07a960f2e994d51ea6fe120dc8e47c9
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfc759386a042e79720a9ea48cd0ac075bc7219d07c736d2b05254cee1a3295c
|
3 |
+
size 15984
|
checkpoint-168000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a5342e15f91bb7006ffd0e2d4f34d13712469ef7255ab7708d495bc92c4a5c1
|
3 |
+
size 15984
|
checkpoint-168000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e94f53e58fab073054663909f40de5ec9693ca4521dc5a6fc31f7da4297502f0
|
3 |
+
size 1064
|
checkpoint-168000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cc945d303237ec2617a0090eabc876f1abdf3c253b81b78167650c2226e3839
|
3 |
+
size 26054153
|
checkpoint-168000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8b32699bbc7e6238e84a62335a2010385954210922ec91b8bc8ab0278e89c56
|
3 |
+
size 6008
|
checkpoint-169000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMDiffusion"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 2,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-169000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-169000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:58ad71b119887354dc2e42879c89d9872fb1644ebc1d85a6ccefc4efaa512a0b
|
3 |
+
size 4538452374
|
checkpoint-169000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:feb80de96641267aa92f72ca238d1f963d3251b5f58b162e9514c400fa4d74c2
|
3 |
+
size 6630551906
|
checkpoint-169000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de8adc173498d12e63f1e9a48660383fdb0e76ba284e33d145c2e7afc8136b6e
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:745147b62cf07252d4a506fc3173059a921140f987890d8c6e8deef1db7c2283
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b41a227645651679958ef755d012eda2f8e4bb188ccdec79a5fa5a4701bcab0
|
3 |
+
size 15997
|
checkpoint-169000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1203c477bb8bd0f324e9e1df5732d8c6d061a1a3b17a474b4563bdc705771d70
|
3 |
+
size 15997
|
checkpoint-169000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:51f9ba4cc8b41a9580e6ae2c36f3f6cb7725e78f73ab96a8ab4cd9b44c85f057
|
3 |
+
size 15997
|
checkpoint-169000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbfe3af346238e934ddf2d202b28b98e50072baeb91069510d18b86951cf28d2
|
3 |
+
size 15997
|
checkpoint-169000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d91d1133cd24ba00278a74bc1a5451f70ad648ba4d41f490437c07de83eb8639
|
3 |
+
size 15997
|
checkpoint-169000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3cecacc172343afc6f4e7804eb2f147731c6a4ed3a0a733538d9dd01048333ae
|
3 |
+
size 15997
|
checkpoint-169000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4216844a14102750c7f12d40443c53fea98d664e1cc520852f40e53b8d5f8841
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97386d5d2b1167d43526ffe624dab00a918c5604ac05c38ded295871d3194294
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32298e0ccfaf1fa1ae15bee9131bb6650c825b19bfb8cc0e0960373c81bbd475
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74bf57f11c4e2ab3e13125d1a302c7db3af6e713c50f26afff669f0cd082957f
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:406f4c339362b05a12dc21313ec2481fbcdc2681b4bd653433a55f0fcbdef6cc
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6c8f21eba8b4b1273d03e5c2a51fc4d8924f89bef6294454295d68423035a65
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99ec412f574075bf93c1fddfc340b6d602411642482f5d41a9b08a0ad8ad73b9
|
3 |
+
size 15984
|
checkpoint-169000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9d4d1157b2b5ea1fc44db0690cc34e4d21a53146b67e4d236d4919ea1f8237b
|
3 |
+
size 15984
|
checkpoint-169000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83de56ae994f16992f17aaac3675983d0052ef337b3aec07d00c998a5092c000
|
3 |
+
size 1064
|
checkpoint-169000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:92710de0bb32e768e50bf52d7661c44ea1075290ba02f6a572ac3901f6035b41
|
3 |
+
size 26209596
|
checkpoint-169000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a953b73b9bdf726b40a7c48f803f02dcafb46ce7e5d75ed7831868bf46ad6984
|
3 |
+
size 5944
|