Upload folder using huggingface_hub
Browse files- .gitattributes +2 -0
- checkpoint-119000/config.json +79 -0
- checkpoint-119000/generation_config.json +6 -0
- checkpoint-119000/model.safetensors +3 -0
- checkpoint-119000/optimizer.pt +3 -0
- checkpoint-119000/rng_state_0.pth +3 -0
- checkpoint-119000/rng_state_1.pth +3 -0
- checkpoint-119000/rng_state_10.pth +3 -0
- checkpoint-119000/rng_state_11.pth +3 -0
- checkpoint-119000/rng_state_12.pth +3 -0
- checkpoint-119000/rng_state_13.pth +3 -0
- checkpoint-119000/rng_state_14.pth +3 -0
- checkpoint-119000/rng_state_15.pth +3 -0
- checkpoint-119000/rng_state_2.pth +3 -0
- checkpoint-119000/rng_state_3.pth +3 -0
- checkpoint-119000/rng_state_4.pth +3 -0
- checkpoint-119000/rng_state_5.pth +3 -0
- checkpoint-119000/rng_state_6.pth +3 -0
- checkpoint-119000/rng_state_7.pth +3 -0
- checkpoint-119000/rng_state_8.pth +3 -0
- checkpoint-119000/rng_state_9.pth +3 -0
- checkpoint-119000/scheduler.pt +3 -0
- checkpoint-119000/trainer_state.json +3 -0
- checkpoint-119000/training_args.bin +3 -0
- checkpoint-120000/config.json +79 -0
- checkpoint-120000/generation_config.json +6 -0
- checkpoint-120000/model.safetensors +3 -0
- checkpoint-120000/optimizer.pt +3 -0
- checkpoint-120000/rng_state_0.pth +3 -0
- checkpoint-120000/rng_state_1.pth +3 -0
- checkpoint-120000/rng_state_10.pth +3 -0
- checkpoint-120000/rng_state_11.pth +3 -0
- checkpoint-120000/rng_state_12.pth +3 -0
- checkpoint-120000/rng_state_13.pth +3 -0
- checkpoint-120000/rng_state_14.pth +3 -0
- checkpoint-120000/rng_state_15.pth +3 -0
- checkpoint-120000/rng_state_2.pth +3 -0
- checkpoint-120000/rng_state_3.pth +3 -0
- checkpoint-120000/rng_state_4.pth +3 -0
- checkpoint-120000/rng_state_5.pth +3 -0
- checkpoint-120000/rng_state_6.pth +3 -0
- checkpoint-120000/rng_state_7.pth +3 -0
- checkpoint-120000/rng_state_8.pth +3 -0
- checkpoint-120000/rng_state_9.pth +3 -0
- checkpoint-120000/scheduler.pt +3 -0
- checkpoint-120000/trainer_state.json +3 -0
- checkpoint-120000/training_args.bin +3 -0
.gitattributes
CHANGED
@@ -56,3 +56,5 @@ checkpoint-112000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
56 |
checkpoint-113000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
57 |
checkpoint-114000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
58 |
checkpoint-115000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
56 |
checkpoint-113000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
57 |
checkpoint-114000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
58 |
checkpoint-115000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
59 |
+
checkpoint-119000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
60 |
+
checkpoint-120000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
checkpoint-119000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMDiffusion"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 2,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-119000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-119000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7ab0172d7e8c1d45776f891f46615073cf1b9f60172a1d22fde14e0b870e6b2
|
3 |
+
size 4538452374
|
checkpoint-119000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1843a116394838b7eb05938fb2cf9f43b2bd6fcf84a51346d227e89047448ee1
|
3 |
+
size 6630551906
|
checkpoint-119000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a97e4f2d5365133e19d171b3055869e705a2534f6ffd0c4191ea386d5d55d44b
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:72e4ac2777f19ea5538ecf6863f2ba5b76a345611aa321695ba3e56ceef6e219
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86c2ca4ac7ac39e82f700acce3ee81e084435adb55ea9f3f228236abd766e214
|
3 |
+
size 15997
|
checkpoint-119000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15985eff4926fd8bca2bad09a59817950d7c011437c77bc555862f414ca30296
|
3 |
+
size 15997
|
checkpoint-119000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82bd9c8e550999c5e3616e1f70cb06ec25668020cd075a074d869c1c05396a81
|
3 |
+
size 15997
|
checkpoint-119000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38342150af1579cbc567e1262a5a333ff0e3a037daf2e25e60c9fc8b2eedd0a9
|
3 |
+
size 15997
|
checkpoint-119000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b31cdd30842d5884a3ed1d133fda70e5e96d555f2bce92a8ed02946dba0989d9
|
3 |
+
size 15997
|
checkpoint-119000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:29da03835c56d97eb14761c14256bfdeeb0253ef99bc605bc60f1e7f9b714be0
|
3 |
+
size 15997
|
checkpoint-119000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35005b7cdb6a740dbf6756b00aa1169034ccbcde944a153cd0360b6504883935
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2f9c4269323bc5b667cd2c73a974e6bd168e468d28d7793d5c6839331d2db24
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19735972c1c831322fb9ac87079a8e99d5b8a8c36d75afbb681000fe5ab61345
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2b30c1097b1937bbf8ddc7960daa89b9d3207cff20d73bf1b4c86fde2db77c9f
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:12f08c92147f5d5deb37fa9d15bdab49635d97a8f51b6f1282a72a0cf3495d7e
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec375ed83c6fcf3f15930d64284ad8da5f4c2b6991249faea3bf2eb5aece5801
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:09cca6e38a7c7ab60160d97349c0e357b1e92d65cc98584f35603a39a1b692ea
|
3 |
+
size 15984
|
checkpoint-119000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a945b099d12e971622d8f13dc037db106610f61a26cd25a6cb46b178d379658
|
3 |
+
size 15984
|
checkpoint-119000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:648c1a2362cc979baf9c1786772067fe74dd5893470c67ea8b1956020207a333
|
3 |
+
size 1064
|
checkpoint-119000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26a8050abf7d078b6cd109d52f12e701f36a741ebadcce60e29ef13082fcb0ff
|
3 |
+
size 18423107
|
checkpoint-119000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acaa7c6ae2d4ff896e71743a00e9a9fb5c55da63567f670ba0d14f25ced8ad75
|
3 |
+
size 6008
|
checkpoint-120000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMDiffusion"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 2,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-sana-1.1-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-120000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-120000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e860aa8b77375f7ae357f60207ee24dc5c680be57f0c13edd53540d3dd536ef1
|
3 |
+
size 4538452374
|
checkpoint-120000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:895b89ca1931496023efd06e35bff944064194a9a20f2cd1493a47ccd9542a2e
|
3 |
+
size 6630551906
|
checkpoint-120000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56a227ccbc0834cc7233952054156cedd85a633b691852354c9e0d8ea0d28151
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8de6a095731b261a18847adff24c08067ecab5b8a3c96aec710603f4e32296fa
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65bd70d0ee44aa3e7571221f0a99f15f534ca0c67021289e269d0ad497cf40b7
|
3 |
+
size 15997
|
checkpoint-120000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4654f4886509650d1b4364448c2827094d0993baf284dae67ac9ec822d71b90
|
3 |
+
size 15997
|
checkpoint-120000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4573286c5994c4b4e2611e8cd07dd182b2ceed775e2efa1c715cece8f906a255
|
3 |
+
size 15997
|
checkpoint-120000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ae26a8ed9c886988646eafb527465a684ab2b2e69e8afc2470655a31c96c55c6
|
3 |
+
size 15997
|
checkpoint-120000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab5fc16a80aa3667e69a0f28e775c6e94941259f7b5a688bdc0951cdce3d42c8
|
3 |
+
size 15997
|
checkpoint-120000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:75275d3c48cfb49f258dcb149618fa101a998332a0427c79ca1effc2d577a5e4
|
3 |
+
size 15997
|
checkpoint-120000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ab85a24f532cd4b66783d82cba67127058fdfe26087e1383572d8e3b78c607d9
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6965c72ed4a334bec110873edbc7905a279ea199d0dd05a6a1135bb5aa008c27
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:94a7abd787aef27a8b5cb71d7bef17ce669dd3448bf14601db1156410e72971a
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c7ae40d4eb426ed5e532d9677071758a440323d6cd3327a200231d2d375e7509
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b3a8b05b08f6d6b84c0add90f84b236c1c7a91ea121f9937dca905a3207023d
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e6f9aa1d7e631f4c037b5b1fcdb82563d5fc41afcfbaedbf05cb5cdce4c2c03a
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99c346d66a67186345d15eac7df865ac4e1036de077587b90cff7017c0a95ebd
|
3 |
+
size 15984
|
checkpoint-120000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c272288c6eb17a55a73ffe3f76820e2c84b115b95439b9dece8a39741d2331b
|
3 |
+
size 15984
|
checkpoint-120000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7506e59efcfc89320b42c0af18120fa2b1e15e421c9d1fa6fe7de5b6fc0406ed
|
3 |
+
size 1064
|
checkpoint-120000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b49beed6a460924c26d3549664f3bb1156cd34337a73f00abea835622a6f46b
|
3 |
+
size 18578703
|
checkpoint-120000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acaa7c6ae2d4ff896e71743a00e9a9fb5c55da63567f670ba0d14f25ced8ad75
|
3 |
+
size 6008
|