Upload folder using huggingface_hub
Browse files- .gitattributes +2 -0
- checkpoint-229000/config.json +79 -0
- checkpoint-229000/generation_config.json +6 -0
- checkpoint-229000/model.safetensors +3 -0
- checkpoint-229000/optimizer.pt +3 -0
- checkpoint-229000/rng_state_0.pth +3 -0
- checkpoint-229000/rng_state_1.pth +3 -0
- checkpoint-229000/rng_state_10.pth +3 -0
- checkpoint-229000/rng_state_11.pth +3 -0
- checkpoint-229000/rng_state_12.pth +3 -0
- checkpoint-229000/rng_state_13.pth +3 -0
- checkpoint-229000/rng_state_14.pth +3 -0
- checkpoint-229000/rng_state_15.pth +3 -0
- checkpoint-229000/rng_state_2.pth +3 -0
- checkpoint-229000/rng_state_3.pth +3 -0
- checkpoint-229000/rng_state_4.pth +3 -0
- checkpoint-229000/rng_state_5.pth +3 -0
- checkpoint-229000/rng_state_6.pth +3 -0
- checkpoint-229000/rng_state_7.pth +3 -0
- checkpoint-229000/rng_state_8.pth +3 -0
- checkpoint-229000/rng_state_9.pth +3 -0
- checkpoint-229000/scheduler.pt +3 -0
- checkpoint-229000/trainer_state.json +3 -0
- checkpoint-229000/training_args.bin +3 -0
- checkpoint-230000/config.json +79 -0
- checkpoint-230000/generation_config.json +6 -0
- checkpoint-230000/model.safetensors +3 -0
- checkpoint-230000/optimizer.pt +3 -0
- checkpoint-230000/rng_state_0.pth +3 -0
- checkpoint-230000/rng_state_1.pth +3 -0
- checkpoint-230000/rng_state_10.pth +3 -0
- checkpoint-230000/rng_state_11.pth +3 -0
- checkpoint-230000/rng_state_12.pth +3 -0
- checkpoint-230000/rng_state_13.pth +3 -0
- checkpoint-230000/rng_state_14.pth +3 -0
- checkpoint-230000/rng_state_15.pth +3 -0
- checkpoint-230000/rng_state_2.pth +3 -0
- checkpoint-230000/rng_state_3.pth +3 -0
- checkpoint-230000/rng_state_4.pth +3 -0
- checkpoint-230000/rng_state_5.pth +3 -0
- checkpoint-230000/rng_state_6.pth +3 -0
- checkpoint-230000/rng_state_7.pth +3 -0
- checkpoint-230000/rng_state_8.pth +3 -0
- checkpoint-230000/rng_state_9.pth +3 -0
- checkpoint-230000/scheduler.pt +3 -0
- checkpoint-230000/trainer_state.json +3 -0
- checkpoint-230000/training_args.bin +3 -0
.gitattributes
CHANGED
@@ -88,3 +88,5 @@ checkpoint-213000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
88 |
checkpoint-219000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
89 |
checkpoint-220000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
90 |
checkpoint-221000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
88 |
checkpoint-219000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
89 |
checkpoint-220000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
90 |
checkpoint-221000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
91 |
+
checkpoint-229000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
92 |
+
checkpoint-230000/trainer_state.json filter=lfs diff=lfs merge=lfs -text
|
checkpoint-229000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMBaseline"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 1,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-in-1.0-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-229000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-229000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1e0edc4e0aaa80a2a6957f67ef8a7a042e8e45e82bfc9b5be9c484379bdf74c2
|
3 |
+
size 4410723984
|
checkpoint-229000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6db4c3ec57b8241b556faa1d70033c18b7c5ffb59809488997416aa3668134f5
|
3 |
+
size 6330255386
|
checkpoint-229000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7b6a149d9f23136484bb709e785756315fed701e1190b33b797abc1404d53e20
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c043b6dcf5ae920bfdea10b77c47cd741dbb78f5963193d3ee836e1a2067198
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e173c1d61c024300dc15811830962b1d5e691ad33eee43f5cf0c9420ebf438e6
|
3 |
+
size 15997
|
checkpoint-229000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:208ba7dfbdb03a933e33442a5b721492fd353c884d95bc6ba42fcaf88969c2e7
|
3 |
+
size 15997
|
checkpoint-229000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:493d031cae1656df0c4f9e82504b671afe6fa918d48c699ad0d9b5f28f8c80b1
|
3 |
+
size 15997
|
checkpoint-229000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99d0b57f3385a80d748131dd6eeafbac70b227583ef1f2d4c976a639942ab0cd
|
3 |
+
size 15997
|
checkpoint-229000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3c1340cd785836267ea932c1589d476d7b4d6d51ee2408c7f2571546e8f88d0b
|
3 |
+
size 15997
|
checkpoint-229000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c0ee0e0ebf591a74d277fe91d7379cdd469defa76781ed198af198d3f57d09c
|
3 |
+
size 15997
|
checkpoint-229000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:024e7a7fecc90b8643cf9e16b522376b04b931f2edabb244975e3492ba619592
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cac3eaa172b1b253c256ba9e7320da0a7247252e78aab3a5ae3f5b698df27b15
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dee7e7c8d4e6be4b53fab5cb69a40d02ff08d7fff31d9d4573fe403f5bf39f0
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:829a0ca311e248e6b6e19ecb27afd57d5bcd85ab0871fba5766bc4a2906ca2ba
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6804954b01765604c8ca83653255ffa1fa3455b8c5b685063849fb5eea0937de
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ad726e230d089ede99cb3831b33771b8d4ba37a060ef24c81ca0b0d4f1afdde
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:935bc40744420d2fc26bcfd48a6c51b74206b123252534daf39ce02181e5b9c8
|
3 |
+
size 15984
|
checkpoint-229000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d2f3ef068d75ad7ee9875e897158c3926c4cb426236c9fb76778feae8b606432
|
3 |
+
size 15984
|
checkpoint-229000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:87bf8cb262af0cbc0422fb8a332bba78c06fa2975259c8aa3cc8e60e1efcc802
|
3 |
+
size 1064
|
checkpoint-229000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc4f82bc0ce9f9bf8ce43bfed758cb671d8cacdcd15bd669a8f5e8833f15fcf5
|
3 |
+
size 35021416
|
checkpoint-229000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9c5f41557bf5b78540cd449032c7079998143a6748f2d58d6dfd615966e3e3b
|
3 |
+
size 5944
|
checkpoint-230000/config.json
ADDED
@@ -0,0 +1,79 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"ar_steps": 1,
|
3 |
+
"architectures": [
|
4 |
+
"DiffVLMBaseline"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"condition_layer": -1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 1536,
|
12 |
+
"image_token_id": 151655,
|
13 |
+
"img_cross_attention_dim": 2048,
|
14 |
+
"img_diffuser_depth": 2,
|
15 |
+
"img_ffn_dim_multiplier": null,
|
16 |
+
"img_hidden_size": 1536,
|
17 |
+
"img_multiple_of": 256,
|
18 |
+
"img_norm_eps": 1e-05,
|
19 |
+
"img_num_attention_heads": 12,
|
20 |
+
"img_num_kv_heads": 12,
|
21 |
+
"img_qk_norm": true,
|
22 |
+
"in_channels": 32,
|
23 |
+
"initializer_range": 0.02,
|
24 |
+
"inject_img_diffuser": false,
|
25 |
+
"input_size": 32,
|
26 |
+
"intermediate_size": 8960,
|
27 |
+
"layer_group_size": 7,
|
28 |
+
"layerwise_start_idx": 0,
|
29 |
+
"lora_alpha": 128,
|
30 |
+
"lora_bias": "none",
|
31 |
+
"lora_dropout": 0.05,
|
32 |
+
"lora_enable": false,
|
33 |
+
"lora_r": 64,
|
34 |
+
"max_position_embeddings": 32768,
|
35 |
+
"max_window_layers": 28,
|
36 |
+
"model_type": "qwen2_vl",
|
37 |
+
"non_linearity": 1,
|
38 |
+
"norm_elementwise_affine": true,
|
39 |
+
"num_attention_heads": 12,
|
40 |
+
"num_hidden_layers": 28,
|
41 |
+
"num_key_value_heads": 2,
|
42 |
+
"patch_size": 1,
|
43 |
+
"repa_coeff": 0.1,
|
44 |
+
"repa_layers": "2",
|
45 |
+
"repa_shared": false,
|
46 |
+
"rms_norm_eps": 1e-06,
|
47 |
+
"rope_scaling": {
|
48 |
+
"mrope_section": [
|
49 |
+
16,
|
50 |
+
24,
|
51 |
+
24
|
52 |
+
],
|
53 |
+
"rope_type": "default",
|
54 |
+
"type": "default"
|
55 |
+
},
|
56 |
+
"rope_theta": 1000000.0,
|
57 |
+
"sample_size": 128,
|
58 |
+
"sampling_steps": 28,
|
59 |
+
"sliding_window": null,
|
60 |
+
"tie_word_embeddings": true,
|
61 |
+
"torch_dtype": "bfloat16",
|
62 |
+
"transformers_version": "4.47.0",
|
63 |
+
"use_cache": true,
|
64 |
+
"use_repa": false,
|
65 |
+
"use_residual_attn": false,
|
66 |
+
"use_sliding_window": false,
|
67 |
+
"vae_path": "mit-han-lab/dc-ae-f32c32-in-1.0-diffusers",
|
68 |
+
"video_token_id": 151656,
|
69 |
+
"vision_config": {
|
70 |
+
"hidden_size": 1536,
|
71 |
+
"in_chans": 3,
|
72 |
+
"model_type": "qwen2_vl",
|
73 |
+
"spatial_patch_size": 14
|
74 |
+
},
|
75 |
+
"vision_end_token_id": 151653,
|
76 |
+
"vision_start_token_id": 151652,
|
77 |
+
"vision_token_id": 151654,
|
78 |
+
"vocab_size": 151936
|
79 |
+
}
|
checkpoint-230000/generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 151643,
|
4 |
+
"eos_token_id": 151645,
|
5 |
+
"transformers_version": "4.47.0"
|
6 |
+
}
|
checkpoint-230000/model.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d1bb92fa8e7214efd7884eacdc18552697ce2513f52172aebf5aa65280f7b45c
|
3 |
+
size 4410723984
|
checkpoint-230000/optimizer.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d98e985f417b718e21586a8d5d913ce6f0274b6f323e3fccd051a2e92d56ecbb
|
3 |
+
size 6330255386
|
checkpoint-230000/rng_state_0.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06e5f77c524a46098fccbce27ff8c3544160ae9a96ee97fa6972f9c0e108ba81
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_1.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b537a4f1d032d764c1f98d757b2ce09a2b5e1b2a803d4aec5efa633e16935409
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_10.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9385ab1b4096ea6b5deda06fd1fe399935521dd93e7526eba8f3c6a1971688d
|
3 |
+
size 15997
|
checkpoint-230000/rng_state_11.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc715c6cd58142dd9d71d76baf7a04e65b7cc7fbfd5e1c0eea23653cb5e1f346
|
3 |
+
size 15997
|
checkpoint-230000/rng_state_12.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cc9c953fb875b835db35929746a3320bdee31e624ce8cab5a8425d9d2b9cff8a
|
3 |
+
size 15997
|
checkpoint-230000/rng_state_13.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95f055ff91941a27f98da569147adaa04367336f534a7df36fe11b7050c0e414
|
3 |
+
size 15997
|
checkpoint-230000/rng_state_14.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38bbd16331bb2cebf72af53e0491cad280c9a8a8a5b1150fc275908c1a2a342a
|
3 |
+
size 15997
|
checkpoint-230000/rng_state_15.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e8d3969ebc61591d901adba7a8593b929159755c12bde573c7b6fcda6f541bf8
|
3 |
+
size 15997
|
checkpoint-230000/rng_state_2.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3d3973c1a3917b38d4657d90cf0cf5512f61857fc4c57bf92950f8fd0d7c20a
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_3.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5863cf7588deb93984974b602e0ebbe2b6c173664e74507ce380f486d467d9e6
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_4.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f04e1151e5eec2b6ada90c38f53fb1708c941e313486f67c39db06a0dd5c9182
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_5.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08aeb0fb9528296b0ddf53b068376517ca4b8022a7d1226bad26db6b7118ca17
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_6.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:42556155d07f2ee1c12fa8a73e221a944893d834b94088af048703914cee5915
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_7.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:14cfcfaa413a6215a5173c7b9c2bfe82d5cf006b8b8753c022e2ddb556793288
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_8.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a207e687b67f7dc07e33f02573aade2cdeff25cdeb80aef49e40a13b4dc03b5e
|
3 |
+
size 15984
|
checkpoint-230000/rng_state_9.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:610a5fa6d18438e3b679b412fa581602b976b72d37eb64edf6625fc7a5e96cbd
|
3 |
+
size 15984
|
checkpoint-230000/scheduler.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1316ffc28af177d66590d5f4174f2d06882f1ed25a04a4b1e7438ac664ec7c9e
|
3 |
+
size 1064
|
checkpoint-230000/trainer_state.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b18268704c3f1389de12b04e171c23804fca6347fa66474e1ca051b53e971b51
|
3 |
+
size 35174710
|
checkpoint-230000/training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a9c5f41557bf5b78540cd449032c7079998143a6748f2d58d6dfd615966e3e3b
|
3 |
+
size 5944
|