bilbo991 commited on
Commit
f93a9fc
·
1 Parent(s): 43cfedf

End of training

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
all_results.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_loss": 3.327958106994629,
4
+ "eval_runtime": 127.0788,
5
+ "eval_samples_per_second": 78.691,
6
+ "eval_steps_per_second": 2.463,
7
+ "train_loss": 3.383876552723975,
8
+ "train_runtime": 1383.4982,
9
+ "train_samples_per_second": 21.684,
10
+ "train_steps_per_second": 0.679
11
+ }
eval_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "eval_loss": 3.327958106994629,
4
+ "eval_runtime": 127.0788,
5
+ "eval_samples_per_second": 78.691,
6
+ "eval_steps_per_second": 2.463
7
+ }
preprocessor_config.json ADDED
@@ -0,0 +1,28 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "crop_size": {
3
+ "height": 224,
4
+ "width": 224
5
+ },
6
+ "do_center_crop": true,
7
+ "do_convert_rgb": true,
8
+ "do_normalize": true,
9
+ "do_rescale": true,
10
+ "do_resize": true,
11
+ "image_mean": [
12
+ 0.48145466,
13
+ 0.4578275,
14
+ 0.40821073
15
+ ],
16
+ "image_processor_type": "CLIPImageProcessor",
17
+ "image_std": [
18
+ 0.26862954,
19
+ 0.26130258,
20
+ 0.27577711
21
+ ],
22
+ "processor_class": "VisionTextDualEncoderProcessor",
23
+ "resample": 3,
24
+ "rescale_factor": 0.00392156862745098,
25
+ "size": {
26
+ "shortest_edge": 224
27
+ }
28
+ }
runs/Aug10_13-46-15_cvrl-flynn-ws2/events.out.tfevents.1691691156.cvrl-flynn-ws2.4174.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5368561400b6a6eb1e8a4582922586c09b273cba77b95f9eb44a78859e12be9
3
+ size 359
special_tokens_map.json ADDED
@@ -0,0 +1,15 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "cls_token": "<s>",
4
+ "eos_token": "</s>",
5
+ "mask_token": {
6
+ "content": "<mask>",
7
+ "lstrip": true,
8
+ "normalized": false,
9
+ "rstrip": false,
10
+ "single_word": false
11
+ },
12
+ "pad_token": "<pad>",
13
+ "sep_token": "</s>",
14
+ "unk_token": "<unk>"
15
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4c08c80d1df11b82ada2fd707562f86a9ebd5b7de04f51ebd2b49f2cd5906d00
3
+ size 17082925
tokenizer_config.json ADDED
@@ -0,0 +1,20 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token": "<s>",
3
+ "clean_up_tokenization_spaces": true,
4
+ "cls_token": "<s>",
5
+ "eos_token": "</s>",
6
+ "mask_token": {
7
+ "__type": "AddedToken",
8
+ "content": "<mask>",
9
+ "lstrip": true,
10
+ "normalized": true,
11
+ "rstrip": false,
12
+ "single_word": false
13
+ },
14
+ "model_max_length": 512,
15
+ "pad_token": "<pad>",
16
+ "processor_class": "VisionTextDualEncoderProcessor",
17
+ "sep_token": "</s>",
18
+ "tokenizer_class": "XLMRobertaTokenizer",
19
+ "unk_token": "<unk>"
20
+ }
train_results.json ADDED
@@ -0,0 +1,7 @@
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 3.0,
3
+ "train_loss": 3.383876552723975,
4
+ "train_runtime": 1383.4982,
5
+ "train_samples_per_second": 21.684,
6
+ "train_steps_per_second": 0.679
7
+ }
trainer_state.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 3.327958106994629,
3
+ "best_model_checkpoint": "clip-roberta-10k/checkpoint-939",
4
+ "epoch": 3.0,
5
+ "global_step": 939,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 1.0,
12
+ "eval_loss": 3.4277737140655518,
13
+ "eval_runtime": 117.2709,
14
+ "eval_samples_per_second": 85.273,
15
+ "eval_steps_per_second": 2.669,
16
+ "step": 313
17
+ },
18
+ {
19
+ "epoch": 1.6,
20
+ "learning_rate": 2.3375931842385517e-05,
21
+ "loss": 3.4415,
22
+ "step": 500
23
+ },
24
+ {
25
+ "epoch": 2.0,
26
+ "eval_loss": 3.3748862743377686,
27
+ "eval_runtime": 131.3188,
28
+ "eval_samples_per_second": 76.151,
29
+ "eval_steps_per_second": 2.384,
30
+ "step": 626
31
+ },
32
+ {
33
+ "epoch": 3.0,
34
+ "eval_loss": 3.327958106994629,
35
+ "eval_runtime": 131.0009,
36
+ "eval_samples_per_second": 76.335,
37
+ "eval_steps_per_second": 2.389,
38
+ "step": 939
39
+ },
40
+ {
41
+ "epoch": 3.0,
42
+ "step": 939,
43
+ "total_flos": 4005518400000000.0,
44
+ "train_loss": 3.383876552723975,
45
+ "train_runtime": 1383.4982,
46
+ "train_samples_per_second": 21.684,
47
+ "train_steps_per_second": 0.679
48
+ }
49
+ ],
50
+ "max_steps": 939,
51
+ "num_train_epochs": 3,
52
+ "total_flos": 4005518400000000.0,
53
+ "trial_name": null,
54
+ "trial_params": null
55
+ }