A-Mahla HF Staff commited on
Commit
e7129dd
·
verified ·
1 Parent(s): de0b30a

End of training

Browse files
Files changed (4) hide show
  1. README.md +5 -1
  2. all_results.json +5 -0
  3. config.json +1 -1
  4. eval_results.json +4 -4
README.md CHANGED
@@ -1,8 +1,12 @@
1
  ---
 
2
  library_name: transformers
3
  model_name: SmolVLM2-2.2B-Instruct-Agentic-GUI
4
  tags:
5
  - generated_from_trainer
 
 
 
6
  - trl
7
  - sft
8
  licence: license
@@ -10,7 +14,7 @@ licence: license
10
 
11
  # Model Card for SmolVLM2-2.2B-Instruct-Agentic-GUI
12
 
13
- This model is a fine-tuned version of [None](https://huggingface.co/None).
14
  It has been trained using [TRL](https://github.com/huggingface/trl).
15
 
16
  ## Quick start
 
1
  ---
2
+ datasets: smolagents/aguvis-stage-2
3
  library_name: transformers
4
  model_name: SmolVLM2-2.2B-Instruct-Agentic-GUI
5
  tags:
6
  - generated_from_trainer
7
+ - open-r1
8
+ - vision-language
9
+ - vlm
10
  - trl
11
  - sft
12
  licence: license
 
14
 
15
  # Model Card for SmolVLM2-2.2B-Instruct-Agentic-GUI
16
 
17
+ This model is a fine-tuned version of [None](https://huggingface.co/None) on the [smolagents/aguvis-stage-2](https://huggingface.co/datasets/smolagents/aguvis-stage-2) dataset.
18
  It has been trained using [TRL](https://github.com/huggingface/trl).
19
 
20
  ## Quick start
all_results.json CHANGED
@@ -1,4 +1,9 @@
1
  {
 
 
 
 
 
2
  "total_flos": 1.0314062938243072e+16,
3
  "train_loss": 0.7184352108531378,
4
  "train_runtime": 49977.4428,
 
1
  {
2
+ "eval_loss": 0.6482115983963013,
3
+ "eval_runtime": 149.9453,
4
+ "eval_samples": 3639,
5
+ "eval_samples_per_second": 24.269,
6
+ "eval_steps_per_second": 0.76,
7
  "total_flos": 1.0314062938243072e+16,
8
  "train_loss": 0.7184352108531378,
9
  "train_runtime": 49977.4428,
config.json CHANGED
@@ -120,7 +120,7 @@
120
  "tie_word_embeddings": false,
121
  "torch_dtype": "bfloat16",
122
  "transformers_version": "4.54.1",
123
- "use_cache": false,
124
  "use_reentrant_checkpointing": false,
125
  "vision_config": {
126
  "attention_dropout": 0.0,
 
120
  "tie_word_embeddings": false,
121
  "torch_dtype": "bfloat16",
122
  "transformers_version": "4.54.1",
123
+ "use_cache": true,
124
  "use_reentrant_checkpointing": false,
125
  "vision_config": {
126
  "attention_dropout": 0.0,
eval_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "eval_loss": 0.5039201974868774,
3
- "eval_runtime": 159.8129,
4
  "eval_samples": 3639,
5
- "eval_samples_per_second": 22.77,
6
- "eval_steps_per_second": 0.713
7
  }
 
1
  {
2
+ "eval_loss": 0.6482115983963013,
3
+ "eval_runtime": 149.9453,
4
  "eval_samples": 3639,
5
+ "eval_samples_per_second": 24.269,
6
+ "eval_steps_per_second": 0.76
7
  }