End of training

Browse files

Files changed (5) hide show

README.md +2 -1
all_results.json +8 -0
train_results.json +8 -0
trainer_state.json +484 -0
training_loss.png +0 -0

README.md CHANGED Viewed

@@ -4,6 +4,7 @@ license: apache-2.0
 base_model: Qwen/Qwen2.5-32B-Instruct
 tags:
 - llama-factory
 - generated_from_trainer
 model-index:
 - name: gaia_qwen2_32B
@@ -15,7 +16,7 @@ should probably proofread and complete it, then remove this comment. -->
 # gaia_qwen2_32B
-This model is a fine-tuned version of [Qwen/Qwen2.5-32B-Instruct](https://huggingface.co/Qwen/Qwen2.5-32B-Instruct) on the None dataset.
 ## Model description

 base_model: Qwen/Qwen2.5-32B-Instruct
 tags:
 - llama-factory
+- full
 - generated_from_trainer
 model-index:
 - name: gaia_qwen2_32B
 # gaia_qwen2_32B
+This model is a fine-tuned version of [Qwen/Qwen2.5-32B-Instruct](https://huggingface.co/Qwen/Qwen2.5-32B-Instruct) on the claude_gaia_1, the claude_gaia_2 and the claude_gaia_3 datasets.
 ## Model description

all_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 2.8976377952755907,
+    "total_flos": 1.2506626070990029e+17,
+    "train_loss": 0.2051201125695592,
+    "train_runtime": 45189.9744,
+    "train_samples_per_second": 0.05,
+    "train_steps_per_second": 0.001
+}

train_results.json ADDED Viewed

	@@ -0,0 +1,8 @@

+{
+    "epoch": 2.8976377952755907,
+    "total_flos": 1.2506626070990029e+17,
+    "train_loss": 0.2051201125695592,
+    "train_runtime": 45189.9744,
+    "train_samples_per_second": 0.05,
+    "train_steps_per_second": 0.001
+}

trainer_state.json ADDED Viewed

	@@ -0,0 +1,484 @@

+{
+  "best_global_step": null,
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 2.8976377952755907,
+  "eval_steps": 500,
+  "global_step": 63,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.047244094488188976,
+      "grad_norm": 3.6492302417755127,
+      "learning_rate": 1.4285714285714286e-06,
+      "loss": 0.4012,
+      "step": 1
+    },
+    {
+      "epoch": 0.09448818897637795,
+      "grad_norm": 2.7150280475616455,
+      "learning_rate": 2.8571428571428573e-06,
+      "loss": 0.3317,
+      "step": 2
+    },
+    {
+      "epoch": 0.14173228346456693,
+      "grad_norm": 4.509909629821777,
+      "learning_rate": 4.2857142857142855e-06,
+      "loss": 0.4663,
+      "step": 3
+    },
+    {
+      "epoch": 0.1889763779527559,
+      "grad_norm": 3.650169849395752,
+      "learning_rate": 5.7142857142857145e-06,
+      "loss": 0.4662,
+      "step": 4
+    },
+    {
+      "epoch": 0.23622047244094488,
+      "grad_norm": 1.761392593383789,
+      "learning_rate": 7.1428571428571436e-06,
+      "loss": 0.3292,
+      "step": 5
+    },
+    {
+      "epoch": 0.28346456692913385,
+      "grad_norm": 1.1722800731658936,
+      "learning_rate": 8.571428571428571e-06,
+      "loss": 0.2505,
+      "step": 6
+    },
+    {
+      "epoch": 0.33070866141732286,
+      "grad_norm": 1.3030749559402466,
+      "learning_rate": 1e-05,
+      "loss": 0.2786,
+      "step": 7
+    },
+    {
+      "epoch": 0.3779527559055118,
+      "grad_norm": 1.4660409688949585,
+      "learning_rate": 9.992134075089085e-06,
+      "loss": 0.3788,
+      "step": 8
+    },
+    {
+      "epoch": 0.4251968503937008,
+      "grad_norm": 2.589200735092163,
+      "learning_rate": 9.968561049466214e-06,
+      "loss": 0.3087,
+      "step": 9
+    },
+    {
+      "epoch": 0.47244094488188976,
+      "grad_norm": 2.669886827468872,
+      "learning_rate": 9.92935509259118e-06,
+      "loss": 0.3672,
+      "step": 10
+    },
+    {
+      "epoch": 0.5196850393700787,
+      "grad_norm": 1.486991286277771,
+      "learning_rate": 9.874639560909118e-06,
+      "loss": 0.275,
+      "step": 11
+    },
+    {
+      "epoch": 0.5669291338582677,
+      "grad_norm": 1.572901964187622,
+      "learning_rate": 9.804586609725499e-06,
+      "loss": 0.309,
+      "step": 12
+    },
+    {
+      "epoch": 0.6141732283464567,
+      "grad_norm": 1.242970585823059,
+      "learning_rate": 9.719416651541839e-06,
+      "loss": 0.2988,
+      "step": 13
+    },
+    {
+      "epoch": 0.6614173228346457,
+      "grad_norm": 1.272771954536438,
+      "learning_rate": 9.619397662556434e-06,
+      "loss": 0.3199,
+      "step": 14
+    },
+    {
+      "epoch": 0.7086614173228346,
+      "grad_norm": 1.215131163597107,
+      "learning_rate": 9.504844339512096e-06,
+      "loss": 0.2371,
+      "step": 15
+    },
+    {
+      "epoch": 0.7559055118110236,
+      "grad_norm": 1.2442128658294678,
+      "learning_rate": 9.376117109543769e-06,
+      "loss": 0.2661,
+      "step": 16
+    },
+    {
+      "epoch": 0.8031496062992126,
+      "grad_norm": 1.0294448137283325,
+      "learning_rate": 9.233620996141421e-06,
+      "loss": 0.2356,
+      "step": 17
+    },
+    {
+      "epoch": 0.8503937007874016,
+      "grad_norm": 1.2284340858459473,
+      "learning_rate": 9.077804344796302e-06,
+      "loss": 0.2911,
+      "step": 18
+    },
+    {
+      "epoch": 0.8976377952755905,
+      "grad_norm": 0.817711353302002,
+      "learning_rate": 8.90915741234015e-06,
+      "loss": 0.238,
+      "step": 19
+    },
+    {
+      "epoch": 0.9448818897637795,
+      "grad_norm": 1.085610032081604,
+      "learning_rate": 8.728210824415829e-06,
+      "loss": 0.2162,
+      "step": 20
+    },
+    {
+      "epoch": 0.9921259842519685,
+      "grad_norm": 0.7799460887908936,
+      "learning_rate": 8.535533905932739e-06,
+      "loss": 0.2419,
+      "step": 21
+    },
+    {
+      "epoch": 1.0,
+      "grad_norm": 0.7799460887908936,
+      "learning_rate": 8.331732889760021e-06,
+      "loss": 0.271,
+      "step": 22
+    },
+    {
+      "epoch": 1.047244094488189,
+      "grad_norm": 5.261403560638428,
+      "learning_rate": 8.117449009293668e-06,
+      "loss": 0.1911,
+      "step": 23
+    },
+    {
+      "epoch": 1.094488188976378,
+      "grad_norm": 0.7940455675125122,
+      "learning_rate": 7.89335648089903e-06,
+      "loss": 0.2041,
+      "step": 24
+    },
+    {
+      "epoch": 1.141732283464567,
+      "grad_norm": 1.4895520210266113,
+      "learning_rate": 7.660160382576683e-06,
+      "loss": 0.1895,
+      "step": 25
+    },
+    {
+      "epoch": 1.188976377952756,
+      "grad_norm": 0.8921546936035156,
+      "learning_rate": 7.4185944355261996e-06,
+      "loss": 0.1575,
+      "step": 26
+    },
+    {
+      "epoch": 1.236220472440945,
+      "grad_norm": 0.9935773611068726,
+      "learning_rate": 7.169418695587791e-06,
+      "loss": 0.194,
+      "step": 27
+    },
+    {
+      "epoch": 1.2834645669291338,
+      "grad_norm": 0.9794341921806335,
+      "learning_rate": 6.913417161825449e-06,
+      "loss": 0.2202,
+      "step": 28
+    },
+    {
+      "epoch": 1.330708661417323,
+      "grad_norm": 0.8670676946640015,
+      "learning_rate": 6.651395309775837e-06,
+      "loss": 0.1789,
+      "step": 29
+    },
+    {
+      "epoch": 1.3779527559055118,
+      "grad_norm": 1.1269317865371704,
+      "learning_rate": 6.384177557124247e-06,
+      "loss": 0.2017,
+      "step": 30
+    },
+    {
+      "epoch": 1.425196850393701,
+      "grad_norm": 1.1137402057647705,
+      "learning_rate": 6.112604669781572e-06,
+      "loss": 0.1751,
+      "step": 31
+    },
+    {
+      "epoch": 1.4724409448818898,
+      "grad_norm": 0.9292981624603271,
+      "learning_rate": 5.837531116523683e-06,
+      "loss": 0.1893,
+      "step": 32
+    },
+    {
+      "epoch": 1.5196850393700787,
+      "grad_norm": 0.8478426933288574,
+      "learning_rate": 5.559822380516539e-06,
+      "loss": 0.1381,
+      "step": 33
+    },
+    {
+      "epoch": 1.5669291338582676,
+      "grad_norm": 0.759232223033905,
+      "learning_rate": 5.2803522361859596e-06,
+      "loss": 0.1584,
+      "step": 34
+    },
+    {
+      "epoch": 1.6141732283464567,
+      "grad_norm": 1.4674817323684692,
+      "learning_rate": 5e-06,
+      "loss": 0.1839,
+      "step": 35
+    },
+    {
+      "epoch": 1.6614173228346458,
+      "grad_norm": 0.900875985622406,
+      "learning_rate": 4.719647763814041e-06,
+      "loss": 0.1776,
+      "step": 36
+    },
+    {
+      "epoch": 1.7086614173228347,
+      "grad_norm": 0.7754679322242737,
+      "learning_rate": 4.4401776194834615e-06,
+      "loss": 0.1667,
+      "step": 37
+    },
+    {
+      "epoch": 1.7559055118110236,
+      "grad_norm": 0.8453861474990845,
+      "learning_rate": 4.162468883476319e-06,
+      "loss": 0.1421,
+      "step": 38
+    },
+    {
+      "epoch": 1.8031496062992125,
+      "grad_norm": 0.7882893085479736,
+      "learning_rate": 3.887395330218429e-06,
+      "loss": 0.1543,
+      "step": 39
+    },
+    {
+      "epoch": 1.8503937007874016,
+      "grad_norm": 1.541914701461792,
+      "learning_rate": 3.6158224428757538e-06,
+      "loss": 0.1796,
+      "step": 40
+    },
+    {
+      "epoch": 1.8976377952755905,
+      "grad_norm": 0.989794909954071,
+      "learning_rate": 3.3486046902241663e-06,
+      "loss": 0.1771,
+      "step": 41
+    },
+    {
+      "epoch": 1.9448818897637796,
+      "grad_norm": 1.0352776050567627,
+      "learning_rate": 3.0865828381745515e-06,
+      "loss": 0.163,
+      "step": 42
+    },
+    {
+      "epoch": 1.9921259842519685,
+      "grad_norm": 1.0325061082839966,
+      "learning_rate": 2.83058130441221e-06,
+      "loss": 0.1518,
+      "step": 43
+    },
+    {
+      "epoch": 2.0,
+      "grad_norm": 1.0325061082839966,
+      "learning_rate": 2.5814055644738013e-06,
+      "loss": 0.1685,
+      "step": 44
+    },
+    {
+      "epoch": 2.047244094488189,
+      "grad_norm": 2.2215065956115723,
+      "learning_rate": 2.339839617423318e-06,
+      "loss": 0.135,
+      "step": 45
+    },
+    {
+      "epoch": 2.094488188976378,
+      "grad_norm": 0.8818472027778625,
+      "learning_rate": 2.1066435191009717e-06,
+      "loss": 0.1472,
+      "step": 46
+    },
+    {
+      "epoch": 2.141732283464567,
+      "grad_norm": 1.6831822395324707,
+      "learning_rate": 1.8825509907063328e-06,
+      "loss": 0.1161,
+      "step": 47
+    },
+    {
+      "epoch": 2.188976377952756,
+      "grad_norm": 0.5498701930046082,
+      "learning_rate": 1.6682671102399806e-06,
+      "loss": 0.0941,
+      "step": 48
+    },
+    {
+      "epoch": 2.236220472440945,
+      "grad_norm": 0.9785574078559875,
+      "learning_rate": 1.4644660940672628e-06,
+      "loss": 0.1614,
+      "step": 49
+    },
+    {
+      "epoch": 2.283464566929134,
+      "grad_norm": 0.9736632704734802,
+      "learning_rate": 1.2717891755841722e-06,
+      "loss": 0.1533,
+      "step": 50
+    },
+    {
+      "epoch": 2.3307086614173227,
+      "grad_norm": 1.1105008125305176,
+      "learning_rate": 1.0908425876598512e-06,
+      "loss": 0.1051,
+      "step": 51
+    },
+    {
+      "epoch": 2.377952755905512,
+      "grad_norm": 0.4693005383014679,
+      "learning_rate": 9.221956552036992e-07,
+      "loss": 0.0923,
+      "step": 52
+    },
+    {
+      "epoch": 2.425196850393701,
+      "grad_norm": 0.9733160138130188,
+      "learning_rate": 7.663790038585794e-07,
+      "loss": 0.0977,
+      "step": 53
+    },
+    {
+      "epoch": 2.47244094488189,
+      "grad_norm": 0.7047190070152283,
+      "learning_rate": 6.238828904562316e-07,
+      "loss": 0.1154,
+      "step": 54
+    },
+    {
+      "epoch": 2.5196850393700787,
+      "grad_norm": 1.1957942247390747,
+      "learning_rate": 4.951556604879049e-07,
+      "loss": 0.1237,
+      "step": 55
+    },
+    {
+      "epoch": 2.5669291338582676,
+      "grad_norm": 0.6617165207862854,
+      "learning_rate": 3.8060233744356634e-07,
+      "loss": 0.1042,
+      "step": 56
+    },
+    {
+      "epoch": 2.6141732283464565,
+      "grad_norm": 0.8499227166175842,
+      "learning_rate": 2.8058334845816214e-07,
+      "loss": 0.1259,
+      "step": 57
+    },
+    {
+      "epoch": 2.661417322834646,
+      "grad_norm": 0.8625606298446655,
+      "learning_rate": 1.9541339027450256e-07,
+      "loss": 0.1105,
+      "step": 58
+    },
+    {
+      "epoch": 2.7086614173228347,
+      "grad_norm": 0.6735402941703796,
+      "learning_rate": 1.253604390908819e-07,
+      "loss": 0.1063,
+      "step": 59
+    },
+    {
+      "epoch": 2.7559055118110236,
+      "grad_norm": 0.753610372543335,
+      "learning_rate": 7.064490740882057e-08,
+      "loss": 0.1343,
+      "step": 60
+    },
+    {
+      "epoch": 2.8031496062992125,
+      "grad_norm": 0.7327992916107178,
+      "learning_rate": 3.143895053378698e-08,
+      "loss": 0.1197,
+      "step": 61
+    },
+    {
+      "epoch": 2.850393700787402,
+      "grad_norm": 0.829689621925354,
+      "learning_rate": 7.865924910916977e-09,
+      "loss": 0.1359,
+      "step": 62
+    },
+    {
+      "epoch": 2.8976377952755907,
+      "grad_norm": 0.7220540046691895,
+      "learning_rate": 0.0,
+      "loss": 0.1042,
+      "step": 63
+    },
+    {
+      "epoch": 2.8976377952755907,
+      "step": 63,
+      "total_flos": 1.2506626070990029e+17,
+      "train_loss": 0.2051201125695592,
+      "train_runtime": 45189.9744,
+      "train_samples_per_second": 0.05,
+      "train_steps_per_second": 0.001
+    }
+  ],
+  "logging_steps": 1,
+  "max_steps": 63,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 20,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.2506626070990029e+17,
+  "train_batch_size": 1,
+  "trial_name": null,
+  "trial_params": null
+}

training_loss.png ADDED Viewed