BigXYZ commited on
Commit
a7e11b4
·
verified ·
1 Parent(s): f96106d

End of training

Browse files
README.md CHANGED
@@ -1,16 +1,19 @@
1
  ---
 
 
2
  library_name: transformers
3
- model_name: Meta-Llama-3.1-8B-dpo-full
4
  tags:
5
  - generated_from_trainer
 
6
  - trl
7
  - dpo
8
  licence: license
9
  ---
10
 
11
- # Model Card for Meta-Llama-3.1-8B-dpo-full
12
 
13
- This model is a fine-tuned version of [None](https://huggingface.co/None).
14
  It has been trained using [TRL](https://github.com/huggingface/trl).
15
 
16
  ## Quick start
 
1
  ---
2
+ datasets:
3
+ - HuggingFaceH4/ultrafeedback_binarized
4
  library_name: transformers
5
+ model_name: data/Meta-Llama-3.1-8B-sft-full
6
  tags:
7
  - generated_from_trainer
8
+ - alignment-handbook
9
  - trl
10
  - dpo
11
  licence: license
12
  ---
13
 
14
+ # Model Card for data/Meta-Llama-3.1-8B-sft-full
15
 
16
+ This model is a fine-tuned version of [None](https://huggingface.co/None) on the [['HuggingFaceH4/ultrafeedback_binarized']](https://huggingface.co/datasets/['HuggingFaceH4/ultrafeedback_binarized']) dataset.
17
  It has been trained using [TRL](https://github.com/huggingface/trl).
18
 
19
  ## Quick start
all_results.json CHANGED
@@ -1,5 +1,18 @@
1
  {
2
  "epoch": 1.0,
 
 
 
 
 
 
 
 
 
 
 
 
 
3
  "total_flos": 0.0,
4
  "train_loss": 1.1715184933969665,
5
  "train_runtime": 4575.3933,
 
1
  {
2
  "epoch": 1.0,
3
+ "eval_logits/chosen": -0.90234375,
4
+ "eval_logits/rejected": -0.84765625,
5
+ "eval_logps/chosen": -370.0,
6
+ "eval_logps/rejected": -440.0,
7
+ "eval_loss": 0.5435234308242798,
8
+ "eval_rewards/accuracies": 0.7734375,
9
+ "eval_rewards/chosen": -0.80859375,
10
+ "eval_rewards/margins": 0.66015625,
11
+ "eval_rewards/rejected": -1.46875,
12
+ "eval_runtime": 44.7378,
13
+ "eval_samples": 2000,
14
+ "eval_samples_per_second": 44.705,
15
+ "eval_steps_per_second": 0.715,
16
  "total_flos": 0.0,
17
  "train_loss": 1.1715184933969665,
18
  "train_runtime": 4575.3933,
config.json CHANGED
@@ -31,6 +31,6 @@
31
  "tie_word_embeddings": false,
32
  "torch_dtype": "bfloat16",
33
  "transformers_version": "4.46.0",
34
- "use_cache": false,
35
  "vocab_size": 128256
36
  }
 
31
  "tie_word_embeddings": false,
32
  "torch_dtype": "bfloat16",
33
  "transformers_version": "4.46.0",
34
+ "use_cache": true,
35
  "vocab_size": 128256
36
  }
eval_results.json ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.0,
3
+ "eval_logits/chosen": -0.90234375,
4
+ "eval_logits/rejected": -0.84765625,
5
+ "eval_logps/chosen": -370.0,
6
+ "eval_logps/rejected": -440.0,
7
+ "eval_loss": 0.5435234308242798,
8
+ "eval_rewards/accuracies": 0.7734375,
9
+ "eval_rewards/chosen": -0.80859375,
10
+ "eval_rewards/margins": 0.66015625,
11
+ "eval_rewards/rejected": -1.46875,
12
+ "eval_runtime": 44.7378,
13
+ "eval_samples": 2000,
14
+ "eval_samples_per_second": 44.705,
15
+ "eval_steps_per_second": 0.715
16
+ }
runs/Feb18_05-02-46_h-80-8-a-01/events.out.tfevents.1739860071.h-80-8-a-01.2047664.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:76ed93ab9d2aab5193889e01d402a3edc4ce3fbdc21a10295874a128ea62e841
3
+ size 828