furmaniak commited on
Commit
2e43702
·
verified ·
1 Parent(s): 1df1b46

Trained with Unsloth

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. README.md +1 -0
  2. config.json +43 -0
  3. generation_config.json +14 -0
  4. model-00001-of-00061.safetensors +3 -0
  5. model-00002-of-00061.safetensors +3 -0
  6. model-00003-of-00061.safetensors +3 -0
  7. model-00004-of-00061.safetensors +3 -0
  8. model-00005-of-00061.safetensors +3 -0
  9. model-00006-of-00061.safetensors +3 -0
  10. model-00007-of-00061.safetensors +3 -0
  11. model-00008-of-00061.safetensors +3 -0
  12. model-00009-of-00061.safetensors +3 -0
  13. model-00010-of-00061.safetensors +3 -0
  14. model-00011-of-00061.safetensors +3 -0
  15. model-00012-of-00061.safetensors +3 -0
  16. model-00013-of-00061.safetensors +3 -0
  17. model-00014-of-00061.safetensors +3 -0
  18. model-00015-of-00061.safetensors +3 -0
  19. model-00016-of-00061.safetensors +3 -0
  20. model-00017-of-00061.safetensors +3 -0
  21. model-00018-of-00061.safetensors +3 -0
  22. model-00019-of-00061.safetensors +3 -0
  23. model-00020-of-00061.safetensors +3 -0
  24. model-00021-of-00061.safetensors +3 -0
  25. model-00022-of-00061.safetensors +3 -0
  26. model-00023-of-00061.safetensors +3 -0
  27. model-00024-of-00061.safetensors +3 -0
  28. model-00025-of-00061.safetensors +3 -0
  29. model-00026-of-00061.safetensors +3 -0
  30. model-00027-of-00061.safetensors +3 -0
  31. model-00028-of-00061.safetensors +3 -0
  32. model-00029-of-00061.safetensors +3 -0
  33. model-00030-of-00061.safetensors +3 -0
  34. model-00031-of-00061.safetensors +3 -0
  35. model-00032-of-00061.safetensors +3 -0
  36. model-00033-of-00061.safetensors +3 -0
  37. model-00034-of-00061.safetensors +3 -0
  38. model-00035-of-00061.safetensors +3 -0
  39. model-00036-of-00061.safetensors +3 -0
  40. model-00037-of-00061.safetensors +3 -0
  41. model-00038-of-00061.safetensors +3 -0
  42. model-00039-of-00061.safetensors +3 -0
  43. model-00040-of-00061.safetensors +3 -0
  44. model-00041-of-00061.safetensors +3 -0
  45. model-00042-of-00061.safetensors +3 -0
  46. model-00043-of-00061.safetensors +3 -0
  47. model-00044-of-00061.safetensors +3 -0
  48. model-00045-of-00061.safetensors +3 -0
  49. model-00046-of-00061.safetensors +3 -0
  50. model-00047-of-00061.safetensors +3 -0
README.md CHANGED
@@ -6,6 +6,7 @@ tags:
6
  - unsloth
7
  - llama
8
  - trl
 
9
  license: apache-2.0
10
  language:
11
  - en
 
6
  - unsloth
7
  - llama
8
  - trl
9
+ - sft
10
  license: apache-2.0
11
  language:
12
  - en
config.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "unsloth/Llama-3.3-70B-Instruct-bnb-4bit",
3
+ "architectures": [
4
+ "LlamaForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 128000,
9
+ "eos_token_id": [
10
+ 128001,
11
+ 128008,
12
+ 128009
13
+ ],
14
+ "head_dim": 128,
15
+ "hidden_act": "silu",
16
+ "hidden_size": 8192,
17
+ "initializer_range": 0.02,
18
+ "intermediate_size": 28672,
19
+ "max_position_embeddings": 131072,
20
+ "mlp_bias": false,
21
+ "model_type": "llama",
22
+ "num_attention_heads": 64,
23
+ "num_hidden_layers": 80,
24
+ "num_key_value_heads": 8,
25
+ "pad_token_id": 128004,
26
+ "pretraining_tp": 1,
27
+ "rms_norm_eps": 1e-05,
28
+ "rope_scaling": {
29
+ "factor": 8.0,
30
+ "high_freq_factor": 4.0,
31
+ "low_freq_factor": 1.0,
32
+ "original_max_position_embeddings": 8192,
33
+ "rope_type": "llama3"
34
+ },
35
+ "rope_theta": 500000.0,
36
+ "tie_word_embeddings": false,
37
+ "torch_dtype": "bfloat16",
38
+ "transformers_version": "4.46.3",
39
+ "unsloth_fixed": true,
40
+ "unsloth_version": "2024.12.4",
41
+ "use_cache": true,
42
+ "vocab_size": 128256
43
+ }
generation_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "max_length": 131072,
10
+ "pad_token_id": 128004,
11
+ "temperature": 0.6,
12
+ "top_p": 0.9,
13
+ "transformers_version": "4.46.3"
14
+ }
model-00001-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:59f06c3445375fa31d92fde9cf3d2c5a176377d3b7d5556ffbbc6f068926abef
3
+ size 4584375104
model-00002-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:600a10bd2c756f57ec7ff2260b44466ceac32fe686e62058898b51f4bb8e883b
3
+ size 4966123352
model-00003-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3b6c6fb29eca0081d83015c38e01f5f8982cc450e3d0c20f73582245691259f
3
+ size 4362110112
model-00004-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d95518c033a3db3432bdbbee30db94f6d9b03b5609044be81cab93d65702c406
3
+ size 4362110104
model-00005-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:16f03ea61c140c0fa0eb8b1c72291efa81c4cdd79ab2d1915309bf1f0beab917
3
+ size 4966123352
model-00006-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dae7fd27a478f158fc571747165e0c910c23370710a37deb949ac6c5333dca58
3
+ size 4362110112
model-00007-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6ca9153770626b5c2d310db809fe36629a614541d1e1776b8e4d5c0fc1816bb
3
+ size 4362110104
model-00008-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf180ca16e8811fd716d4361f66646649176a4a0f1fb62185c12dfc640f1cbe6
3
+ size 4966123344
model-00009-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c3eafede44f0b32ab45323219f10596227b02bc6435f224d55347cd6e1132f84
3
+ size 4362110120
model-00010-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d923fbd5c0bc207346307c52d7634f08a4fcd4457ea350779c670c34c2529d60
3
+ size 4362110120
model-00011-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d092d302a0ad2934df30d9044a8fd3fcaa952e8d4ba8ab9ba6c434d39d6b1ae4
3
+ size 4966123368
model-00012-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b29f86f8927a5b2f9d3cb82a6cafc1f7234527e691e350dc81da6e7512313cc
3
+ size 4362110120
model-00013-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:817c94af6dc7b6f062af3898f0faabb36e57a87915d8188521f25b126fe13924
3
+ size 4362110120
model-00014-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf21c80e158af52d90ead220fd267bfd8828f718cabf79f73b626a9f243c486f
3
+ size 4966123368
model-00015-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:202f5bcfb5420fae56b4e4e893dbb52d36d3e87f041fdf036bad0e76d4dfdda2
3
+ size 4362110120
model-00016-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83ccd01dc18787c1f72309905c4d620e18833a1a2588eec598b77d003c45b1ca
3
+ size 4362110120
model-00017-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c3a31d44ce9b32a4086b46558cc7e70eed25b45ab3bd4c09ca0464838285ffd
3
+ size 4966123368
model-00018-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7e615257ea1f9223e127482397a37e4d1e0d1c09e705c37b9ba9afa257a17d2
3
+ size 4362110120
model-00019-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db8844e7d26de9d76ee6e02e1a2681cd433910b7f012d9c9865d8cccbb9f4ff3
3
+ size 4362110120
model-00020-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:47c336c46aca34e6ce677a7d7a94eadfbe18cca3c2f84d24f8ad1afa23237552
3
+ size 4966123368
model-00021-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8ee4db0091248a838ad8586a0122dbd2c59967bd544197f8cc6bd8c452de172d
3
+ size 4362110120
model-00022-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de6cc6b562906b459fc1fc630437c378d85328bcee3ca315689cb212cb0cb0c5
3
+ size 4362110120
model-00023-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a51a597d1f5814c21fc439bcc0d1e2184ba3c436331a2627ca67032fc6898ba
3
+ size 4966123368
model-00024-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:878737db20f26f179a27bd70ccca8b61a33e4698158ab345372383cbe5ce9dae
3
+ size 4362110120
model-00025-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4213ee4d985a1f53eca503ace2af0c3c2873ca45a66ab5e861d0bdec12c6a7a8
3
+ size 4362110120
model-00026-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c644a1dbb4b63cd6dd7e773b56d059879e2ce604ab9476347c1e1452e9dee76e
3
+ size 4966123368
model-00027-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8d01101a7797fde2b463c3b165258db23ff947a19f8813b7815281ba9637369
3
+ size 4362110120
model-00028-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f6cc99e8fd0f02a6a3af3035c9e8ef0e314c4e7fbc3943cf6a6ea9027766dd4
3
+ size 4362110120
model-00029-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c291f214bd9efe020cbccc7981456166c86900ae6d05e98081623d9e5c446c9
3
+ size 4966123368
model-00030-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6a136cf6116d74ff28a53463c2773e2e4c42f57f50eb64c75c5d5d6dbe324b1d
3
+ size 4362110120
model-00031-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0877c94c5aebeafd0d8bfb9bafba66876fea5fa5ddd9b61fd4f4450505d33d24
3
+ size 4362110120
model-00032-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66553bdd47ae92b4cfeb66ce69ee0b219ca7bc010080135253df26c19a1942f6
3
+ size 4966123368
model-00033-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc1144165098eaf0ceb72b9e460cd98b01dd8046d7ebbb68ceb2adcb4ad1706c
3
+ size 4362110120
model-00034-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b67f276ce200477adbf93204ec099b6d2322abfaf7bd57ae1290a0b32051831d
3
+ size 4362110120
model-00035-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ad70bbe2ce2e5bae8d1984db6ed1e6e9ec7438b6b094078de393996b5fc371e
3
+ size 4966123368
model-00036-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:007ec2a21e83a1d6e2a040bfa5657f044ea4076f4f66c01f1635df0d1dd6d4a2
3
+ size 4362110120
model-00037-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52abefa32d54233fe2712882b391bf33138e69bcb96e114df23a9f78abf71b37
3
+ size 4362110120
model-00038-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4682a32d9d9d58b76c0ceeaaa045f67a1e2eef41438b7e17f91f6502e6908281
3
+ size 4966123368
model-00039-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c5b2e3b5bb7ceb72ac94e1ffd20e456d6a07559d47f26bb1f536223cc67a957
3
+ size 4362110120
model-00040-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3b8fd64e15db0f6277afc54959fc2cab21bbba6d219adfef480ef9347d946ea
3
+ size 4362110120
model-00041-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d29e896662b19b2416ea05b0f67ae34a1696fb039d3f8ddd86eaf7db9fe7856c
3
+ size 4966123368
model-00042-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2c3d420305fb40590aeac15f4f9078584b046e0913420a57363b1c1be81c57e0
3
+ size 4362110120
model-00043-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c5172c70c5dfdbef12779ba0d5c9cb26769cf532172bee288eca182ab8fdfec
3
+ size 4362110120
model-00044-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7f65ba0834720ec1e33c26e2addf38572338e0305dd925121b7c3f70abe51b6
3
+ size 4966123368
model-00045-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd14a3d853f8f00e8e25eae0a94d70aee8619cc6a5d5dec742dab2d06b0d5586
3
+ size 4362110120
model-00046-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bd3a3fdd9739853866ca0b2fb414acb2c509a486ae5cdc6bc7d32afd77baac8
3
+ size 4362110120
model-00047-of-00061.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4e53e7a8566c184933834abecdaac9a7b3af7b0e70930b5067c0ce235f0f020
3
+ size 4966123368