Trained with Unsloth
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +1 -0
- config.json +43 -0
- generation_config.json +14 -0
- model-00001-of-00061.safetensors +3 -0
- model-00002-of-00061.safetensors +3 -0
- model-00003-of-00061.safetensors +3 -0
- model-00004-of-00061.safetensors +3 -0
- model-00005-of-00061.safetensors +3 -0
- model-00006-of-00061.safetensors +3 -0
- model-00007-of-00061.safetensors +3 -0
- model-00008-of-00061.safetensors +3 -0
- model-00009-of-00061.safetensors +3 -0
- model-00010-of-00061.safetensors +3 -0
- model-00011-of-00061.safetensors +3 -0
- model-00012-of-00061.safetensors +3 -0
- model-00013-of-00061.safetensors +3 -0
- model-00014-of-00061.safetensors +3 -0
- model-00015-of-00061.safetensors +3 -0
- model-00016-of-00061.safetensors +3 -0
- model-00017-of-00061.safetensors +3 -0
- model-00018-of-00061.safetensors +3 -0
- model-00019-of-00061.safetensors +3 -0
- model-00020-of-00061.safetensors +3 -0
- model-00021-of-00061.safetensors +3 -0
- model-00022-of-00061.safetensors +3 -0
- model-00023-of-00061.safetensors +3 -0
- model-00024-of-00061.safetensors +3 -0
- model-00025-of-00061.safetensors +3 -0
- model-00026-of-00061.safetensors +3 -0
- model-00027-of-00061.safetensors +3 -0
- model-00028-of-00061.safetensors +3 -0
- model-00029-of-00061.safetensors +3 -0
- model-00030-of-00061.safetensors +3 -0
- model-00031-of-00061.safetensors +3 -0
- model-00032-of-00061.safetensors +3 -0
- model-00033-of-00061.safetensors +3 -0
- model-00034-of-00061.safetensors +3 -0
- model-00035-of-00061.safetensors +3 -0
- model-00036-of-00061.safetensors +3 -0
- model-00037-of-00061.safetensors +3 -0
- model-00038-of-00061.safetensors +3 -0
- model-00039-of-00061.safetensors +3 -0
- model-00040-of-00061.safetensors +3 -0
- model-00041-of-00061.safetensors +3 -0
- model-00042-of-00061.safetensors +3 -0
- model-00043-of-00061.safetensors +3 -0
- model-00044-of-00061.safetensors +3 -0
- model-00045-of-00061.safetensors +3 -0
- model-00046-of-00061.safetensors +3 -0
- model-00047-of-00061.safetensors +3 -0
README.md
CHANGED
@@ -6,6 +6,7 @@ tags:
|
|
6 |
- unsloth
|
7 |
- llama
|
8 |
- trl
|
|
|
9 |
license: apache-2.0
|
10 |
language:
|
11 |
- en
|
|
|
6 |
- unsloth
|
7 |
- llama
|
8 |
- trl
|
9 |
+
- sft
|
10 |
license: apache-2.0
|
11 |
language:
|
12 |
- en
|
config.json
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "unsloth/Llama-3.3-70B-Instruct-bnb-4bit",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 128000,
|
9 |
+
"eos_token_id": [
|
10 |
+
128001,
|
11 |
+
128008,
|
12 |
+
128009
|
13 |
+
],
|
14 |
+
"head_dim": 128,
|
15 |
+
"hidden_act": "silu",
|
16 |
+
"hidden_size": 8192,
|
17 |
+
"initializer_range": 0.02,
|
18 |
+
"intermediate_size": 28672,
|
19 |
+
"max_position_embeddings": 131072,
|
20 |
+
"mlp_bias": false,
|
21 |
+
"model_type": "llama",
|
22 |
+
"num_attention_heads": 64,
|
23 |
+
"num_hidden_layers": 80,
|
24 |
+
"num_key_value_heads": 8,
|
25 |
+
"pad_token_id": 128004,
|
26 |
+
"pretraining_tp": 1,
|
27 |
+
"rms_norm_eps": 1e-05,
|
28 |
+
"rope_scaling": {
|
29 |
+
"factor": 8.0,
|
30 |
+
"high_freq_factor": 4.0,
|
31 |
+
"low_freq_factor": 1.0,
|
32 |
+
"original_max_position_embeddings": 8192,
|
33 |
+
"rope_type": "llama3"
|
34 |
+
},
|
35 |
+
"rope_theta": 500000.0,
|
36 |
+
"tie_word_embeddings": false,
|
37 |
+
"torch_dtype": "bfloat16",
|
38 |
+
"transformers_version": "4.46.3",
|
39 |
+
"unsloth_fixed": true,
|
40 |
+
"unsloth_version": "2024.12.4",
|
41 |
+
"use_cache": true,
|
42 |
+
"vocab_size": 128256
|
43 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 128000,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
128001,
|
6 |
+
128008,
|
7 |
+
128009
|
8 |
+
],
|
9 |
+
"max_length": 131072,
|
10 |
+
"pad_token_id": 128004,
|
11 |
+
"temperature": 0.6,
|
12 |
+
"top_p": 0.9,
|
13 |
+
"transformers_version": "4.46.3"
|
14 |
+
}
|
model-00001-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:59f06c3445375fa31d92fde9cf3d2c5a176377d3b7d5556ffbbc6f068926abef
|
3 |
+
size 4584375104
|
model-00002-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:600a10bd2c756f57ec7ff2260b44466ceac32fe686e62058898b51f4bb8e883b
|
3 |
+
size 4966123352
|
model-00003-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3b6c6fb29eca0081d83015c38e01f5f8982cc450e3d0c20f73582245691259f
|
3 |
+
size 4362110112
|
model-00004-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d95518c033a3db3432bdbbee30db94f6d9b03b5609044be81cab93d65702c406
|
3 |
+
size 4362110104
|
model-00005-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16f03ea61c140c0fa0eb8b1c72291efa81c4cdd79ab2d1915309bf1f0beab917
|
3 |
+
size 4966123352
|
model-00006-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dae7fd27a478f158fc571747165e0c910c23370710a37deb949ac6c5333dca58
|
3 |
+
size 4362110112
|
model-00007-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a6ca9153770626b5c2d310db809fe36629a614541d1e1776b8e4d5c0fc1816bb
|
3 |
+
size 4362110104
|
model-00008-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf180ca16e8811fd716d4361f66646649176a4a0f1fb62185c12dfc640f1cbe6
|
3 |
+
size 4966123344
|
model-00009-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c3eafede44f0b32ab45323219f10596227b02bc6435f224d55347cd6e1132f84
|
3 |
+
size 4362110120
|
model-00010-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d923fbd5c0bc207346307c52d7634f08a4fcd4457ea350779c670c34c2529d60
|
3 |
+
size 4362110120
|
model-00011-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d092d302a0ad2934df30d9044a8fd3fcaa952e8d4ba8ab9ba6c434d39d6b1ae4
|
3 |
+
size 4966123368
|
model-00012-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b29f86f8927a5b2f9d3cb82a6cafc1f7234527e691e350dc81da6e7512313cc
|
3 |
+
size 4362110120
|
model-00013-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:817c94af6dc7b6f062af3898f0faabb36e57a87915d8188521f25b126fe13924
|
3 |
+
size 4362110120
|
model-00014-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf21c80e158af52d90ead220fd267bfd8828f718cabf79f73b626a9f243c486f
|
3 |
+
size 4966123368
|
model-00015-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:202f5bcfb5420fae56b4e4e893dbb52d36d3e87f041fdf036bad0e76d4dfdda2
|
3 |
+
size 4362110120
|
model-00016-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83ccd01dc18787c1f72309905c4d620e18833a1a2588eec598b77d003c45b1ca
|
3 |
+
size 4362110120
|
model-00017-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c3a31d44ce9b32a4086b46558cc7e70eed25b45ab3bd4c09ca0464838285ffd
|
3 |
+
size 4966123368
|
model-00018-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7e615257ea1f9223e127482397a37e4d1e0d1c09e705c37b9ba9afa257a17d2
|
3 |
+
size 4362110120
|
model-00019-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db8844e7d26de9d76ee6e02e1a2681cd433910b7f012d9c9865d8cccbb9f4ff3
|
3 |
+
size 4362110120
|
model-00020-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:47c336c46aca34e6ce677a7d7a94eadfbe18cca3c2f84d24f8ad1afa23237552
|
3 |
+
size 4966123368
|
model-00021-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8ee4db0091248a838ad8586a0122dbd2c59967bd544197f8cc6bd8c452de172d
|
3 |
+
size 4362110120
|
model-00022-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:de6cc6b562906b459fc1fc630437c378d85328bcee3ca315689cb212cb0cb0c5
|
3 |
+
size 4362110120
|
model-00023-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a51a597d1f5814c21fc439bcc0d1e2184ba3c436331a2627ca67032fc6898ba
|
3 |
+
size 4966123368
|
model-00024-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:878737db20f26f179a27bd70ccca8b61a33e4698158ab345372383cbe5ce9dae
|
3 |
+
size 4362110120
|
model-00025-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4213ee4d985a1f53eca503ace2af0c3c2873ca45a66ab5e861d0bdec12c6a7a8
|
3 |
+
size 4362110120
|
model-00026-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c644a1dbb4b63cd6dd7e773b56d059879e2ce604ab9476347c1e1452e9dee76e
|
3 |
+
size 4966123368
|
model-00027-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8d01101a7797fde2b463c3b165258db23ff947a19f8813b7815281ba9637369
|
3 |
+
size 4362110120
|
model-00028-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f6cc99e8fd0f02a6a3af3035c9e8ef0e314c4e7fbc3943cf6a6ea9027766dd4
|
3 |
+
size 4362110120
|
model-00029-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c291f214bd9efe020cbccc7981456166c86900ae6d05e98081623d9e5c446c9
|
3 |
+
size 4966123368
|
model-00030-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6a136cf6116d74ff28a53463c2773e2e4c42f57f50eb64c75c5d5d6dbe324b1d
|
3 |
+
size 4362110120
|
model-00031-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0877c94c5aebeafd0d8bfb9bafba66876fea5fa5ddd9b61fd4f4450505d33d24
|
3 |
+
size 4362110120
|
model-00032-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66553bdd47ae92b4cfeb66ce69ee0b219ca7bc010080135253df26c19a1942f6
|
3 |
+
size 4966123368
|
model-00033-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc1144165098eaf0ceb72b9e460cd98b01dd8046d7ebbb68ceb2adcb4ad1706c
|
3 |
+
size 4362110120
|
model-00034-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b67f276ce200477adbf93204ec099b6d2322abfaf7bd57ae1290a0b32051831d
|
3 |
+
size 4362110120
|
model-00035-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ad70bbe2ce2e5bae8d1984db6ed1e6e9ec7438b6b094078de393996b5fc371e
|
3 |
+
size 4966123368
|
model-00036-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:007ec2a21e83a1d6e2a040bfa5657f044ea4076f4f66c01f1635df0d1dd6d4a2
|
3 |
+
size 4362110120
|
model-00037-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52abefa32d54233fe2712882b391bf33138e69bcb96e114df23a9f78abf71b37
|
3 |
+
size 4362110120
|
model-00038-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4682a32d9d9d58b76c0ceeaaa045f67a1e2eef41438b7e17f91f6502e6908281
|
3 |
+
size 4966123368
|
model-00039-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c5b2e3b5bb7ceb72ac94e1ffd20e456d6a07559d47f26bb1f536223cc67a957
|
3 |
+
size 4362110120
|
model-00040-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3b8fd64e15db0f6277afc54959fc2cab21bbba6d219adfef480ef9347d946ea
|
3 |
+
size 4362110120
|
model-00041-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d29e896662b19b2416ea05b0f67ae34a1696fb039d3f8ddd86eaf7db9fe7856c
|
3 |
+
size 4966123368
|
model-00042-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c3d420305fb40590aeac15f4f9078584b046e0913420a57363b1c1be81c57e0
|
3 |
+
size 4362110120
|
model-00043-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9c5172c70c5dfdbef12779ba0d5c9cb26769cf532172bee288eca182ab8fdfec
|
3 |
+
size 4362110120
|
model-00044-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d7f65ba0834720ec1e33c26e2addf38572338e0305dd925121b7c3f70abe51b6
|
3 |
+
size 4966123368
|
model-00045-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd14a3d853f8f00e8e25eae0a94d70aee8619cc6a5d5dec742dab2d06b0d5586
|
3 |
+
size 4362110120
|
model-00046-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bd3a3fdd9739853866ca0b2fb414acb2c509a486ae5cdc6bc7d32afd77baac8
|
3 |
+
size 4362110120
|
model-00047-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4e53e7a8566c184933834abecdaac9a7b3af7b0e70930b5067c0ce235f0f020
|
3 |
+
size 4966123368
|