Upload LlamaForCausalLM
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +29 -0
- generation_config.json +8 -0
- model-00001-of-00061.safetensors +3 -0
- model-00002-of-00061.safetensors +3 -0
- model-00003-of-00061.safetensors +3 -0
- model-00004-of-00061.safetensors +3 -0
- model-00005-of-00061.safetensors +3 -0
- model-00006-of-00061.safetensors +3 -0
- model-00007-of-00061.safetensors +3 -0
- model-00008-of-00061.safetensors +3 -0
- model-00009-of-00061.safetensors +3 -0
- model-00010-of-00061.safetensors +3 -0
- model-00011-of-00061.safetensors +3 -0
- model-00012-of-00061.safetensors +3 -0
- model-00013-of-00061.safetensors +3 -0
- model-00014-of-00061.safetensors +3 -0
- model-00015-of-00061.safetensors +3 -0
- model-00016-of-00061.safetensors +3 -0
- model-00017-of-00061.safetensors +3 -0
- model-00018-of-00061.safetensors +3 -0
- model-00019-of-00061.safetensors +3 -0
- model-00020-of-00061.safetensors +3 -0
- model-00021-of-00061.safetensors +3 -0
- model-00022-of-00061.safetensors +3 -0
- model-00023-of-00061.safetensors +3 -0
- model-00024-of-00061.safetensors +3 -0
- model-00025-of-00061.safetensors +3 -0
- model-00026-of-00061.safetensors +3 -0
- model-00027-of-00061.safetensors +3 -0
- model-00028-of-00061.safetensors +3 -0
- model-00029-of-00061.safetensors +3 -0
- model-00030-of-00061.safetensors +3 -0
- model-00031-of-00061.safetensors +3 -0
- model-00032-of-00061.safetensors +3 -0
- model-00033-of-00061.safetensors +3 -0
- model-00034-of-00061.safetensors +3 -0
- model-00035-of-00061.safetensors +3 -0
- model-00036-of-00061.safetensors +3 -0
- model-00037-of-00061.safetensors +3 -0
- model-00038-of-00061.safetensors +3 -0
- model-00039-of-00061.safetensors +3 -0
- model-00040-of-00061.safetensors +3 -0
- model-00041-of-00061.safetensors +3 -0
- model-00042-of-00061.safetensors +3 -0
- model-00043-of-00061.safetensors +3 -0
- model-00044-of-00061.safetensors +3 -0
- model-00045-of-00061.safetensors +3 -0
- model-00046-of-00061.safetensors +3 -0
- model-00047-of-00061.safetensors +3 -0
- model-00048-of-00061.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "merged_marcoroni70b",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 8192,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 28672,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"num_attention_heads": 64,
|
17 |
+
"num_hidden_layers": 80,
|
18 |
+
"num_key_value_heads": 8,
|
19 |
+
"pad_token_id": 0,
|
20 |
+
"pretraining_tp": 1,
|
21 |
+
"rms_norm_eps": 1e-05,
|
22 |
+
"rope_scaling": null,
|
23 |
+
"rope_theta": 10000.0,
|
24 |
+
"tie_word_embeddings": false,
|
25 |
+
"torch_dtype": "float32",
|
26 |
+
"transformers_version": "4.36.2",
|
27 |
+
"use_cache": false,
|
28 |
+
"vocab_size": 32000
|
29 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,8 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 0,
|
6 |
+
"transformers_version": "4.36.2",
|
7 |
+
"use_cache": false
|
8 |
+
}
|
model-00001-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c921454a21d2c14b80ee950a05f42ecc36f2b44a382dcaa58f627911d4cfc78
|
3 |
+
size 4806739440
|
model-00002-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc6a497911d6e54cf79fe48a19d88a1874e123e1382f8b0825f80f86d94bf67a
|
3 |
+
size 4630578440
|
model-00003-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bb7cdf4b22b39aea4aec8a4545d137b271ff58ed20f0e416cdf9f516b1f5638
|
3 |
+
size 4362142864
|
model-00004-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3acaaeb105328a6cd1beb6dbbec05a8e206faaa507afa92186bf0dfe620dca9a
|
3 |
+
size 4966188864
|
model-00005-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d3a07113797690bcd5b09ebd0e5091415734730e1073a519d0ad868cf32fb018
|
3 |
+
size 4362142864
|
model-00006-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f685a6bec89b561abeed2d2d50a048f6360e18d41da6096c76c921c01d0a7726
|
3 |
+
size 4362142864
|
model-00007-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7879bf679306240982de17b19d7d1b5c8a61f502a6755814cf838e2344f7076
|
3 |
+
size 4966188864
|
model-00008-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:acc9d683a48d957473b7190e2fc19438cd42114e815afa74ff11d5761cc31a44
|
3 |
+
size 4362142880
|
model-00009-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8e65c0be11c75254b5a72851119a5c378c6cbde9f775c6395b592fef1ec5b933
|
3 |
+
size 4362142872
|
model-00010-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:833b9629fd2797930dab0ea203cddbbb5fa1dc146e402fbaf53b4b342dd5b9c9
|
3 |
+
size 4966188880
|
model-00011-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec8d428c5af18e27350d237b9042370fdf2503ec7acc6494e3b44a7c14da622e
|
3 |
+
size 4362142872
|
model-00012-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2af8795d69ed71e1a06d2dbbfd5b48439a46141bb90b795553cc758a0c562ea4
|
3 |
+
size 4362142872
|
model-00013-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ee7401f22503919607e109185c270e34d2f3ca723eb09e263a0f9bd94e66c94
|
3 |
+
size 4966188880
|
model-00014-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8603add4dd9382107bb77c6bd04b365e32a3ce2a6ef154d0c7a06a8131fce16
|
3 |
+
size 4362142872
|
model-00015-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:007854ada89f3f97a2d7281c8903dbb471751391dfb0f99bc2f441609f0c8309
|
3 |
+
size 4362142872
|
model-00016-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c5359e3fbe06ac2c5f4226367b9862bbe9ec52f023a2b3903abc47f7ebf94a6
|
3 |
+
size 4966188880
|
model-00017-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11c1ff4222fc0bfc7384d9d786402aeb78de40f4233691be91a702aadcb2d7d0
|
3 |
+
size 4362142872
|
model-00018-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c37be7fc13e5be411457381725b07effdff88ed3eb8cfa2ddfd73b24a818df57
|
3 |
+
size 4362142872
|
model-00019-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:699f5e55ab8af815a8077bdfcd799cbde6d32cd2a8eed998aae0dedf878b7e41
|
3 |
+
size 4966188880
|
model-00020-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7bfed75586618d1423e0d85b030ef09758ecf68ce3d287c43324dc281e2977e5
|
3 |
+
size 4362142872
|
model-00021-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3dc977d1e3642cf1d09c9359a8c09333a3960ef6ef1c96b47086472ceedbde5
|
3 |
+
size 4362142872
|
model-00022-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a48af4b56cb5f36ae09912a4aea1999522b80faf83eaf987e4a96e1cac763e01
|
3 |
+
size 4966188880
|
model-00023-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:84dd5e109fedaa08bd68da7ff92c3ae47a14f902c04d249a6ba79240bcab2374
|
3 |
+
size 4362142872
|
model-00024-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50a71a3b20c05490d0ebfa4705bba954162ddca20d61fbdb434ee8ed03effe47
|
3 |
+
size 4362142872
|
model-00025-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:150f593b91b8e37d3f1534dc7fa08929dec9296f50e949977dcda9f9e4ebe8e5
|
3 |
+
size 4966188880
|
model-00026-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2deffdd7aa5fd025f13634d2185c4831bb7a1d2eb895fd446604b1def0b08484
|
3 |
+
size 4362142872
|
model-00027-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ebb73f23107966e39d94d4ba043166d9e9e83320818b33d9f4ea0440eb72113
|
3 |
+
size 4362142872
|
model-00028-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3181d787fa6a9c47741d7c70375cfd4566ac5275deb85b80cc9680b2c6b4f54
|
3 |
+
size 4966188880
|
model-00029-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a30b9d4e0f70d6a7737d975dd6539dbdda47a270748c1c0b2cb843cf9fa98aba
|
3 |
+
size 4362142872
|
model-00030-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:38b2d4a4ca167ef885d2e6347c018f45f0ab247ebf434a0f4c7590c683dba96c
|
3 |
+
size 4362142872
|
model-00031-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:634c36e9b3bf11f9a0705a2b218d769c5ecc457227aa0b1b69ec3ea9185e7721
|
3 |
+
size 4966188880
|
model-00032-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d730cb66474233b5da031179301133298e5e2e40ec1a8b5c6583187a0042932d
|
3 |
+
size 4362142872
|
model-00033-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0fb9a14b0ad587092fa350b2e2ba70ab689030e5de5136f9435f195cc219f78d
|
3 |
+
size 4362142872
|
model-00034-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e99c2e241a386b946dfa9de6c2f2b80ec80f99733a586bda62b2d2ff83d0a977
|
3 |
+
size 4966188880
|
model-00035-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1487c296ecf3c1955d32c5b8d36c768830a14919958bd734f4f60993e787bfbe
|
3 |
+
size 4362142872
|
model-00036-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c92b2d0eeb416f96052a7eb82a84065193d6b76b209a6b32767066c81da2fe08
|
3 |
+
size 4362142872
|
model-00037-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1f6941e407b38a38999e9eb16b823760e75654704c3c9632cdb63954f91f6597
|
3 |
+
size 4966188880
|
model-00038-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ba77213ae35e9e785ac16d74ee8eb5cbdbef1b03ba8f7f2fb6a8711ff58df3e
|
3 |
+
size 4362142872
|
model-00039-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50bfdbcbcc0253f1d755599bbc777a1e90c1995924d776299bbcf6b9005f3f40
|
3 |
+
size 4362142872
|
model-00040-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7548698a52f67879ed7333e01296f59d0924756faf718e13f7cc6af0e35672d4
|
3 |
+
size 4966188880
|
model-00041-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c062571485cd736c62d949f2fabc4deecc80ed7192e3cd59b815331ea8ce13eb
|
3 |
+
size 4362142872
|
model-00042-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7e712a14133c9a2e1a7ed50edc4163712431df86d944a227b1acafde74da6cb
|
3 |
+
size 4362142872
|
model-00043-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6943e2137d3da0eed59ada7bf8dadac1c05016835d199d83ce6d3bac7ee6c3e2
|
3 |
+
size 4966188880
|
model-00044-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2207531330d874f2fd3f2d9971ef4f6847355ce5c655a5a5ea65b5df5dad8022
|
3 |
+
size 4362142872
|
model-00045-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7267b73fce2a4d4f63643c2ef281e91157aac7e4cde784eb875b431d8813ef9
|
3 |
+
size 4362142872
|
model-00046-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2bddfc5288852364407679c384bf7fcfc6a81638ccd03b0c1fc63367cae1a9d
|
3 |
+
size 4966188880
|
model-00047-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9bf30fb3f82c73ac064c826e888cde87fb6c07722ba139fa07a570bf4a037a2e
|
3 |
+
size 4362142872
|
model-00048-of-00061.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81da0ee7520aa5feec78297401a97a877a796c4a70c92e04b72c7cc5c7fbafe0
|
3 |
+
size 4362142872
|