Dampfinchen
/

Llama-3-8B-Ultra-Instruct

@@ -1,6 +1,11 @@
 ---
 base_model:
 - Undi95/Meta-Llama-3-8B-Instruct-hf
 library_name: transformers
 tags:
 - mergekit
@@ -33,8 +38,12 @@ This model was merged using the [DARE](https://arxiv.org/abs/2311.03099) [TIES](
 ### Models Merged
 The following models were included in the merge:
-* llama-3-8B-ultra-instruct/InstructPart
-* llama-3-8B-ultra-instruct/RPPart
 ### Configuration
@@ -56,6 +65,7 @@ dtype: bfloat16
 base_model: Undi95/Meta-Llama-3-8B-hf
 name: RPPart
 ---
 models:
   - model: Weyaxi/Einstein-v6.1-Llama3-8B
     parameters:
@@ -71,6 +81,7 @@ base_model: Undi95/Meta-Llama-3-8B-hf
 dtype: bfloat16
 name: InstructPart
 ---
 models:
   - model: RPPart
     parameters:
@@ -106,4 +117,4 @@ Detailed results can be found [here](https://huggingface.co/datasets/open-llm-le
 |MMLU (5-Shot)                    |68.32|
 |TruthfulQA (0-shot)              |52.80|
 |Winogrande (5-shot)              |76.95|
-|GSM8k (5-shot)                   |70.36|

 ---
 base_model:
 - Undi95/Meta-Llama-3-8B-Instruct-hf
+- Undi95/Llama-3-LewdPlay-8B-evo
+- jondurbin/bagel-8b-v1.0
+- Weyaxi/Einstein-v6.1-Llama3-8B
+- VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
+- aaditya/OpenBioLLM-Llama3-8B
 library_name: transformers
 tags:
 - mergekit
 ### Models Merged
 The following models were included in the merge:
+* Undi95/Meta-Llama-3-8B-Instruct-hf
+* Undi95/Llama-3-LewdPlay-8B-evo
+* jondurbin/bagel-8b-v1.0
+* Weyaxi/Einstein-v6.1-Llama3-8B
+* VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
+* aaditya/OpenBioLLM-Llama3-8B
 ### Configuration
 base_model: Undi95/Meta-Llama-3-8B-hf
 name: RPPart
 ---
 models:
   - model: Weyaxi/Einstein-v6.1-Llama3-8B
     parameters:
 dtype: bfloat16
 name: InstructPart
 ---
 models:
   - model: RPPart
     parameters:
 |MMLU (5-Shot)                    |68.32|
 |TruthfulQA (0-shot)              |52.80|
 |Winogrande (5-shot)              |76.95|
+|GSM8k (5-shot)                   |70.36|

mergekit_config.yml CHANGED Viewed

@@ -1,15 +1,43 @@
-base_model: Undi95/Meta-Llama-3-8B-Instruct-hf
 dtype: bfloat16
 merge_method: dare_ties
-slices:
-- sources:
-  - layer_range: [0, 32]
-    model: llama-3-8B-ultra-instruct/RPPart
     parameters:
       weight: 0.39
-  - layer_range: [0, 32]
-    model: llama-3-8B-ultra-instruct/InstructPart
     parameters:
       weight: 0.26
-  - layer_range: [0, 32]
-    model: Undi95/Meta-Llama-3-8B-Instruct-hf

+models:
+  - model: ChaoticNeutrals/Poppy_Porpoise-v0.7-L3-8B
+    parameters:
+      weight: 0.4
+  - model: Undi95/Llama-3-LewdPlay-8B-evo
+    parameters:
+      weight: 0.5
+  - model: jondurbin/bagel-8b-v1.0
+    parameters:
+      weight: 0.1
+merge_method: dare_ties
 dtype: bfloat16
+base_model: Undi95/Meta-Llama-3-8B-hf
+name: RPPart
+---
+models:
+  - model: Weyaxi/Einstein-v6.1-Llama3-8B
+    parameters:
+      weight: 0.6
+  - model: VAGOsolutions/Llama-3-SauerkrautLM-8b-Instruct
+    parameters:
+      weight: 0.3
+  - model: aaditya/OpenBioLLM-Llama3-8B
+    parameters:
+      weight: 0.1
 merge_method: dare_ties
+base_model: Undi95/Meta-Llama-3-8B-hf
+dtype: bfloat16
+name: InstructPart
+---
+models:
+  - model: RPPart
     parameters:
       weight: 0.39
+  - model: InstructPart
     parameters:
       weight: 0.26
+merge_method: dare_ties
+base_model: Undi95/Meta-Llama-3-8B-Instruct-hf
+dtype: bfloat16
+name: Llama-3-8B-Ultra-Instruct