LoneStriker commited on
Commit
dcda9da
1 Parent(s): 700a289

Upload 3 files

Browse files
Files changed (3) hide show
  1. README.md +19 -0
  2. adapter_config.json +2 -2
  3. config.json +1 -1
README.md ADDED
@@ -0,0 +1,19 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ inference: false
3
+ language:
4
+ - en
5
+ library_name: transformers
6
+ pipeline_tag: text-generation
7
+ tags:
8
+ - mixtral
9
+ license: apache-2.0
10
+ datasets:
11
+ - jondurbin/airoboros-3.2
12
+ ---
13
+
14
+ # Air-Striker-Mixtral-8x7B-ZLoss
15
+
16
+ Experimental model, trained using config and [Transformers/Axolotl](https://github.com/DocShotgun/axolotl) forks provided by [Doctor-Shotdun](https://huggingface.co/Doctor-Shotgun)
17
+
18
+ Model was trained with airoboros-3.2 dataset, for 4 epochs, ChatML prompt format at 8K context length.
19
+
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": "/users/hngo/models/Mixtral-8x7B-v0.1",
5
  "bias": "none",
6
  "fan_in_fan_out": null,
7
  "inference_mode": true,
@@ -29,4 +29,4 @@
29
  "w2"
30
  ],
31
  "task_type": "CAUSAL_LM"
32
- }
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "/users/ubuntu/models/Mixtral-8x7B-v0.1",
5
  "bias": "none",
6
  "fan_in_fan_out": null,
7
  "inference_mode": true,
 
29
  "w2"
30
  ],
31
  "task_type": "CAUSAL_LM"
32
+ }
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/users/hngo/models/Mixtral-8x7B-v0.1",
3
  "architectures": [
4
  "MixtralForCausalLM"
5
  ],
 
1
  {
2
+ "_name_or_path": "/users/ubuntu/models/Mixtral-8x7B-v0.1",
3
  "architectures": [
4
  "MixtralForCausalLM"
5
  ],