DrNicefellow commited on
Commit
0495aad
1 Parent(s): 57eae2c

Upload 3 files

Browse files
Files changed (2) hide show
  1. config.json +2 -1
  2. model.safetensors +3 -0
config.json CHANGED
@@ -1,4 +1,5 @@
1
  {
 
2
  "activation_function": "gelu_new",
3
  "architectures": [
4
  "GPT2LMHeadModel"
@@ -25,7 +26,7 @@
25
  "summary_proj_to_labels": true,
26
  "summary_type": "cls_index",
27
  "summary_use_proj": true,
28
- "torch_dtype": "float32",
29
  "transformers_version": "4.43.1",
30
  "use_cache": true,
31
  "vocab_size": 50304
 
1
  {
2
+ "_name_or_path": "DrNicefellow/Nano-GPT2-500m-29k_steps",
3
  "activation_function": "gelu_new",
4
  "architectures": [
5
  "GPT2LMHeadModel"
 
26
  "summary_proj_to_labels": true,
27
  "summary_type": "cls_index",
28
  "summary_use_proj": true,
29
+ "torch_dtype": "bfloat16",
30
  "transformers_version": "4.43.1",
31
  "use_cache": true,
32
  "vocab_size": 50304
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1962b57e8ae4ccc40ab13366944b811242f3a2ac13b0ce89eaf10c420141d51
3
+ size 1012097368