minpeter commited on
Commit
0ded438
·
verified ·
1 Parent(s): 6759ac3

Upload LlamaForCausalLM

Browse files
Files changed (2) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
config.json CHANGED
@@ -6,7 +6,7 @@
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 32001,
9
- "head_dim": 32,
10
  "hidden_act": "silu",
11
  "hidden_size": 256,
12
  "initializer_range": 0.02,
@@ -14,7 +14,7 @@
14
  "max_position_embeddings": 8192,
15
  "mlp_bias": false,
16
  "model_type": "llama",
17
- "num_attention_heads": 8,
18
  "num_hidden_layers": 12,
19
  "num_key_value_heads": 2,
20
  "pad_token_id": 32003,
 
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 32001,
9
+ "head_dim": 64,
10
  "hidden_act": "silu",
11
  "hidden_size": 256,
12
  "initializer_range": 0.02,
 
14
  "max_position_embeddings": 8192,
15
  "mlp_bias": false,
16
  "model_type": "llama",
17
+ "num_attention_heads": 4,
18
  "num_hidden_layers": 12,
19
  "num_key_value_heads": 2,
20
  "pad_token_id": 32003,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4189ae9393a4f793766021a2f8bd6d7f8bf58d19a953a44bc2608197cddbc315
3
- size 78437072
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f23c6c722d233179e227519b00ef0b46e8209102e60f735fcf8be37ad23c5fc7
3
+ size 80009960