Text Generation
Transformers
Safetensors
English
llama
conversational
text-generation-inference
lucifertrj commited on
Commit
eb999fa
Β·
verified Β·
1 Parent(s): 768371f

Upload folder using huggingface_hub

Browse files
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "meta-llama/Llama-2-7b-hf",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
@@ -8,14 +8,14 @@
8
  "bos_token_id": 1,
9
  "eos_token_id": 2,
10
  "hidden_act": "silu",
11
- "hidden_size": 4096,
12
  "initializer_range": 0.02,
13
- "intermediate_size": 11008,
14
- "max_position_embeddings": 4096,
15
  "model_type": "llama",
16
- "num_attention_heads": 32,
17
- "num_hidden_layers": 32,
18
- "num_key_value_heads": 32,
19
  "pretraining_tp": 1,
20
  "quantization_config": {
21
  "_load_in_4bit": true,
@@ -33,10 +33,10 @@
33
  },
34
  "rms_norm_eps": 1e-05,
35
  "rope_scaling": null,
36
- "rope_theta": 10000.0,
37
  "tie_word_embeddings": false,
38
  "torch_dtype": "float16",
39
  "transformers_version": "4.38.2",
40
- "use_cache": true,
41
- "vocab_size": 32000
42
  }
 
1
  {
2
+ "_name_or_path": "codellama/CodeLlama-13b-Instruct-hf",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
 
8
  "bos_token_id": 1,
9
  "eos_token_id": 2,
10
  "hidden_act": "silu",
11
+ "hidden_size": 5120,
12
  "initializer_range": 0.02,
13
+ "intermediate_size": 13824,
14
+ "max_position_embeddings": 16384,
15
  "model_type": "llama",
16
+ "num_attention_heads": 40,
17
+ "num_hidden_layers": 40,
18
+ "num_key_value_heads": 40,
19
  "pretraining_tp": 1,
20
  "quantization_config": {
21
  "_load_in_4bit": true,
 
33
  },
34
  "rms_norm_eps": 1e-05,
35
  "rope_scaling": null,
36
+ "rope_theta": 1000000,
37
  "tie_word_embeddings": false,
38
  "torch_dtype": "float16",
39
  "transformers_version": "4.38.2",
40
+ "use_cache": false,
41
+ "vocab_size": 32016
42
  }
generation_config.json CHANGED
@@ -1,10 +1,6 @@
1
  {
 
2
  "bos_token_id": 1,
3
- "do_sample": true,
4
  "eos_token_id": 2,
5
- "max_length": 4096,
6
- "pad_token_id": 0,
7
- "temperature": 0.6,
8
- "top_p": 0.9,
9
  "transformers_version": "4.38.2"
10
  }
 
1
  {
2
+ "_from_model_config": true,
3
  "bos_token_id": 1,
 
4
  "eos_token_id": 2,
 
 
 
 
5
  "transformers_version": "4.38.2"
6
  }
pytorch_model-00001-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:de8c0ae9cd517ee4a0feeee0886a3e5f90ebee6ff7285977bd0340c4956f6875
3
+ size 5000268830
pytorch_model-00002-of-00002.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24d4212eb7bbb0eaae609e9507e036efa2414e4ecb7b7f6e1ccd324ee2660723
3
+ size 2202469569
pytorch_model.bin.index.json ADDED
The diff for this file is too large to render. See raw diff
 
special_tokens_map.json CHANGED
@@ -1,4 +1,10 @@
1
  {
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<s>",
4
  "lstrip": false,
@@ -13,6 +19,7 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
 
16
  "unk_token": {
17
  "content": "<unk>",
18
  "lstrip": false,
 
1
  {
2
+ "additional_special_tokens": [
3
+ "▁<PRE>",
4
+ "▁<MID>",
5
+ "▁<SUF>",
6
+ "▁<EOT>"
7
+ ],
8
  "bos_token": {
9
  "content": "<s>",
10
  "lstrip": false,
 
19
  "rstrip": false,
20
  "single_word": false
21
  },
22
+ "pad_token": "</s>",
23
  "unk_token": {
24
  "content": "<unk>",
25
  "lstrip": false,
tokenizer.json CHANGED
@@ -1,7 +1,21 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
4
- "padding": null,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5
  "added_tokens": [
6
  {
7
  "id": 0,
@@ -29,6 +43,42 @@
29
  "rstrip": false,
30
  "normalized": false,
31
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32
  }
33
  ],
34
  "normalizer": {
@@ -32134,7 +32184,23 @@
32134
  "μ™•": 31996,
32135
  "ζ”Ά": 31997,
32136
  "弘": 31998,
32137
- "η»™": 31999
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
32138
  },
32139
  "merges": [
32140
  "▁ t",
@@ -93385,7 +93451,18 @@
93385
  "▁▁▁▁▁▁▁▁▁ ▁▁▁▁▁▁",
93386
  "▁▁▁▁▁▁▁ ▁▁▁▁▁▁▁▁",
93387
  "▁▁▁▁▁▁▁▁▁▁▁ ▁▁▁▁",
93388
- "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁"
 
 
 
 
 
 
 
 
 
 
 
93389
  ]
93390
  }
93391
  }
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 512,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
+ "padding": {
10
+ "strategy": {
11
+ "Fixed": 512
12
+ },
13
+ "direction": "Right",
14
+ "pad_to_multiple_of": null,
15
+ "pad_id": 2,
16
+ "pad_type_id": 0,
17
+ "pad_token": "</s>"
18
+ },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
43
  "rstrip": false,
44
  "normalized": false,
45
  "special": true
46
+ },
47
+ {
48
+ "id": 32007,
49
+ "content": "▁<PRE>",
50
+ "single_word": false,
51
+ "lstrip": false,
52
+ "rstrip": false,
53
+ "normalized": false,
54
+ "special": true
55
+ },
56
+ {
57
+ "id": 32008,
58
+ "content": "▁<SUF>",
59
+ "single_word": false,
60
+ "lstrip": false,
61
+ "rstrip": false,
62
+ "normalized": false,
63
+ "special": true
64
+ },
65
+ {
66
+ "id": 32009,
67
+ "content": "▁<MID>",
68
+ "single_word": false,
69
+ "lstrip": false,
70
+ "rstrip": false,
71
+ "normalized": false,
72
+ "special": true
73
+ },
74
+ {
75
+ "id": 32010,
76
+ "content": "▁<EOT>",
77
+ "single_word": false,
78
+ "lstrip": false,
79
+ "rstrip": false,
80
+ "normalized": false,
81
+ "special": true
82
  }
83
  ],
84
  "normalizer": {
 
32184
  "μ™•": 31996,
32185
  "ζ”Ά": 31997,
32186
  "弘": 31998,
32187
+ "η»™": 31999,
32188
+ "▁<SU": 32000,
32189
+ "▁<SUF": 32001,
32190
+ "▁<PRE": 32002,
32191
+ "▁<M": 32003,
32192
+ "▁<MID": 32004,
32193
+ "▁<E": 32005,
32194
+ "▁<EOT": 32006,
32195
+ "▁<PRE>": 32007,
32196
+ "▁<SUF>": 32008,
32197
+ "▁<MID>": 32009,
32198
+ "▁<EOT>": 32010,
32199
+ "▁<EOT><EOT>": 32011,
32200
+ "▁<EOT><EOT><EOT>": 32012,
32201
+ "▁<EOT><EOT><EOT><EOT>": 32013,
32202
+ "▁<EOT><EOT><EOT><EOT><EOT>": 32014,
32203
+ "▁<EOT><EOT><EOT><EOT><EOT><EOT>": 32015
32204
  },
32205
  "merges": [
32206
  "▁ t",
 
93451
  "▁▁▁▁▁▁▁▁▁ ▁▁▁▁▁▁",
93452
  "▁▁▁▁▁▁▁ ▁▁▁▁▁▁▁▁",
93453
  "▁▁▁▁▁▁▁▁▁▁▁ ▁▁▁▁",
93454
+ "▁ ▁▁▁▁▁▁▁▁▁▁▁▁▁▁",
93455
+ "▁< SU",
93456
+ "▁<SU F",
93457
+ "▁< PRE",
93458
+ "▁< M",
93459
+ "▁<M ID",
93460
+ "▁< E",
93461
+ "▁<E OT",
93462
+ "▁<PRE >",
93463
+ "▁<SUF >",
93464
+ "▁<MID >",
93465
+ "▁<EOT >"
93466
  ]
93467
  }
93468
  }
tokenizer.model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9e556afd44213b6bd1be2b850ebbbd98f5481437a8021afaf58ee7fb1818d347
3
- size 499723
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45ccb9c8b6b561889acea59191d66986d314e7cbd6a78abc6e49b139ca91c1e6
3
+ size 500058
tokenizer_config.json CHANGED
@@ -25,17 +25,60 @@
25
  "rstrip": false,
26
  "single_word": false,
27
  "special": true
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
28
  }
29
  },
 
 
 
 
 
 
30
  "bos_token": "<s>",
 
31
  "clean_up_tokenization_spaces": false,
32
  "eos_token": "</s>",
33
- "legacy": false,
 
 
 
34
  "model_max_length": 1000000000000000019884624838656,
35
- "pad_token": null,
36
- "padding_side": "right",
37
  "sp_model_kwargs": {},
38
- "tokenizer_class": "LlamaTokenizer",
 
39
  "unk_token": "<unk>",
40
  "use_default_system_prompt": false
41
  }
 
25
  "rstrip": false,
26
  "single_word": false,
27
  "special": true
28
+ },
29
+ "32007": {
30
+ "content": "▁<PRE>",
31
+ "lstrip": false,
32
+ "normalized": false,
33
+ "rstrip": false,
34
+ "single_word": false,
35
+ "special": true
36
+ },
37
+ "32008": {
38
+ "content": "▁<SUF>",
39
+ "lstrip": false,
40
+ "normalized": false,
41
+ "rstrip": false,
42
+ "single_word": false,
43
+ "special": true
44
+ },
45
+ "32009": {
46
+ "content": "▁<MID>",
47
+ "lstrip": false,
48
+ "normalized": false,
49
+ "rstrip": false,
50
+ "single_word": false,
51
+ "special": true
52
+ },
53
+ "32010": {
54
+ "content": "▁<EOT>",
55
+ "lstrip": false,
56
+ "normalized": false,
57
+ "rstrip": false,
58
+ "single_word": false,
59
+ "special": true
60
  }
61
  },
62
+ "additional_special_tokens": [
63
+ "▁<PRE>",
64
+ "▁<MID>",
65
+ "▁<SUF>",
66
+ "▁<EOT>"
67
+ ],
68
  "bos_token": "<s>",
69
+ "chat_template": "{% if messages[0]['role'] == 'system' %}{% set loop_messages = messages[1:] %}{% set system_message = messages[0]['content'] %}{% else %}{% set loop_messages = messages %}{% set system_message = false %}{% endif %}{% for message in loop_messages %}{% if (message['role'] == 'user') != (loop.index0 % 2 == 0) %}{{ raise_exception('Conversation roles must alternate user/assistant/user/assistant/...') }}{% endif %}{% if loop.index0 == 0 and system_message != false %}{% set content = '<<SYS>>\\n' + system_message + '\\n<</SYS>>\\n\\n' + message['content'] %}{% else %}{% set content = message['content'] %}{% endif %}{% if message['role'] == 'user' %}{{ bos_token + '[INST] ' + content | trim + ' [/INST]' }}{% elif message['role'] == 'assistant' %}{{ ' ' + content | trim + ' ' + eos_token }}{% endif %}{% endfor %}",
70
  "clean_up_tokenization_spaces": false,
71
  "eos_token": "</s>",
72
+ "eot_token": "▁<EOT>",
73
+ "fill_token": "<FILL_ME>",
74
+ "legacy": null,
75
+ "middle_token": "▁<MID>",
76
  "model_max_length": 1000000000000000019884624838656,
77
+ "pad_token": "</s>",
78
+ "prefix_token": "▁<PRE>",
79
  "sp_model_kwargs": {},
80
+ "suffix_token": "▁<SUF>",
81
+ "tokenizer_class": "CodeLlamaTokenizer",
82
  "unk_token": "<unk>",
83
  "use_default_system_prompt": false
84
  }