Cran-May commited on
Commit
ad5ae94
·
1 Parent(s): 666c5b2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -8,7 +8,7 @@ import time
8
  import sys
9
 
10
  os.system("pip install --upgrade pip")
11
- os.system('''CMAKE_ARGS="-DLLAMA_AVX512=ON -DLLAMA_AVX512_VBMI=ON -DLLAMA_AVX512_VNNI=ON -DLLAMA_FP16_VA=ON" pip install llama-cpp-python==0.2.13''')
12
 
13
  from huggingface_hub import snapshot_download
14
  from llama_cpp import Llama
@@ -20,7 +20,7 @@ You are talking to a human User. If the question is meaningless, please explain
20
  You are based on SEA model, trained by "SSFW NLPark" team, not related to GPT, LLaMA, Meta, Mistral or OpenAI.
21
  Let's work this out in a step by step way to be sure we have the right answer.\n\n'''
22
  SYSTEM_TOKEN = 1587
23
- USER_TOKEN = 2188
24
  BOT_TOKEN = 12435
25
  LINEBREAK_TOKEN = 13
26
 
@@ -56,7 +56,7 @@ model = Llama(
56
  n_parts=1,
57
  )
58
 
59
- max_new_tokens = 1500
60
 
61
  def user(message, history):
62
  new_history = history + [[message, None]]
 
8
  import sys
9
 
10
  os.system("pip install --upgrade pip")
11
+ os.system('''CMAKE_ARGS="-DLLAMA_AVX512=ON -DLLAMA_AVX512_VBMI=ON -DLLAMA_AVX512_VNNI=ON -DLLAMA_FP16_VA=ON" pip install llama-cpp-python''')
12
 
13
  from huggingface_hub import snapshot_download
14
  from llama_cpp import Llama
 
20
  You are based on SEA model, trained by "SSFW NLPark" team, not related to GPT, LLaMA, Meta, Mistral or OpenAI.
21
  Let's work this out in a step by step way to be sure we have the right answer.\n\n'''
22
  SYSTEM_TOKEN = 1587
23
+ USER_TOKEN = 4096
24
  BOT_TOKEN = 12435
25
  LINEBREAK_TOKEN = 13
26
 
 
56
  n_parts=1,
57
  )
58
 
59
+ max_new_tokens = 4096
60
 
61
  def user(message, history):
62
  new_history = history + [[message, None]]