Update app.py
Browse files
app.py
CHANGED
@@ -16,19 +16,27 @@ def respond(message):
|
|
16 |
# Record the start time
|
17 |
start_time = time.time()
|
18 |
|
19 |
-
#
|
20 |
-
|
21 |
-
|
|
|
22 |
# Generate response
|
23 |
response = pipe(
|
24 |
input_text,
|
25 |
-
max_length=
|
26 |
truncation=True,
|
27 |
num_return_sequences=1,
|
28 |
temperature=0.2, # 控制生成多样性
|
29 |
top_p=0.1, # 控制生成质量
|
30 |
)
|
31 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
32 |
|
33 |
# Calculate inference time
|
34 |
inference_time = time.time() - start_time
|
|
|
16 |
# Record the start time
|
17 |
start_time = time.time()
|
18 |
|
19 |
+
# 修改 prompt:在對話中加入指令,要求只輸出最終答案,不顯示推理過程
|
20 |
+
instruction = "請只輸出最終答案,不要展示任何中間推理過程。"
|
21 |
+
input_text = f"User: {message}\nAssistant: {instruction}\nAssistant:"
|
22 |
+
|
23 |
# Generate response
|
24 |
response = pipe(
|
25 |
input_text,
|
26 |
+
max_length=1024,
|
27 |
truncation=True,
|
28 |
num_return_sequences=1,
|
29 |
temperature=0.2, # 控制生成多样性
|
30 |
top_p=0.1, # 控制生成质量
|
31 |
)
|
32 |
+
generated_text = response[0]['generated_text'].strip()
|
33 |
+
|
34 |
+
# 提取模型輸出中最後一次出現 "Assistant:" 之後的部分(假設模型按照格式輸出)
|
35 |
+
# 若模型輸出格式不同,可根據實際情況進行調整
|
36 |
+
if "Assistant:" in generated_text:
|
37 |
+
reply = generated_text.split("Assistant:")[-1].strip()
|
38 |
+
else:
|
39 |
+
reply = generated_text
|
40 |
|
41 |
# Calculate inference time
|
42 |
inference_time = time.time() - start_time
|