Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -22,16 +22,20 @@ def generate_response(prompt):
|
|
22 |
try:
|
23 |
generated = pipe.generate([prompt], max_length=1024)
|
24 |
tokenpersec=f'{generated.perf_metrics.get_throughput().mean:.2f}'
|
|
|
25 |
match = re.search(r"<think>(.*?)</think>(.*)", generated, re.DOTALL)
|
26 |
-
|
|
|
27 |
if match:
|
28 |
thinking = match.group(1).strip()
|
29 |
content = match.group(2).strip()
|
30 |
else:
|
31 |
thinking = "樑εζ²ζζδΎζθιη¨"
|
32 |
content = generated # ζθ
generated.textοΌ εζ±ΊζΌ generated η©δ»Άη屬ζ§
|
33 |
-
|
34 |
return tokenpersec, thinking, content
|
|
|
|
|
35 |
except Exception as e:
|
36 |
return "ηΌηι―θͺ€", "ηΌηι―θͺ€", f"ηζεζζηΌηι―θͺ€οΌ{e}"
|
37 |
|
@@ -42,8 +46,9 @@ demo = gr.Interface(
|
|
42 |
inputs=gr.Textbox(lines=5, label="θΌΈε
₯ζη€Ί (Prompt)"),
|
43 |
outputs=[
|
44 |
gr.Textbox(label="tokens/sec"),
|
45 |
-
gr.Textbox(label="ζθιη¨"),
|
46 |
-
gr.Textbox(label="ζη΅εζ")
|
|
|
47 |
],
|
48 |
title="Qwen3-0.6B-int4-ov ",
|
49 |
description="εΊζΌ Qwen3-0.6B-int4-ov ζ¨ηζη¨οΌζ―ζ΄ζθιη¨ει’θ GUIγ"
|
|
|
22 |
try:
|
23 |
generated = pipe.generate([prompt], max_length=1024)
|
24 |
tokenpersec=f'{generated.perf_metrics.get_throughput().mean:.2f}'
|
25 |
+
'''
|
26 |
match = re.search(r"<think>(.*?)</think>(.*)", generated, re.DOTALL)
|
27 |
+
thinking = ""
|
28 |
+
content = ""
|
29 |
if match:
|
30 |
thinking = match.group(1).strip()
|
31 |
content = match.group(2).strip()
|
32 |
else:
|
33 |
thinking = "樑εζ²ζζδΎζθιη¨"
|
34 |
content = generated # ζθ
generated.textοΌ εζ±ΊζΌ generated η©δ»Άη屬ζ§
|
35 |
+
|
36 |
return tokenpersec, thinking, content
|
37 |
+
'''
|
38 |
+
return tokenpersec, generated
|
39 |
except Exception as e:
|
40 |
return "ηΌηι―θͺ€", "ηΌηι―θͺ€", f"ηζεζζηΌηι―θͺ€οΌ{e}"
|
41 |
|
|
|
46 |
inputs=gr.Textbox(lines=5, label="θΌΈε
₯ζη€Ί (Prompt)"),
|
47 |
outputs=[
|
48 |
gr.Textbox(label="tokens/sec"),
|
49 |
+
#gr.Textbox(label="ζθιη¨"),
|
50 |
+
#gr.Textbox(label="ζη΅εζ")
|
51 |
+
gr.Textbox(label="εζ")
|
52 |
],
|
53 |
title="Qwen3-0.6B-int4-ov ",
|
54 |
description="εΊζΌ Qwen3-0.6B-int4-ov ζ¨ηζη¨οΌζ―ζ΄ζθιη¨ει’θ GUIγ"
|