Spaces:
Paused
Paused
Commit
·
de1f6e0
1
Parent(s):
a939eac
Update app.py
Browse files
app.py
CHANGED
|
@@ -26,5 +26,14 @@ model = AutoGPTQForCausalLM.from_quantized(quantized_model_dir,
|
|
| 26 |
use_triton=use_triton,
|
| 27 |
quantize_config=quantize_config)
|
| 28 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 29 |
|
| 30 |
demo.launch()
|
|
|
|
| 26 |
use_triton=use_triton,
|
| 27 |
quantize_config=quantize_config)
|
| 28 |
|
| 29 |
+
pipe = pipeline(
|
| 30 |
+
"text-generation",
|
| 31 |
+
model=model,
|
| 32 |
+
tokenizer=tokenizer,
|
| 33 |
+
max_new_tokens=512,
|
| 34 |
+
temperature=0.1,
|
| 35 |
+
top_p=0.95,
|
| 36 |
+
repetition_penalty=1.15
|
| 37 |
+
)
|
| 38 |
|
| 39 |
demo.launch()
|