Spaces:
Building
on
CPU Upgrade
Building
on
CPU Upgrade
Update app.py
Browse filesRemove unsupported optimizations
app.py
CHANGED
@@ -29,7 +29,6 @@ import gradio as gr
|
|
29 |
|
30 |
import torch
|
31 |
from transformers import TorchAoConfig, AutoModelForCausalLM, AutoTokenizer
|
32 |
-
import torchao.quantization.pt2e as pt2e
|
33 |
from torchao.quantization import Float8DynamicActivationFloat8WeightConfig, Float8WeightOnlyConfig
|
34 |
|
35 |
# quant_config = Float8WeightOnlyConfig()
|
@@ -47,9 +46,6 @@ model = AutoModelForCausalLM.from_pretrained(
|
|
47 |
|
48 |
gc.collect()
|
49 |
|
50 |
-
pt2e.move_exported_model_to_eval(model)
|
51 |
-
|
52 |
-
gc.collect()
|
53 |
|
54 |
#########
|
55 |
|
|
|
29 |
|
30 |
import torch
|
31 |
from transformers import TorchAoConfig, AutoModelForCausalLM, AutoTokenizer
|
|
|
32 |
from torchao.quantization import Float8DynamicActivationFloat8WeightConfig, Float8WeightOnlyConfig
|
33 |
|
34 |
# quant_config = Float8WeightOnlyConfig()
|
|
|
46 |
|
47 |
gc.collect()
|
48 |
|
|
|
|
|
|
|
49 |
|
50 |
#########
|
51 |
|