hsuwill000 commited on
Commit
de22364
·
verified ·
1 Parent(s): 5202755

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -3
app.py CHANGED
@@ -39,13 +39,15 @@ model_path = "ov"
39
  pipe = ov_genai.LLMPipeline(model_path, "CPU")
40
  '''
41
 
42
- model = OVModelForCausalLM.from_pretrained(
43
  model_id,
44
- quantization_config=OVWeightQuantizationConfig(bits=4, asym=True, ratio=0.8, dataset="ptb"),
 
45
  )
46
 
 
47
  # save the model after optimization
48
- model.save_pretrained(model_path)
49
 
50
  #pipe.start_chat()
51
 
 
39
  pipe = ov_genai.LLMPipeline(model_path, "CPU")
40
  '''
41
 
42
+ pipe = OVModelForCausalLM.from_pretrained(
43
  model_id,
44
+ export=True,
45
+ quantization_config=OVWeightQuantizationConfig(bits=4),
46
  )
47
 
48
+
49
  # save the model after optimization
50
+ #pipe.save_pretrained(model_path)
51
 
52
  #pipe.start_chat()
53