Update app.py
Browse files
app.py
CHANGED
@@ -1,17 +1,17 @@
|
|
1 |
import gradio as gr
|
2 |
-
|
3 |
import torch
|
4 |
from peft import PeftModel, PeftConfig
|
5 |
from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, AutoTokenizer, GenerationConfig
|
6 |
-
|
7 |
from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig, GemmaTokenizer, StoppingCriteria, StoppingCriteriaList, GenerationConfig
|
8 |
-
|
9 |
import os
|
10 |
|
|
|
|
|
|
|
11 |
peft_model_id = "daqc/kuntur-peru-legal-es-gemma-2b-it"
|
12 |
config = PeftConfig.from_pretrained(peft_model_id)
|
13 |
-
model = AutoModelForCausalLM.from_pretrained(config.base_model_name_or_path, return_dict=True, load_in_8bit=True, device_map={"":0})
|
14 |
-
tokenizer = AutoTokenizer.from_pretrained(peft_model_id)
|
15 |
|
16 |
model = PeftModel.from_pretrained(model, peft_model_id)
|
17 |
model.eval()
|
|
|
1 |
import gradio as gr
|
|
|
2 |
import torch
|
3 |
from peft import PeftModel, PeftConfig
|
4 |
from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, AutoTokenizer, GenerationConfig
|
|
|
5 |
from transformers import AutoTokenizer, AutoModelForCausalLM, BitsAndBytesConfig, GemmaTokenizer, StoppingCriteria, StoppingCriteriaList, GenerationConfig
|
|
|
6 |
import os
|
7 |
|
8 |
+
token = os.getenv("hf_token")
|
9 |
+
|
10 |
+
|
11 |
peft_model_id = "daqc/kuntur-peru-legal-es-gemma-2b-it"
|
12 |
config = PeftConfig.from_pretrained(peft_model_id)
|
13 |
+
model = AutoModelForCausalLM.from_pretrained(config.base_model_name_or_path, return_dict=True, load_in_8bit=True, device_map={"":0}, token=hf_token)
|
14 |
+
tokenizer = AutoTokenizer.from_pretrained(peft_model_id, token=hf_token)
|
15 |
|
16 |
model = PeftModel.from_pretrained(model, peft_model_id)
|
17 |
model.eval()
|