Spaces:
Running
on
Zero
Running
on
Zero
Commit
·
2fae289
1
Parent(s):
04a10c7
update
Browse files- src/attribution/attntrace.py +1 -0
- src/models/Llama.py +1 -0
src/attribution/attntrace.py
CHANGED
@@ -36,6 +36,7 @@ class AttnTraceAttribution(Attribution):
|
|
36 |
#print(last_group,group, last_group_label,group_label)
|
37 |
importances[feature_index[0]]+=(last_group_loss-group_loss)
|
38 |
return importances
|
|
|
39 |
def attribute(self, question: str, contexts: list, answer: str,explained_answer: str, customized_template: str = None):
|
40 |
start_time = time.time()
|
41 |
if self.llm.model!=None:
|
|
|
36 |
#print(last_group,group, last_group_label,group_label)
|
37 |
importances[feature_index[0]]+=(last_group_loss-group_loss)
|
38 |
return importances
|
39 |
+
@spaces.GPU
|
40 |
def attribute(self, question: str, contexts: list, answer: str,explained_answer: str, customized_template: str = None):
|
41 |
start_time = time.time()
|
42 |
if self.llm.model!=None:
|
src/models/Llama.py
CHANGED
@@ -34,6 +34,7 @@ class Llama(Model):
|
|
34 |
self.model = model
|
35 |
return self.model
|
36 |
|
|
|
37 |
def query(self, msg, max_tokens=128000):
|
38 |
model = self._load_model_if_needed().to("cuda")
|
39 |
messages = self.messages
|
|
|
34 |
self.model = model
|
35 |
return self.model
|
36 |
|
37 |
+
@spaces.GPU
|
38 |
def query(self, msg, max_tokens=128000):
|
39 |
model = self._load_model_if_needed().to("cuda")
|
40 |
messages = self.messages
|