Spaces:
Running
on
T4
Running
on
T4
Update auditqa/reader.py
Browse files- auditqa/reader.py +15 -0
auditqa/reader.py
CHANGED
@@ -11,6 +11,21 @@ model_config = getconfig("model_params.cfg")
|
|
11 |
NVIDIA_SERVER = os.environ["NVIDIA_SERVERLESS"]
|
12 |
HF_token = os.environ["LLAMA_3_1"]
|
13 |
INF_SERVERLESS = os.environ["INF_SERVERLESS"]
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
14 |
|
15 |
|
16 |
def nvidia_client():
|
|
|
11 |
NVIDIA_SERVER = os.environ["NVIDIA_SERVERLESS"]
|
12 |
HF_token = os.environ["LLAMA_3_1"]
|
13 |
INF_SERVERLESS = os.environ["INF_SERVERLESS"]
|
14 |
+
NEBIUS_LLAMA3_1_8B = os.environ["NEBIUS"]
|
15 |
+
|
16 |
+
|
17 |
+
|
18 |
+
def Inf_provider():
|
19 |
+
"""return the inf service provider"""
|
20 |
+
client = InferenceClient(
|
21 |
+
|
22 |
+
provider=model_config.get('reader','INF_PROVIDER')
|
23 |
+
api_key=NEBIUS_LLAMA3_1_8B,
|
24 |
+
)
|
25 |
+
print(f"getting {provider} client")
|
26 |
+
|
27 |
+
return client
|
28 |
+
|
29 |
|
30 |
|
31 |
def nvidia_client():
|