Colin Dablain
commited on
feat: factor out HF_API_ROOT to allow different inference endpoints (#332)
Browse files- .env +1 -0
- src/lib/server/modelEndpoint.ts +2 -2
.env
CHANGED
|
@@ -7,6 +7,7 @@ MONGODB_DIRECT_CONNECTION=false
|
|
| 7 |
|
| 8 |
COOKIE_NAME=hf-chat
|
| 9 |
HF_ACCESS_TOKEN=#hf_<token> from from https://huggingface.co/settings/token
|
|
|
|
| 10 |
|
| 11 |
# used to activate search with web functionality. disabled if none are defined. choose one of the following:
|
| 12 |
SERPER_API_KEY=#your serper.dev api key here
|
|
|
|
| 7 |
|
| 8 |
COOKIE_NAME=hf-chat
|
| 9 |
HF_ACCESS_TOKEN=#hf_<token> from from https://huggingface.co/settings/token
|
| 10 |
+
HF_API_ROOT=https://api-inference.huggingface.co/models
|
| 11 |
|
| 12 |
# used to activate search with web functionality. disabled if none are defined. choose one of the following:
|
| 13 |
SERPER_API_KEY=#your serper.dev api key here
|
src/lib/server/modelEndpoint.ts
CHANGED
|
@@ -1,4 +1,4 @@
|
|
| 1 |
-
import { HF_ACCESS_TOKEN } from "$env/static/private";
|
| 2 |
import { sum } from "$lib/utils/sum";
|
| 3 |
import type { BackendModel } from "./models";
|
| 4 |
|
|
@@ -12,7 +12,7 @@ export function modelEndpoint(model: BackendModel): {
|
|
| 12 |
} {
|
| 13 |
if (!model.endpoints) {
|
| 14 |
return {
|
| 15 |
-
url:
|
| 16 |
authorization: `Bearer ${HF_ACCESS_TOKEN}`,
|
| 17 |
weight: 1,
|
| 18 |
};
|
|
|
|
| 1 |
+
import { HF_ACCESS_TOKEN, HF_API_ROOT } from "$env/static/private";
|
| 2 |
import { sum } from "$lib/utils/sum";
|
| 3 |
import type { BackendModel } from "./models";
|
| 4 |
|
|
|
|
| 12 |
} {
|
| 13 |
if (!model.endpoints) {
|
| 14 |
return {
|
| 15 |
+
url: `${HF_API_ROOT}/${model.name}`,
|
| 16 |
authorization: `Bearer ${HF_ACCESS_TOKEN}`,
|
| 17 |
weight: 1,
|
| 18 |
};
|