Update vertexLib.py
Browse files- vertexLib.py +102 -75
vertexLib.py
CHANGED
@@ -2,46 +2,13 @@ import json
|
|
2 |
import time
|
3 |
import requests
|
4 |
import jwt
|
5 |
-
import aiohttp
|
6 |
-
|
7 |
|
8 |
# βββββββββββββββββββββββββββββββββββββββββ
|
9 |
-
#
|
10 |
-
# "True" β μ μ
|
11 |
-
# "exceed" β μΏΌν°β§λ μ΄νΈλ¦¬λ° μ΄κ³Ό
|
12 |
-
# "False" β κ·Έ μΈ μ€ν¨
|
13 |
-
# βββββββββββββββββββββββββββββββββββββββββ
|
14 |
-
def _classify_response(resp: requests.Response) -> str:
|
15 |
-
if resp.status_code == 200:
|
16 |
-
return "True"
|
17 |
-
|
18 |
-
try:
|
19 |
-
err = resp.json().get("error", {})
|
20 |
-
code = err.get("code", 0)
|
21 |
-
msg = str(err.get("message", "")).lower()
|
22 |
-
|
23 |
-
if code == 429 or "quota" in msg or "rate" in msg or "exceed" in msg:
|
24 |
-
return "exceed"
|
25 |
-
except Exception:
|
26 |
-
pass
|
27 |
-
|
28 |
-
return "False"
|
29 |
-
|
30 |
-
|
31 |
-
def _classify_async_status(code: int, text: str) -> str:
|
32 |
-
if code == 200:
|
33 |
-
return "True"
|
34 |
-
if code == 429 or any(kw in text.lower() for kw in ("quota", "rate", "exceed")):
|
35 |
-
return "exceed"
|
36 |
-
return "False"
|
37 |
-
|
38 |
-
|
39 |
-
# βββββββββββββββββββββββββββββββββββββββββ
|
40 |
-
# 1) μλΉμ€ κ³μ β μ‘μΈμ€ ν ν°
|
41 |
# βββββββββββββββββββββββββββββββββββββββββ
|
42 |
def get_access_token(client_email, private_key):
|
43 |
current_time = int(time.time())
|
44 |
-
expiration_time = current_time + 600
|
45 |
|
46 |
claims = {
|
47 |
"iss": client_email,
|
@@ -54,9 +21,9 @@ def get_access_token(client_email, private_key):
|
|
54 |
try:
|
55 |
signed_jwt = jwt.encode(claims, private_key, algorithm="RS256")
|
56 |
except Exception as e:
|
57 |
-
return
|
58 |
|
59 |
-
|
60 |
"https://oauth2.googleapis.com/token",
|
61 |
data={
|
62 |
"grant_type": "urn:ietf:params:oauth:grant-type:jwt-bearer",
|
@@ -64,80 +31,140 @@ def get_access_token(client_email, private_key):
|
|
64 |
},
|
65 |
)
|
66 |
|
67 |
-
|
|
|
|
|
|
|
68 |
|
69 |
|
70 |
# βββββββββββββββββββββββββββββββββββββββββ
|
71 |
-
#
|
72 |
# βββββββββββββββββββββββββββββββββββββββββ
|
73 |
def get_access_token_refresh(client_id, client_secret, refresh_token):
|
74 |
-
|
75 |
-
|
76 |
-
|
77 |
-
|
78 |
-
|
79 |
-
|
80 |
-
|
81 |
-
|
82 |
-
)
|
83 |
|
84 |
-
|
|
|
|
|
|
|
85 |
|
86 |
|
87 |
# βββββββββββββββββββββββββββββββββββββββββ
|
88 |
-
#
|
89 |
-
# μ±κ³΅ μ¬λΆλ§ λ°ν
|
90 |
# βββββββββββββββββββββββββββββββββββββββββ
|
91 |
-
def get_gemini_models(key):
|
92 |
-
|
93 |
-
|
94 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
95 |
|
96 |
|
97 |
# βββββββββββββββββββββββββββββββββββββββββ
|
98 |
-
#
|
99 |
# βββββββββββββββββββββββββββββββββββββββββ
|
100 |
-
def send_fake_gemini_request(key, model="gemini-1.5-flash"):
|
|
|
|
|
|
|
|
|
101 |
url = f"https://generativelanguage.googleapis.com/v1beta/models/{model}:generateContent?key={key}"
|
102 |
payload = {
|
103 |
"contents": [{"role": "user", "parts": [{"text": ""}]}],
|
104 |
"generationConfig": {"maxOutputTokens": 0},
|
105 |
}
|
106 |
-
|
107 |
try:
|
108 |
resp = requests.post(url, headers={"Content-Type": "application/json"}, json=payload)
|
109 |
-
return
|
110 |
except Exception:
|
111 |
-
return
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
112 |
|
113 |
|
114 |
# βββββββββββββββββββββββββββββββββββββββββ
|
115 |
-
#
|
116 |
# βββββββββββββββββββββββββββββββββββββββββ
|
117 |
-
def send_gemini_request(key, payload, model="gemini-1.5-flash"):
|
118 |
url = f"https://generativelanguage.googleapis.com/v1beta/models/{model}:generateContent?key={key}"
|
119 |
resp = requests.post(url, headers={"Content-Type": "application/json"}, json=payload)
|
120 |
-
|
|
|
|
|
|
|
|
|
121 |
|
122 |
|
123 |
# βββββββββββββββββββββββββββββββββββββββββ
|
124 |
-
#
|
125 |
-
# μνλ§ κ°μνν΄ λ°ν
|
126 |
# βββββββββββββββββββββββββββββββββββββββββ
|
127 |
async def send_gcp_request(
|
128 |
-
session
|
129 |
-
project_id: str,
|
130 |
-
access_token: str,
|
131 |
-
payload: str,
|
132 |
-
region: str = "us-east5",
|
133 |
-
model: str = "claude-3-5-sonnet@20240620",
|
134 |
):
|
135 |
-
|
|
|
|
|
|
|
136 |
headers = {
|
137 |
"Authorization": f"Bearer {access_token}",
|
138 |
"Content-Type": "application/json; charset=utf-8",
|
139 |
}
|
140 |
|
141 |
-
async with session.post(url, headers=headers, data=payload) as
|
142 |
-
|
143 |
-
|
|
|
|
2 |
import time
|
3 |
import requests
|
4 |
import jwt
|
|
|
|
|
5 |
|
6 |
# βββββββββββββββββββββββββββββββββββββββββ
|
7 |
+
# 1. GCP μλΉμ€κ³μ μ‘μΈμ€ ν ν°
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8 |
# βββββββββββββββββββββββββββββββββββββββββ
|
9 |
def get_access_token(client_email, private_key):
|
10 |
current_time = int(time.time())
|
11 |
+
expiration_time = current_time + 600 # 10 λΆ
|
12 |
|
13 |
claims = {
|
14 |
"iss": client_email,
|
|
|
21 |
try:
|
22 |
signed_jwt = jwt.encode(claims, private_key, algorithm="RS256")
|
23 |
except Exception as e:
|
24 |
+
return False, e
|
25 |
|
26 |
+
response = requests.post(
|
27 |
"https://oauth2.googleapis.com/token",
|
28 |
data={
|
29 |
"grant_type": "urn:ietf:params:oauth:grant-type:jwt-bearer",
|
|
|
31 |
},
|
32 |
)
|
33 |
|
34 |
+
if response.status_code == 200:
|
35 |
+
return True, response.json()["access_token"]
|
36 |
+
else:
|
37 |
+
return False, response.text
|
38 |
|
39 |
|
40 |
# βββββββββββββββββββββββββββββββββββββββββ
|
41 |
+
# 2. GCP refresh-token μ‘μΈμ€ ν ν°
|
42 |
# βββββββββββββββββββββββββββββββββββββββββ
|
43 |
def get_access_token_refresh(client_id, client_secret, refresh_token):
|
44 |
+
token_url = "https://oauth2.googleapis.com/token"
|
45 |
+
data = {
|
46 |
+
"client_id": client_id,
|
47 |
+
"client_secret": client_secret,
|
48 |
+
"refresh_token": refresh_token,
|
49 |
+
"grant_type": "refresh_token",
|
50 |
+
}
|
51 |
+
|
52 |
+
response = requests.post(token_url, data=data)
|
53 |
|
54 |
+
if response.status_code == 200:
|
55 |
+
return True, response.json()["access_token"]
|
56 |
+
else:
|
57 |
+
return False, response.text
|
58 |
|
59 |
|
60 |
# βββββββββββββββββββββββββββββββββββββββββ
|
61 |
+
# 3. (μ ν) λͺ¨λΈ λͺ©λ‘ μ‘°ν β μ΅λ 10κ°λ§ λ°ν
|
|
|
62 |
# βββββββββββββββββββββββββββββββββββββββββ
|
63 |
+
def get_gemini_models(key, max_return: int = 1):
|
64 |
+
"""
|
65 |
+
λͺ¨λΈμ΄ λ무 λ§μ κ°λ
μ±μ΄ λ¨μ΄μ§λ―λ‘,
|
66 |
+
κΈ°λ³Έμ μΌλ‘ 10κ°κΉμ§λ§ λ°ννκ³ λλ¨Έμ§λ κ°μλ‘ μμ½.
|
67 |
+
"""
|
68 |
+
url = f"https://generativelanguage.googleapis.com/v1beta/models?key={key}&pageSize=1000"
|
69 |
+
response = requests.get(url)
|
70 |
+
|
71 |
+
if response.status_code != 200:
|
72 |
+
return ""
|
73 |
+
|
74 |
+
models = response.json().get("models", [])
|
75 |
+
names = [m["name"].split("/")[1] for m in models]
|
76 |
+
#if len(names) > max_return:
|
77 |
+
# return names[:max_return] + [f"...(+{len(names)-max_return})"]
|
78 |
+
return None
|
79 |
|
80 |
|
81 |
# βββββββββββββββββββββββββββββββββββββββββ
|
82 |
+
# 4. βλοΏ½οΏ½οΏ½β μμ²μΌλ‘ ν€ μνλ§ νλ³
|
83 |
# βββββββββββββββββββββββββββββββββββββββββ
|
84 |
+
def send_fake_gemini_request(key, model: str = "gemini-1.5-flash"):
|
85 |
+
"""
|
86 |
+
ν둬ννΈλ₯Ό λΉ λ¬Έμμ΄λ‘ λ³΄λ΄ κ°λ¨ν ν€ μ ν¨μ±μ 체ν¬.
|
87 |
+
λ°νκ°: error dict | '' | None
|
88 |
+
"""
|
89 |
url = f"https://generativelanguage.googleapis.com/v1beta/models/{model}:generateContent?key={key}"
|
90 |
payload = {
|
91 |
"contents": [{"role": "user", "parts": [{"text": ""}]}],
|
92 |
"generationConfig": {"maxOutputTokens": 0},
|
93 |
}
|
|
|
94 |
try:
|
95 |
resp = requests.post(url, headers={"Content-Type": "application/json"}, json=payload)
|
96 |
+
return resp.json().get("error", "")
|
97 |
except Exception:
|
98 |
+
return None
|
99 |
+
|
100 |
+
|
101 |
+
def check_key_gemini_availability(key):
|
102 |
+
"""
|
103 |
+
βΆ λ°ν: (bool, str)
|
104 |
+
β’ (True, 'ok') : ν€ μ ν¨, μ¬μ© κ°λ₯
|
105 |
+
β’ (False, 'exceed') : quota / rate-limit μ΄κ³Ό
|
106 |
+
β’ (False, 'invalid') : μλͺ»λ ν€ νΉμ κΆν μμ
|
107 |
+
β’ (False, 'error') : κΈ°ν λ€νΈμν¬/μ μ μλ μ€λ₯
|
108 |
+
"""
|
109 |
+
err = send_fake_gemini_request(key)
|
110 |
+
|
111 |
+
# λ€νΈμν¬ μ€ν¨
|
112 |
+
if err is None:
|
113 |
+
return False, "error"
|
114 |
+
|
115 |
+
# μλ¬ νλκ° μμΌλ©΄ μ μ
|
116 |
+
if err == "":
|
117 |
+
return True, "ok"
|
118 |
+
|
119 |
+
# μλ¬ κ°μ²΄ λΆμ
|
120 |
+
code = err.get("code", 0)
|
121 |
+
status = err.get("status", "")
|
122 |
+
|
123 |
+
# λΉ ν둬ννΈ λλ¬Έμ INVALID_ARGUMENTκ° λ¨λ κ²½μ° β ν€λ μ μ
|
124 |
+
if status == "INVALID_ARGUMENT":
|
125 |
+
return True, "ok"
|
126 |
+
|
127 |
+
# quota μ΄κ³Ό
|
128 |
+
if code == 429 or status == "RESOURCE_EXHAUSTED":
|
129 |
+
return False, "exceed"
|
130 |
+
|
131 |
+
# κΆν/μΈμ¦ λ¬Έμ
|
132 |
+
if code in (401, 403) or status in ("PERMISSION_DENIED", "UNAUTHENTICATED"):
|
133 |
+
return False, "invalid"
|
134 |
+
|
135 |
+
# κΈ°ν
|
136 |
+
return False, "error"
|
137 |
|
138 |
|
139 |
# βββββββββββββββββββββββββββββββββββββββββ
|
140 |
+
# 5. μ€μ Gemini μμ²
|
141 |
# βββββββββββββββββββββββββββββββββββββββββ
|
142 |
+
def send_gemini_request(key, payload, model: str = "gemini-1.5-flash"):
|
143 |
url = f"https://generativelanguage.googleapis.com/v1beta/models/{model}:generateContent?key={key}"
|
144 |
resp = requests.post(url, headers={"Content-Type": "application/json"}, json=payload)
|
145 |
+
|
146 |
+
if resp.status_code == 200:
|
147 |
+
return True, resp.json()
|
148 |
+
else:
|
149 |
+
return False, resp.text
|
150 |
|
151 |
|
152 |
# βββββββββββββββββββββββββββββββββββββββββ
|
153 |
+
# 6. Vertex AI (Anthropic) μμ² β λΉλκΈ°
|
|
|
154 |
# βββββββββββββββββββββββββββββββββββββββββ
|
155 |
async def send_gcp_request(
|
156 |
+
session, project_id, access_token, payload, region="us-east5", model="claude-3-5-sonnet@20240620"
|
|
|
|
|
|
|
|
|
|
|
157 |
):
|
158 |
+
VERTEX_URL = (
|
159 |
+
f"https://{region}-aiplatform.googleapis.com/v1/projects/"
|
160 |
+
f"{project_id}/locations/{region}/publishers/anthropic/models/{model}:streamRawPredict"
|
161 |
+
)
|
162 |
headers = {
|
163 |
"Authorization": f"Bearer {access_token}",
|
164 |
"Content-Type": "application/json; charset=utf-8",
|
165 |
}
|
166 |
|
167 |
+
async with session.post(url=VERTEX_URL, headers=headers, data=payload) as response:
|
168 |
+
if response.status != 200:
|
169 |
+
return json.loads(await response.text())
|
170 |
+
return await response.json()
|