Spaces:
Paused
Paused
Upload 3 files
Browse files
app.py
CHANGED
|
@@ -1124,22 +1124,37 @@ def index():
|
|
| 1124 |
|
| 1125 |
def num_tokens_from_string(string, model=""):
|
| 1126 |
try:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1127 |
response = requests.post(
|
| 1128 |
TOKENIZER_SERVICE_URL,
|
| 1129 |
-
json=
|
| 1130 |
timeout=10
|
| 1131 |
)
|
| 1132 |
|
|
|
|
|
|
|
|
|
|
| 1133 |
if response.status_code == 200:
|
| 1134 |
result = response.json()
|
| 1135 |
input_tokens = result.get("input_tokens", 0)
|
| 1136 |
-
|
|
|
|
| 1137 |
else:
|
|
|
|
| 1138 |
print(f"Tokenizer服务错误: {response.status_code} - {response.text}")
|
| 1139 |
-
|
|
|
|
| 1140 |
except Exception as e:
|
|
|
|
| 1141 |
print(f"计算token错误: {e}")
|
| 1142 |
-
|
|
|
|
| 1143 |
|
| 1144 |
|
| 1145 |
# 更新模型使用统计
|
|
|
|
| 1124 |
|
| 1125 |
def num_tokens_from_string(string, model=""):
|
| 1126 |
try:
|
| 1127 |
+
print(f"\n开始计算token: model={model}")
|
| 1128 |
+
request_data = {
|
| 1129 |
+
"model": model,
|
| 1130 |
+
"messages": [{"role": "user", "content": string}]
|
| 1131 |
+
}
|
| 1132 |
+
print(f"请求数据: {json.dumps(request_data, ensure_ascii=False)}")
|
| 1133 |
+
|
| 1134 |
response = requests.post(
|
| 1135 |
TOKENIZER_SERVICE_URL,
|
| 1136 |
+
json=request_data,
|
| 1137 |
timeout=10
|
| 1138 |
)
|
| 1139 |
|
| 1140 |
+
print(f"Tokenizer响应状态码: {response.status_code}")
|
| 1141 |
+
print(f"Tokenizer响应内容: {response.text}")
|
| 1142 |
+
|
| 1143 |
if response.status_code == 200:
|
| 1144 |
result = response.json()
|
| 1145 |
input_tokens = result.get("input_tokens", 0)
|
| 1146 |
+
print(f"成功获取token数: {input_tokens},返回计算方法: 精确")
|
| 1147 |
+
return input_tokens, "精确"
|
| 1148 |
else:
|
| 1149 |
+
estimated_tokens = len(string) // 4
|
| 1150 |
print(f"Tokenizer服务错误: {response.status_code} - {response.text}")
|
| 1151 |
+
print(f"使用估算token数: {estimated_tokens},返回计算方法: 估算")
|
| 1152 |
+
return estimated_tokens, "估算"
|
| 1153 |
except Exception as e:
|
| 1154 |
+
estimated_tokens = len(string) // 4
|
| 1155 |
print(f"计算token错误: {e}")
|
| 1156 |
+
print(f"使用估算token数: {estimated_tokens},返回计算方法: 估算")
|
| 1157 |
+
return estimated_tokens, "估算"
|
| 1158 |
|
| 1159 |
|
| 1160 |
# 更新模型使用统计
|