Spaces:

caidaohz
/

dp

Paused

App Files Files Community

caidaohz commited on Jun 24, 2025

Commit

dad2a85

1 Parent(s): 2c89095

✨ 更新性能指标，优化内存使用和错误率显示，确保精度提升至两位小数；增加API超时时间配置以支持长时间流式响应

Browse files

Files changed (3) hide show

.gitignore +1 -0
main.go +39 -17
stats.go +7 -3

.gitignore CHANGED Viewed

@@ -108,3 +108,4 @@ api-proxy
 # Go coverage files
 *.out
 proxy-server

 # Go coverage files
 *.out
 proxy-server
+deno-proxy

main.go CHANGED Viewed

@@ -44,11 +44,12 @@ var (
 		"/cerebras":    "https://api.cerebras.ai",
 	}
 	httpClient = &http.Client{
-		Timeout: 30 * time.Second,
 		Transport: &http.Transport{
-			MaxIdleConns:        100,
-			MaxIdleConnsPerHost: 100,
-			IdleConnTimeout:     90 * time.Second,
 		},
 	}
 )
@@ -140,12 +141,6 @@ func (apc *AsyncProxyContext) StreamData(data []byte) error {
 // handleAPIProxy 处理API代理请求（异步优化版）
 func handleAPIProxy(c *gin.Context) {
-	// 创建异步代理上下文
-	asyncCtx := NewAsyncProxyContext(c, 60*time.Second) // 60秒超时
-	defer asyncCtx.cancel()
-	atomic.AddInt64(&requestCount, 1)
 	path := c.Request.URL.Path
 	prefix, rest := extractPrefixAndRest(path)
 	if prefix == "" {
@@ -154,6 +149,13 @@ func handleAPIProxy(c *gin.Context) {
 		return
 	}
 	// 异步记录请求，避免阻塞主流程
 	go stats.recordRequest(prefix)
@@ -299,13 +301,7 @@ func apc_streamResponseBody(asyncCtx *AsyncProxyContext, resp *http.Response) er
 		case <-asyncCtx.ctx.Done():
 			return asyncCtx.ctx.Err()
 		default:
-			// 设置读取超时
-			if deadline, ok := asyncCtx.ctx.Deadline(); ok {
-				if tcpConn, ok := resp.Body.(interface{ SetReadDeadline(time.Time) error }); ok {
-					tcpConn.SetReadDeadline(deadline)
-				}
-			}
 			n, err := resp.Body.Read(buffer)
 			if n > 0 {
 				if streamErr := asyncCtx.StreamData(buffer[:n]); streamErr != nil {
@@ -612,6 +608,31 @@ func fastJSONPatch(bodyBytes []byte) ([]byte, error) {
 	return json.Marshal(bodyJSON)
 }
 // main 主函数
 func main() {
 	// 设置生产模式
@@ -671,6 +692,7 @@ func main() {
 	log.Printf("🚀 API代理服务器已启动 (Go优化版) 端口:%s", port)
 	log.Printf("🕒 统计数据每分钟自动刷新页面")
 	log.Printf("⚡ 性能优化：异步统计、内存优化、锁竞争减少")
 	log.Printf("📊 访问 http://localhost:%s 查看统计信息", port)
 	// 使用自定义HTTP服务器以更好地控制

 		"/cerebras":    "https://api.cerebras.ai",
 	}
 	httpClient = &http.Client{
+		Timeout: 1800 * time.Second, // 增加到30分钟，适合长时间AI流式响应
 		Transport: &http.Transport{
+			MaxIdleConns:          100,
+			MaxIdleConnsPerHost:   100,
+			IdleConnTimeout:       90 * time.Second,
+			ResponseHeaderTimeout: 30 * time.Second, // 只对响应头设置30秒超时
 		},
 	}
 )
 // handleAPIProxy 处理API代理请求（异步优化版）
 func handleAPIProxy(c *gin.Context) {
 	path := c.Request.URL.Path
 	prefix, rest := extractPrefixAndRest(path)
 	if prefix == "" {
 		return
 	}
+	// 根据API端点设置合适的超时时间
+	timeout := getTimeoutForEndpoint(prefix)
+	asyncCtx := NewAsyncProxyContext(c, timeout)
+	defer asyncCtx.cancel()
+	atomic.AddInt64(&requestCount, 1)
 	// 异步记录请求，避免阻塞主流程
 	go stats.recordRequest(prefix)
 		case <-asyncCtx.ctx.Done():
 			return asyncCtx.ctx.Err()
 		default:
+			// 对于流式响应，不设置严格的读取超时，让context控制整体超时
 			n, err := resp.Body.Read(buffer)
 			if n > 0 {
 				if streamErr := asyncCtx.StreamData(buffer[:n]); streamErr != nil {
 	return json.Marshal(bodyJSON)
 }
+// getTimeoutForEndpoint 根据API端点返回合适的超时时间
+func getTimeoutForEndpoint(prefix string) time.Duration {
+	// AI流式API需要更长的超时时间 - 30分钟
+	aiEndpoints := map[string]time.Duration{
+		"/openai":     1800 * time.Second, // 30分钟
+		"/claude":     1800 * time.Second, // 30分钟
+		"/gemini":     1800 * time.Second, // 30分钟
+		"/gnothink":   1800 * time.Second, // 30分钟
+		"/groq":       1800 * time.Second, // 30分钟
+		"/xai":        1800 * time.Second, // 30分钟
+		"/cohere":     1800 * time.Second, // 30分钟
+		"/together":   1800 * time.Second, // 30分钟
+		"/fireworks":  1800 * time.Second, // 30分钟
+		"/openrouter": 1800 * time.Second, // 30分钟
+		"/cerebras":   1800 * time.Second, // 30分钟
+	}
+	if timeout, exists := aiEndpoints[prefix]; exists {
+		return timeout
+	}
+	// 其他API使用较短的超时时间
+	return 60 * time.Second
+}
 // main 主函数
 func main() {
 	// 设置生产模式
 	log.Printf("🚀 API代理服务器已启动 (Go优化版) 端口:%s", port)
 	log.Printf("🕒 统计数据每分钟自动刷新页面")
 	log.Printf("⚡ 性能优化：异步统计、内存优化、锁竞争减少")
+	log.Printf("⏱️  超时配置：AI API 30分钟，其他API 1分钟，HTTP客户端 30分钟")
 	log.Printf("📊 访问 http://localhost:%s 查看统计信息", port)
 	// 使用自定义HTTP服务器以更好地控制

stats.go CHANGED Viewed

@@ -1,6 +1,7 @@
 package main
 import (
 	"runtime"
 	"sync"
 	"sync/atomic"
@@ -241,7 +242,7 @@ func updatePerformanceMetrics() {
 	var m runtime.MemStats
 	runtime.ReadMemStats(&m)
-	perfMetrics.MemoryUsageMB = float64(m.Alloc) / 1024 / 1024
 	perfMetrics.GoroutineCount = runtime.NumGoroutine()
 	perfMetrics.LastUpdated = now.UnixMilli()
@@ -281,6 +282,9 @@ func updatePerformanceMetrics() {
 				perfMetrics.RequestsPerSec = 0.3*qps + 0.7*perfMetrics.RequestsPerSec
 			}
 			// 更新记录
 			atomic.StoreInt64(&lastQPSUpdate, currentTime)
 			atomic.StoreInt64(&lastRequestCount, currentRequests)
@@ -291,8 +295,8 @@ func updatePerformanceMetrics() {
 	totalErrors := atomic.LoadInt64(&errorCount)
 	if totalReqs > 0 {
 		errorRate := float64(totalErrors) / float64(totalReqs) * 100
-		// 四舍五入到2位小数
-		perfMetrics.ErrorRate = float64(int(errorRate*100+0.5)) / 100
 	}
 	// 计算平均响应时间

 package main
 import (
+	"math"
 	"runtime"
 	"sync"
 	"sync/atomic"
 	var m runtime.MemStats
 	runtime.ReadMemStats(&m)
+	perfMetrics.MemoryUsageMB = math.Round(float64(m.Alloc)/1024/1024*100) / 100
 	perfMetrics.GoroutineCount = runtime.NumGoroutine()
 	perfMetrics.LastUpdated = now.UnixMilli()
 				perfMetrics.RequestsPerSec = 0.3*qps + 0.7*perfMetrics.RequestsPerSec
 			}
+			// 保留2位小数
+			perfMetrics.RequestsPerSec = math.Round(perfMetrics.RequestsPerSec*100) / 100
 			// 更新记录
 			atomic.StoreInt64(&lastQPSUpdate, currentTime)
 			atomic.StoreInt64(&lastRequestCount, currentRequests)
 	totalErrors := atomic.LoadInt64(&errorCount)
 	if totalReqs > 0 {
 		errorRate := float64(totalErrors) / float64(totalReqs) * 100
+		// 使用math.Round保证精确的2位小数
+		perfMetrics.ErrorRate = math.Round(errorRate*100) / 100
 	}
 	// 计算平均响应时间