Spaces:

owlninjam
/

spacecs3b

Sleeping

App Files Files Community

owlninjam commited on Aug 7, 2025

Commit

bde8af9

verified ·

1 Parent(s): 526f112

Delete app.py

Browse files

Files changed (1) hide show

app.py +0 -200

app.py DELETED Viewed

@@ -1,200 +0,0 @@
-import streamlit as st
-import subprocess
-import threading
-import time
-import requests
-import json
-from typing import List, Dict
-import sys
-import os
-API_KEYS = ["sk-adminkey02", "sk-testkey123", "sk-userkey456", "sk-demokey789"]
-DEFAULT_API_KEY = "sk-adminkey02"
-def start_fastapi():
-    try:
-        subprocess.Popen([
-            sys.executable, "-m", "uvicorn", "api:app",
-            "--host", "0.0.0.0",
-            "--port", "8000",
-            "--workers", "1"
-        ])
-        print("🚀 FastAPI server starting on port 8000...")
-    except Exception as e:
-        st.error(f"Failed to start API server: {e}")
-if 'api_started' not in st.session_state:
-    st.session_state.api_started = True
-    threading.Thread(target=start_fastapi, daemon=True).start()
-    time.sleep(8)
-def call_api(messages: List[Dict], max_tokens: int = 512, temperature: float = 0.7, api_key: str = DEFAULT_API_KEY):
-    try:
-        response = requests.post(
-            "http://localhost:8000/v1/chat/completions",
-            headers={"Authorization": f"Bearer {api_key}"},
-            json={
-                "model": "zephyr-quiklang-3b-4k",
-                "messages": messages,
-                "max_tokens": max_tokens,
-                "temperature": temperature
-            },
-            timeout=120
-        )
-        if response.status_code == 200:
-            return response.json()
-        elif response.status_code == 401:
-            st.error("❌ Invalid API key")
-            return None
-        else:
-            st.error(f"API Error: {response.status_code} - {response.text}")
-            return None
-    except requests.exceptions.RequestException as e:
-        st.error(f"Failed to connect to API: {e}")
-        return None
-def check_api_health():
-    try:
-        response = requests.get("http://localhost:8000/v1/health", timeout=10)
-        return response.status_code == 200
-    except:
-        return False
-def get_api_info():
-    try:
-        response = requests.get("http://localhost:8000/v1", timeout=5)
-        if response.status_code == 200:
-            return response.json()
-    except:
-        pass
-    return None
-def main():
-    st.set_page_config(
-        page_title="🧠 Zephyr Quiklang 3B-4K Chat",
-        page_icon="🧠",
-        layout="wide",
-        initial_sidebar_state="expanded"
-    )
-    st.title("🧠 Zephyr Quiklang 3B-4K")
-    st.markdown("*3B parameter model with OpenAI-compatible API (Q4_K_M quantized)*")
-    space_url = st.text_input(
-        "🌐 Your Space URL",
-        placeholder="https://your-username-your-space.hf.space",
-        help="Enter your Hugging Face Space URL for API examples"
-    )
-    api_healthy = check_api_health()
-    col1, col2, col3 = st.columns([2, 1, 1])
-    with col1:
-        if api_healthy:
-            st.success("✅ API Server is running")
-        else:
-            st.warning("⏳ API Server is starting...")
-    with col2:
-        if st.button("🔄 Refresh"):
-            st.rerun()
-    with col3:
-        if st.button("📊 API Info"):
-            info = get_api_info()
-            if info:
-                st.json(info)
-    if not api_healthy:
-        st.info("🕐 The model is loading in the background. First startup may take 2-3 minutes.")
-        st.stop()
-    with st.sidebar:
-        st.header("⚙️ Settings")
-        selected_api_key = st.selectbox("🔑 API Key", API_KEYS, index=0)
-        max_tokens = st.slider("Max Tokens", 50, 1024, 512)
-        temperature = st.slider("Temperature", 0.0, 1.0, 0.7, 0.1)
-        st.divider()
-        st.header("📡 API Access")
-        st.markdown(f"**Base URL:** `{space_url or 'https://your-space.hf.space'}/v1`")
-        st.code("/v1/models")
-        st.code("/v1/chat/completions")
-        st.code("/v1/health")
-        st.code("/v1/docs")
-        st.markdown("**Authentication Header:**")
-        st.code(f"Authorization: Bearer {selected_api_key}")
-    tab1, tab2 = st.tabs(["💬 Chat", "🔗 Code Examples"])
-    with tab1:
-        if "messages" not in st.session_state:
-            st.session_state.messages = []
-        for message in st.session_state.messages:
-            with st.chat_message(message["role"]):
-                st.markdown(message["content"])
-                if "stats" in message:
-                    st.caption(message["stats"])
-        if prompt := st.chat_input("Ask me anything..."):
-            st.session_state.messages.append({"role": "user", "content": prompt})
-            with st.chat_message("user"):
-                st.markdown(prompt)
-            with st.chat_message("assistant"):
-                with st.spinner("🤔 Thinking..."):
-                    api_messages = [
-                        {"role": msg["role"], "content": msg["content"]}
-                        for msg in st.session_state.messages if "stats" not in msg
-                    ]
-                    result = call_api(api_messages, max_tokens, temperature, selected_api_key)
-                    if result and 'choices' in result:
-                        response = result['choices'][0]['message']['content']
-                        usage = result.get('usage', {})
-                        completion_tokens = usage.get('completion_tokens', 0)
-                        generation_time = usage.get('total_tokens', 0) / 4.0
-                        stats = f"📊 {completion_tokens} tokens • ~{generation_time:.1f}s • API: {selected_api_key[:12]}..."
-                        st.markdown(response)
-                        st.caption(stats)
-                        st.session_state.messages.append({
-                            "role": "assistant",
-                            "content": response,
-                            "stats": stats
-                        })
-        col1, col2 = st.columns(2)
-        with col1:
-            if st.button("🗑️ Clear Chat"):
-                st.session_state.messages = []
-                st.rerun()
-        with col2:
-            if st.button("💾 Export Chat"):
-                chat_json = json.dumps(st.session_state.messages, indent=2)
-                st.download_button("📥 Download JSON", chat_json, "chat_export.json", "application/json")
-    with tab2:
-        st.subheader("🐍 Python Example")
-        base_url = f"{space_url or 'https://your-space.hf.space'}/v1"
-        python_code = f"""from openai import OpenAI
-client = OpenAI(
-    base_url="{base_url}",
-    api_key="{selected_api_key}"
-)
-response = client.chat.completions.create(
-    model="zephyr-quiklang-3b-4k",
-    messages=[{{"role": "user", "content": "Hello!"}}],
-    max_tokens=512,
-    temperature=0.7
-)
-print(response.choices[0].message.content)
-"""
-        st.code(python_code, language="python")
-if __name__ == "__main__":
-    main()