Point app to org model repo
Browse files
README.md
CHANGED
|
@@ -12,7 +12,7 @@ header: mini
|
|
| 12 |
short_description: "Dense Gradio lab console for probing a Phase-3 Q8 GGUF."
|
| 13 |
suggested_hardware: zero-a10g
|
| 14 |
models:
|
| 15 |
-
-
|
| 16 |
tags:
|
| 17 |
- gradio
|
| 18 |
- zerogpu
|
|
@@ -27,7 +27,7 @@ license: mit
|
|
| 27 |
# First-Principle AI
|
| 28 |
|
| 29 |
First-Principle AI is a compact Gradio console for probing the
|
| 30 |
-
`
|
| 31 |
`llama-cpp-python`.
|
| 32 |
|
| 33 |
The UI is intentionally dense: chat, sampling controls, system prompt,
|
|
@@ -36,7 +36,7 @@ one screen.
|
|
| 36 |
|
| 37 |
## Runtime Notes
|
| 38 |
|
| 39 |
-
- Model repo: `
|
| 40 |
- Model file: `model-Q8_0.gguf`
|
| 41 |
- Runtime: `llama-cpp-python`
|
| 42 |
- Hardware target: ZeroGPU
|
|
|
|
| 12 |
short_description: "Dense Gradio lab console for probing a Phase-3 Q8 GGUF."
|
| 13 |
suggested_hardware: zero-a10g
|
| 14 |
models:
|
| 15 |
+
- build-small-hackathon/phase-3-gguf
|
| 16 |
tags:
|
| 17 |
- gradio
|
| 18 |
- zerogpu
|
|
|
|
| 27 |
# First-Principle AI
|
| 28 |
|
| 29 |
First-Principle AI is a compact Gradio console for probing the
|
| 30 |
+
`build-small-hackathon/phase-3-gguf` Q8 GGUF model through
|
| 31 |
`llama-cpp-python`.
|
| 32 |
|
| 33 |
The UI is intentionally dense: chat, sampling controls, system prompt,
|
|
|
|
| 36 |
|
| 37 |
## Runtime Notes
|
| 38 |
|
| 39 |
+
- Model repo: `build-small-hackathon/phase-3-gguf`
|
| 40 |
- Model file: `model-Q8_0.gguf`
|
| 41 |
- Runtime: `llama-cpp-python`
|
| 42 |
- Hardware target: ZeroGPU
|
app.py
CHANGED
|
@@ -25,7 +25,7 @@ else:
|
|
| 25 |
LLAMA_IMPORT_ERROR = None
|
| 26 |
|
| 27 |
|
| 28 |
-
MODEL_REPO = os.getenv("PHASE3_MODEL_REPO", "
|
| 29 |
MODEL_FILE = os.getenv("PHASE3_MODEL_FILE", "model-Q8_0.gguf")
|
| 30 |
MODEL_LABEL = "First-Principle AI"
|
| 31 |
LOCAL_MODEL_PATH = Path("/Users/user/.lmstudio/models/owenisas/Phase-3-GGUF/model-Q8_0.gguf")
|
|
@@ -424,7 +424,7 @@ with gr.Blocks(title="First-Principle AI", fill_width=True) as demo:
|
|
| 424 |
<h1>First-Principle AI</h1>
|
| 425 |
<p>A dense Gradio console for probing the Phase-3 Q8 GGUF with visible runtime diagnostics.</p>
|
| 426 |
<div class="phase-badge-row">
|
| 427 |
-
<span class="phase-badge"><strong>Model</strong>
|
| 428 |
<span class="phase-badge"><strong>Runtime</strong> llama.cpp via llama-cpp-python</span>
|
| 429 |
<span class="phase-badge"><strong>Hardware target</strong> ZeroGPU with guarded fallback</span>
|
| 430 |
</div>
|
|
|
|
| 25 |
LLAMA_IMPORT_ERROR = None
|
| 26 |
|
| 27 |
|
| 28 |
+
MODEL_REPO = os.getenv("PHASE3_MODEL_REPO", "build-small-hackathon/phase-3-gguf")
|
| 29 |
MODEL_FILE = os.getenv("PHASE3_MODEL_FILE", "model-Q8_0.gguf")
|
| 30 |
MODEL_LABEL = "First-Principle AI"
|
| 31 |
LOCAL_MODEL_PATH = Path("/Users/user/.lmstudio/models/owenisas/Phase-3-GGUF/model-Q8_0.gguf")
|
|
|
|
| 424 |
<h1>First-Principle AI</h1>
|
| 425 |
<p>A dense Gradio console for probing the Phase-3 Q8 GGUF with visible runtime diagnostics.</p>
|
| 426 |
<div class="phase-badge-row">
|
| 427 |
+
<span class="phase-badge"><strong>Model</strong> build-small-hackathon/phase-3-gguf</span>
|
| 428 |
<span class="phase-badge"><strong>Runtime</strong> llama.cpp via llama-cpp-python</span>
|
| 429 |
<span class="phase-badge"><strong>Hardware target</strong> ZeroGPU with guarded fallback</span>
|
| 430 |
</div>
|