Spaces:

vedaco
/

Visible_by_veda

Runtime error

App Files Files Community

vedaco commited on Jan 7

Commit

d7c8b67

verified ·

1 Parent(s): cc1f992

Create app.py

Browse files

Files changed (1) hide show

app.py +1092 -0

app.py ADDED Viewed

	@@ -0,0 +1,1092 @@

+"""
+Visible LLM - A Language Model built with TensorFlow
+Trained on veda.txt
+"""
+import os
+import json
+import numpy as np
+import tensorflow as tf
+from tensorflow import keras
+from tensorflow.keras import layers
+from flask import Flask, request, jsonify, render_template_string
+import re
+import pickle
+from datetime import datetime
+# ============================================================
+# CONFIGURATION
+# ============================================================
+class VisibleConfig:
+    """Configuration for Visible LLM"""
+    MODEL_NAME = "Visible"
+    VERSION = "1.0.0"
+    # Model Architecture
+    VOCAB_SIZE = 10000
+    EMBEDDING_DIM = 256
+    NUM_HEADS = 8
+    NUM_LAYERS = 6
+    FF_DIM = 512
+    MAX_SEQ_LENGTH = 128
+    DROPOUT_RATE = 0.1
+    # Training
+    BATCH_SIZE = 32
+    EPOCHS = 50
+    LEARNING_RATE = 0.0001
+    WARMUP_STEPS = 4000
+    # Paths
+    DATA_FILE = "veda.txt"
+    MODEL_DIR = "models"
+    MODEL_PATH = "models/visible_model"
+    TOKENIZER_PATH = "models/visible_tokenizer.pkl"
+    CONFIG_PATH = "models/visible_config.json"
+# ============================================================
+# CUSTOM TOKENIZER
+# ============================================================
+class VisibleTokenizer:
+    """Custom tokenizer for Visible LLM"""
+    def __init__(self, vocab_size=10000):
+        self.vocab_size = vocab_size
+        self.word_to_idx = {}
+        self.idx_to_word = {}
+        self.vocab = []
+        # Special tokens
+        self.pad_token = "<PAD>"
+        self.unk_token = "<UNK>"
+        self.start_token = "<START>"
+        self.end_token = "<END>"
+        self.pad_token_id = 0
+        self.unk_token_id = 1
+        self.start_token_id = 2
+        self.end_token_id = 3
+    def _preprocess_text(self, text):
+        """Clean and preprocess text"""
+        text = text.lower()
+        text = re.sub(r'[^\w\s\.\,\!\?\;\:\'\"\-]', '', text)
+        text = re.sub(r'\s+', ' ', text)
+        return text.strip()
+    def _tokenize(self, text):
+        """Split text into tokens"""
+        text = self._preprocess_text(text)
+        # Simple word-level tokenization with punctuation handling
+        tokens = re.findall(r'\w+|[^\w\s]', text)
+        return tokens
+    def fit(self, texts):
+        """Build vocabulary from texts"""
+        print("Building vocabulary...")
+        word_counts = {}
+        for text in texts:
+            tokens = self._tokenize(text)
+            for token in tokens:
+                word_counts[token] = word_counts.get(token, 0) + 1
+        # Sort by frequency
+        sorted_words = sorted(word_counts.items(), key=lambda x: x[1], reverse=True)
+        # Build vocabulary with special tokens
+        self.vocab = [self.pad_token, self.unk_token, self.start_token, self.end_token]
+        self.vocab.extend([word for word, _ in sorted_words[:self.vocab_size - 4]])
+        self.word_to_idx = {word: idx for idx, word in enumerate(self.vocab)}
+        self.idx_to_word = {idx: word for idx, word in enumerate(self.vocab)}
+        print(f"Vocabulary size: {len(self.vocab)}")
+        return self
+    def encode(self, text, max_length=None, add_special_tokens=True):
+        """Encode text to token ids"""
+        tokens = self._tokenize(text)
+        if add_special_tokens:
+            tokens = [self.start_token] + tokens + [self.end_token]
+        token_ids = [self.word_to_idx.get(token, self.unk_token_id) for token in tokens]
+        if max_length:
+            if len(token_ids) > max_length:
+                token_ids = token_ids[:max_length]
+            else:
+                token_ids.extend([self.pad_token_id] * (max_length - len(token_ids)))
+        return token_ids
+    def decode(self, token_ids, skip_special_tokens=True):
+        """Decode token ids to text"""
+        special_ids = {self.pad_token_id, self.start_token_id, self.end_token_id}
+        tokens = []
+        for idx in token_ids:
+            if skip_special_tokens and idx in special_ids:
+                continue
+            if idx == self.unk_token_id and skip_special_tokens:
+                tokens.append("<?>")
+            else:
+                tokens.append(self.idx_to_word.get(idx, self.unk_token))
+        # Join tokens properly
+        text = ' '.join(tokens)
+        # Fix punctuation spacing
+        text = re.sub(r'\s+([.,!?;:])', r'\1', text)
+        return text
+    def save(self, path):
+        """Save tokenizer to file"""
+        with open(path, 'wb') as f:
+            pickle.dump({
+                'vocab': self.vocab,
+                'vocab_size': self.vocab_size
+            }, f)
+        print(f"Tokenizer saved to {path}")
+    def load(self, path):
+        """Load tokenizer from file"""
+        with open(path, 'rb') as f:
+            data = pickle.load(f)
+            self.vocab = data['vocab']
+            self.vocab_size = data['vocab_size']
+            self.word_to_idx = {word: idx for idx, word in enumerate(self.vocab)}
+            self.idx_to_word = {idx: word for idx, word in enumerate(self.vocab)}
+        print(f"Tokenizer loaded from {path}")
+        return self
+    def __len__(self):
+        return len(self.vocab)
+# ============================================================
+# TRANSFORMER COMPONENTS
+# ============================================================
+class PositionalEncoding(layers.Layer):
+    """Positional encoding layer"""
+    def __init__(self, max_seq_length, embed_dim, **kwargs):
+        super().__init__(**kwargs)
+        self.max_seq_length = max_seq_length
+        self.embed_dim = embed_dim
+        # Create positional encoding matrix
+        position = np.arange(max_seq_length)[:, np.newaxis]
+        div_term = np.exp(np.arange(0, embed_dim, 2) * -(np.log(10000.0) / embed_dim))
+        pe = np.zeros((max_seq_length, embed_dim))
+        pe[:, 0::2] = np.sin(position * div_term)
+        pe[:, 1::2] = np.cos(position * div_term)
+        self.positional_encoding = tf.constant(pe, dtype=tf.float32)
+    def call(self, x):
+        seq_length = tf.shape(x)[1]
+        return x + self.positional_encoding[:seq_length, :]
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            'max_seq_length': self.max_seq_length,
+            'embed_dim': self.embed_dim
+        })
+        return config
+class TransformerBlock(layers.Layer):
+    """Transformer decoder block"""
+    def __init__(self, embed_dim, num_heads, ff_dim, dropout_rate=0.1, **kwargs):
+        super().__init__(**kwargs)
+        self.embed_dim = embed_dim
+        self.num_heads = num_heads
+        self.ff_dim = ff_dim
+        self.dropout_rate = dropout_rate
+        self.attention = layers.MultiHeadAttention(
+            num_heads=num_heads,
+            key_dim=embed_dim // num_heads,
+            dropout=dropout_rate
+        )
+        self.ffn = keras.Sequential([
+            layers.Dense(ff_dim, activation='gelu'),
+            layers.Dropout(dropout_rate),
+            layers.Dense(embed_dim)
+        ])
+        self.layernorm1 = layers.LayerNormalization(epsilon=1e-6)
+        self.layernorm2 = layers.LayerNormalization(epsilon=1e-6)
+        self.dropout1 = layers.Dropout(dropout_rate)
+        self.dropout2 = layers.Dropout(dropout_rate)
+    def causal_attention_mask(self, seq_length):
+        """Create causal mask for autoregressive attention"""
+        mask = tf.linalg.band_part(tf.ones((seq_length, seq_length)), -1, 0)
+        return mask
+    def call(self, x, training=False):
+        seq_length = tf.shape(x)[1]
+        causal_mask = self.causal_attention_mask(seq_length)
+        # Self-attention with causal mask
+        attention_output = self.attention(
+            query=x,
+            value=x,
+            key=x,
+            attention_mask=causal_mask,
+            training=training
+        )
+        attention_output = self.dropout1(attention_output, training=training)
+        x = self.layernorm1(x + attention_output)
+        # Feed-forward network
+        ffn_output = self.ffn(x)
+        ffn_output = self.dropout2(ffn_output, training=training)
+        x = self.layernorm2(x + ffn_output)
+        return x
+    def get_config(self):
+        config = super().get_config()
+        config.update({
+            'embed_dim': self.embed_dim,
+            'num_heads': self.num_heads,
+            'ff_dim': self.ff_dim,
+            'dropout_rate': self.dropout_rate
+        })
+        return config
+# ============================================================
+# VISIBLE LLM MODEL
+# ============================================================
+class VisibleLLM:
+    """Visible Language Model"""
+    def __init__(self, config=None):
+        self.config = config or VisibleConfig()
+        self.tokenizer = None
+        self.model = None
+        self.history = None
+    def build_model(self, vocab_size=None):
+        """Build the Transformer model"""
+        vocab_size = vocab_size or self.config.VOCAB_SIZE
+        print(f"\n{'='*50}")
+        print(f"Building {self.config.MODEL_NAME} LLM")
+        print(f"{'='*50}")
+        # Input layer
+        inputs = layers.Input(shape=(None,), dtype=tf.int32, name="input_ids")
+        # Token embedding
+        token_embedding = layers.Embedding(
+            input_dim=vocab_size,
+            output_dim=self.config.EMBEDDING_DIM,
+            name="token_embedding"
+        )(inputs)
+        # Positional encoding
+        x = PositionalEncoding(
+            self.config.MAX_SEQ_LENGTH,
+            self.config.EMBEDDING_DIM,
+            name="positional_encoding"
+        )(token_embedding)
+        # Dropout
+        x = layers.Dropout(self.config.DROPOUT_RATE)(x)
+        # Transformer blocks
+        for i in range(self.config.NUM_LAYERS):
+            x = TransformerBlock(
+                embed_dim=self.config.EMBEDDING_DIM,
+                num_heads=self.config.NUM_HEADS,
+                ff_dim=self.config.FF_DIM,
+                dropout_rate=self.config.DROPOUT_RATE,
+                name=f"transformer_block_{i}"
+            )(x)
+        # Final layer normalization
+        x = layers.LayerNormalization(epsilon=1e-6, name="final_layernorm")(x)
+        # Output projection
+        outputs = layers.Dense(vocab_size, name="output_projection")(x)
+        self.model = keras.Model(inputs=inputs, outputs=outputs, name=self.config.MODEL_NAME)
+        # Compile model
+        self.model.compile(
+            optimizer=keras.optimizers.Adam(learning_rate=self.config.LEARNING_RATE),
+            loss=keras.losses.SparseCategoricalCrossentropy(from_logits=True),
+            metrics=['accuracy']
+        )
+        self.model.summary()
+        return self.model
+    def load_data(self, file_path=None):
+        """Load and preprocess training data"""
+        file_path = file_path or self.config.DATA_FILE
+        print(f"\nLoading data from {file_path}...")
+        if not os.path.exists(file_path):
+            raise FileNotFoundError(f"Data file not found: {file_path}")
+        with open(file_path, 'r', encoding='utf-8') as f:
+            text = f.read()
+        # Split into sentences/chunks
+        sentences = re.split(r'[.!?]+', text)
+        sentences = [s.strip() for s in sentences if len(s.strip()) > 10]
+        print(f"Loaded {len(sentences)} text segments")
+        return sentences
+    def prepare_training_data(self, texts):
+        """Prepare data for training"""
+        print("\nPreparing training data...")
+        # Initialize and fit tokenizer
+        self.tokenizer = VisibleTokenizer(vocab_size=self.config.VOCAB_SIZE)
+        self.tokenizer.fit(texts)
+        # Create training sequences
+        input_sequences = []
+        target_sequences = []
+        for text in texts:
+            token_ids = self.tokenizer.encode(
+                text,
+                max_length=self.config.MAX_SEQ_LENGTH + 1,
+                add_special_tokens=True
+            )
+            if len([t for t in token_ids if t != 0]) > 3:  # Skip very short sequences
+                input_sequences.append(token_ids[:-1])
+                target_sequences.append(token_ids[1:])
+        X = np.array(input_sequences)
+        y = np.array(target_sequences)
+        print(f"Training samples: {len(X)}")
+        print(f"Input shape: {X.shape}")
+        print(f"Target shape: {y.shape}")
+        return X, y
+    def train(self, data_file=None, epochs=None, batch_size=None):
+        """Train the model"""
+        epochs = epochs or self.config.EPOCHS
+        batch_size = batch_size or self.config.BATCH_SIZE
+        # Load and prepare data
+        texts = self.load_data(data_file)
+        X, y = self.prepare_training_data(texts)
+        # Build model
+        self.build_model(vocab_size=len(self.tokenizer))
+        # Create model directory
+        os.makedirs(self.config.MODEL_DIR, exist_ok=True)
+        # Callbacks
+        callbacks = [
+            keras.callbacks.ModelCheckpoint(
+                filepath=self.config.MODEL_PATH,
+                save_best_only=True,
+                monitor='loss',
+                mode='min'
+            ),
+            keras.callbacks.EarlyStopping(
+                monitor='loss',
+                patience=5,
+                restore_best_weights=True
+            ),
+            keras.callbacks.ReduceLROnPlateau(
+                monitor='loss',
+                factor=0.5,
+                patience=3,
+                min_lr=1e-7
+            ),
+            keras.callbacks.TensorBoard(
+                log_dir=f'logs/{datetime.now().strftime("%Y%m%d-%H%M%S")}'
+            )
+        ]
+        print(f"\n{'='*50}")
+        print(f"Training {self.config.MODEL_NAME}")
+        print(f"{'='*50}")
+        print(f"Epochs: {epochs}")
+        print(f"Batch Size: {batch_size}")
+        print(f"{'='*50}\n")
+        # Train
+        self.history = self.model.fit(
+            X, y,
+            epochs=epochs,
+            batch_size=batch_size,
+            callbacks=callbacks,
+            validation_split=0.1
+        )
+        # Save tokenizer
+        self.tokenizer.save(self.config.TOKENIZER_PATH)
+        # Save config
+        self.save_config()
+        print(f"\n{'='*50}")
+        print(f"Training Complete!")
+        print(f"Model saved to: {self.config.MODEL_PATH}")
+        print(f"Tokenizer saved to: {self.config.TOKENIZER_PATH}")
+        print(f"{'='*50}\n")
+        return self.history
+    def save_config(self):
+        """Save model configuration"""
+        config_dict = {
+            'model_name': self.config.MODEL_NAME,
+            'version': self.config.VERSION,
+            'vocab_size': len(self.tokenizer),
+            'embedding_dim': self.config.EMBEDDING_DIM,
+            'num_heads': self.config.NUM_HEADS,
+            'num_layers': self.config.NUM_LAYERS,
+            'ff_dim': self.config.FF_DIM,
+            'max_seq_length': self.config.MAX_SEQ_LENGTH,
+            'trained_on': datetime.now().isoformat()
+        }
+        with open(self.config.CONFIG_PATH, 'w') as f:
+            json.dump(config_dict, f, indent=2)
+    def load_model(self, model_path=None, tokenizer_path=None):
+        """Load a trained model"""
+        model_path = model_path or self.config.MODEL_PATH
+        tokenizer_path = tokenizer_path or self.config.TOKENIZER_PATH
+        print(f"Loading model from {model_path}...")
+        # Load tokenizer
+        self.tokenizer = VisibleTokenizer()
+        self.tokenizer.load(tokenizer_path)
+        # Load model with custom objects
+        custom_objects = {
+            'PositionalEncoding': PositionalEncoding,
+            'TransformerBlock': TransformerBlock
+        }
+        self.model = keras.models.load_model(model_path, custom_objects=custom_objects)
+        print("Model loaded successfully!")
+        return self
+    def generate(self, prompt, max_length=100, temperature=0.7, top_k=50, top_p=0.9):
+        """Generate text from a prompt"""
+        if self.model is None or self.tokenizer is None:
+            raise ValueError("Model not loaded. Call load_model() first.")
+        # Encode prompt
+        input_ids = self.tokenizer.encode(prompt, add_special_tokens=True)
+        input_ids = input_ids[:-1]  # Remove end token for generation
+        generated_ids = list(input_ids)
+        for _ in range(max_length):
+            # Prepare input
+            current_input = np.array([generated_ids[-self.config.MAX_SEQ_LENGTH:]])
+            # Get predictions
+            predictions = self.model.predict(current_input, verbose=0)
+            next_token_logits = predictions[0, -1, :]
+            # Apply temperature
+            next_token_logits = next_token_logits / temperature
+            # Apply top-k filtering
+            if top_k > 0:
+                indices_to_remove = np.argsort(next_token_logits)[:-top_k]
+                next_token_logits[indices_to_remove] = float('-inf')
+            # Apply top-p (nucleus) filtering
+            if top_p < 1.0:
+                sorted_indices = np.argsort(next_token_logits)[::-1]
+                sorted_logits = next_token_logits[sorted_indices]
+                cumulative_probs = np.cumsum(tf.nn.softmax(sorted_logits).numpy())
+                sorted_indices_to_remove = cumulative_probs > top_p
+                sorted_indices_to_remove[1:] = sorted_indices_to_remove[:-1].copy()
+                sorted_indices_to_remove[0] = False
+                indices_to_remove = sorted_indices[sorted_indices_to_remove]
+                next_token_logits[indices_to_remove] = float('-inf')
+            # Sample from distribution
+            probs = tf.nn.softmax(next_token_logits).numpy()
+            next_token_id = np.random.choice(len(probs), p=probs)
+            # Stop if end token
+            if next_token_id == self.tokenizer.end_token_id:
+                break
+            generated_ids.append(next_token_id)
+        # Decode generated text
+        generated_text = self.tokenizer.decode(generated_ids, skip_special_tokens=True)
+        return generated_text
+    def chat(self, user_input, max_length=100, temperature=0.7):
+        """Interactive chat with the model"""
+        response = self.generate(
+            prompt=user_input,
+            max_length=max_length,
+            temperature=temperature
+        )
+        return response
+# ============================================================
+# FLASK WEB APPLICATION
+# ============================================================
+app = Flask(__name__)
+visible_llm = None
+# HTML Template
+HTML_TEMPLATE = """
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Visible LLM</title>
+    <style>
+        * {
+            margin: 0;
+            padding: 0;
+            box-sizing: border-box;
+        }
+        body {
+            font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
+            background: linear-gradient(135deg, #1a1a2e 0%, #16213e 100%);
+            min-height: 100vh;
+            color: #fff;
+        }
+        .container {
+            max-width: 900px;
+            margin: 0 auto;
+            padding: 20px;
+        }
+        header {
+            text-align: center;
+            padding: 40px 0;
+        }
+        h1 {
+            font-size: 3em;
+            background: linear-gradient(90deg, #00d2ff, #3a7bd5);
+            -webkit-background-clip: text;
+            -webkit-text-fill-color: transparent;
+            margin-bottom: 10px;
+        }
+        .subtitle {
+            color: #888;
+            font-size: 1.1em;
+        }
+        .chat-container {
+            background: rgba(255, 255, 255, 0.05);
+            border-radius: 20px;
+            padding: 30px;
+            margin-top: 20px;
+            backdrop-filter: blur(10px);
+            border: 1px solid rgba(255, 255, 255, 0.1);
+        }
+        .messages {
+            height: 400px;
+            overflow-y: auto;
+            padding: 20px;
+            margin-bottom: 20px;
+            border-radius: 15px;
+            background: rgba(0, 0, 0, 0.3);
+        }
+        .message {
+            margin-bottom: 15px;
+            padding: 15px 20px;
+            border-radius: 15px;
+            max-width: 80%;
+            animation: fadeIn 0.3s ease;
+        }
+        @keyframes fadeIn {
+            from { opacity: 0; transform: translateY(10px); }
+            to { opacity: 1; transform: translateY(0); }
+        }
+        .user-message {
+            background: linear-gradient(135deg, #3a7bd5, #00d2ff);
+            margin-left: auto;
+            text-align: right;
+        }
+        .bot-message {
+            background: rgba(255, 255, 255, 0.1);
+            margin-right: auto;
+        }
+        .input-area {
+            display: flex;
+            gap: 15px;
+        }
+        #userInput {
+            flex: 1;
+            padding: 15px 20px;
+            border: none;
+            border-radius: 15px;
+            background: rgba(255, 255, 255, 0.1);
+            color: #fff;
+            font-size: 1em;
+            outline: none;
+            transition: all 0.3s ease;
+        }
+        #userInput:focus {
+            background: rgba(255, 255, 255, 0.15);
+            box-shadow: 0 0 20px rgba(0, 210, 255, 0.2);
+        }
+        #userInput::placeholder {
+            color: #888;
+        }
+        button {
+            padding: 15px 30px;
+            border: none;
+            border-radius: 15px;
+            background: linear-gradient(135deg, #3a7bd5, #00d2ff);
+            color: #fff;
+            font-size: 1em;
+            cursor: pointer;
+            transition: all 0.3s ease;
+        }
+        button:hover {
+            transform: translateY(-2px);
+            box-shadow: 0 10px 30px rgba(0, 210, 255, 0.3);
+        }
+        button:disabled {
+            opacity: 0.5;
+            cursor: not-allowed;
+            transform: none;
+        }
+        .settings {
+            display: grid;
+            grid-template-columns: repeat(auto-fit, minmax(150px, 1fr));
+            gap: 15px;
+            margin-bottom: 20px;
+            padding: 20px;
+            background: rgba(0, 0, 0, 0.2);
+            border-radius: 15px;
+        }
+        .setting-group {
+            display: flex;
+            flex-direction: column;
+            gap: 5px;
+        }
+        .setting-group label {
+            font-size: 0.9em;
+            color: #888;
+        }
+        .setting-group input[type="range"] {
+            width: 100%;
+        }
+        .setting-value {
+            text-align: center;
+            font-size: 0.9em;
+            color: #00d2ff;
+        }
+        .status {
+            text-align: center;
+            padding: 10px;
+            border-radius: 10px;
+            margin-bottom: 20px;
+        }
+        .status.ready {
+            background: rgba(0, 255, 0, 0.1);
+            color: #00ff00;
+        }
+        .status.loading {
+            background: rgba(255, 255, 0, 0.1);
+            color: #ffff00;
+        }
+        .status.error {
+            background: rgba(255, 0, 0, 0.1);
+            color: #ff0000;
+        }
+        .loading-spinner {
+            display: inline-block;
+            width: 20px;
+            height: 20px;
+            border: 2px solid #fff;
+            border-radius: 50%;
+            border-top-color: transparent;
+            animation: spin 1s linear infinite;
+        }
+        @keyframes spin {
+            to { transform: rotate(360deg); }
+        }
+    </style>
+</head>
+<body>
+    <div class="container">
+        <header>
+            <h1>🔮 Visible</h1>
+            <p class="subtitle">Intelligent Language Model powered by TensorFlow</p>
+        </header>
+        <div class="chat-container">
+            <div id="status" class="status loading">Checking model status...</div>
+            <div class="settings">
+                <div class="setting-group">
+                    <label>Temperature</label>
+                    <input type="range" id="temperature" min="0.1" max="2" step="0.1" value="0.7">
+                    <span class="setting-value" id="tempValue">0.7</span>
+                </div>
+                <div class="setting-group">
+                    <label>Max Length</label>
+                    <input type="range" id="maxLength" min="10" max="200" step="10" value="100">
+                    <span class="setting-value" id="lengthValue">100</span>
+                </div>
+                <div class="setting-group">
+                    <label>Top-K</label>
+                    <input type="range" id="topK" min="1" max="100" step="1" value="50">
+                    <span class="setting-value" id="topKValue">50</span>
+                </div>
+                <div class="setting-group">
+                    <label>Top-P</label>
+                    <input type="range" id="topP" min="0.1" max="1" step="0.1" value="0.9">
+                    <span class="setting-value" id="topPValue">0.9</span>
+                </div>
+            </div>
+            <div class="messages" id="messages">
+                <div class="message bot-message">
+                    Hello! I am Visible, your AI assistant. Ask me anything!
+                </div>
+            </div>
+            <div class="input-area">
+                <input type="text" id="userInput" placeholder="Type your message..." autocomplete="off">
+                <button id="sendBtn" onclick="sendMessage()">Send</button>
+            </div>
+        </div>
+    </div>
+    <script>
+        // Update setting values display
+        document.querySelectorAll('input[type="range"]').forEach(input => {
+            input.addEventListener('input', function() {
+                document.getElementById(this.id + 'Value' === 'temperatureValue' ? 'tempValue' :
+                    this.id === 'maxLength' ? 'lengthValue' :
+                    this.id === 'topK' ? 'topKValue' : 'topPValue').textContent = this.value;
+            });
+        });
+        // Fix the value display IDs
+        document.getElementById('temperature').addEventListener('input', function() {
+            document.getElementById('tempValue').textContent = this.value;
+        });
+        document.getElementById('maxLength').addEventListener('input', function() {
+            document.getElementById('lengthValue').textContent = this.value;
+        });
+        document.getElementById('topK').addEventListener('input', function() {
+            document.getElementById('topKValue').textContent = this.value;
+        });
+        document.getElementById('topP').addEventListener('input', function() {
+            document.getElementById('topPValue').textContent = this.value;
+        });
+        // Check status
+        async function checkStatus() {
+            try {
+                const response = await fetch('/api/status');
+                const data = await response.json();
+                const statusEl = document.getElementById('status');
+                if (data.model_loaded) {
+                    statusEl.className = 'status ready';
+                    statusEl.textContent = '✓ Model Ready - ' + data.model_name;
+                } else {
+                    statusEl.className = 'status error';
+                    statusEl.textContent = '✗ Model not loaded. Please train the model first.';
+                }
+            } catch (e) {
+                document.getElementById('status').className = 'status error';
+                document.getElementById('status').textContent = '✗ Server connection failed';
+            }
+        }
+        checkStatus();
+        // Send message
+        async function sendMessage() {
+            const input = document.getElementById('userInput');
+            const message = input.value.trim();
+            if (!message) return;
+            const messagesDiv = document.getElementById('messages');
+            const sendBtn = document.getElementById('sendBtn');
+            // Add user message
+            messagesDiv.innerHTML += `<div class="message user-message">${message}</div>`;
+            input.value = '';
+            // Disable button and show loading
+            sendBtn.disabled = true;
+            sendBtn.innerHTML = '<span class="loading-spinner"></span>';
+            // Scroll to bottom
+            messagesDiv.scrollTop = messagesDiv.scrollHeight;
+            try {
+                const response = await fetch('/api/generate', {
+                    method: 'POST',
+                    headers: { 'Content-Type': 'application/json' },
+                    body: JSON.stringify({
+                        prompt: message,
+                        max_length: parseInt(document.getElementById('maxLength').value),
+                        temperature: parseFloat(document.getElementById('temperature').value),
+                        top_k: parseInt(document.getElementById('topK').value),
+                        top_p: parseFloat(document.getElementById('topP').value)
+                    })
+                });
+                const data = await response.json();
+                if (data.success) {
+                    messagesDiv.innerHTML += `<div class="message bot-message">${data.response}</div>`;
+                } else {
+                    messagesDiv.innerHTML += `<div class="message bot-message" style="color: #ff6b6b">Error: ${data.error}</div>`;
+                }
+            } catch (e) {
+                messagesDiv.innerHTML += `<div class="message bot-message" style="color: #ff6b6b">Error: Failed to connect to server</div>`;
+            }
+            // Re-enable button
+            sendBtn.disabled = false;
+            sendBtn.innerHTML = 'Send';
+            // Scroll to bottom
+            messagesDiv.scrollTop = messagesDiv.scrollHeight;
+        }
+        // Handle Enter key
+        document.getElementById('userInput').addEventListener('keypress', function(e) {
+            if (e.key === 'Enter') {
+                sendMessage();
+            }
+        });
+    </script>
+</body>
+</html>
+"""
+@app.route('/')
+def home():
+    """Render the main chat interface"""
+    return render_template_string(HTML_TEMPLATE)
+@app.route('/api/status')
+def status():
+    """Get model status"""
+    global visible_llm
+    return jsonify({
+        'model_loaded': visible_llm is not None and visible_llm.model is not None,
+        'model_name': VisibleConfig.MODEL_NAME,
+        'version': VisibleConfig.VERSION
+    })
+@app.route('/api/generate', methods=['POST'])
+def generate():
+    """Generate text from prompt"""
+    global visible_llm
+    if visible_llm is None or visible_llm.model is None:
+        return jsonify({
+            'success': False,
+            'error': 'Model not loaded. Please train the model first.'
+        })
+    try:
+        data = request.json
+        prompt = data.get('prompt', '')
+        max_length = data.get('max_length', 100)
+        temperature = data.get('temperature', 0.7)
+        top_k = data.get('top_k', 50)
+        top_p = data.get('top_p', 0.9)
+        response = visible_llm.generate(
+            prompt=prompt,
+            max_length=max_length,
+            temperature=temperature,
+            top_k=top_k,
+            top_p=top_p
+        )
+        return jsonify({
+            'success': True,
+            'response': response,
+            'prompt': prompt
+        })
+    except Exception as e:
+        return jsonify({
+            'success': False,
+            'error': str(e)
+        })
+@app.route('/api/train', methods=['POST'])
+def train_model():
+    """Train the model (API endpoint)"""
+    global visible_llm
+    try:
+        data = request.json or {}
+        epochs = data.get('epochs', 50)
+        batch_size = data.get('batch_size', 32)
+        visible_llm = VisibleLLM()
+        visible_llm.train(epochs=epochs, batch_size=batch_size)
+        return jsonify({
+            'success': True,
+            'message': 'Training complete!'
+        })
+    except Exception as e:
+        return jsonify({
+            'success': False,
+            'error': str(e)
+        })
+# ============================================================
+# COMMAND LINE INTERFACE
+# ============================================================
+def main():
+    """Main entry point"""
+    import argparse
+    parser = argparse.ArgumentParser(description='Visible LLM - Language Model')
+    parser.add_argument('--train', action='store_true', help='Train the model')
+    parser.add_argument('--serve', action='store_true', help='Start web server')
+    parser.add_argument('--chat', action='store_true', help='Interactive chat mode')
+    parser.add_argument('--epochs', type=int, default=50, help='Number of training epochs')
+    parser.add_argument('--batch-size', type=int, default=32, help='Batch size')
+    parser.add_argument('--data', type=str, default='veda.txt', help='Training data file')
+    parser.add_argument('--port', type=int, default=5000, help='Server port')
+    args = parser.parse_args()
+    global visible_llm
+    if args.train:
+        print("\n" + "="*60)
+        print("VISIBLE LLM - TRAINING MODE")
+        print("="*60 + "\n")
+        visible_llm = VisibleLLM()
+        VisibleConfig.DATA_FILE = args.data
+        visible_llm.train(epochs=args.epochs, batch_size=args.batch_size)
+    elif args.chat:
+        print("\n" + "="*60)
+        print("VISIBLE LLM - CHAT MODE")
+        print("="*60 + "\n")
+        visible_llm = VisibleLLM()
+        visible_llm.load_model()
+        print("Chat with Visible (type 'quit' to exit)\n")
+        while True:
+            user_input = input("You: ").strip()
+            if user_input.lower() in ['quit', 'exit', 'q']:
+                print("Goodbye!")
+                break
+            if user_input:
+                response = visible_llm.chat(user_input)
+                print(f"Visible: {response}\n")
+    elif args.serve:
+        print("\n" + "="*60)
+        print("VISIBLE LLM - WEB SERVER MODE")
+        print("="*60 + "\n")
+        # Try to load existing model
+        visible_llm = VisibleLLM()
+        try:
+            visible_llm.load_model()
+            print("Model loaded successfully!")
+        except Exception as e:
+            print(f"Could not load model: {e}")
+            print("Please train the model first with: python app.py --train")
+            visible_llm = None
+        print(f"\nStarting server on http://localhost:{args.port}")
+        app.run(host='0.0.0.0', port=args.port, debug=False)
+    else:
+        # Default: show help
+        parser.print_help()
+        print("\n" + "="*60)
+        print("QUICK START:")
+        print("="*60)
+        print("1. Train the model:    python app.py --train --data veda.txt")
+        print("2. Start web server:   python app.py --serve")
+        print("3. Interactive chat:   python app.py --chat")
+        print("="*60 + "\n")
+if __name__ == '__main__':
+    main()