Architech

Runtime error

App Files Files Community

Or4cl3-2 commited on Jan 26

Commit

b2be7e9

verified ·

1 Parent(s): ef57b75

Update app.py

Browse files

Files changed (1) hide show

app.py +717 -137

app.py CHANGED Viewed

@@ -1059,7 +1059,571 @@ What would you like to do?"""
                 history.append((user_msg, bot_msg))
         return history
-repo_chat = RepositoryChat()# ==================== GRADIO INTERFACE ====================
 def create_gradio_interface():
     agent = ArchitechAgent()
@@ -1236,6 +1800,157 @@ def create_gradio_interface():
                     outputs=test_output
                 )
             # Repository Chat Tab
             with gr.Tab("💬 Repository Chat"):
                 gr.Markdown("""
@@ -1315,139 +2030,4 @@ def create_gradio_interface():
                     history.append((message, bot_response))
                     return history, ""
-                send_btn.click(
-                    fn=chat_respond,
-                    inputs=[chat_input, chatbot],
-                    outputs=[chatbot, chat_input]
-                )
-                chat_input.submit(
-                    fn=chat_respond,
-                    inputs=[chat_input, chatbot],
-                    outputs=[chatbot, chat_input]
-                )
-            # Model Management Tab
-            with gr.Tab("💾 Model Management"):
-                gr.Markdown("""
-                ### Manage Your Models
-                Upload, download, and organize your trained models
-                """)
-                with gr.Row():
-                    # Upload Section
-                    with gr.Column():
-                        gr.Markdown("### 📤 Upload Model")
-                        upload_file = gr.File(
-                            label="Upload Model ZIP",
-                            file_types=[".zip"],
-                            type="filepath"
-                        )
-                        upload_btn = gr.Button("📦 Extract and Save", variant="primary")
-                        upload_output = gr.Markdown()
-                        upload_btn.click(
-                            fn=model_manager.extract_model_zip,
-                            inputs=[upload_file],
-                            outputs=upload_output
-                        )
-                    # Download Section
-                    with gr.Column():
-                        gr.Markdown("### 📥 Download Model")
-                        model_path_input = gr.Textbox(
-                            label="Model Path",
-                            placeholder="e.g., ./trained_my-model",
-                            info="Path to the model directory"
-                        )
-                        model_name_input = gr.Textbox(
-                            label="Archive Name",
-                            placeholder="e.g., my-awesome-model",
-                            info="Name for the zip file"
-                        )
-                        download_btn = gr.Button("📦 Create ZIP", variant="primary")
-                        download_file = gr.File(label="Download")
-                        download_output = gr.Markdown()
-                        def create_and_return_zip(model_path, model_name):
-                            zip_path, message = model_manager.create_model_zip(model_path, model_name)
-                            return zip_path, message
-                        download_btn.click(
-                            fn=create_and_return_zip,
-                            inputs=[model_path_input, model_name_input],
-                            outputs=[download_file, download_output]
-                        )
-                gr.Markdown("---")
-                # List Models
-                with gr.Row():
-                    with gr.Column():
-                        gr.Markdown("### 📋 Your Models")
-                        refresh_btn = gr.Button("🔄 Refresh List", variant="secondary")
-                        models_list = gr.Markdown()
-                        refresh_btn.click(
-                            fn=model_manager.list_local_models,
-                            outputs=models_list
-                        )
-                    with gr.Column():
-                        gr.Markdown("### 🗑️ Delete Model")
-                        delete_path = gr.Textbox(
-                            label="Model Path to Delete",
-                            placeholder="e.g., ./trained_my-model"
-                        )
-                        delete_btn = gr.Button("🗑️ Delete", variant="stop")
-                        delete_output = gr.Markdown()
-                        delete_btn.click(
-                            fn=model_manager.delete_model,
-                            inputs=[delete_path],
-                            outputs=delete_output
-                        )
-                gr.Markdown("""
-                ### 💡 Tips:
-                - Upload model zips from backups or other systems
-                - Download models as portable archives
-                - Keep your workspace organized
-                - Always backup before deleting!
-                """)
-            # About
-            with gr.Tab("ℹ️ About"):
-                gr.Markdown("""
-                ## 🏗️ Architech - Your AI Model Architect
-                ### Features:
-                - 🎨 **Generate Synthetic Data**: No training data? No problem!
-                - 🚀 **Train Custom Models**: Fine-tune models for your specific needs
-                - 🧪 **Test Your Models**: Load and test your models instantly
-                - ⚡ **Rate Limited**: Fair usage for all users
-                - 🔒 **Secure**: Token-based authentication
-                ### How to Use:
-                1. Generate synthetic training data for your task
-                2. Train a custom model with your data
-                3. Test and deploy your model!
-                ### Rate Limits:
-                - Dataset Generation: 10 per hour
-                - Model Training: 3 per hour
-                - Model Inference: 50 per hour
-                *Built with ❤️ using Gradio, Transformers, and HuggingFace*
-                """)
-    return demo
-if __name__ == "__main__":
-    demo = create_gradio_interface()
-    demo.launch()

                 history.append((user_msg, bot_msg))
         return history
+repo_chat = RepositoryChat()# # ==================== MODEL CARD & PAPER GENERATOR ====================
+class DocumentationGenerator:
+    def __init__(self):
+        self.templates_dir = Path("./generated_docs")
+        self.templates_dir.mkdir(exist_ok=True)
+    def generate_model_card(
+        self,
+        model_name: str,
+        task_description: str,
+        base_model: str,
+        dataset_size: int,
+        training_params: Dict[str, Any],
+        domain: str = "general",
+        intended_use: str = "",
+        limitations: str = "",
+        ethical_considerations: str = ""
+    ) -> str:
+        """Generate a comprehensive model card following HuggingFace standards"""
+        timestamp = datetime.now().strftime("%Y-%m-%d")
+        model_card = f"""---
+language: en
+license: mit
+tags:
+- text-generation
+- custom-model
+- architech
+- {domain}
+datasets:
+- synthetic-data
+metrics:
+- perplexity
+model-index:
+- name: {model_name}
+  results: []
+---
+# {model_name}
+## Model Description
+**{model_name}** is a fine-tuned language model created using Architech AI Model Architect.
+### Model Details
+- **Developed by:** Architech User
+- **Model type:** Causal Language Model
+- **Language(s):** English
+- **Base Model:** {base_model}
+- **License:** MIT
+- **Finetuned from:** {base_model}
+### Model Purpose
+{task_description}
+## Training Details
+### Training Data
+This model was trained on a synthetic dataset specifically generated for this task:
+- **Dataset Size:** {dataset_size} examples
+- **Domain:** {domain.title()}
+- **Data Generation:** Architech Synthetic Data Generator
+- **Data Format:** Conversational pairs / Instruction-response format
+The training data was synthetically generated to ensure:
+- Domain-specific vocabulary and concepts
+- Natural language variations
+- Task-relevant examples
+- Ethical and unbiased content
+### Training Procedure
+**Training Hyperparameters:**
+- **Base Model:** {base_model}
+- **Training Examples:** {dataset_size}
+- **Epochs:** {training_params.get('epochs', 'N/A')}
+- **Learning Rate:** {training_params.get('learning_rate', 'N/A')}
+- **Batch Size:** {training_params.get('batch_size', 'N/A')}
+- **Gradient Accumulation Steps:** {training_params.get('gradient_accumulation', 4)}
+- **Optimizer:** AdamW
+- **Training Precision:** FP16 (if GPU available)
+**Training Infrastructure:**
+- **Framework:** HuggingFace Transformers
+- **Training Tool:** Architech AI Model Architect
+- **Hardware:** {training_params.get('hardware', 'GPU/CPU auto-detected')}
+## Intended Use
+### Direct Use
+{intended_use if intended_use else f'''This model is designed for {task_description.lower()}. It can be used directly for:
+- Text generation in the {domain} domain
+- Conversational AI applications
+- Task-specific completion and assistance
+- Research and experimentation'''}
+### Downstream Use
+This model can be further fine-tuned for:
+- More specialized tasks within the {domain} domain
+- Multi-turn conversations
+- Domain-specific applications
+### Out-of-Scope Use
+This model should NOT be used for:
+- Medical, legal, or financial advice without human oversight
+- Safety-critical applications
+- Decision-making without human review
+- Generating harmful, biased, or unethical content
+## Bias, Risks, and Limitations
+{limitations if limitations else f'''### Known Limitations
+- Trained on synthetic data, which may not capture all real-world nuances
+- Limited to {dataset_size} training examples
+- May produce inconsistent outputs on topics outside training domain
+- Should not be considered a source of factual information without verification
+### Recommendations
+Users should:
+- Validate outputs for accuracy and appropriateness
+- Not rely solely on this model for critical decisions
+- Be aware of potential biases in generated content
+- Use human oversight for production applications'''}
+## Ethical Considerations
+{ethical_considerations if ethical_considerations else '''This model was developed with ethical AI principles in mind:
+- Training data was synthetically generated to avoid privacy issues
+- No personally identifiable information was used in training
+- Content generation should be monitored for potential misuse
+- Users are responsible for ensuring ethical use of generated content'''}
+## How to Use
+### Loading the Model
+```python
+from transformers import AutoTokenizer, AutoModelForCausalLM
+tokenizer = AutoTokenizer.from_pretrained("{model_name}")
+model = AutoModelForCausalLM.from_pretrained("{model_name}")
+# Generate text
+inputs = tokenizer("Your prompt here", return_tensors="pt")
+outputs = model.generate(**inputs, max_length=100)
+generated_text = tokenizer.decode(outputs[0], skip_special_tokens=True)
+print(generated_text)
+```
+### Using with Pipeline
+```python
+from transformers import pipeline
+generator = pipeline('text-generation', model='{model_name}')
+result = generator("Your prompt here", max_length=100)
+print(result[0]['generated_text'])
+```
+## Model Performance
+Performance metrics will vary based on specific use case and evaluation criteria.
+### Training Loss
+Training completed successfully with the model converging appropriately for the given dataset size and complexity.
+## Environmental Impact
+- **Training Time:** Approximately {training_params.get('training_time', 'varies')} minutes
+- **Hardware:** {training_params.get('hardware', 'GPU/CPU')}
+- **Carbon Emissions:** Minimal due to efficient training approach
+## Technical Specifications
+### Model Architecture
+Based on {base_model} architecture with task-specific fine-tuning.
+### Compute Infrastructure
+- **Training Platform:** HuggingFace Spaces / Architech
+- **Framework:** PyTorch + Transformers
+- **Optimization:** Gradient accumulation for memory efficiency
+## Citation
+If you use this model, please cite:
+```bibtex
+@misc{{{model_name.replace('-', '_')},
+  author = {{Architech User}},
+  title = {{{model_name}}},
+  year = {{{datetime.now().year}}},
+  publisher = {{HuggingFace}},
+  howpublished = {{\\url{{https://huggingface.co/your-username/{model_name}}}}}
+}}
+```
+## Model Card Authors
+- Generated by: Architech AI Model Architect
+- Date: {timestamp}
+## Model Card Contact
+For questions or feedback about this model, please open an issue in the model repository.
+---
+*This model card was automatically generated by Architech AI Model Architect. Please review and customize as needed.*
+"""
+        # Save model card
+        card_path = self.templates_dir / f"{model_name}_model_card.md"
+        with open(card_path, 'w') as f:
+            f.write(model_card)
+        return model_card, str(card_path)
+    def generate_research_paper(
+        self,
+        model_name: str,
+        task_description: str,
+        base_model: str,
+        dataset_size: int,
+        training_params: Dict[str, Any],
+        domain: str = "general",
+        methodology_notes: str = "",
+        results_summary: str = ""
+    ) -> str:
+        """Generate a research paper documenting the model"""
+        timestamp = datetime.now().strftime("%B %Y")
+        paper = f"""# Fine-Tuning {base_model} for {task_description}: A Synthetic Data Approach
+**Authors:** Architech User
+**Date:** {timestamp}
+**Model:** {model_name}
+---
+## Abstract
+We present **{model_name}**, a fine-tuned language model specifically designed for {task_description.lower()}.
+This work demonstrates the effectiveness of synthetic data generation for domain-specific language model adaptation.
+Using {dataset_size} synthetically generated examples, we fine-tuned {base_model} to create a specialized model
+for the {domain} domain. Our approach leverages automated data generation techniques to overcome the common challenge
+of limited training data availability while maintaining high-quality, task-relevant outputs.
+**Keywords:** Language Models, Transfer Learning, Synthetic Data, Fine-Tuning, {domain.title()}, {base_model}
+---
+## 1. Introduction
+### 1.1 Background
+Large language models (LLMs) have demonstrated remarkable capabilities across diverse natural language processing tasks.
+However, adapting these models to specific domains or tasks often requires substantial amounts of high-quality training data,
+which can be expensive, time-consuming, or difficult to obtain while maintaining privacy and ethical standards.
+### 1.2 Motivation
+The primary motivation for this work is to address the data scarcity problem in domain-specific language model development.
+Our specific use case—{task_description.lower()}—requires specialized knowledge and conversational patterns that may not
+be adequately represented in general-purpose language models.
+### 1.3 Contributions
+This work makes the following contributions:
+1. **Synthetic Data Generation Framework**: We develop and apply a domain-specific synthetic data generation approach
+   that creates high-quality training examples without requiring manual annotation.
+2. **Efficient Fine-Tuning**: We demonstrate effective fine-tuning of {base_model} using a relatively small dataset
+   of {dataset_size} examples, showcasing the efficiency of modern transfer learning approaches.
+3. **Practical Application**: We provide a complete, production-ready model for {task_description.lower()} that can
+   be deployed immediately or serve as a foundation for further specialization.
+---
+## 2. Related Work
+### 2.1 Transfer Learning in NLP
+Transfer learning has become the dominant paradigm in natural language processing, with pre-trained models like GPT,
+BERT, and their variants achieving state-of-the-art results across numerous benchmarks. Our work builds on this
+foundation by demonstrating efficient domain adaptation.
+### 2.2 Synthetic Data Generation
+Recent work has shown that synthetic data can effectively augment or even replace human-annotated data for specific tasks.
+Our approach extends these findings to conversational AI and domain-specific language generation.
+### 2.3 Domain Adaptation
+Domain adaptation techniques allow models trained on one domain to perform well on another. Our work contributes to
+this area by combining synthetic data generation with fine-tuning for efficient domain-specific model creation.
+---
+## 3. Methodology
+### 3.1 Base Model Selection
+We selected **{base_model}** as our base model for the following reasons:
+- **Architecture**: Modern transformer-based architecture with proven generation capabilities
+- **Size**: Appropriate balance between capability and computational efficiency
+- **Compatibility**: Well-supported by the HuggingFace ecosystem
+- **Performance**: Strong baseline performance on general language tasks
+### 3.2 Synthetic Data Generation
+{methodology_notes if methodology_notes else f'''Our synthetic data generation process consists of several key components:
+**Domain Knowledge Base:**
+We curated domain-specific vocabulary, concepts, and contexts relevant to the {domain} domain. This knowledge base
+includes:
+- Key topics and terminology
+- Common question-answer patterns
+- Domain-specific use cases
+- Contextual scenarios
+**Template-Based Generation:**
+We employed template-based generation with intelligent variable substitution:
+- Multiple conversation templates
+- Dynamic topic and concept insertion
+- Natural language variation
+- Context-appropriate responses
+**Quality Assurance:**
+Each generated example undergoes validation:
+- Coherence checking
+- Domain relevance verification
+- Diversity analysis
+- Edge case inclusion'''}
+### 3.3 Training Configuration
+Our training setup utilized the following hyperparameters:
+| Parameter | Value |
+|-----------|-------|
+| Base Model | {base_model} |
+| Training Examples | {dataset_size} |
+| Epochs | {training_params.get('epochs', 'N/A')} |
+| Learning Rate | {training_params.get('learning_rate', 'N/A')} |
+| Batch Size | {training_params.get('batch_size', 'N/A')} |
+| Gradient Accumulation | {training_params.get('gradient_accumulation', 4)} steps |
+| Optimizer | AdamW |
+| Precision | Mixed (FP16) |
+**Training Procedure:**
+1. **Data Preparation**: Synthetic examples were tokenized using the base model's tokenizer
+2. **Model Initialization**: Started from pre-trained {base_model} weights
+3. **Fine-Tuning**: Applied supervised fine-tuning with causal language modeling objective
+4. **Optimization**: Used gradient accumulation for memory efficiency
+5. **Validation**: Monitored training loss for convergence
+### 3.4 Implementation Details
+Our implementation leverages:
+- **Framework**: HuggingFace Transformers
+- **Training Tool**: Architech AI Model Architect
+- **Infrastructure**: Cloud-based GPU/CPU resources
+- **Optimization**: Automatic mixed precision training
+---
+## 4. Results
+### 4.1 Training Outcomes
+{results_summary if results_summary else f'''The model successfully converged during training, demonstrating:
+- **Stable Training**: Loss decreased consistently across epochs
+- **No Overfitting**: Training remained stable without signs of overfitting to the small dataset
+- **Efficient Learning**: Model adapted to domain-specific patterns effectively
+**Qualitative Observations:**
+- Generated text shows strong alignment with the {domain} domain
+- Model produces coherent, contextually appropriate responses
+- Task-specific vocabulary and concepts are properly utilized
+- Conversation flow is natural and relevant to intended use case'''}
+### 4.2 Model Capabilities
+The fine-tuned model demonstrates:
+1. **Domain Expertise**: Strong understanding of {domain}-specific concepts
+2. **Task Alignment**: Outputs are well-aligned with {task_description.lower()}
+3. **Coherence**: Generated text maintains logical consistency
+4. **Flexibility**: Adapts to various prompts within the domain
+### 4.3 Limitations
+We acknowledge the following limitations:
+- **Dataset Size**: With {dataset_size} examples, coverage of edge cases may be limited
+- **Synthetic Origin**: Training data may not capture all real-world nuances
+- **Domain Specificity**: Performance may degrade on out-of-domain inputs
+- **Evaluation**: Comprehensive quantitative evaluation remains future work
+---
+## 5. Discussion
+### 5.1 Effectiveness of Synthetic Data
+Our results demonstrate that synthetically generated data can effectively fine-tune language models for specific tasks.
+The quality of outputs suggests that carefully designed synthetic data can capture essential patterns needed for
+domain adaptation.
+### 5.2 Practical Implications
+This work has several practical implications:
+- **Accessibility**: Reduces barriers to creating custom language models
+- **Privacy**: Eliminates need for potentially sensitive real-world data
+- **Efficiency**: Enables rapid prototyping and iteration
+- **Scalability**: Framework can be applied to diverse domains and tasks
+### 5.3 Future Directions
+Several promising directions for future work include:
+1. **Quantitative Evaluation**: Comprehensive benchmarking against domain-specific metrics
+2. **Dataset Scaling**: Investigation of performance vs. dataset size trade-offs
+3. **Hybrid Approaches**: Combining synthetic and real data for enhanced performance
+4. **Multi-Domain Transfer**: Exploring transfer learning across related domains
+---
+## 6. Conclusion
+We presented **{model_name}**, a fine-tuned language model for {task_description.lower()}, demonstrating the
+effectiveness of synthetic data generation for domain-specific model adaptation. Our approach successfully created
+a specialized model using {dataset_size} synthetically generated examples, proving that efficient domain adaptation
+is achievable without large-scale manual data collection.
+The model shows strong task alignment and domain expertise, validating our methodology. This work contributes to
+the growing body of evidence that synthetic data, when carefully designed, can serve as an effective alternative
+or complement to human-annotated data for language model fine-tuning.
+As language models continue to evolve, techniques for efficient, ethical, and accessible model adaptation will
+become increasingly important. Our work provides a practical framework for creating custom language models that
+can be applied across diverse domains and use cases.
+---
+## 7. References
+1. HuggingFace Transformers: State-of-the-art Natural Language Processing
+2. Attention Is All You Need (Vaswani et al., 2017)
+3. Language Models are Few-Shot Learners (Brown et al., 2020)
+4. Transfer Learning in Natural Language Processing (Ruder, 2019)
+---
+## Appendix A: Model Architecture
+**Base Architecture:** {base_model}
+The model inherits the transformer-based architecture of the base model, with all parameters fine-tuned for the
+specific task.
+## Appendix B: Training Logs
+Training completed successfully with stable convergence. Detailed logs available in model repository.
+## Appendix C: Code Availability
+Model and code are available at: https://huggingface.co/your-username/{model_name}
+---
+## Acknowledgments
+This research was conducted using Architech AI Model Architect, an open-source tool for automated language model
+development. We thank the HuggingFace team for providing the infrastructure and tools that made this work possible.
+---
+**Contact:** For questions about this work, please open an issue in the model repository.
+**Date:** {timestamp}
+**Version:** 1.0
+---
+*This paper was automatically generated by Architech AI Model Architect. Please review and customize as needed for publication.*
+"""
+        # Save paper
+        paper_path = self.templates_dir / f"{model_name}_research_paper.md"
+        with open(paper_path, 'w') as f:
+            f.write(paper)
+        return paper, str(paper_path)
+    def generate_both_documents(
+        self,
+        model_name: str,
+        task_description: str,
+        base_model: str,
+        dataset_size: int,
+        num_epochs: int,
+        learning_rate: float,
+        batch_size: int,
+        domain: str = "general",
+        intended_use: str = "",
+        limitations: str = "",
+        methodology_notes: str = "",
+        results_summary: str = "",
+        progress=gr.Progress()
+    ) -> Tuple[str, str, str, str]:
+        """Generate both model card and research paper"""
+        progress(0.3, "📝 Generating Model Card...")
+        training_params = {
+            'epochs': num_epochs,
+            'learning_rate': learning_rate,
+            'batch_size': batch_size,
+            'gradient_accumulation': 4,
+            'hardware': 'GPU/CPU (auto-detected)'
+        }
+        model_card, card_path = self.generate_model_card(
+            model_name, task_description, base_model, dataset_size,
+            training_params, domain, intended_use, limitations
+        )
+        progress(0.7, "📄 Generating Research Paper...")
+        paper, paper_path = self.generate_research_paper(
+            model_name, task_description, base_model, dataset_size,
+            training_params, domain, methodology_notes, results_summary
+        )
+        progress(1.0, "✅ Documentation Generated!")
+        return model_card, card_path, paper, paper_path
+doc_generator = DocumentationGenerator()# ==================== GRADIO INTERFACE ====================
 def create_gradio_interface():
     agent = ArchitechAgent()
                     outputs=test_output
                 )
+            # Documentation Generation Tab
+            with gr.Tab("📄 Generate Documentation"):
+                gr.Markdown("""
+                ### Generate Professional Model Card & Research Paper
+                Automatically create comprehensive documentation for your models
+                """)
+                with gr.Row():
+                    with gr.Column():
+                        gr.Markdown("### 📋 Model Information")
+                        doc_model_name = gr.Textbox(
+                            label="Model Name",
+                            placeholder="my-awesome-model"
+                        )
+                        doc_task_desc = gr.Textbox(
+                            label="Task Description",
+                            placeholder="Customer support chatbot for technical products",
+                            lines=2
+                        )
+                        doc_base_model = gr.Dropdown(
+                            choices=["distilgpt2", "gpt2", "microsoft/DialoGPT-small", "other"],
+                            label="Base Model",
+                            value="distilgpt2"
+                        )
+                        with gr.Row():
+                            doc_dataset_size = gr.Number(
+                                label="Dataset Size",
+                                value=100,
+                                precision=0
+                            )
+                            doc_domain = gr.Dropdown(
+                                choices=["technology", "healthcare", "finance", "education", "general"],
+                                label="Domain",
+                                value="general"
+                            )
+                        with gr.Row():
+                            doc_epochs = gr.Number(label="Epochs", value=3, precision=0)
+                            doc_lr = gr.Number(label="Learning Rate", value=0.0002)
+                            doc_batch = gr.Number(label="Batch Size", value=2, precision=0)
+                        with gr.Accordion("📝 Optional Details", open=False):
+                            doc_intended_use = gr.Textbox(
+                                label="Intended Use (optional)",
+                                placeholder="Describe specific use cases...",
+                                lines=3
+                            )
+                            doc_limitations = gr.Textbox(
+                                label="Known Limitations (optional)",
+                                placeholder="Describe any known limitations...",
+                                lines=3
+                            )
+                            doc_methodology = gr.Textbox(
+                                label="Methodology Notes (optional)",
+                                placeholder="Additional methodology details...",
+                                lines=3
+                            )
+                            doc_results = gr.Textbox(
+                                label="Results Summary (optional)",
+                                placeholder="Summary of model performance...",
+                                lines=3
+                            )
+                        generate_docs_btn = gr.Button("📄 Generate Documentation", variant="primary", size="lg")
+                    with gr.Column():
+                        gr.Markdown("### 📥 Generated Documents")
+                        doc_status = gr.Markdown("*Generate documents to see preview*")
+                        with gr.Tabs():
+                            with gr.Tab("📋 Model Card"):
+                                model_card_output = gr.Markdown()
+                                model_card_file = gr.File(label="Download Model Card")
+                            with gr.Tab("📄 Research Paper"):
+                                paper_output = gr.Markdown()
+                                paper_file = gr.File(label="Download Research Paper")
+                def generate_and_display_docs(
+                    name, task, base, size, domain, epochs, lr, batch,
+                    intended, limitations, methodology, results, progress=gr.Progress()
+                ):
+                    try:
+                        model_card, card_path, paper, paper_path = doc_generator.generate_both_documents(
+                            name, task, base, int(size), int(epochs), float(lr), int(batch),
+                            domain, intended, limitations, methodology, results, progress
+                        )
+                        status = f"""✅ **Documentation Generated Successfully!**
+📋 **Model Card:** `{Path(card_path).name}`
+📄 **Research Paper:** `{Path(paper_path).name}`
+**Files saved to:** `./generated_docs/`
+**What's Next?**
+1. Review the documents in the tabs above
+2. Download and customize if needed
+3. Upload to your model repository on HuggingFace
+4. Share with the community!
+"""
+                        # Truncate for preview
+                        card_preview = model_card[:5000] + "\n\n*... (truncated for preview, download for full content)*" if len(model_card) > 5000 else model_card
+                        paper_preview = paper[:5000] + "\n\n*... (truncated for preview, download for full content)*" if len(paper) > 5000 else paper
+                        return status, card_preview, card_path, paper_preview, paper_path
+                    except Exception as e:
+                        error_msg = f"❌ Error generating documentation: {str(e)}"
+                        return error_msg, "", None, "", None
+                generate_docs_btn.click(
+                    fn=generate_and_display_docs,
+                    inputs=[
+                        doc_model_name, doc_task_desc, doc_base_model,
+                        doc_dataset_size, doc_domain, doc_epochs, doc_lr, doc_batch,
+                        doc_intended_use, doc_limitations, doc_methodology, doc_results
+                    ],
+                    outputs=[doc_status, model_card_output, model_card_file, paper_output, paper_file]
+                )
+                gr.Markdown("""
+                ---
+                ### 💡 Documentation Tips
+                **Model Card:**
+                - Standard format recognized by HuggingFace
+                - Includes model details, training info, and usage examples
+                - Ready to upload to your model repository
+                **Research Paper:**
+                - Academic-style documentation
+                - Describes methodology and approach
+                - Great for sharing your work formally
+                **Best Practices:**
+                - Fill in optional fields for more detailed documentation
+                - Customize generated docs before publishing
+                - Keep documentation up-to-date with model changes
+                - Include ethical considerations and limitations
+                """)
             # Repository Chat Tab
             with gr.Tab("💬 Repository Chat"):
                 gr.Markdown("""
                     history.append((message, bot_response))
                     return history, ""