Spaces:

pangxiang
/

capricode-codefix

Sleeping

App Files Files Community

pangxiang commited on Oct 24, 2025

Commit

2a16183

verified ·

1 Parent(s): 20f5179

Update app.py

Browse files

Files changed (1) hide show

app.py +577 -167

app.py CHANGED Viewed

@@ -1,10 +1,11 @@
 import gradio as gr
 import json
 import os
 from datetime import datetime
 from transformers import pipeline, AutoTokenizer, AutoModelForCausalLM
-class SmartCodeFixer:
     def __init__(self):
         self.feedback_file = "user_feedback.json"
         self.model = None
@@ -15,20 +16,24 @@ class SmartCodeFixer:
     def load_model(self):
         """加载预训练模型"""
         try:
-            # 使用一个较好的代码生成模型
-            model_name = "microsoft/DialoGPT-medium"  # 或者 "codellama/CodeLlama-7b-hf"
             self.tokenizer = AutoTokenizer.from_pretrained(model_name)
             self.model = AutoModelForCausalLM.from_pretrained(model_name)
-            print("模型加载成功!")
         except Exception as e:
-            print(f"模型加载失败: {e}")
             self.model = None
     def load_feedback_data(self):
         """加载用户反馈数据用于学习"""
         if os.path.exists(self.feedback_file):
-            with open(self.feedback_file, 'r', encoding='utf-8') as f:
-                self.feedback_data = json.load(f)
         else:
             self.feedback_data = []
@@ -49,21 +54,25 @@ class SmartCodeFixer:
         with open(self.feedback_file, 'w', encoding='utf-8') as f:
             json.dump(self.feedback_data, f, ensure_ascii=False, indent=2)
-        # 定期重新训练模型（简化版）
-        if len(self.feedback_data) % 10 == 0:  # 每10个反馈重新学习
             self.retrain_from_feedback()
     def detect_language(self, code):
         """智能检测编程语言"""
-        code_lower = code.lower()
         language_indicators = {
-            'html': ['<!doctype', '<html', '<div', '<span', 'class="', 'id="'],
-            'python': ['def ', 'import ', 'print(', 'if __name__', 'lambda '],
-            'javascript': ['function ', 'console.log', 'document.', 'addEventListener'],
-            'java': ['public class', 'public static', 'System.out.println'],
-            'cpp': ['#include', 'using namespace', 'cout <<', 'std::'],
-            'css': ['{', '}', ':', ';', 'font-size', 'color:']
         }
         scores = {lang: 0 for lang in language_indicators}
@@ -73,18 +82,34 @@ class SmartCodeFixer:
                 if indicator in code_lower:
                     scores[lang] += 1
-        return max(scores.items(), key=lambda x: x[1])[0]
     def ai_fix_code(self, code, language):
         """使用AI模型修复代码"""
         if self.model is None:
-            return self.rule_based_fix(code, language)
         try:
-            # 构建修复提示
-            prompt = f"""修复以下{language}代码的错误：
-错误代码:
 ```{language}
 {code}
 """
@@ -92,228 +117,604 @@ class SmartCodeFixer:
             inputs = self.tokenizer.encode(prompt, return_tensors="pt")
             outputs = self.model.generate(
                 inputs,
-                max_length=len(inputs[0]) + 100,
                 num_return_sequences=1,
-                temperature=0.7,
-                do_sample=True
             )
             response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
             # 提取修复后的代码
             if "```" in response:
-                fixed_code = response.split("```")[2].strip()
             else:
                 fixed_code = response.replace(prompt, "").strip()
-            return fixed_code
         except Exception as e:
-            print(f"AI修复失败: {e}")
-            return self.rule_based_fix(code, language)
-    def rule_based_fix(self, code, language):
-        """基于规则的代码修复"""
-        fixes = {
-            'html': self.fix_html,
-            'python': self.fix_python,
-            'javascript': self.fix_javascript,
-            'java': self.fix_java,
-            'cpp': self.fix_cpp,
-            'css': self.fix_css
         }
-        fix_function = fixes.get(language, self.fix_generic)
-        return fix_function(code)
-    def fix_html(self, code):
-        """修复HTML代码"""
         fixes = []
-        # 检查标签闭合
-        if '<div>' in code and '</div>' not in code:
-            code += '\n</div>'
-            fixes.append("添加了缺失的 </div> 标签")
-        # 检查属性引号
-        if 'class=' in code and 'class="' not in code:
-            code = code.replace('class=', 'class="')
-            if '"' not in code[code.find('class="')+7:code.find('class="')+20]:
-                code = code.replace('class="', 'class=""')
-            fixes.append("修复了属性引号")
         # 添加基本的HTML结构
-        if '<!DOCTYPE html>' not in code and '<html>' not in code:
-            code = f"""<!DOCTYPE html>
-<html>
 <head>
     <meta charset="UTF-8">
     <title>Document</title>
 </head>
 <body>
-{code}
 </body>
 </html>"""
-            fixes.append("添加了基本的HTML结构")
-        return code, fixes
-    def fix_python(self, code):
-        """修复Python代码"""
         fixes = []
-        # 修复括号
-        if code.count('(') > code.count(')'):
-            code += ')' * (code.count('(') - code.count(')'))
-            fixes.append("修复了不匹配的括号")
-        # 修复引号
-        if code.count('"') % 2 != 0:
-            code += '"'
-            fixes.append("修复了不匹配的双引号")
-        if code.count("'") % 2 != 0:
-            code += "'"
-            fixes.append("修复了不匹配的单引号")
-        # 修复冒号
-        lines = code.split('\n')
-        for i, line in enumerate(lines):
-            if any(keyword in line for keyword in ['if ', 'for ', 'def ', 'class ', 'while ']) and not line.rstrip().endswith(':'):
-                lines[i] = line.rstrip() + ':'
-                fixes.append("在条件/函数声明后添加了冒号")
-        return '\n'.join(lines), fixes
-    def fix_javascript(self, code):
-        """修复JavaScript代码"""
         fixes = []
-        # 修复括号
-        if code.count('(') > code.count(')'):
-            code += ')' * (code.count('(') - code.count(')'))
-            fixes.append("修复了不匹配的括号")
-        # 修复花括号
-        if code.count('{') > code.count('}'):
-            code += '}' * (code.count('{') - code.count('}'))
-            fixes.append("修复了不匹配的花括号")
-        return code, fixes
-    def fix_css(self, code):
-        """修复CSS代码"""
         fixes = []
         # 修复选择器
-        if ':' in code and ';' not in code:
-            code += ';'
-            fixes.append("添加了缺失的分号")
-        return code, fixes
-    def fix_java(self, code):
-        """修复Java代码"""
         fixes = []
         # 添加基本的类结构
-        if 'public class' in code and '{' not in code:
-            code = code.replace('public class', 'public class Main {') + '\n    public static void main(String[] args) {\n        \n    }\n}'
-            fixes.append("添加了基本的类结构")
-        return code, fixes
-    def fix_cpp(self, code):
-        """修复C++代码"""
         fixes = []
-        if '#include' in code and 'int main' not in code:
-            code += '\n\nint main() {\n    return 0;\n}'
             fixes.append("添加了main函数")
-        return code, fixes
-    def fix_generic(self, code):
-        """通用修复"""
-        fixes = ["进行了通用语法检查"]
         return code, fixes
     def retrain_from_feedback(self):
-        """根据用户反馈重新训练模型（简化版）"""
-        print("正在从用户反馈中学习...")
-        # 这里可以添加增量学习的逻辑
-        # 目前先记录反馈，后续可以真正重新训练模型
 # 创建修复器实例
-fixer = SmartCodeFixer()
 def process_code(input_code, use_ai=True):
     """处理代码修复"""
-    language = fixer.detect_language(input_code)
-    if use_ai and fixer.model is not None:
-        fixed_code = fixer.ai_fix_code(input_code, language)
-        fixes = ["使用AI模型修复"]
-    else:
-        fixed_code, fixes = fixer.rule_based_fix(input_code, language)
-    # 生成修复报告
-    report = f"""🔧 修复报告
-📝 检测语言: {language}
-✅ 修复内容: {', '.join(fixes) if fixes else '代码看起来没问题'}
-修复后的代码:"""
-    return fixed_code, report
 def handle_feedback(original_code, fixed_code, user_feedback, is_correct):
     """处理用户反馈"""
     fixer.save_feedback(original_code, fixed_code, user_feedback, is_correct)
-    return "感谢您的反馈！系统正在学习改进... 💡"
 # 创建Gradio界面
-with gr.Blocks(theme=gr.themes.Soft()) as demo:
-    gr.Markdown("# 🚀 Capricode 智能代码修复助手")
-    gr.Markdown("支持 HTML, Python, JavaScript, Java, C++, CSS 等多种语言！")
-    with gr.Tab("代码修复"):
         with gr.Row():
-            with gr.Column():
                 input_code = gr.Textbox(
-                    label="📥 输入需要修复的代码",
-                    placeholder="粘贴你的代码到这里...",
-                    lines=10
                 )
-                use_ai = gr.Checkbox(label="使用AI智能修复", value=True)
-                fix_btn = gr.Button("🔧 修复代码", variant="primary")
-            with gr.Column():
                 output_code = gr.Textbox(
-                    label="📤 修复后的代码",
-                    lines=10,
                     show_copy_button=True
                 )
                 report = gr.Textbox(
-                    label="📊 修复报告",
-                    lines=3
                 )
-    with gr.Tab("反馈学习"):
-        gr.Markdown("## 💡 帮助系统变得更好")
         with gr.Row():
             with gr.Column():
-                feedback_original = gr.Textbox(label="原始代码", lines=3)
-                feedback_fixed = gr.Textbox(label="修复后的代码", lines=3)
-                user_feedback = gr.Textbox(
-                    label="您的反馈建议",
-                    placeholder="这里可以如何改进？",
-                    lines=3
-                )
-                is_correct = gr.Radio(
-                    choices=[("正确修复", True), ("需要改进", False)],
-                    label="修复是否正确？"
                 )
-                feedback_btn = gr.Button("提交反馈", variant="secondary")
-                feedback_result = gr.Textbox(label="反馈结果", interactive=False)
     # 事件处理
     fix_btn.click(
@@ -328,16 +729,25 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
         outputs=[feedback_result]
     )
-    # 示例
-    gr.Markdown("## 🎯 试试这些例子:")
     gr.Examples(
-        examples=[
-            ["<div>Hello World", True],  # HTML
-            ["print('Hello World'", True],  # Python
-            ["function test() {", True],  # JavaScript
-            ["public class MyClass", True],  # Java
-        ],
-        inputs=[input_code, use_ai]
     )
 if __name__ == "__main__":

 import gradio as gr
 import json
 import os
+import re
 from datetime import datetime
 from transformers import pipeline, AutoTokenizer, AutoModelForCausalLM
+class AdvancedCodeFixer:
     def __init__(self):
         self.feedback_file = "user_feedback.json"
         self.model = None
     def load_model(self):
         """加载预训练模型"""
         try:
+            # 使用轻量级但效果不错的模型
+            model_name = "microsoft/DialoGPT-medium"
             self.tokenizer = AutoTokenizer.from_pretrained(model_name)
             self.model = AutoModelForCausalLM.from_pretrained(model_name)
+            print("🤖 AI模型加载成功!")
         except Exception as e:
+            print(f"❌ 模型加载失败: {e}")
             self.model = None
     def load_feedback_data(self):
         """加载用户反馈数据用于学习"""
         if os.path.exists(self.feedback_file):
+            try:
+                with open(self.feedback_file, 'r', encoding='utf-8') as f:
+                    self.feedback_data = json.load(f)
+                print(f"📚 已加载 {len(self.feedback_data)} 条反馈数据")
+            except:
+                self.feedback_data = []
         else:
             self.feedback_data = []
         with open(self.feedback_file, 'w', encoding='utf-8') as f:
             json.dump(self.feedback_data, f, ensure_ascii=False, indent=2)
+        # 每5个反馈重新学习一次
+        if len(self.feedback_data) % 5 == 0:
             self.retrain_from_feedback()
     def detect_language(self, code):
         """智能检测编程语言"""
+        code_lower = code.lower().strip()
         language_indicators = {
+            'html': ['<!doctype', '<html', '<div', '<span', '<body', '<head', '<title', 'class="', 'id="'],
+            'python': ['def ', 'import ', 'print(', 'if __name__', 'lambda ', 'range(', 'len('],
+            'javascript': ['function ', 'console.log', 'document.', 'addEventListener', 'const ', 'let ', '=>'],
+            'java': ['public class', 'public static', 'system.out.println', 'void main'],
+            'cpp': ['#include', 'using namespace', 'cout <<', 'std::', 'int main()'],
+            'css': ['{', '}', ':', ';', 'font-size', 'color:', 'background:'],
+            'php': ['<?php', '$_get', '$_post', 'echo '],
+            'sql': ['select ', 'from ', 'where ', 'insert into', 'update '],
+            'ruby': ['def ', 'end', 'puts ', 'class '],
+            'go': ['package ', 'import "', 'func main()', 'fmt.println']
         }
         scores = {lang: 0 for lang in language_indicators}
                 if indicator in code_lower:
                     scores[lang] += 1
+        # 如果分数相同，优先选择更具体的语言
+        detected_lang = max(scores.items(), key=lambda x: x[1])[0]
+        # 如果所有分数都为0，根据内容特征猜测
+        if scores[detected_lang] == 0:
+            if '<' in code and '>' in code:
+                return 'html'
+            elif 'def ' in code or 'import ' in code:
+                return 'python'
+            elif 'function ' in code or 'console.log' in code:
+                return 'javascript'
+            elif 'public class' in code:
+                return 'java'
+            else:
+                return 'text'
+        return detected_lang
     def ai_fix_code(self, code, language):
         """使用AI模型修复代码"""
         if self.model is None:
+            return self.advanced_rule_based_fix(code, language)
         try:
+            # 构建更详细的修复提示
+            prompt = f"""请修复以下{language}代码��的语法错误和常见问题：
+有问题的代码:
 ```{language}
 {code}
 """
             inputs = self.tokenizer.encode(prompt, return_tensors="pt")
             outputs = self.model.generate(
                 inputs,
+                max_length=min(len(inputs[0]) + 200, 1024),
                 num_return_sequences=1,
+                temperature=0.3,
+                do_sample=True,
+                pad_token_id=self.tokenizer.eos_token_id
             )
             response = self.tokenizer.decode(outputs[0], skip_special_tokens=True)
             # 提取修复后的代码
             if "```" in response:
+                parts = response.split("```")
+                if len(parts) >= 3:
+                    fixed_code = parts[2].strip()
+                else:
+                    fixed_code = parts[-1].strip()
             else:
                 fixed_code = response.replace(prompt, "").strip()
+            return fixed_code, ["使用AI智能修复"]
         except Exception as e:
+            print(f"🤖 AI修复失败: {e}")
+            return self.advanced_rule_based_fix(code, language)
+    def advanced_rule_based_fix(self, code, language):
+        """基于规则的智能代码修复"""
+        fixes = []
+        fixed_code = code
+        # 通用修复（适用于所有语言）
+        fixed_code, general_fixes = self.apply_general_fixes(fixed_code)
+        fixes.extend(general_fixes)
+        # 语言特定修复
+        language_fix_functions = {
+            'html': self.fix_html_advanced,
+            'python': self.fix_python_advanced,
+            'javascript': self.fix_javascript_advanced,
+            'java': self.fix_java_advanced,
+            'cpp': self.fix_cpp_advanced,
+            'css': self.fix_css_advanced,
+            'php': self.fix_php_advanced,
+            'sql': self.fix_sql_advanced,
+            'ruby': self.fix_ruby_advanced,
+            'go': self.fix_go_advanced
         }
+        fix_function = language_fix_functions.get(language, self.fix_generic_advanced)
+        fixed_code, language_fixes = fix_function(fixed_code)
+        fixes.extend(language_fixes)
+        return fixed_code, fixes
+    def apply_general_fixes(self, code):
+        """应用通用修复规则"""
         fixes = []
+        fixed_code = code
+        # 修复不匹配的括号
+        paren_diff = fixed_code.count('(') - fixed_code.count(')')
+        if paren_diff > 0:
+            fixed_code += ')' * paren_diff
+            fixes.append(f"添加了 {paren_diff} 个缺失的右括号")
+        # 修复不匹配的方括号
+        bracket_diff = fixed_code.count('[') - fixed_code.count(']')
+        if bracket_diff > 0:
+            fixed_code += ']' * bracket_diff
+            fixes.append(f"添加了 {bracket_diff} 个缺失的右方括号")
+        # 修复不匹配的花括号
+        brace_diff = fixed_code.count('{') - fixed_code.count('}')
+        if brace_diff > 0:
+            fixed_code += '}' * brace_diff
+            fixes.append(f"添加了 {brace_diff} 个缺失的右花括号")
+        # 修复不匹配的引号
+        single_quote_pairs = fixed_code.count("'") % 2
+        double_quote_pairs = fixed_code.count('"') % 2
+        if single_quote_pairs != 0:
+            fixed_code += "'"
+            fixes.append("修复了不匹配的单引号")
+        if double_quote_pairs != 0:
+            fixed_code += '"'
+            fixes.append("修复了不匹配的双引号")
+        return fixed_code, fixes
+    def fix_html_advanced(self, code):
+        """高级HTML修复"""
+        fixes = []
+        fixed_code = code
+        # 修复属性引号
+        attr_pattern = r'(\w+)=([^"\'][^\s>]*)'
+        fixed_code = re.sub(attr_pattern, r'\1="\2"', fixed_code)
+        if fixed_code != code:
+            fixes.append("修复了HTML属性引号")
+        # 修复常见的标签闭合问题
+        unclosed_tags = {
+            '<div>': '</div>', '<p>': '</p>', '<span>': '</span>',
+            '<h1>': '</h1>', '<h2>': '</h2>', '<h3>': '</h3>',
+            '<ul>': '</ul>', '<ol>': '</ol>', '<li>': '</li>',
+            '<table>': '</table>', '<tr>': '</tr>', '<td>': '</td>'
+        }
+        for start_tag, end_tag in unclosed_tags.items():
+            if start_tag in fixed_code and end_tag not in fixed_code:
+                # 简单地在文档末尾添加结束标签（实际应该更智能）
+                if fixed_code.count(start_tag) > fixed_code.count(end_tag):
+                    fixed_code += f"\n{end_tag}"
+                    fixes.append(f"添加了缺失的 {end_tag}")
         # 添加基本的HTML结构
+        if '<!DOCTYPE html>' not in fixed_code and '<html>' not in fixed_code:
+            if not fixed_code.strip().startswith('<'):
+                fixed_code = f"""<!DOCTYPE html>
+<html lang="zh-CN">
 <head>
     <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
     <title>Document</title>
 </head>
 <body>
+    {fixed_code}
 </body>
 </html>"""
+                fixes.append("添加了完整的HTML文档结构")
+        # 修复自闭合标签
+        self_closing_tags = ['img', 'br', 'hr', 'input', 'meta', 'link']
+        for tag in self_closing_tags:
+            pattern = fr'<{tag}([^>]*[^/])>'
+            replacement = fr'<{tag}\1 />'
+            if re.search(pattern, fixed_code):
+                fixed_code = re.sub(pattern, replacement, fixed_code)
+                fixes.append(f"修复了 {tag} 标签的自闭合语法")
+        return fixed_code, fixes
+    def fix_python_advanced(self, code):
+        """高级Python修复"""
         fixes = []
+        fixed_code = code
+        lines = fixed_code.split('\n')
+        for i, line in enumerate(lines):
+            stripped = line.strip()
+            # 修复函数定义缺少冒号
+            if (stripped.startswith('def ') or
+                stripped.startswith('class ') or
+                (stripped.startswith('if ') and ':' not in stripped) or
+                (stripped.startswith('for ') and ':' not in stripped) or
+                (stripped.startswith('while ') and ':' not in stripped) or
+                (stripped.startswith('elif ') and ':' not in stripped) or
+                (stripped.startswith('else:') is False and stripped.startswith('else') and ':' not in stripped)):
+                if ':' not in stripped and not stripped.endswith('\\'):
+                    lines[i] = line.rstrip() + ':'
+                    fixes.append("在语句末尾添加了冒号")
+            # 修复缩进（简单的缩进检查）
+            if stripped and not stripped.startswith('#') and not stripped.startswith('@'):
+                if ':' in lines[i] and i + 1 < len(lines):
+                    next_line = lines[i + 1].strip()
+                    if next_line and not next_line.startswith(' ') and not next_line.startswith('\t'):
+                        lines[i + 1] = '    ' + lines[i + 1]
+                        fixes.append("修复了缩进")
+        fixed_code = '\n'.join(lines)
+        # 修复常见的Python语法问题
+        if 'print ' in fixed_code and 'print(' not in fixed_code:
+            fixed_code = fixed_code.replace('print ', 'print(') + ')'
+            fixes.append("修复了print语句语法")
+        return fixed_code, fixes
+    def fix_javascript_advanced(self, code):
+        """高级JavaScript修复"""
         fixes = []
+        fixed_code = code
+        lines = fixed_code.split('\n')
+        for i, line in enumerate(lines):
+            stripped = line.strip()
+            # 添加分号
+            if (stripped and
+                not stripped.endswith(';') and
+                not stripped.endswith('{') and
+                not stripped.endswith('}') and
+                not stripped.startswith('//') and
+                not stripped.startswith('/*') and
+                not stripped.startswith('*') and
+                not stripped.endswith('*/') and
+                ('=' in stripped or
+                 stripped.startswith('const ') or
+                 stripped.startswith('let ') or
+                 stripped.startswith('var ') or
+                 stripped.startswith('console.') or
+                 'function' in stripped or
+                 stripped.startswith('return ') or
+                 stripped.startswith('throw '))):
+                lines[i] = line.rstrip() + ';'
+                fixes.append("添加了语句结束分号")
+        fixed_code = '\n'.join(lines)
+        # 修复箭头函数
+        if '=>' in fixed_code and '(' not in fixed_code.split('=>')[0]:
+            # 简单的箭头函数参数修复
+            parts = fixed_code.split('=>')
+            if len(parts) > 1:
+                param_part = parts[0].strip()
+                if ' ' in param_part and not param_part.startswith('('):
+                    fixed_code = fixed_code.replace(param_part, f'({param_part})', 1)
+                    fixes.append("修复了箭头函数参数括号")
+        return fixed_code, fixes
+    def fix_css_advanced(self, code):
+        """高级CSS修复"""
         fixes = []
+        fixed_code = code
+        lines = fixed_code.split('\n')
+        in_rule = False
+        for i, line in enumerate(lines):
+            stripped = line.strip()
+            # 检测CSS规则开始和结束
+            if stripped.endswith('{'):
+                in_rule = True
+            elif stripped.endswith('}'):
+                in_rule = False
+            # 在CSS规则内修复属性
+            if in_rule and ':' in stripped and not stripped.endswith(';') and not stripped.endswith('{'):
+                lines[i] = line.rstrip() + ';'
+                fixes.append("添加了CSS属性分号")
+        fixed_code = '\n'.join(lines)
         # 修复选择器
+        if ': ' in fixed_code and ';' not in fixed_code:
+            fixed_code = fixed_code.replace(': ', ': ;')
+            fixes.append("修复了CSS选择器语法")
+        return fixed_code, fixes
+    def fix_java_advanced(self, code):
+        """高级Java修复"""
         fixes = []
+        fixed_code = code
+        lines = fixed_code.split('\n')
+        for i, line in enumerate(lines):
+            stripped = line.strip()
+            # 添加语句分号
+            if (stripped and
+                not stripped.endswith(';') and
+                not stripped.endswith('{') and
+                not stripped.endswith('}') and
+                not stripped.startswith('//') and
+                not stripped.startswith('/*') and
+                not stripped.startswith('*') and
+                not stripped.endswith('*/') and
+                ('=' in stripped or
+                 stripped.startswith('public ') or
+                 stripped.startswith('private ') or
+                 stripped.startswith('protected ') or
+                 stripped.startswith('return ') or
+                 'System.out' in stripped)):
+                lines[i] = line.rstrip() + ';'
+                fixes.append("添加了Java语句分号")
+        fixed_code = '\n'.join(lines)
         # 添加基本的类结构
+        if 'public class' in fixed_code and '{' not in fixed_code:
+            fixed_code = fixed_code.replace('public class', 'public class Main {') + '\n    public static void main(String[] args) {\n        // 程序入口\n    }\n}'
+            fixes.append("添加了完整的Java类结构")
+        return fixed_code, fixes
+    def fix_cpp_advanced(self, code):
+        """高级C++修复"""
+        fixes = []
+        fixed_code = code
+        lines = fixed_code.split('\n')
+        for i, line in enumerate(lines):
+            stripped = line.strip()
+            # 添加语句分号
+            if (stripped and
+                not stripped.endswith(';') and
+                not stripped.endswith('{') and
+                not stripped.endswith('}') and
+                not stripped.startswith('//') and
+                not stripped.startswith('/*') and
+                not stripped.startswith('#') and
+                ('=' in stripped or
+                 stripped.startswith('return ') or
+                 stripped.startswith('cout ') or
+                 'cout <<' in stripped)):
+                lines[i] = line.rstrip() + ';'
+                fixes.append("添加了C++语句分号")
+        fixed_code = '\n'.join(lines)
+        # 添加main函数
+        if '#include' in fixed_code and 'int main' not in fixed_code:
+            fixed_code += '\n\nint main() {\n    return 0;\n}'
+            fixes.append("添加了main函数")
+        return fixed_code, fixes
+    def fix_php_advanced(self, code):
+        """高级PHP修复"""
         fixes = []
+        fixed_code = code
+        # 添加PHP开始标签
+        if '<?php' not in fixed_code and not fixed_code.strip().startswith('<?'):
+            fixed_code = '<?php\n' + fixed_code
+            fixes.append("添加了PHP开始标签")
+        # 修复PHP语句分号
+        lines = fixed_code.split('\n')
+        for i, line in enumerate(lines):
+            stripped = line.strip()
+            if (stripped and
+                not stripped.endswith(';') and
+                not stripped.endswith('{') and
+                not stripped.endswith('}') and
+                not stripped.startswith('//') and
+                not stripped.startswith('/*') and
+                not stripped.startswith('*') and
+                not stripped.startswith('<?') and
+                not stripped.startswith('?>') and
+                ('=' in stripped or
+                 stripped.startswith('echo ') or
+                 stripped.startswith('return ') or
+                 stripped.startswith('$'))):
+                lines[i] = line.rstrip() + ';'
+                fixes.append("添加了PHP语句分号")
+        fixed_code = '\n'.join(lines)
+        return fixed_code, fixes
+    def fix_sql_advanced(self, code):
+        """高级SQL修复"""
+        fixes = []
+        fixed_code = code.upper()  # SQL通常使用大写
+        # 修复常见的SQL语法
+        sql_keywords = ['SELECT', 'FROM', 'WHERE', 'INSERT', 'UPDATE', 'DELETE']
+        for keyword in sql_keywords:
+            if keyword in fixed_code and f'{keyword} ' not in fixed_code:
+                fixed_code = fixed_code.replace(keyword, f'{keyword} ')
+                fixes.append(f"修复了{keyword}关键字格式")
+        return fixed_code, fixes
+    def fix_ruby_advanced(self, code):
+        """高级Ruby修复"""
+        fixes = []
+        fixed_code = code
+        # 修复方法定义
+        if 'def ' in fixed_code and fixed_code.count('def ') > fixed_code.count('end'):
+            fixed_code += '\nend'
+            fixes.append("添加了方法结束的end")
+        # 修复块结构
+        if ('do ' in fixed_code or ' do\n' in fixed_code) and fixed_code.count('do') > fixed_code.count('end'):
+            fixed_code += '\nend'
+            fixes.append("添加了块结束的end")
+        return fixed_code, fixes
+    def fix_go_advanced(self, code):
+        """高级Go修复"""
+        fixes = []
+        fixed_code = code
+        # 添加package声明
+        if 'package ' not in fixed_code:
+            fixed_code = 'package main\n\n' + fixed_code
+            fixes.append("添加了package声明")
+        # 添加import语句如果使用了标准库
+        if ('fmt.' in fixed_code or 'println' in fixed_code) and 'import "' not in fixed_code:
+            if 'package main' in fixed_code:
+                fixed_code = fixed_code.replace('package main', 'package main\n\nimport "fmt"')
+                fixes.append("添加了fmt包导入")
+        # 添加main函数
+        if 'func main' not in fixed_code and 'package main' in fixed_code:
+            fixed_code += '\n\nfunc main() {\n    // 程序入口\n}'
             fixes.append("添加了main函数")
+        return fixed_code, fixes
+    def fix_generic_advanced(self, code):
+        """通用高级修复"""
+        fixes = ["进行了通用语法检查和修复"]
         return code, fixes
     def retrain_from_feedback(self):
+        """根据用户反馈重新训练模型"""
+        print(f"🧠 正在从 {len(self.feedback_data)} 条反馈中学习...")
+        # 这里可以添加真正的增量学习逻辑
+        # 目前先记录，后续可以集成真正的模型微调
 # 创建修复器实例
+fixer = AdvancedCodeFixer()
 def process_code(input_code, use_ai=True):
     """处理代码修复"""
+    if not input_code.strip():
+        return "请输入代码", "❌ 输入为空"
+    language = fixer.detect_language(input_code)
+    try:
+        if use_ai and fixer.model is not None:
+            fixed_code, fixes = fixer.ai_fix_code(input_code, language)
+        else:
+            fixed_code, fixes = fixer.advanced_rule_based_fix(input_code, language)
+        # 生成详细的修复报告
+        report = f"""🔧 智能修复报告
+📝 检测语言: {language.upper()}
+✅ 修复内容: {', '.join(fixes) if fixes else '代码看起来基本正确'}
+🎯 修复类型: {'AI智能修复' if use_ai and fixer.model else '规则修复'}
+💡 提示: {'' if fixes else '如需进一步优化，请使用反馈功能'}"""
+        return fixed_code, report
+    except Exception as e:
+        return f"修复过程中出现错误: {str(e)}", f"❌ 错误报告: {str(e)}"
 def handle_feedback(original_code, fixed_code, user_feedback, is_correct):
     """处理用户反馈"""
+    if not original_code.strip():
+        return "❌ 请输入原始代码"
     fixer.save_feedback(original_code, fixed_code, user_feedback, is_correct)
+    if is_correct:
+        return "✅ 感谢您的正面反馈！系统会继续保持"
+    else:
+        return "🔄 感谢您的改进建议！系统正在学习优化..."
 # 创建Gradio界面
+with gr.Blocks(
+    theme=gr.themes.Soft(
+        primary_hue="blue",
+        secondary_hue="green"
+    ),
+    css="""
+    .gradio-container {
+        max-width: 1200px !important;
+    }
+    .feedback-box {
+        border: 2px solid #e0e0e0;
+        border-radius: 10px;
+        padding: 15px;
+        margin: 10px 0;
+    }
+    """
+) as demo:
+    gr.Markdown("""
+    # 🚀 Capricode 智能多语言代码修复助手
+    **支持 HTML, Python, JavaScript, Java, C++, CSS, PHP, SQL, Ruby, Go 等10+种编程语言！**
+    """)
+    with gr.Tab("🛠️ 代码修复"):
         with gr.Row():
+            with gr.Column(scale=1):
+                gr.Markdown("### 📥 输入代码")
                 input_code = gr.Textbox(
+                    label="",
+                    placeholder="粘贴你的代码到这里...支持多种编程语言自动识别！",
+                    lines=12,
+                    show_copy_button=True
                 )
+                with gr.Row():
+                    use_ai = gr.Checkbox(
+                        label="使用AI智能修复（推荐）",
+                        value=True,
+                        info="启用AI模型进行更智能的修复"
+                    )
+                    fix_btn = gr.Button(
+                        "🔧 开始修复",
+                        variant="primary",
+                        size="lg"
+                    )
+            with gr.Column(scale=1):
+                gr.Markdown("### 📤 修复结果")
                 output_code = gr.Textbox(
+                    label="修复后的代码",
+                    lines=12,
                     show_copy_button=True
                 )
                 report = gr.Textbox(
+                    label="📊 修复分析报告",
+                    lines=4,
+                    max_lines=6
                 )
+    with gr.Tab("💡 反馈学习"):
+        gr.Markdown("""
+        ## 🎯 帮助系统变得更好
+        您的反馈会让AI模型越来越聪明！
+        """)
         with gr.Row():
             with gr.Column():
+                with gr.Group():
+                    gr.Markdown("#### 原始输入")
+                    feedback_original = gr.Textbox(
+                        label="",
+                        placeholder="原始有问题的代码...",
+                        lines=4
+                    )
+                with gr.Group():
+                    gr.Markdown("#### 修复结果")
+                    feedback_fixed = gr.Textbox(
+                        label="",
+                        placeholder="系统修复后的代码...",
+                        lines=4
+                    )
+            with gr.Column():
+                with gr.Group():
+                    gr.Markdown("#### 您的评价")
+                    user_feedback = gr.Textbox(
+                        label="改进建议",
+                        placeholder="这里可以如何改进？有什么建议？",
+                        lines=3
+                    )
+                    is_correct = gr.Radio(
+                        choices=[
+                            ("✅ 修复正确", True),
+                            ("🔄 需要改进", False)
+                        ],
+                        label="修复效果评价",
+                        value=True
+                    )
+                    feedback_btn = gr.Button(
+                        "📮 提交反馈",
+                        variant="secondary"
+                    )
+                feedback_result = gr.Textbox(
+                    label="反馈结果",
+                    interactive=False,
+                    lines=2
                 )
+    with gr.Tab("📚 语言支持"):
+        gr.Markdown("""
+        ## 🌍 支持的编程语言
+        | 语言 | 支持特性 | 示例 |
+        |------|----------|------|
+        | **HTML** | 标签闭合、属性引号、文档结构 | `<div class=test>` → `<div class="test">` |
+        | **Python** | 括号匹配、缩进、冒号、引号 | `print('hello'` → `print('hello')` |
+        | **JavaScript** | 分号、括号、箭头函数 | `function test(` → `function test()` |
+        | **Java** | 分号、类结构、main方法 | `public class Test` → 完整类结构 |
+        | **C++** | 分号、头文件、main函数 | `cout << "hello"` → 添加分号 |
+        | **CSS** | 分号、选择器、属性 | `color: red` → `color: red;` |
+        | **PHP** | 开始标签、分号、语法 | `echo "hello"` → `echo "hello";` |
+        | **SQL** | 关键字格式、语法 | `select name` → `SELECT NAME` |
+        | **Ruby** | end关键字、块结构 | `def test` → 添加end |
+        | **Go** | package、import、main函数 | 自动添加基本结构 |
+        💡 **提示**: 系统会自动检测代码语言并应用相应的修复规则！
+        """)
     # 事件处理
     fix_btn.click(
         outputs=[feedback_result]
     )
+    # 更丰富的示例
+    gr.Markdown("## 🎯 试试这些例子（点击自动填充）:")
+    examples_data = [
+        ["<div class=test>\n    <p>Hello World\n    <img src=image.jpg alt=test>\n</div>", True],  # HTML
+        ["def greet(name\n    print(f'Hello, {name}!')\n    return 'Done'", True],  # Python
+        ["function calculate(a, b {\n    const result = a + b\n    console.log('结果:', result\n    return result", True],  # JavaScript
+        ["public class Calculator {\n    public int add(int a, int b) {\n        return a + b\n    }", True],  # Java
+        [".container {\n    width: 100%\n    height: 200px\n    background: blue\n}", True],  # CSS
+        ["<?php\n$name = 'John'\necho 'Hello, ' . $name", True],  # PHP
+        ["select name, age from users where age > 18", True],  # SQL
+        ["def greet(name)\n    puts 'Hello, ' + name", True],  # Ruby
+        ["fmt.Println('Hello, World!')", True],  # Go
+    ]
     gr.Examples(
+        examples=examples_data,
+        inputs=[input_code, use_ai],
+        label="点击示例代码自动测试"
     )
 if __name__ == "__main__":