Spaces:

teoo33
/

ThesisAnalyzer

Sleeping

App Files Files Community

teoo33 commited on Feb 21, 2025

Commit

8f8f85b

verified ·

1 Parent(s): 4a1fadc

Update app.py

Browse files

Files changed (1) hide show

app.py +168 -217

app.py CHANGED Viewed

@@ -28,40 +28,40 @@ genai.configure(api_key=gemini_api_key)
 def process_single_pdf(pdf_file):
     pdf_path = pdf_file.name if hasattr(pdf_file, 'name') else pdf_file
-    logger.info(f"شروع پردازش فایل: {pdf_path}")
     if not os.path.isfile(pdf_path):
-        logger.error(f"فایل {pdf_path} وجود ندارد.")
         return None, None
     text_splitter = RecursiveCharacterTextSplitter(chunk_size=800, chunk_overlap=150)
     loader = PyPDFLoader(pdf_path)
     try:
         pages = loader.load_and_split()
         docs = text_splitter.split_documents(pages)
-        sections = {"مقدمه": [], "روش‌شناسی": [], "نتایج": [], "بحث": [], "منابع": []}
         for doc in docs:
             text = doc.page_content
-            if re.search(r"مقدمه|Introduction", text, re.I):
-                sections["مقدمه"].append(doc)
-            elif re.search(r"روش|Methodology", text, re.I):
-                sections["روش‌شناسی"].append(doc)
-            elif re.search(r"نتایج|Results", text, re.I):
-                sections["نتایج"].append(doc)
-            elif re.search(r"بحث|Discussion", text, re.I):
-                sections["بحث"].append(doc)
-            elif re.search(r"منابع|References|Bibliography", text, re.I):
-                sections["منابع"].append(doc)
-        logger.info(f"پردازش فایل: {pdf_path} - تعداد تکه‌ها: {len(docs)}")
         return docs, sections
     except Exception as e:
-        logger.error(f"خطا در پردازش {pdf_path}: {str(e)}")
         return None, None
 def upload_and_process_pdf(pdf_files):
     if not pdf_files:
-        return None, None, None, "لطفاً حداقل یک فایل PDF آپلود کنید."
-    logger.info(f"تعداد فایل‌های ورودی: {len(pdf_files)}")
     all_docs = []
-    all_sections = {"مقدمه": [], "روش‌شناسی": [], "نتایج": [], "بحث": [], "منابع": []}
     with concurrent.futures.ThreadPoolExecutor() as executor:
         future_to_file = {executor.submit(process_single_pdf, pdf_file): pdf_file for pdf_file in pdf_files}
         for future in concurrent.futures.as_completed(future_to_file):
@@ -72,47 +72,47 @@ def upload_and_process_pdf(pdf_files):
                     all_sections[key].extend(sections[key])
             else:
                 pdf_file = future_to_file[future]
-                return None, None, None, f"خطا در پردازش فایل: {pdf_file.name if hasattr(pdf_file, 'name') else pdf_file}"
-    logger.info(f"تعداد کل اسناد پردازش‌شده: {len(all_docs)}")
     return None, all_docs, all_sections, None
 def create_vector_db(docs):
     if not docs:
-        return None, "هیچ محتوایی پردازش نشد."
     embeddings = GoogleGenerativeAIEmbeddings(model="models/embedding-001", google_api_key=gemini_api_key)
     try:
-        logger.info("شروع ساخت FAISS...")
         vector_store = FAISS.from_documents(docs, embedding=embeddings)
-        logger.info(f"پایگاه داده وکتوری با {len(docs)} سند ساخته شد.")
         return vector_store, None
     except Exception as e:
-        logger.error(f"خطا در ایجاد پایگاه داده وکتوری: {str(e)}")
-        return None, f"خطا در پردازش وکتوری: {str(e)}"
 def extract_keywords(text):
     try:
-        prompt = f"از متن زیر، 5 کلمه کلیدی اصلی که موضوع اصلی را نشان می‌دهند استخراج کنید:\n**متن:**\n{text[:2000]}\n**کلمات کلیدی:**"
         model = genai.GenerativeModel('gemini-pro')
         response = model.generate_content(prompt)
-        keywords = response.text.split("**کلمات کلیدی:**")[-1].strip().split(", ")
-        logger.info(f"کلمات کلیدی استخراج‌شده: {keywords}")
         time.sleep(1)
         return keywords[:5]
     except Exception as e:
-        logger.error(f"خطا در استخراج کلمات کلیدی: {str(e)}")
-        return ["تحقیق", "نتایج", "روش", "تحلیل", "موضوع"]
 def translate_to_english(text):
     try:
-        prompt = f"متن زیر را به انگلیسی ترجمه کنید:\n**متن:**\n{text[:1000]}\n**ترجمه:**"
         model = genai.GenerativeModel('gemini-pro')
         response = model.generate_content(prompt)
-        translated_text = response.text.split("**ترجمه:**")[-1].strip()
-        logger.info(f"متن ترجمه‌شده: {translated_text[:50]}...")
         time.sleep(1)
         return translated_text
     except Exception as e:
-        logger.error(f"خطا در ترجمه: {str(e)}")
         return text
 def check_plagiarism(text):
@@ -121,72 +121,72 @@ def check_plagiarism(text):
         translated_keywords = translate_to_english(" ".join(keywords))
         query = translated_keywords
-        # جستجو در Google Scholar
         url_scholar = f"https://scholar.google.com/scholar?q={query}"
         response_scholar = requests.get(url_scholar, headers={"User-Agent": "Mozilla/5.0"})
         soup_scholar = BeautifulSoup(response_scholar.text, 'html.parser')
         results_scholar = []
         for item in soup_scholar.find_all('h3', class_='gs_rt', limit=5):
             title = item.get_text().strip()
-            link = item.find('a')['href'] if item.find('a') else "لینک موجود نیست"
             author_info = item.find_next('div', class_='gs_a')
             if author_info:
                 author_year = author_info.get_text().strip()
                 author_match = re.search(r"(.+?)(?: - (\d{4}))?", author_year)
-                author = author_match.group(1) if author_match.group(1) else "نویسنده نامشخص"
-                year = author_match.group(2) if author_match.group(2) else "نامشخص"
             else:
-                author, year = "نویسنده نامشخص", "نامشخص"
             results_scholar.append((title, link, author, year))
-        logger.info(f"نتایج Google Scholar: {results_scholar}")
-        # جستجو در arXiv
         url_arxiv = f"https://arxiv.org/search/?query={query}&searchtype=all&source=header"
         response_arxiv = requests.get(url_arxiv, headers={"User-Agent": "Mozilla/5.0"})
         soup_arxiv = BeautifulSoup(response_arxiv.text, 'html.parser')
         results_arxiv = []
         for item in soup_arxiv.find_all('p', class_='title', limit=5):
             title = item.get_text().strip()
-            link = item.find_previous('a', class_='arxiv-url')['href'] if item.find_previous('a', class_='arxiv-url') else "لینک موجود نیست"
             author_info = item.find_next('p', class_='authors')
             year_info = item.find_next('p', class_='is-size-7')
-            author = author_info.get_text().replace("Authors:", "").strip() if author_info else "نویسنده نامشخص"
-            year = re.search(r"\d{4}", year_info.get_text() if year_info else "").group(0) if re.search(r"\d{4}", year_info.get_text() if year_info else "") else "نامشخص"
             results_arxiv.append((title, link, author, year))
-        logger.info(f"نتایج arXiv: {results_arxiv}")
         all_results = results_scholar + results_arxiv
         if not all_results:
-            return "هیچ تشابه قابل توجهی یافت نشد.\n**توضیح:** متن شما با منابع علمی موجود در Google Scholar و arXiv مقایسه شد و هیچ تطابق معناداری پیدا نشد.\n**وضعیت:** احتمال سرقت ادبی بسیار پایین است."
         max_similarity = 0
         matched_texts = []
         for title, link, author, year in all_results:
             similarity = SequenceMatcher(None, text[:1000], title).ratio()
-            if similarity > 0.1:  # حداقل 10% تشابه برای نمایش
-                matched_texts.append(f"**عنوان:** {title}\n**نویسنده:** {author}\n**سال:** {year}\n**لینک:** {link}\n**توضیح:** این منبع ممکن است بخشی از متن شما را مشابه داشته باشد.")
             if similarity > max_similarity:
                 max_similarity = similarity
         time.sleep(1)
         similarity_percent = max_similarity * 100
         if not matched_texts:
-            return "هیچ تشابه قابل توجهی یافت نشد.\n**توضیح:** متن شما با منابع علمی مقایسه شد و تطابقی پیدا نشد.\n**وضعیت:** احتمال سرقت ادبی بسیار پایین است."
         if similarity_percent > 20:
-            status = "احتمال سرقت ادبی وجود دارد. لطفاً منابع مشابه را بررسی کنید و ارجاع مناسب اضافه کنید."
         elif similarity_percent > 10:
-            status = "تشابه کم. احتمالاً تصادفی است، اما مرور منابع توصیه می‌شود."
         else:
-            status = "تشابه بسیار کم. احتمال سرقت ادبی ناچیز است."
-        output = (f"**درصد تشابه:** {similarity_percent:.2f}%\n"
-                  f"**وضعیت:** {status}\n"
-                  f"**منابع مشابه یافت‌شده:**\n" + "\n--------------------\n".join(matched_texts[:3]))
         return output
     except Exception as e:
-        logger.error(f"خطا در چک سرقت ادبی: {str(e)}")
-        return f"خطا در بررسی سرقت ادبی: {str(e)}\nلطفاً دوباره امتحان کنید یا پشتیبانی تماس بگیرید."
 def suggest_resources(text):
     try:
@@ -196,20 +196,20 @@ def suggest_resources(text):
         url_scholar = f"https://scholar.google.com/scholar?q={query}"
         response_scholar = requests.get(url_scholar, headers={"User-Agent": "Mozilla/5.0"})
         soup_scholar = BeautifulSoup(response_scholar.text, 'html.parser')
-        papers_scholar = [f"{h.get_text().strip()} (لینک: {h.find('a')['href']})" for h in soup_scholar.find_all('h3')[:3] if h.find('a')]
         url_arxiv = f"https://arxiv.org/search/?query={query}&searchtype=all&source=header"
         response_arxiv = requests.get(url_arxiv, headers={"User-Agent": "Mozilla/5.0"})
         soup_arxiv = BeautifulSoup(response_arxiv.text, 'html.parser')
-        papers_arxiv = [f"{paper.get_text().strip()} (لینک: {paper.find_previous('a', class_='arxiv-url')['href']})"
                         for paper in soup_arxiv.find_all('p', class_='title')[:2] if paper.find_previous('a', class_='arxiv-url')]
         resources = papers_scholar + papers_arxiv if papers_scholar else papers_arxiv
         time.sleep(1)
-        return resources if resources else ["منبعی یافت نشد."]
     except Exception as e:
-        logger.error(f"خطا در پیشنهاد منابع: {str(e)}")
-        return ["خطا در جستجوی منابع"]
 def evaluate_quality(docs, sections):
     text = " ".join([doc.page_content for doc in docs])
@@ -218,67 +218,67 @@ def evaluate_quality(docs, sections):
     suggestions = []
     auto_fix = ""
-    # معیار 1: منابع (کیفیت و تعداد)
     ref_count = len(re.findall(r"\[\d+\]|[A-Za-z]+\s+\d{4}", text))
     if ref_count > 15:
         score += 30
-        explanation.append("منابع بسیار قوی و قابل استناد (بیش از 15 ارجاع از مجلات معتبر).")
     elif ref_count > 10:
         score += 25
-        explanation.append("منابع کافی و قابل استناد (10-15 ارجاع).")
     elif ref_count > 0:
         score += 15
-        explanation.append("منابع موجود اما محدود (کمتر از 10 ارجاع).")
-        suggestions.append("حداقل 5 منبع از مجلات معتبر (مثل IEEE، Springer، یا Elsevier) با ذکر دقیق نویسنده و سال اضافه کنید.")
     else:
-        explanation.append("منابع کافی یافت نشد.")
-        suggestions.append("بخش منابع را با حداقل 10 ارجاع از مقالات Peer-Reviewed تکمیل کنید.")
-        auto_fix += "\n**اصلاح خودکار - نمونه ارجاع:**\n[1] Smith, J. (2020). 'Advanced Research Methods', Journal of Science, 15(3), 123-145."
-    # معیار 2: انسجام، نگارش، و بار علمی
     words = text.split()
     word_freq = Counter(words).most_common(10)
-    keywords = [word[0] for word in word_freq[:3]] if word_freq else ["تحقیق", "نتایج", "روش"]
     scientific_terms = sum(1 for word in words if word.lower() in ["analysis", "data", "method", "result", "hypothesis", "theory"])
     if word_freq and word_freq[0][1] > len(words) * 0.02 and scientific_terms > len(words) * 0.05:
         score += 25
-        explanation.append("انسجام متنی عالی و بار علمی بالا (تمرکز روی موضوع و استفاده از اصطلاحات علمی).")
     else:
-        explanation.append("انسجام متنی ضعیف یا بار علمی پایین (پراکندگی موضوعی یا کمبود اصطلاحات علمی).")
-        suggestions.append(f"از کلمات کلیدی مثل {', '.join(keywords)} و اصطلاحات علمی (مثل 'تحلیل آماری' یا 'فرضیه') بیشتر استفاده کنید و جملات را روان‌تر کنید.")
         try:
-            prompt = f"این پاراگراف را علمی‌تر، روان‌تر و با بار علمی بالاتر بازنویسی کنید:\n**متن:**\n{text[:500]}\n**بازنویسی:**"
             model = genai.GenerativeModel('gemini-pro')
             response = model.generate_content(prompt)
-            auto_fix += f"\n**اصلاح خودکار - بازنویسی پاراگراف:**\n{response.text.split('**بازنویسی:**')[-1].strip()}"
             time.sleep(1)
         except Exception as e:
-            logger.error(f"خطا در بازنویسی: {str(e)}")
-            auto_fix += "\n**اصلاح خودکار - بازنویسی:**\nخطا در بازنویسی، لطفاً متن را دستی اصلاح کنید."
-    # معیار 3: جداول/شکل‌ها
-    if re.search(r"جدول|شکل|Table|Figure", text, re.I):
         score += 20
-        explanation.append("استفاده مؤثر از جداول یا شکل‌ها برای پشتیبانی یافته‌ها.")
     else:
-        explanation.append("عدم استفاده از جداول یا شکل‌ها.")
-        suggestions.append("یک جدول برای داده‌ها و یک شکل (مثل نمودار میله‌ای یا خطی) برای روندها اضافه کنید تا یافته‌ها قابل‌فهم‌تر شوند.")
-    # معیار 4: عمق تحلیل و بار علمی
-    analysis_text = " ".join([doc.page_content for doc in sections.get("نتایج", []) + sections.get("بحث", [])])
-    stats_found = bool(re.search(r"آمار|Statistic|Regression|ANOVA|T-test|Correlation", analysis_text, re.I))
     if len(analysis_text.split()) > 1500 and stats_found:
         score += 25
-        explanation.append("عمق تحلیل بسیار بالا (تحلیل طولانی و آماری با بار علمی قوی).")
     elif len(analysis_text.split()) > 1000:
         score += 15
-        explanation.append("عمق تحلیل قابل قبول (طولانی اما بدون تحلیل آماری کافی).")
-        suggestions.append("تحلیل آماری پیشرفته (مثل رگرسیون، ANOVA، یا T-test) برای تقویت یافته‌ها اضافه کنید.")
     else:
-        explanation.append("عمق تحلیل ضعیف (کوتاه و بدون تحلیل آماری).")
-        suggestions.append("بخش نتایج/بحث را با حداقل 1500 کلمه و تحلیل آماری جامع گسترش دهید.")
-    # سنجش بار علمی با مقایسه جهانی
     try:
         keywords = extract_keywords(text)
         translated_text = translate_to_english(" ".join(keywords))
@@ -288,11 +288,11 @@ def evaluate_quality(docs, sections):
         soup_arxiv = BeautifulSoup(response_arxiv.text, 'html.parser')
         arxiv_titles = [paper.get_text().strip() for paper in soup_arxiv.find_all('p', class_='title')[:3]]
         if arxiv_titles:
-            suggestions.append(f"برای افزایش بار علمی، به مقالات مشابه در arXiv مثل '{arxiv_titles[0]}' رجوع کنید و یافته‌های خود را با آن‌ها مقایسه کنید.")
         time.sleep(1)
     except Exception as e:
-        logger.error(f"خطا در سنجش بار علمی: {str(e)}")
-        suggestions.append("مقایسه با منابع علمی جهانی به دلیل خطا انجام نشد.")
     score = max(min(score, 100), 0)
     return score, "; ".join(explanation), "; ".join(suggestions), auto_fix
@@ -300,69 +300,69 @@ def evaluate_quality(docs, sections):
 llm_gemini = ChatGoogleGenerativeAI(model="gemini-pro", google_api_key=gemini_api_key, convert_system_message_to_human=True, temperature=0.5)
 academic_analysis_prompt = PromptTemplate(
-    template="""شما یک تحلیلگر آکادمیک حرفه‌ای هستید. تحلیل عمیق و ساختارمند از {section} ارائه دهید:
-1. صرفاً بر اساس متن ارائه‌شده.
-2. شامل مرور موضوع، روش‌ها، یافته‌ها و نقد (در صورت وجود).
-3. به زبان {language} و با جزئیات {detail_level}.
-**متن مرتبط:**
 {context}
-**سوال کاربر:** {question}
-**تحلیل آکادمیک:**""",
     input_variables=["section", "context", "question", "language", "detail_level"]
 )
 summary_prompt = PromptTemplate(
-    template="""شما یک متخصص نگارش آکادمیک هستید. یک خلاصه علمی ساختارمند (200-300 کلمه) از متن زیر به زبان {language} تولید کنید که شامل:
-1. هدف تحقیق
-2. روش‌شناسی
-3. یافته‌های اصلی
-4. نتیجه‌گیری
-**متن:**
 {context}
-**خلاصه:**""",
     input_variables=["context", "language"]
 )
 general_qa_prompt = PromptTemplate(
-    template="""شما یک دستیار هوشمند هستید. به سوال کاربر به زبان {language} پاسخ دهید:
-**سوال کاربر:** {question}
-پاسخ:""",
     input_variables=["question", "language"]
 )
 plagiarism_prompt = PromptTemplate(
-    template="""درصد تشابه متن زیر با منابع انگلیسی را گزارش دهید:
-**متن:**
 {context}
-**نتیجه:** {similarity}""",
     input_variables=["context", "similarity"]
 )
 quality_prompt = PromptTemplate(
-    template="""شما یک ارزیاب آکادمیک حرفه‌ای هستید. کیفیت علمی متن زیر را ارزیابی کنید:
-**متن:**
 {context}
-**امتیاز:** {score}/100
-**توضیحات:** {explanation}
-**پیشنهادات بهبود:** {suggestions}""",
     input_variables=["context", "score", "explanation", "suggestions"]
 )
 def create_conversation_chain(vector_store, docs, mode, language, detail_level, section=None):
-    if mode == "تحلیل آکادمیک (RAG)":
         retriever = vector_store.as_retriever(search_kwargs={"k": 3})
         chain = ConversationalRetrievalChain.from_llm(
             llm=llm_gemini,
             retriever=retriever,
             return_source_documents=True,
-            combine_docs_chain_kwargs={"prompt": academic_analysis_prompt.partial(language=language, detail_level=detail_level, section=section or "کل سند")},
             verbose=True
         )
-    elif mode == "خلاصه خودکار":
         chain = LLMChain(llm=llm_gemini, prompt=summary_prompt.partial(language=language))
-    elif mode == "چک سرقت ادبی":
         chain = LLMChain(llm=llm_gemini, prompt=plagiarism_prompt.partial(language=language))
-    elif mode == "ارزیابی کیفیت":
         chain = LLMChain(llm=llm_gemini, prompt=quality_prompt.partial(language=language))
     else:
         chain = LLMChain(llm=llm_gemini, prompt=general_qa_prompt.partial(language=language))
@@ -370,141 +370,92 @@ def create_conversation_chain(vector_store, docs, mode, language, detail_level,
 def academic_chatbot(pdf_file, mode, query, language, detail_level, section_dropdown):
     start_time = time.time()
-    logger.info(f"شروع پردازش - حالت: {mode}, سوال: {query}, زبان: {language}, جزئیات: {detail_level}, بخش: {section_dropdown}")
-    if mode != "پاسخ استاندارد" and not pdf_file:
-        return "لطفاً یک فایل PDF آپلود کنید."
-    if mode == "پاسخ استاندارد":
         chain = create_conversation_chain(None, None, mode, language, detail_level)
         try:
             result = chain.invoke({"question": query})["text"]
-            return f"{result}\n\n⏱ زمان پردازش: {time.time() - start_time:.2f} ثانیه"
         except Exception as e:
-            logger.error(f"خطا در پردازش استاندارد: {str(e)}")
-            return f"خطا: {str(e)}"
     pdf_files = pdf_file if isinstance(pdf_file, list) else [pdf_file]
     _, docs, sections, error = upload_and_process_pdf(pdf_files)
     if error:
         return error
-    target_docs = docs if section_dropdown == "کل سند" else sections.get(section_dropdown, docs)
     context = " ".join([doc.page_content for doc in target_docs])
     vector_store = None
-    if mode in ["تحلیل آکادمیک (RAG)", "چک سرقت ادبی", "ارزیابی کیفیت"]:
         vector_store, vectordb_error = create_vector_db(target_docs)
         if vectordb_error:
             return vectordb_error
     chain = create_conversation_chain(vector_store, target_docs, mode, language, detail_level, section_dropdown)
     try:
-        if mode == "خلاصه خودکار":
             time.sleep(2)
             result = chain.invoke({"context": context[:5000]})["text"]
-        elif mode == "چک سرقت ادبی":
             plagiarism_result = check_plagiarism(context)
             result = plagiarism_result
-        elif mode == "ارزیابی کیفیت":
             score, explanation, suggestions, auto_fix = evaluate_quality(target_docs, sections)
             time.sleep(2)
             result = chain.invoke({"context": context[:5000], "score": score, "explanation": explanation, "suggestions": suggestions})["text"] + auto_fix
         else:
             result = chain.invoke({"question": query, "chat_history": []})["answer"]
-        if mode not in ["چک سرقت ادبی", "ارزیابی کیفیت"]:
             resources = suggest_resources(context)
-            result += "\n\n**منابع پیشنهادی:**\n" + "\n".join(resources)
-        return f"{result}\n\n⏱ زمان پردازش: {time.time() - start_time:.2f} ثانیه"
     except Exception as e:
-        logger.error(f"خطا در پردازش: {str(e)}")
         if "429" in str(e):
-            return "خطا: محدودیت درخواست به API Gemini. لطفاً چند دقیقه صبر کنید و دوباره امتحان کنید."
-        return f"خطا: {str(e)}"
-# CSS و JavaScript برای راست‌چین، نمایش کلمات انگلیسی، و پشتیبانی از Dark/Light Mode
 css = """
-:root {
-    --bg-light: #f0f4f8;
-    --bg-dark: #1a202c;
-    --text-light: #2c3e50;
-    --text-dark: #ffffff;
-    --button-bg: #4CAF50;
-    --button-hover: #45a049;
-    --input-bg: #ffffff;
-    --input-border: #ddd;
-    --input-bg-dark: #2d3748;
-    --input-border-dark: #4a5568;
-}
-[data-theme="dark"] {
-    --bg-light: #1a202c;
-    --bg-dark: #f0f4f8;
-    --text-light: #ffffff;
-    --text-dark: #2c3e50;
-    --input-bg: #2d3748;
-    --input-border: #4a5568;
-}
-body {background-color: var(--bg-light); font-family: 'Vazir', 'Arial', sans-serif; direction: rtl; text-align: right; color: var(--text-light); transition: all 0.3s ease;}
-.gr-button {background-color: var(--button-bg); color: white; border: none; padding: 12px 25px; border-radius: 5px; margin-right: 25px; width: auto; display: inline-block; transition: all 0.3s ease;}
-.gr-button:hover {background-color: var(--button-hover);}
-.gr-textbox, .gr-dropdown, .gr-radio, .gr-file {direction: rtl; text-align: right; background-color: var(--input-bg); border: 1px solid var(--input-border); border-radius: 5px; padding: 12px; margin-right: 20px; width: 95%; box-sizing: border-box; font-size: 16px; color: var(--text-light); transition: all 0.3s ease;}
-.gr-row {display: flex; justify-content: space-between; margin-bottom: 20px;}
-.gr-column {padding: 20px;}
-h1, h2, h3 {color: var(--text-light); text-align: center; margin-bottom: 25px; font-size: 24px; transition: all 0.3s ease;}
-.markdown {direction: rtl; text-align: right; color: var(--text-light); margin-bottom: 20px; font-size: 16px; transition: all 0.3s ease;}
-/* نمایش بهتر کلمات انگلیسی در متن فارسی */
-body {unicode-bidi: embed;}
-body * {unicode-bidi: embed;}
-.english {direction: ltr; display: inline-block; margin-left: 10px; padding: 3px 5px; font-family: 'Arial', sans-serif; background: var(--input-bg); border-radius: 3px; box-shadow: 0 1px 2px rgba(0,0,0,0.1); color: var(--text-light);}
-/* تنظیم فلش منوهای کشویی */
-.gr-dropdown {position: relative;}
-.gr-dropdown select {direction: rtl; text-align: right; padding: 12px 40px 12px 15px; appearance: none; background: url('data:image/svg+xml;utf8,<svg fill="%23ffffff" height="24" viewBox="0 0 24 24" width="24" xmlns="http://www.w3.org/2000/svg"><path d="M7 10l5 5 5-5z"/></svg>') no-repeat right 15px center; background-size: 20px; border: 1px solid var(--input-border); border-radius: 5px; font-size: 16px; color: var(--text-light); background-color: var(--input-bg);}
-.gr-dropdown select option {direction: rtl; text-align: right; padding: 10px; background-color: var(--input-bg); color: var(--text-light);}
-/* سوئیچ Dark/Light Mode */
-#theme-toggle {position: fixed; top: 10px; left: 10px; padding: 8px 15px; background-color: var(--button-bg); color: white; border-radius: 5px; cursor: pointer; z-index: 1000; transition: all 0.3s ease;}
-#theme-toggle:hover {background-color: var(--button-hover);}
-"""
-# JavaScript برای تغییر تم
-js = """
-function toggleTheme() {
-    const body = document.body;
-    const currentTheme = body.getAttribute('data-theme') || 'light';
-    const newTheme = currentTheme === 'light' ? 'dark' : 'light';
-    body.setAttribute('data-theme', newTheme);
-    const button = document.getElementById('theme-toggle');
-    button.textContent = newTheme === 'dark' ? 'تغییر به Light Mode' : 'تغییر به Dark Mode';
-    return newTheme;
-}
-document.getElementById('theme-toggle').addEventListener('click', function() {
-    toggleTheme();
-});
 """
-with gr.Blocks(css=css, title="تحلیلگر حرفه‌ای پایان‌نامه", head=gr.HTML(f"<script>{js}</script>")) as iface:
-    gr.Markdown("# تحلیلگر حرفه‌ای پایان‌نامه با Gemini")
-    gr.Markdown("فایل <span class='english'>PDF</span> خود را آپلود کنید و از قابلیت‌های تحلیل، خلاصه، سرقت ادبی یا ارزیابی ��یفیت استفاده کنید.")
     with gr.Row():
         with gr.Column():
-            pdf_input = gr.File(file_types=['.pdf'], label="آپلود فایل PDF", file_count="multiple")
             mode = gr.Radio(
-                ["تحلیل آکادمیک (RAG)", "خلاصه خودکار", "چک سرقت ادبی", "ارزیابی کیفیت", "پاسخ استاندارد"],
-                label="حالت پردازش",
-                value="تحلیل آکادمیک (RAG)"
             )
-            query = gr.Textbox(lines=3, placeholder="سوال یا درخواست خود را اینجا بنویسید...", label="سوال یا درخواست")
-            section = gr.Dropdown(["کل سند", "مقدمه", "روش‌شناسی", "نتایج", "بحث", "منابع"], label="بخش موردنظر", value="کل سند")
-            language = gr.Dropdown(["فارسی", "English"], label="زبان پاسخ", value="فارسی")
-            detail = gr.Dropdown(["خلاصه", "جامع"], label="سطح جزئیات", value="جامع")
-            submit = gr.Button("ارسال")
         with gr.Column():
-            output = gr.Textbox(label="نتیجه پردازش", lines=10, placeholder="نتایج اینجا نمایش داده می‌شود...")
     submit.click(
         fn=academic_chatbot,

 def process_single_pdf(pdf_file):
     pdf_path = pdf_file.name if hasattr(pdf_file, 'name') else pdf_file
+    logger.info(f"Starting to process file: {pdf_path}")
     if not os.path.isfile(pdf_path):
+        logger.error(f"File {pdf_path} does not exist.")
         return None, None
     text_splitter = RecursiveCharacterTextSplitter(chunk_size=800, chunk_overlap=150)
     loader = PyPDFLoader(pdf_path)
     try:
         pages = loader.load_and_split()
         docs = text_splitter.split_documents(pages)
+        sections = {"Introduction": [], "Methodology": [], "Results": [], "Discussion": [], "References": []}
         for doc in docs:
             text = doc.page_content
+            if re.search(r"Introduction|مقدمه", text, re.I):
+                sections["Introduction"].append(doc)
+            elif re.search(r"Methodology|روش", text, re.I):
+                sections["Methodology"].append(doc)
+            elif re.search(r"Results|نتایج", text, re.I):
+                sections["Results"].append(doc)
+            elif re.search(r"Discussion|بحث", text, re.I):
+                sections["Discussion"].append(doc)
+            elif re.search(r"References|Bibliography|منابع", text, re.I):
+                sections["References"].append(doc)
+        logger.info(f"Processed file: {pdf_path} - Number of chunks: {len(docs)}")
         return docs, sections
     except Exception as e:
+        logger.error(f"Error processing {pdf_path}: {str(e)}")
         return None, None
 def upload_and_process_pdf(pdf_files):
     if not pdf_files:
+        return None, None, None, "Please upload at least one PDF file."
+    logger.info(f"Number of input files: {len(pdf_files)}")
     all_docs = []
+    all_sections = {"Introduction": [], "Methodology": [], "Results": [], "Discussion": [], "References": []}
     with concurrent.futures.ThreadPoolExecutor() as executor:
         future_to_file = {executor.submit(process_single_pdf, pdf_file): pdf_file for pdf_file in pdf_files}
         for future in concurrent.futures.as_completed(future_to_file):
                     all_sections[key].extend(sections[key])
             else:
                 pdf_file = future_to_file[future]
+                return None, None, None, f"Error processing file: {pdf_file.name if hasattr(pdf_file, 'name') else pdf_file}"
+    logger.info(f"Total number of processed documents: {len(all_docs)}")
     return None, all_docs, all_sections, None
 def create_vector_db(docs):
     if not docs:
+        return None, "No content was processed."
     embeddings = GoogleGenerativeAIEmbeddings(model="models/embedding-001", google_api_key=gemini_api_key)
     try:
+        logger.info("Starting to build FAISS...")
         vector_store = FAISS.from_documents(docs, embedding=embeddings)
+        logger.info(f"Vector database built with {len(docs)} documents.")
         return vector_store, None
     except Exception as e:
+        logger.error(f"Error creating vector database: {str(e)}")
+        return None, f"Error in vector processing: {str(e)}"
 def extract_keywords(text):
     try:
+        prompt = f"Extract 5 main keywords from the following text that represent the main topic:\n**Text:**\n{text[:2000]}\n**Keywords:**"
         model = genai.GenerativeModel('gemini-pro')
         response = model.generate_content(prompt)
+        keywords = response.text.split("**Keywords:**")[-1].strip().split(", ")
+        logger.info(f"Extracted keywords: {keywords}")
         time.sleep(1)
         return keywords[:5]
     except Exception as e:
+        logger.error(f"Error extracting keywords: {str(e)}")
+        return ["research", "results", "method", "analysis", "topic"]
 def translate_to_english(text):
     try:
+        prompt = f"Translate the following text to English:\n**Text:**\n{text[:1000]}\n**Translation:**"
         model = genai.GenerativeModel('gemini-pro')
         response = model.generate_content(prompt)
+        translated_text = response.text.split("**Translation:**")[-1].strip()
+        logger.info(f"Translated text: {translated_text[:50]}...")
         time.sleep(1)
         return translated_text
     except Exception as e:
+        logger.error(f"Error in translation: {str(e)}")
         return text
 def check_plagiarism(text):
         translated_keywords = translate_to_english(" ".join(keywords))
         query = translated_keywords
+        # Search in Google Scholar
         url_scholar = f"https://scholar.google.com/scholar?q={query}"
         response_scholar = requests.get(url_scholar, headers={"User-Agent": "Mozilla/5.0"})
         soup_scholar = BeautifulSoup(response_scholar.text, 'html.parser')
         results_scholar = []
         for item in soup_scholar.find_all('h3', class_='gs_rt', limit=5):
             title = item.get_text().strip()
+            link = item.find('a')['href'] if item.find('a') else "No link available"
             author_info = item.find_next('div', class_='gs_a')
             if author_info:
                 author_year = author_info.get_text().strip()
                 author_match = re.search(r"(.+?)(?: - (\d{4}))?", author_year)
+                author = author_match.group(1) if author_match.group(1) else "Unknown Author"
+                year = author_match.group(2) if author_match.group(2) else "Unknown"
             else:
+                author, year = "Unknown Author", "Unknown"
             results_scholar.append((title, link, author, year))
+        logger.info(f"Google Scholar results: {results_scholar}")
+        # Search in arXiv
         url_arxiv = f"https://arxiv.org/search/?query={query}&searchtype=all&source=header"
         response_arxiv = requests.get(url_arxiv, headers={"User-Agent": "Mozilla/5.0"})
         soup_arxiv = BeautifulSoup(response_arxiv.text, 'html.parser')
         results_arxiv = []
         for item in soup_arxiv.find_all('p', class_='title', limit=5):
             title = item.get_text().strip()
+            link = item.find_previous('a', class_='arxiv-url')['href'] if item.find_previous('a', class_='arxiv-url') else "No link available"
             author_info = item.find_next('p', class_='authors')
             year_info = item.find_next('p', class_='is-size-7')
+            author = author_info.get_text().replace("Authors:", "").strip() if author_info else "Unknown Author"
+            year = re.search(r"\d{4}", year_info.get_text() if year_info else "").group(0) if re.search(r"\d{4}", year_info.get_text() if year_info else "") else "Unknown"
             results_arxiv.append((title, link, author, year))
+        logger.info(f"arXiv results: {results_arxiv}")
         all_results = results_scholar + results_arxiv
         if not all_results:
+            return "No significant similarity found.\n**Explanation:** Your text was compared with scientific resources in Google Scholar and arXiv, and no meaningful matches were found.\n**Status:** Plagiarism likelihood is very low."
         max_similarity = 0
         matched_texts = []
         for title, link, author, year in all_results:
             similarity = SequenceMatcher(None, text[:1000], title).ratio()
+            if similarity > 0.1:  # Minimum 10% similarity for display
+                matched_texts.append(f"**Title:** {title}\n**Author:** {author}\n**Year:** {year}\n**Link:** {link}\n**Note:** This resource may have some similarity with your text.")
             if similarity > max_similarity:
                 max_similarity = similarity
         time.sleep(1)
         similarity_percent = max_similarity * 100
         if not matched_texts:
+            return "No significant similarity found.\n**Explanation:** Your text was compared with scientific resources and no matches were found.\n**Status:** Plagiarism likelihood is very low."
         if similarity_percent > 20:
+            status = "Plagiarism is likely. Please review similar resources and add appropriate citations."
         elif similarity_percent > 10:
+            status = "Low similarity. Possibly coincidental, but reviewing resources is recommended."
         else:
+            status = "Very low similarity. Plagiarism likelihood is negligible."
+        output = (f"**Similarity Percentage:** {similarity_percent:.2f}%\n"
+                  f"**Status:** {status}\n"
+                  f"**Similar Resources Found:**\n" + "\n--------------------\n".join(matched_texts[:3]))
         return output
     except Exception as e:
+        logger.error(f"Error in plagiarism check: {str(e)}")
+        return f"Error in plagiarism check: {str(e)}\nPlease try again or contact support."
 def suggest_resources(text):
     try:
         url_scholar = f"https://scholar.google.com/scholar?q={query}"
         response_scholar = requests.get(url_scholar, headers={"User-Agent": "Mozilla/5.0"})
         soup_scholar = BeautifulSoup(response_scholar.text, 'html.parser')
+        papers_scholar = [f"{h.get_text().strip()} (Link: {h.find('a')['href']})" for h in soup_scholar.find_all('h3')[:3] if h.find('a')]
         url_arxiv = f"https://arxiv.org/search/?query={query}&searchtype=all&source=header"
         response_arxiv = requests.get(url_arxiv, headers={"User-Agent": "Mozilla/5.0"})
         soup_arxiv = BeautifulSoup(response_arxiv.text, 'html.parser')
+        papers_arxiv = [f"{paper.get_text().strip()} (Link: {paper.find_previous('a', class_='arxiv-url')['href']})"
                         for paper in soup_arxiv.find_all('p', class_='title')[:2] if paper.find_previous('a', class_='arxiv-url')]
         resources = papers_scholar + papers_arxiv if papers_scholar else papers_arxiv
         time.sleep(1)
+        return resources if resources else ["No resources found."]
     except Exception as e:
+        logger.error(f"Error in suggesting resources: {str(e)}")
+        return ["Error in resource search"]
 def evaluate_quality(docs, sections):
     text = " ".join([doc.page_content for doc in docs])
     suggestions = []
     auto_fix = ""
+    # Criterion 1: References (Quality and Quantity)
     ref_count = len(re.findall(r"\[\d+\]|[A-Za-z]+\s+\d{4}", text))
     if ref_count > 15:
         score += 30
+        explanation.append("Very strong and credible references (more than 15 citations from reputable journals).")
     elif ref_count > 10:
         score += 25
+        explanation.append("Sufficient and credible references (10-15 citations).")
     elif ref_count > 0:
         score += 15
+        explanation.append("Existing but limited references (fewer than 10 citations).")
+        suggestions.append("Add at least 5 sources from reputable journals (like IEEE, Springer, or Elsevier) with precise author and year citations.")
     else:
+        explanation.append("No sufficient references found.")
+        suggestions.append("Complete the references section with at least 10 citations from peer-reviewed articles.")
+        auto_fix += "\n**Auto-fix - Sample Citation:**\n[1] Smith, J. (2020). 'Advanced Research Methods', Journal of Science, 15(3), 123-145."
+    # Criterion 2: Coherence, Writing, and Scientific Weight
     words = text.split()
     word_freq = Counter(words).most_common(10)
+    keywords = [word[0] for word in word_freq[:3]] if word_freq else ["research", "results", "method"]
     scientific_terms = sum(1 for word in words if word.lower() in ["analysis", "data", "method", "result", "hypothesis", "theory"])
     if word_freq and word_freq[0][1] > len(words) * 0.02 and scientific_terms > len(words) * 0.05:
         score += 25
+        explanation.append("Excellent textual coherence and high scientific weight (focus on topic and use of scientific terms).")
     else:
+        explanation.append("Poor textual coherence or low scientific weight (topic dispersion or lack of scientific terms).")
+        suggestions.append(f"Use keywords like {', '.join(keywords)} and scientific terms (like 'statistical analysis' or 'hypothesis') more frequently and make sentences smoother.")
         try:
+            prompt = f"Rewrite the following paragraph to be more scientific, smoother, and with higher scientific weight:\n**Text:**\n{text[:500]}\n**Rewritten:**"
             model = genai.GenerativeModel('gemini-pro')
             response = model.generate_content(prompt)
+            auto_fix += f"\n**Auto-fix - Rewritten Paragraph:**\n{response.text.split('**Rewritten:**')[-1].strip()}"
             time.sleep(1)
         except Exception as e:
+            logger.error(f"Error in rewriting: {str(e)}")
+            auto_fix += "\n**Auto-fix - Rewritten:**\nError in rewriting, please manually revise the text."
+    # Criterion 3: Tables/Figures
+    if re.search(r"Table|Figure|جدول|شکل", text, re.I):
         score += 20
+        explanation.append("Effective use of tables or figures to support findings.")
     else:
+        explanation.append("No use of tables or figures.")
+        suggestions.append("Add a table for data and a figure (like a bar chart or line graph) for trends to make findings more comprehensible.")
+    # Criterion 4: Depth of Analysis and Scientific Weight
+    analysis_text = " ".join([doc.page_content for doc in sections.get("Results", []) + sections.get("Discussion", [])])
+    stats_found = bool(re.search(r"Statistic|Regression|ANOVA|T-test|Correlation|آمار", analysis_text, re.I))
     if len(analysis_text.split()) > 1500 and stats_found:
         score += 25
+        explanation.append("Very high depth of analysis (long and statistical with strong scientific weight).")
     elif len(analysis_text.split()) > 1000:
         score += 15
+        explanation.append("Acceptable depth of analysis (long but lacking sufficient statistical analysis).")
+        suggestions.append("Add advanced statistical analysis (like regression, ANOVA, or T-test) to strengthen findings.")
     else:
+        explanation.append("Poor depth of analysis (short and without statistical analysis).")
+        suggestions.append("Expand the Results/Discussion section to at least 1500 words with comprehensive statistical analysis.")
+    # Measure scientific weight by global comparison
     try:
         keywords = extract_keywords(text)
         translated_text = translate_to_english(" ".join(keywords))
         soup_arxiv = BeautifulSoup(response_arxiv.text, 'html.parser')
         arxiv_titles = [paper.get_text().strip() for paper in soup_arxiv.find_all('p', class_='title')[:3]]
         if arxiv_titles:
+            suggestions.append(f"To increase scientific weight, refer to similar arXiv papers like '{arxiv_titles[0]}' and compare your findings with them.")
         time.sleep(1)
     except Exception as e:
+        logger.error(f"Error in scientific weight assessment: {str(e)}")
+        suggestions.append("Global comparison with scientific resources failed due to an error.")
     score = max(min(score, 100), 0)
     return score, "; ".join(explanation), "; ".join(suggestions), auto_fix
 llm_gemini = ChatGoogleGenerativeAI(model="gemini-pro", google_api_key=gemini_api_key, convert_system_message_to_human=True, temperature=0.5)
 academic_analysis_prompt = PromptTemplate(
+    template="""You are a professional academic analyst. Provide a deep and structured analysis of {section}:
+1. Based solely on the provided text.
+2. Including a review of the topic, methods, findings, and critique (if applicable).
+3. In {language} with {detail_level} detail.
+**Related Text:**
 {context}
+**User Question:** {question}
+**Academic Analysis:**""",
     input_variables=["section", "context", "question", "language", "detail_level"]
 )
 summary_prompt = PromptTemplate(
+    template="""You are an expert in academic writing. Produce a structured scientific summary (200-300 words) of the following text in {language} that includes:
+1. Research objective
+2. Methodology
+3. Main findings
+4. Conclusion
+**Text:**
 {context}
+**Summary:**""",
     input_variables=["context", "language"]
 )
 general_qa_prompt = PromptTemplate(
+    template="""You are an intelligent assistant. Answer the user's question in {language}:
+**User Question:** {question}
+Answer:""",
     input_variables=["question", "language"]
 )
 plagiarism_prompt = PromptTemplate(
+    template="""Report the percentage of similarity of the following text with English resources:
+**Text:**
 {context}
+**Result:** {similarity}""",
     input_variables=["context", "similarity"]
 )
 quality_prompt = PromptTemplate(
+    template="""You are a professional academic evaluator. Evaluate the scientific quality of the following text:
+**Text:**
 {context}
+**Score:** {score}/100
+**Explanations:** {explanation}
+**Improvement Suggestions:** {suggestions}""",
     input_variables=["context", "score", "explanation", "suggestions"]
 )
 def create_conversation_chain(vector_store, docs, mode, language, detail_level, section=None):
+    if mode == "Academic Analysis (RAG)":
         retriever = vector_store.as_retriever(search_kwargs={"k": 3})
         chain = ConversationalRetrievalChain.from_llm(
             llm=llm_gemini,
             retriever=retriever,
             return_source_documents=True,
+            combine_docs_chain_kwargs={"prompt": academic_analysis_prompt.partial(language=language, detail_level=detail_level, section=section or "Entire Document")},
             verbose=True
         )
+    elif mode == "Auto Summary":
         chain = LLMChain(llm=llm_gemini, prompt=summary_prompt.partial(language=language))
+    elif mode == "Plagiarism Check":
         chain = LLMChain(llm=llm_gemini, prompt=plagiarism_prompt.partial(language=language))
+    elif mode == "Quality Evaluation":
         chain = LLMChain(llm=llm_gemini, prompt=quality_prompt.partial(language=language))
     else:
         chain = LLMChain(llm=llm_gemini, prompt=general_qa_prompt.partial(language=language))
 def academic_chatbot(pdf_file, mode, query, language, detail_level, section_dropdown):
     start_time = time.time()
+    logger.info(f"Starting processing - Mode: {mode}, Question: {query}, Language: {language}, Detail: {detail_level}, Section: {section_dropdown}")
+    if mode != "Standard Response" and not pdf_file:
+        return "Please upload at least one PDF file."
+    if mode == "Standard Response":
         chain = create_conversation_chain(None, None, mode, language, detail_level)
         try:
             result = chain.invoke({"question": query})["text"]
+            return f"{result}\n\n⏱ Processing time: {time.time() - start_time:.2f} seconds"
         except Exception as e:
+            logger.error(f"Error in standard processing: {str(e)}")
+            return f"Error: {str(e)}"
     pdf_files = pdf_file if isinstance(pdf_file, list) else [pdf_file]
     _, docs, sections, error = upload_and_process_pdf(pdf_files)
     if error:
         return error
+    target_docs = docs if section_dropdown == "Entire Document" else sections.get(section_dropdown, docs)
     context = " ".join([doc.page_content for doc in target_docs])
     vector_store = None
+    if mode in ["Academic Analysis (RAG)", "Plagiarism Check", "Quality Evaluation"]:
         vector_store, vectordb_error = create_vector_db(target_docs)
         if vectordb_error:
             return vectordb_error
     chain = create_conversation_chain(vector_store, target_docs, mode, language, detail_level, section_dropdown)
     try:
+        if mode == "Auto Summary":
             time.sleep(2)
             result = chain.invoke({"context": context[:5000]})["text"]
+        elif mode == "Plagiarism Check":
             plagiarism_result = check_plagiarism(context)
             result = plagiarism_result
+        elif mode == "Quality Evaluation":
             score, explanation, suggestions, auto_fix = evaluate_quality(target_docs, sections)
             time.sleep(2)
             result = chain.invoke({"context": context[:5000], "score": score, "explanation": explanation, "suggestions": suggestions})["text"] + auto_fix
         else:
             result = chain.invoke({"question": query, "chat_history": []})["answer"]
+        if mode not in ["Plagiarism Check", "Quality Evaluation"]:
             resources = suggest_resources(context)
+            result += "\n\n**Suggested Resources:**\n" + "\n".join(resources)
+        return f"{result}\n\n⏱ Processing time: {time.time() - start_time:.2f} seconds"
     except Exception as e:
+        logger.error(f"Error in processing: {str(e)}")
         if "429" in str(e):
+            return "Error: Rate limit exceeded for Gemini API. Please wait a few minutes and try again."
+        return f"Error: {str(e)}"
+# CSS برای چپ‌چین (LTR) و طراحی ساده با Light Mode
 css = """
+body {background-color: #f0f4f8; font-family: 'Arial', sans-serif; color: #2c3e50; transition: all 0.3s ease;}
+.gr-button {background-color: #4CAF50; color: white; border: none; padding: 12px 25px; border-radius: 5px; margin-right: 15px; width: auto; display: inline-block; transition: all 0.3s ease;}
+.gr-button:hover {background-color: #45a049;}
+.gr-textbox, .gr-dropdown, .gr-radio, .gr-file {background-color: #ffffff; border: 1px solid #ddd; border-radius: 5px; padding: 12px; margin-right: 15px; width: 95%; box-sizing: border-box; font-size: 16px; color: #2c3e50; transition: all 0.3s ease;}
+.gr-row {display: flex; justify-content: space-between; margin-bottom: 15px;}
+.gr-column {padding: 15px;}
+h1, h2, h3 {color: #2c3e50; text-align: left; margin-bottom: 20px; font-size: 24px; transition: all 0.3s ease;}
+.markdown {color: #2c3e50; margin-bottom: 15px; font-size: 16px; transition: all 0.3s ease;}
+/* نمایش بهتر کلمات انگلیسی (بدون نیاز به راست‌چین) */
+.english {display: inline; font-family: 'Arial', sans-serif; background: #e0e0e0; padding: 2px 4px; border-radius: 3px; box-shadow: 0 1px 2px rgba(0,0,0,0.1);}
 """
+with gr.Blocks(css=css, title="Professional Thesis Analyzer with Gemini") as iface:
+    gr.Markdown("# Professional Thesis Analyzer with Gemini")
+    gr.Markdown("Upload your <span class='english'>PDF</span> file and use the analysis, summary, plagiarism check, or quality evaluation features.")
     with gr.Row():
         with gr.Column():
+            pdf_input = gr.File(file_types=['.pdf'], label="Upload <span class='english'>PDF</span> File", file_count="multiple")
             mode = gr.Radio(
+                ["Academic Analysis (RAG)", "Auto Summary", "Plagiarism Check", "Quality Evaluation", "Standard Response"],
+                label="Processing Mode",
+                value="Academic Analysis (RAG)"
             )
+            query = gr.Textbox(lines=3, placeholder="Enter your question or request here...", label="Question or Request")
+            section = gr.Dropdown(["Entire Document", "Introduction", "Methodology", "Results", "Discussion", "References"], label="Target Section", value="Entire Document")
+            language = gr.Dropdown(["English", "Farsi"], label="Response Language", value="English")
+            detail = gr.Dropdown(["Brief", "Detailed"], label="Detail Level", value="Detailed")
+            submit = gr.Button("Submit")
         with gr.Column():
+            output = gr.Textbox(label="Processing Result", lines=10, placeholder="Results will be displayed here...")
     submit.click(
         fn=academic_chatbot,