Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -2,15 +2,14 @@
|
|
| 2 |
import sys
|
| 3 |
import subprocess
|
| 4 |
import importlib
|
|
|
|
| 5 |
|
| 6 |
-
# List of required packages
|
| 7 |
required_packages = {
|
| 8 |
'gradio': 'gradio>=3.0',
|
| 9 |
'pandas': 'pandas',
|
| 10 |
'PyPDF2': 'PyPDF2',
|
| 11 |
'transformers': 'transformers',
|
| 12 |
-
'pdfplumber': 'pdfplumber'
|
| 13 |
-
'typing_extensions': 'typing_extensions'
|
| 14 |
}
|
| 15 |
|
| 16 |
def check_and_install_packages():
|
|
@@ -23,12 +22,7 @@ def check_and_install_packages():
|
|
| 23 |
|
| 24 |
if missing_packages:
|
| 25 |
print(f"Missing packages: {', '.join(missing_packages)}")
|
| 26 |
-
|
| 27 |
-
try:
|
| 28 |
-
subprocess.check_call([sys.executable, "-m", "pip", "install", *missing_packages])
|
| 29 |
-
print("Installation successful.")
|
| 30 |
-
except subprocess.CalledProcessError as e:
|
| 31 |
-
print(f"Failed to install packages. Error: {e}")
|
| 32 |
|
| 33 |
check_and_install_packages()
|
| 34 |
|
|
@@ -59,6 +53,7 @@ class UniversalTranscriptParser:
|
|
| 59 |
}
|
| 60 |
|
| 61 |
def parse_transcript(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
|
|
|
| 62 |
transcript_type = self._identify_transcript_type(text)
|
| 63 |
|
| 64 |
if transcript_type == 'homeschool':
|
|
@@ -69,6 +64,7 @@ class UniversalTranscriptParser:
|
|
| 69 |
return self._parse_miami_dade(text)
|
| 70 |
|
| 71 |
def _identify_transcript_type(self, text: str) -> str:
|
|
|
|
| 72 |
if re.search(r'Sample OFFICIAL HIGH SCHOOL TRANSCRIPT', text):
|
| 73 |
return 'homeschool'
|
| 74 |
elif re.search(r'DORAL ACADEMY HIGH SCHOOL', text):
|
|
@@ -76,22 +72,27 @@ class UniversalTranscriptParser:
|
|
| 76 |
return 'miami_dade'
|
| 77 |
|
| 78 |
def _parse_homeschool(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
|
|
|
| 79 |
courses = []
|
| 80 |
current_grade = None
|
| 81 |
current_year = None
|
| 82 |
|
|
|
|
| 83 |
student_info = {}
|
| 84 |
name_match = re.search(r'Student Name:\s*(.+)\s*SSN:', text)
|
| 85 |
if name_match:
|
| 86 |
student_info['name'] = name_match.group(1).strip()
|
| 87 |
|
|
|
|
| 88 |
for line in text.split('\n'):
|
|
|
|
| 89 |
grade_match = re.match(r'^\|?\s*(\d+th Grade)\s*\|.*(\d{4}-\d{4})', line)
|
| 90 |
if grade_match:
|
| 91 |
current_grade = grade_match.group(1)
|
| 92 |
current_year = grade_match.group(2)
|
| 93 |
continue
|
| 94 |
|
|
|
|
| 95 |
course_match = re.match(
|
| 96 |
r'^\|?\s*([^\|]+?)\s*\|\s*([A-Z][+*]?)\s*\|\s*([^\|]+)\s*\|\s*(\d+\.?\d*)\s*\|\s*(\d+)',
|
| 97 |
line
|
|
@@ -99,6 +100,7 @@ class UniversalTranscriptParser:
|
|
| 99 |
|
| 100 |
if course_match and current_grade:
|
| 101 |
course_name = course_match.group(1).strip()
|
|
|
|
| 102 |
course_name = re.sub(r'^\|?\s*', '', course_name)
|
| 103 |
|
| 104 |
courses.append({
|
|
@@ -112,33 +114,40 @@ class UniversalTranscriptParser:
|
|
| 112 |
'transcript_type': 'homeschool'
|
| 113 |
})
|
| 114 |
|
|
|
|
| 115 |
gpa_data = {}
|
| 116 |
gpa_match = re.search(r'Cum\. GPA\s*\|\s*([\d\.]+)', text)
|
| 117 |
if gpa_match:
|
| 118 |
gpa_data['unweighted'] = gpa_match.group(1)
|
| 119 |
-
gpa_data['weighted'] = gpa_match.group(1)
|
| 120 |
|
| 121 |
return {
|
| 122 |
'student_info': student_info,
|
| 123 |
-
'courses': {'All': courses},
|
| 124 |
'gpa': gpa_data,
|
| 125 |
'grade_level': current_grade.replace('th Grade', '') if current_grade else "Unknown"
|
| 126 |
}
|
| 127 |
|
| 128 |
def _parse_doral_academy(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
|
|
|
| 129 |
courses = []
|
|
|
|
|
|
|
| 130 |
student_info = {}
|
| 131 |
name_match = re.search(r'LEGAL NAME:\s*([^\n]+)', text)
|
| 132 |
if name_match:
|
| 133 |
student_info['name'] = name_match.group(1).strip()
|
| 134 |
|
|
|
|
| 135 |
year_pattern = re.compile(r'YEAR:\s*(\d{4}-\d{4})\s*GRADE LEVEL:\s*(\d{2})', re.MULTILINE)
|
| 136 |
year_matches = year_pattern.finditer(text)
|
| 137 |
|
|
|
|
| 138 |
grade_year_map = {}
|
| 139 |
for match in year_matches:
|
| 140 |
grade_year_map[match.group(2)] = match.group(1)
|
| 141 |
|
|
|
|
| 142 |
course_pattern = re.compile(
|
| 143 |
r'(\d)\s+(\d{7})\s+([^\n]+?)\s+([A-Z]{2})\s+([A-Z])\s+([A-Z])\s+([A-Z])\s+(\d\.\d{2})\s+(\d\.\d{2})',
|
| 144 |
re.MULTILINE
|
|
@@ -166,6 +175,7 @@ class UniversalTranscriptParser:
|
|
| 166 |
|
| 167 |
courses_by_grade[grade_level_num].append(course_info)
|
| 168 |
|
|
|
|
| 169 |
gpa_data = {}
|
| 170 |
unweighted_match = re.search(r'Un-weighted GPA\s*([\d\.]+)', text)
|
| 171 |
weighted_match = re.search(r'Weighted GPA\s*([\d\.]+)', text)
|
|
@@ -175,6 +185,7 @@ class UniversalTranscriptParser:
|
|
| 175 |
if weighted_match:
|
| 176 |
gpa_data['weighted'] = weighted_match.group(1)
|
| 177 |
|
|
|
|
| 178 |
grade_level = "12" if re.search(r'GRADE LEVEL:\s*12', text) else "Unknown"
|
| 179 |
|
| 180 |
return {
|
|
@@ -185,14 +196,17 @@ class UniversalTranscriptParser:
|
|
| 185 |
}
|
| 186 |
|
| 187 |
def _parse_miami_dade(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
|
|
|
| 188 |
courses = []
|
| 189 |
courses_by_grade = defaultdict(list)
|
| 190 |
|
|
|
|
| 191 |
student_info = {}
|
| 192 |
name_match = re.search(r'0783977 - ([^,]+),\s*([^\n]+)', text)
|
| 193 |
if name_match:
|
| 194 |
student_info['name'] = f"{name_match.group(2)} {name_match.group(1)}"
|
| 195 |
|
|
|
|
| 196 |
course_pattern = re.compile(
|
| 197 |
r'([A-Z]-[A-Za-z\s&]+)\s*\|\s*(\d{4}-\d{4})\s*\|\s*(\d{2})\s*\|\s*([A-Z0-9]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([A-Z]?)\s*\|\s*([A-Z]?)\s*\|\s*([^\|]+)',
|
| 198 |
re.MULTILINE
|
|
@@ -218,11 +232,13 @@ class UniversalTranscriptParser:
|
|
| 218 |
|
| 219 |
courses_by_grade[match.group(3)].append(course_info)
|
| 220 |
|
|
|
|
| 221 |
gpa_data = {
|
| 222 |
'weighted': extract_gpa(text, 'Weighted GPA'),
|
| 223 |
'unweighted': extract_gpa(text, 'Un-weighted GPA')
|
| 224 |
}
|
| 225 |
|
|
|
|
| 226 |
grade_level = re.search(r'Current Grade:\s*(\d+)', text).group(1) if re.search(r'Current Grade:\s*(\d+)', text) else "Unknown"
|
| 227 |
|
| 228 |
return {
|
|
@@ -274,85 +290,16 @@ def parse_transcript(file):
|
|
| 274 |
|
| 275 |
parsed_data = parser.parse_transcript(text)
|
| 276 |
|
| 277 |
-
|
| 278 |
-
|
| 279 |
-
|
| 280 |
-
|
| 281 |
-
|
| 282 |
-
output_text += f"Current Grade Level: {parsed_data.get('grade_level', 'Unknown')}\n"
|
| 283 |
-
|
| 284 |
-
if 'gpa' in parsed_data:
|
| 285 |
-
gpa = parsed_data['gpa']
|
| 286 |
-
output_text += f"Weighted GPA: {gpa.get('weighted', 'N/A')}\n"
|
| 287 |
-
output_text += f"Unweighted GPA: {gpa.get('unweighted', 'N/A')}\n\n"
|
| 288 |
-
|
| 289 |
-
output_text += "Course History:\n{'='*40}\n"
|
| 290 |
-
|
| 291 |
-
if 'courses' in parsed_data:
|
| 292 |
-
courses_by_grade = parsed_data['courses']
|
| 293 |
-
|
| 294 |
-
def grade_sort_key(grade):
|
| 295 |
-
try:
|
| 296 |
-
num = int(re.search(r'\d+', grade).group())
|
| 297 |
-
return num
|
| 298 |
-
except (AttributeError, ValueError):
|
| 299 |
-
return float('inf')
|
| 300 |
-
|
| 301 |
-
grades_sorted = sorted(courses_by_grade.keys(), key=grade_sort_key)
|
| 302 |
-
|
| 303 |
-
for grade in grades_sorted:
|
| 304 |
-
output_text += f"\nGrade {grade}:\n{'-'*30}\n"
|
| 305 |
-
for course in courses_by_grade[grade]:
|
| 306 |
-
output_text += f"- {course.get('name', 'Unnamed Course')}"
|
| 307 |
-
if 'grade' in course and course['grade']:
|
| 308 |
-
output_text += f" (Grade: {course['grade']})"
|
| 309 |
-
if 'credits' in course:
|
| 310 |
-
output_text += f" | Credits: {course['credits']}"
|
| 311 |
-
if 'school_year' in course:
|
| 312 |
-
output_text += f" | Year: {course['school_year']}"
|
| 313 |
-
output_text += "\n"
|
| 314 |
|
| 315 |
return output_text, parsed_data
|
| 316 |
else:
|
| 317 |
return "Unsupported file format (PDF only for transcript parsing)", None
|
| 318 |
|
| 319 |
-
def transcript_display(transcript_dict):
|
| 320 |
-
if not transcript_dict or "courses" not in transcript_dict:
|
| 321 |
-
return "No course information available"
|
| 322 |
-
|
| 323 |
-
display = "### Detailed Course History\n"
|
| 324 |
-
courses_by_grade = transcript_dict["courses"]
|
| 325 |
-
|
| 326 |
-
if isinstance(courses_by_grade, dict):
|
| 327 |
-
def grade_sort_key(grade):
|
| 328 |
-
try:
|
| 329 |
-
num = int(re.search(r'\d+', grade).group())
|
| 330 |
-
return num
|
| 331 |
-
except (AttributeError, ValueError):
|
| 332 |
-
return float('inf')
|
| 333 |
-
|
| 334 |
-
grades_sorted = sorted(courses_by_grade.keys(), key=grade_sort_key)
|
| 335 |
-
|
| 336 |
-
for grade in grades_sorted:
|
| 337 |
-
display += f"\n**Grade {grade}**\n"
|
| 338 |
-
for course in courses_by_grade[grade]:
|
| 339 |
-
display += f"- {course.get('name', 'Unnamed Course')}"
|
| 340 |
-
if 'grade' in course and course['grade']:
|
| 341 |
-
display += f" (Grade: {course['grade']})"
|
| 342 |
-
if 'credits' in course:
|
| 343 |
-
display += f" | Credits: {course['credits']}"
|
| 344 |
-
if 'school_year' in course:
|
| 345 |
-
display += f" | Year: {course['school_year']}"
|
| 346 |
-
display += "\n"
|
| 347 |
-
|
| 348 |
-
if 'gpa' in transcript_dict:
|
| 349 |
-
gpa = transcript_dict['gpa']
|
| 350 |
-
display += "\n**GPA Information**\n"
|
| 351 |
-
display += f"- Unweighted: {gpa.get('unweighted', 'N/A')}\n"
|
| 352 |
-
display += f"- Weighted: {gpa.get('weighted', 'N/A')}\n"
|
| 353 |
-
|
| 354 |
-
return display
|
| 355 |
-
|
| 356 |
# ========== LEARNING STYLE QUIZ ==========
|
| 357 |
learning_style_questions = [
|
| 358 |
"When you study for a test, you prefer to:",
|
|
@@ -421,16 +368,20 @@ def learning_style_quiz(*answers):
|
|
| 421 |
max_score = max(scores.values())
|
| 422 |
total_questions = len(learning_style_questions)
|
| 423 |
|
|
|
|
| 424 |
percentages = {style: (score/total_questions)*100 for style, score in scores.items()}
|
| 425 |
|
|
|
|
| 426 |
sorted_styles = sorted(scores.items(), key=lambda x: x[1], reverse=True)
|
| 427 |
|
|
|
|
| 428 |
result = "Your Learning Style Results:\n\n"
|
| 429 |
for style, score in sorted_styles:
|
| 430 |
result += f"{style}: {score}/{total_questions} ({percentages[style]:.1f}%)\n"
|
| 431 |
|
| 432 |
result += "\n"
|
| 433 |
|
|
|
|
| 434 |
primary_styles = [style for style, score in scores.items() if score == max_score]
|
| 435 |
|
| 436 |
if len(primary_styles) == 1:
|
|
@@ -453,7 +404,7 @@ def learning_style_quiz(*answers):
|
|
| 453 |
result += "- Create summaries in your own words\n"
|
| 454 |
result += "- Read textbooks and articles\n"
|
| 455 |
result += "- Make lists to organize information\n"
|
| 456 |
-
else:
|
| 457 |
result += "Tips for Kinesthetic Learners:\n"
|
| 458 |
result += "- Use hands-on activities\n"
|
| 459 |
result += "- Take frequent movement breaks\n"
|
|
@@ -469,6 +420,7 @@ def learning_style_quiz(*answers):
|
|
| 469 |
def save_profile(name, age, interests, transcript, learning_style,
|
| 470 |
movie, movie_reason, show, show_reason,
|
| 471 |
book, book_reason, character, character_reason, blog):
|
|
|
|
| 472 |
age = int(age) if age else 0
|
| 473 |
|
| 474 |
favorites = {
|
|
@@ -501,8 +453,9 @@ def save_profile(name, age, interests, transcript, learning_style,
|
|
| 501 |
**Age:** {age}
|
| 502 |
**Interests:** {interests}
|
| 503 |
**Learning Style:** {learning_style}
|
| 504 |
-
####
|
| 505 |
-
{
|
|
|
|
| 506 |
#### Favorites:
|
| 507 |
- Movie: {favorites['movie']} ({favorites['movie_reason']})
|
| 508 |
- Show: {favorites['show']} ({favorites['show_reason']})
|
|
@@ -528,107 +481,96 @@ def generate_response(message, history):
|
|
| 528 |
if not profile:
|
| 529 |
return "Please complete and save your profile first using the previous tabs."
|
| 530 |
|
|
|
|
| 531 |
learning_style = profile.get("learning_style", "")
|
| 532 |
-
|
| 533 |
-
gpa =
|
| 534 |
-
|
| 535 |
-
courses = profile.get("transcript", {}).get("courses", {})
|
| 536 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 537 |
greetings = ["hi", "hello", "hey"]
|
| 538 |
study_help = ["study", "learn", "prepare", "exam"]
|
| 539 |
-
grade_help = ["
|
| 540 |
-
|
| 541 |
-
course_help = ["courses", "classes", "transcript", "schedule"]
|
| 542 |
|
| 543 |
if any(greet in message.lower() for greet in greetings):
|
| 544 |
return f"Hello {profile.get('name', 'there')}! How can I help you today?"
|
| 545 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 546 |
elif any(word in message.lower() for word in study_help):
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 547 |
if "Visual" in learning_style:
|
| 548 |
-
response
|
| 549 |
-
"- Creating mind maps or diagrams\n"
|
| 550 |
-
"- Using color-coded notes\n"
|
| 551 |
-
"- Watching educational videos")
|
| 552 |
elif "Auditory" in learning_style:
|
| 553 |
-
response
|
| 554 |
-
"- Recording lectures and listening to them\n"
|
| 555 |
-
"- Participating in study groups\n"
|
| 556 |
-
"- Explaining concepts out loud")
|
| 557 |
elif "Reading/Writing" in learning_style:
|
| 558 |
-
response
|
| 559 |
-
"- Writing detailed notes\n"
|
| 560 |
-
"- Creating summaries in your own words\n"
|
| 561 |
-
"- Reading textbooks and articles")
|
| 562 |
elif "Kinesthetic" in learning_style:
|
| 563 |
-
response
|
| 564 |
-
"- Hands-on practice\n"
|
| 565 |
-
"- Creating physical models\n"
|
| 566 |
-
"- Taking frequent movement breaks")
|
| 567 |
-
else:
|
| 568 |
-
response = ("Here are some general study tips:\n"
|
| 569 |
-
"- Break study sessions into 25-minute chunks\n"
|
| 570 |
-
"- Review material regularly\n"
|
| 571 |
-
"- Teach concepts to someone else")
|
| 572 |
|
| 573 |
return response
|
| 574 |
|
| 575 |
-
elif any(word in message.lower() for word in grade_help):
|
| 576 |
-
return (f"Your GPA information:\n"
|
| 577 |
-
f"- Unweighted: {gpa.get('unweighted', 'N/A')}\n"
|
| 578 |
-
f"- Weighted: {gpa.get('weighted', 'N/A')}\n\n"
|
| 579 |
-
"To improve your grades, try:\n"
|
| 580 |
-
"- Setting specific goals\n"
|
| 581 |
-
"- Meeting with teachers\n"
|
| 582 |
-
"- Developing a study schedule")
|
| 583 |
-
|
| 584 |
-
elif any(word in message.lower() for word in interest_help):
|
| 585 |
-
return (f"I see you're interested in: {interests}\n\n"
|
| 586 |
-
"You might want to:\n"
|
| 587 |
-
"- Find clubs or activities related to these interests\n"
|
| 588 |
-
"- Explore career paths that align with them")
|
| 589 |
-
|
| 590 |
elif any(word in message.lower() for word in course_help):
|
| 591 |
-
|
| 592 |
-
|
| 593 |
-
|
| 594 |
-
|
| 595 |
-
|
| 596 |
-
|
| 597 |
-
|
| 598 |
-
|
| 599 |
-
|
| 600 |
-
|
| 601 |
-
|
| 602 |
-
|
| 603 |
-
|
| 604 |
-
|
| 605 |
-
|
| 606 |
-
if 'grade' in course:
|
| 607 |
-
response += f" (Grade: {course['grade']})"
|
| 608 |
-
response += "\n"
|
| 609 |
-
else:
|
| 610 |
-
response += "No detailed course information available."
|
| 611 |
return response
|
| 612 |
|
| 613 |
elif "help" in message.lower():
|
| 614 |
return ("I can help with:\n"
|
| 615 |
-
"-
|
| 616 |
-
"-
|
| 617 |
-
"- Course
|
| 618 |
-
"-
|
| 619 |
-
"Try asking about study strategies or your grades!")
|
| 620 |
|
| 621 |
else:
|
| 622 |
return ("I'm your personalized teaching assistant. "
|
| 623 |
-
"
|
| 624 |
-
"Try asking about how to study for your classes!")
|
| 625 |
|
| 626 |
# ========== GRADIO INTERFACE ==========
|
| 627 |
with gr.Blocks() as app:
|
| 628 |
with gr.Tab("Step 1: Upload Transcript"):
|
| 629 |
gr.Markdown("### Upload your transcript (PDF recommended)")
|
| 630 |
transcript_file = gr.File(label="Transcript file", file_types=[".pdf"])
|
| 631 |
-
transcript_output = gr.Textbox(label="Transcript Results", lines=
|
| 632 |
transcript_data = gr.State()
|
| 633 |
transcript_file.change(
|
| 634 |
fn=parse_transcript,
|
|
@@ -681,13 +623,12 @@ with gr.Blocks() as app:
|
|
| 681 |
chatbot = gr.ChatInterface(
|
| 682 |
fn=generate_response,
|
| 683 |
examples=[
|
| 684 |
-
"
|
| 685 |
-
"
|
| 686 |
-
"
|
| 687 |
-
"How can I improve my grades?"
|
| 688 |
]
|
| 689 |
)
|
| 690 |
|
| 691 |
-
# ========== RUN APPLICATION ==========
|
| 692 |
if __name__ == "__main__":
|
| 693 |
-
app.launch()
|
|
|
|
|
|
| 2 |
import sys
|
| 3 |
import subprocess
|
| 4 |
import importlib
|
| 5 |
+
from datetime import datetime
|
| 6 |
|
|
|
|
| 7 |
required_packages = {
|
| 8 |
'gradio': 'gradio>=3.0',
|
| 9 |
'pandas': 'pandas',
|
| 10 |
'PyPDF2': 'PyPDF2',
|
| 11 |
'transformers': 'transformers',
|
| 12 |
+
'pdfplumber': 'pdfplumber'
|
|
|
|
| 13 |
}
|
| 14 |
|
| 15 |
def check_and_install_packages():
|
|
|
|
| 22 |
|
| 23 |
if missing_packages:
|
| 24 |
print(f"Missing packages: {', '.join(missing_packages)}")
|
| 25 |
+
subprocess.check_call([sys.executable, "-m", "pip", "install", *missing_packages])
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 26 |
|
| 27 |
check_and_install_packages()
|
| 28 |
|
|
|
|
| 53 |
}
|
| 54 |
|
| 55 |
def parse_transcript(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
| 56 |
+
"""Determine transcript type and parse accordingly"""
|
| 57 |
transcript_type = self._identify_transcript_type(text)
|
| 58 |
|
| 59 |
if transcript_type == 'homeschool':
|
|
|
|
| 64 |
return self._parse_miami_dade(text)
|
| 65 |
|
| 66 |
def _identify_transcript_type(self, text: str) -> str:
|
| 67 |
+
"""Identify which type of transcript we're processing"""
|
| 68 |
if re.search(r'Sample OFFICIAL HIGH SCHOOL TRANSCRIPT', text):
|
| 69 |
return 'homeschool'
|
| 70 |
elif re.search(r'DORAL ACADEMY HIGH SCHOOL', text):
|
|
|
|
| 72 |
return 'miami_dade'
|
| 73 |
|
| 74 |
def _parse_homeschool(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
| 75 |
+
"""Parse homeschool transcript format"""
|
| 76 |
courses = []
|
| 77 |
current_grade = None
|
| 78 |
current_year = None
|
| 79 |
|
| 80 |
+
# Extract student info
|
| 81 |
student_info = {}
|
| 82 |
name_match = re.search(r'Student Name:\s*(.+)\s*SSN:', text)
|
| 83 |
if name_match:
|
| 84 |
student_info['name'] = name_match.group(1).strip()
|
| 85 |
|
| 86 |
+
# Process each line
|
| 87 |
for line in text.split('\n'):
|
| 88 |
+
# Check for grade level header
|
| 89 |
grade_match = re.match(r'^\|?\s*(\d+th Grade)\s*\|.*(\d{4}-\d{4})', line)
|
| 90 |
if grade_match:
|
| 91 |
current_grade = grade_match.group(1)
|
| 92 |
current_year = grade_match.group(2)
|
| 93 |
continue
|
| 94 |
|
| 95 |
+
# Course line pattern
|
| 96 |
course_match = re.match(
|
| 97 |
r'^\|?\s*([^\|]+?)\s*\|\s*([A-Z][+*]?)\s*\|\s*([^\|]+)\s*\|\s*(\d+\.?\d*)\s*\|\s*(\d+)',
|
| 98 |
line
|
|
|
|
| 100 |
|
| 101 |
if course_match and current_grade:
|
| 102 |
course_name = course_match.group(1).strip()
|
| 103 |
+
# Clean course names that start with | or have extra spaces
|
| 104 |
course_name = re.sub(r'^\|?\s*', '', course_name)
|
| 105 |
|
| 106 |
courses.append({
|
|
|
|
| 114 |
'transcript_type': 'homeschool'
|
| 115 |
})
|
| 116 |
|
| 117 |
+
# Extract GPA information from homeschool transcript
|
| 118 |
gpa_data = {}
|
| 119 |
gpa_match = re.search(r'Cum\. GPA\s*\|\s*([\d\.]+)', text)
|
| 120 |
if gpa_match:
|
| 121 |
gpa_data['unweighted'] = gpa_match.group(1)
|
| 122 |
+
gpa_data['weighted'] = gpa_match.group(1) # Homeschool often has same weighted/unweighted
|
| 123 |
|
| 124 |
return {
|
| 125 |
'student_info': student_info,
|
| 126 |
+
'courses': {'All': courses}, # Homeschool doesn't separate by grade in same way
|
| 127 |
'gpa': gpa_data,
|
| 128 |
'grade_level': current_grade.replace('th Grade', '') if current_grade else "Unknown"
|
| 129 |
}
|
| 130 |
|
| 131 |
def _parse_doral_academy(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
| 132 |
+
"""Parse Doral Academy specific format"""
|
| 133 |
courses = []
|
| 134 |
+
|
| 135 |
+
# Extract student info
|
| 136 |
student_info = {}
|
| 137 |
name_match = re.search(r'LEGAL NAME:\s*([^\n]+)', text)
|
| 138 |
if name_match:
|
| 139 |
student_info['name'] = name_match.group(1).strip()
|
| 140 |
|
| 141 |
+
# Extract school year information
|
| 142 |
year_pattern = re.compile(r'YEAR:\s*(\d{4}-\d{4})\s*GRADE LEVEL:\s*(\d{2})', re.MULTILINE)
|
| 143 |
year_matches = year_pattern.finditer(text)
|
| 144 |
|
| 145 |
+
# Create mapping of grade levels to years
|
| 146 |
grade_year_map = {}
|
| 147 |
for match in year_matches:
|
| 148 |
grade_year_map[match.group(2)] = match.group(1)
|
| 149 |
|
| 150 |
+
# Course pattern for Doral Academy
|
| 151 |
course_pattern = re.compile(
|
| 152 |
r'(\d)\s+(\d{7})\s+([^\n]+?)\s+([A-Z]{2})\s+([A-Z])\s+([A-Z])\s+([A-Z])\s+(\d\.\d{2})\s+(\d\.\d{2})',
|
| 153 |
re.MULTILINE
|
|
|
|
| 175 |
|
| 176 |
courses_by_grade[grade_level_num].append(course_info)
|
| 177 |
|
| 178 |
+
# Extract GPA information from Doral Academy transcript
|
| 179 |
gpa_data = {}
|
| 180 |
unweighted_match = re.search(r'Un-weighted GPA\s*([\d\.]+)', text)
|
| 181 |
weighted_match = re.search(r'Weighted GPA\s*([\d\.]+)', text)
|
|
|
|
| 185 |
if weighted_match:
|
| 186 |
gpa_data['weighted'] = weighted_match.group(1)
|
| 187 |
|
| 188 |
+
# Extract current grade level
|
| 189 |
grade_level = "12" if re.search(r'GRADE LEVEL:\s*12', text) else "Unknown"
|
| 190 |
|
| 191 |
return {
|
|
|
|
| 196 |
}
|
| 197 |
|
| 198 |
def _parse_miami_dade(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
|
| 199 |
+
"""Parse standard Miami-Dade format"""
|
| 200 |
courses = []
|
| 201 |
courses_by_grade = defaultdict(list)
|
| 202 |
|
| 203 |
+
# Extract student info
|
| 204 |
student_info = {}
|
| 205 |
name_match = re.search(r'0783977 - ([^,]+),\s*([^\n]+)', text)
|
| 206 |
if name_match:
|
| 207 |
student_info['name'] = f"{name_match.group(2)} {name_match.group(1)}"
|
| 208 |
|
| 209 |
+
# Course pattern for Miami-Dade
|
| 210 |
course_pattern = re.compile(
|
| 211 |
r'([A-Z]-[A-Za-z\s&]+)\s*\|\s*(\d{4}-\d{4})\s*\|\s*(\d{2})\s*\|\s*([A-Z0-9]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([A-Z]?)\s*\|\s*([A-Z]?)\s*\|\s*([^\|]+)',
|
| 212 |
re.MULTILINE
|
|
|
|
| 232 |
|
| 233 |
courses_by_grade[match.group(3)].append(course_info)
|
| 234 |
|
| 235 |
+
# Extract GPA information
|
| 236 |
gpa_data = {
|
| 237 |
'weighted': extract_gpa(text, 'Weighted GPA'),
|
| 238 |
'unweighted': extract_gpa(text, 'Un-weighted GPA')
|
| 239 |
}
|
| 240 |
|
| 241 |
+
# Extract current grade level
|
| 242 |
grade_level = re.search(r'Current Grade:\s*(\d+)', text).group(1) if re.search(r'Current Grade:\s*(\d+)', text) else "Unknown"
|
| 243 |
|
| 244 |
return {
|
|
|
|
| 290 |
|
| 291 |
parsed_data = parser.parse_transcript(text)
|
| 292 |
|
| 293 |
+
# Only show GPA in the output
|
| 294 |
+
output_text = f"Transcript Processed Successfully!\n\n"
|
| 295 |
+
output_text += f"GPA Information:\n"
|
| 296 |
+
output_text += f"- Weighted: {parsed_data['gpa'].get('weighted', 'N/A')}\n"
|
| 297 |
+
output_text += f"- Unweighted: {parsed_data['gpa'].get('unweighted', 'N/A')}"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 298 |
|
| 299 |
return output_text, parsed_data
|
| 300 |
else:
|
| 301 |
return "Unsupported file format (PDF only for transcript parsing)", None
|
| 302 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 303 |
# ========== LEARNING STYLE QUIZ ==========
|
| 304 |
learning_style_questions = [
|
| 305 |
"When you study for a test, you prefer to:",
|
|
|
|
| 368 |
max_score = max(scores.values())
|
| 369 |
total_questions = len(learning_style_questions)
|
| 370 |
|
| 371 |
+
# Calculate percentages
|
| 372 |
percentages = {style: (score/total_questions)*100 for style, score in scores.items()}
|
| 373 |
|
| 374 |
+
# Sort styles by score (descending)
|
| 375 |
sorted_styles = sorted(scores.items(), key=lambda x: x[1], reverse=True)
|
| 376 |
|
| 377 |
+
# Prepare detailed results
|
| 378 |
result = "Your Learning Style Results:\n\n"
|
| 379 |
for style, score in sorted_styles:
|
| 380 |
result += f"{style}: {score}/{total_questions} ({percentages[style]:.1f}%)\n"
|
| 381 |
|
| 382 |
result += "\n"
|
| 383 |
|
| 384 |
+
# Determine primary and secondary styles
|
| 385 |
primary_styles = [style for style, score in scores.items() if score == max_score]
|
| 386 |
|
| 387 |
if len(primary_styles) == 1:
|
|
|
|
| 404 |
result += "- Create summaries in your own words\n"
|
| 405 |
result += "- Read textbooks and articles\n"
|
| 406 |
result += "- Make lists to organize information\n"
|
| 407 |
+
else: # Kinesthetic
|
| 408 |
result += "Tips for Kinesthetic Learners:\n"
|
| 409 |
result += "- Use hands-on activities\n"
|
| 410 |
result += "- Take frequent movement breaks\n"
|
|
|
|
| 420 |
def save_profile(name, age, interests, transcript, learning_style,
|
| 421 |
movie, movie_reason, show, show_reason,
|
| 422 |
book, book_reason, character, character_reason, blog):
|
| 423 |
+
# Convert age to int if it's a numpy number (from gradio Number input)
|
| 424 |
age = int(age) if age else 0
|
| 425 |
|
| 426 |
favorites = {
|
|
|
|
| 453 |
**Age:** {age}
|
| 454 |
**Interests:** {interests}
|
| 455 |
**Learning Style:** {learning_style}
|
| 456 |
+
#### GPA Information:
|
| 457 |
+
- Weighted: {transcript['gpa'].get('weighted', 'N/A')}
|
| 458 |
+
- Unweighted: {transcript['gpa'].get('unweighted', 'N/A')}
|
| 459 |
#### Favorites:
|
| 460 |
- Movie: {favorites['movie']} ({favorites['movie_reason']})
|
| 461 |
- Show: {favorites['show']} ({favorites['show_reason']})
|
|
|
|
| 481 |
if not profile:
|
| 482 |
return "Please complete and save your profile first using the previous tabs."
|
| 483 |
|
| 484 |
+
# Get profile data
|
| 485 |
learning_style = profile.get("learning_style", "")
|
| 486 |
+
transcript = profile.get("transcript", {})
|
| 487 |
+
gpa = transcript.get("gpa", {})
|
| 488 |
+
courses = []
|
|
|
|
| 489 |
|
| 490 |
+
# Flatten all courses from all grades
|
| 491 |
+
if 'courses' in transcript:
|
| 492 |
+
if isinstance(transcript['courses'], dict):
|
| 493 |
+
for grade_courses in transcript['courses'].values():
|
| 494 |
+
courses.extend(grade_courses)
|
| 495 |
+
elif isinstance(transcript['courses'], list):
|
| 496 |
+
courses = transcript['courses']
|
| 497 |
+
|
| 498 |
+
# Common responses
|
| 499 |
greetings = ["hi", "hello", "hey"]
|
| 500 |
study_help = ["study", "learn", "prepare", "exam"]
|
| 501 |
+
grade_help = ["gpa", "grade point average", "grades"]
|
| 502 |
+
course_help = ["courses", "classes", "subjects"]
|
|
|
|
| 503 |
|
| 504 |
if any(greet in message.lower() for greet in greetings):
|
| 505 |
return f"Hello {profile.get('name', 'there')}! How can I help you today?"
|
| 506 |
|
| 507 |
+
elif any(word in message.lower() for word in grade_help):
|
| 508 |
+
return (f"Your GPA information:\n"
|
| 509 |
+
f"- Weighted: {gpa.get('weighted', 'N/A')}\n"
|
| 510 |
+
f"- Unweighted: {gpa.get('unweighted', 'N/A')}")
|
| 511 |
+
|
| 512 |
elif any(word in message.lower() for word in study_help):
|
| 513 |
+
# Analyze course performance to give personalized advice
|
| 514 |
+
strong_subjects = [c['name'] for c in courses if 'grade' in c and c['grade'] in ['A', 'A+', 'B+']]
|
| 515 |
+
weak_subjects = [c['name'] for c in courses if 'grade' in c and c['grade'] in ['D', 'F']]
|
| 516 |
+
|
| 517 |
+
response = "Here are some personalized study tips:\n"
|
| 518 |
+
|
| 519 |
+
if strong_subjects:
|
| 520 |
+
response += f"\nYou're doing well in: {', '.join(strong_subjects[:3])}\n"
|
| 521 |
+
response += "→ Keep up the good work in these areas!\n"
|
| 522 |
+
|
| 523 |
+
if weak_subjects:
|
| 524 |
+
response += f"\nYou might want to focus more on: {', '.join(weak_subjects[:3])}\n"
|
| 525 |
+
response += "→ Consider getting extra help or tutoring\n"
|
| 526 |
+
|
| 527 |
+
# Add learning style specific tips
|
| 528 |
if "Visual" in learning_style:
|
| 529 |
+
response += "\nVisual Learner Tip: Try creating diagrams or mind maps\n"
|
|
|
|
|
|
|
|
|
|
| 530 |
elif "Auditory" in learning_style:
|
| 531 |
+
response += "\nAuditory Learner Tip: Record yourself explaining concepts\n"
|
|
|
|
|
|
|
|
|
|
| 532 |
elif "Reading/Writing" in learning_style:
|
| 533 |
+
response += "\nReading/Writing Tip: Write summaries in your own words\n"
|
|
|
|
|
|
|
|
|
|
| 534 |
elif "Kinesthetic" in learning_style:
|
| 535 |
+
response += "\nKinesthetic Tip: Use physical objects to demonstrate concepts\n"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 536 |
|
| 537 |
return response
|
| 538 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 539 |
elif any(word in message.lower() for word in course_help):
|
| 540 |
+
if not courses:
|
| 541 |
+
return "No course information available."
|
| 542 |
+
|
| 543 |
+
# Group by subject area
|
| 544 |
+
subjects = defaultdict(list)
|
| 545 |
+
for course in courses:
|
| 546 |
+
if 'name' in course:
|
| 547 |
+
# Extract first word as subject area
|
| 548 |
+
subject = course['name'].split()[0]
|
| 549 |
+
subjects[subject].append(course)
|
| 550 |
+
|
| 551 |
+
response = "Your course subjects:\n"
|
| 552 |
+
for subject, subject_courses in subjects.items():
|
| 553 |
+
response += f"\n{subject} ({len(subject_courses)} courses)"
|
| 554 |
+
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 555 |
return response
|
| 556 |
|
| 557 |
elif "help" in message.lower():
|
| 558 |
return ("I can help with:\n"
|
| 559 |
+
"- Your GPA information\n"
|
| 560 |
+
"- Personalized study tips\n"
|
| 561 |
+
"- Course information\n"
|
| 562 |
+
"- Learning style recommendations")
|
|
|
|
| 563 |
|
| 564 |
else:
|
| 565 |
return ("I'm your personalized teaching assistant. "
|
| 566 |
+
"Ask me about your GPA, courses, or study tips!")
|
|
|
|
| 567 |
|
| 568 |
# ========== GRADIO INTERFACE ==========
|
| 569 |
with gr.Blocks() as app:
|
| 570 |
with gr.Tab("Step 1: Upload Transcript"):
|
| 571 |
gr.Markdown("### Upload your transcript (PDF recommended)")
|
| 572 |
transcript_file = gr.File(label="Transcript file", file_types=[".pdf"])
|
| 573 |
+
transcript_output = gr.Textbox(label="Transcript Results", lines=5)
|
| 574 |
transcript_data = gr.State()
|
| 575 |
transcript_file.change(
|
| 576 |
fn=parse_transcript,
|
|
|
|
| 623 |
chatbot = gr.ChatInterface(
|
| 624 |
fn=generate_response,
|
| 625 |
examples=[
|
| 626 |
+
"What's my GPA?",
|
| 627 |
+
"How should I study for my classes?",
|
| 628 |
+
"What subjects am I taking?"
|
|
|
|
| 629 |
]
|
| 630 |
)
|
| 631 |
|
|
|
|
| 632 |
if __name__ == "__main__":
|
| 633 |
+
app.launch()
|
| 634 |
+
|