Spaces:

Dannyar608
/

Final_project

Running

App Files Files Community

Dannyar608 commited on 9 days ago

Commit

b57ed91

verified ·

1 Parent(s): 0ecc813

Update app.py

Browse files

Files changed (1) hide show

app.py +72 -239

app.py CHANGED Viewed

@@ -3,6 +3,15 @@ import sys
 import subprocess
 import importlib
 from datetime import datetime
 required_packages = {
     'gradio': 'gradio>=3.0',
@@ -26,18 +35,6 @@ def check_and_install_packages():
 check_and_install_packages()
-# ========== MAIN IMPORTS ==========
-import gradio as gr
-import pandas as pd
-import json
-import os
-import re
-from PyPDF2 import PdfReader
-from collections import defaultdict
-from transformers import pipeline
-from typing import List, Dict, Union
-import pdfplumber
 # ========== TRANSCRIPT PARSING ==========
 class UniversalTranscriptParser:
     def __init__(self):
@@ -53,7 +50,6 @@ class UniversalTranscriptParser:
         }
     def parse_transcript(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
-        """Determine transcript type and parse accordingly"""
         transcript_type = self._identify_transcript_type(text)
         if transcript_type == 'homeschool':
@@ -64,7 +60,6 @@ class UniversalTranscriptParser:
             return self._parse_miami_dade(text)
     def _identify_transcript_type(self, text: str) -> str:
-        """Identify which type of transcript we're processing"""
         if re.search(r'Sample OFFICIAL HIGH SCHOOL TRANSCRIPT', text):
             return 'homeschool'
         elif re.search(r'DORAL ACADEMY HIGH SCHOOL', text):
@@ -72,27 +67,22 @@ class UniversalTranscriptParser:
         return 'miami_dade'
     def _parse_homeschool(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
-        """Parse homeschool transcript format"""
         courses = []
         current_grade = None
         current_year = None
-        # Extract student info
         student_info = {}
         name_match = re.search(r'Student Name:\s*(.+)\s*SSN:', text)
         if name_match:
             student_info['name'] = name_match.group(1).strip()
-        # Process each line
         for line in text.split('\n'):
-            # Check for grade level header
             grade_match = re.match(r'^\|?\s*(\d+th Grade)\s*\|.*(\d{4}-\d{4})', line)
             if grade_match:
                 current_grade = grade_match.group(1)
                 current_year = grade_match.group(2)
                 continue
-            # Course line pattern
             course_match = re.match(
                 r'^\|?\s*([^\|]+?)\s*\|\s*([A-Z][+*]?)\s*\|\s*([^\|]+)\s*\|\s*(\d+\.?\d*)\s*\|\s*(\d+)',
                 line
@@ -100,7 +90,6 @@ class UniversalTranscriptParser:
             if course_match and current_grade:
                 course_name = course_match.group(1).strip()
-                # Clean course names that start with | or have extra spaces
                 course_name = re.sub(r'^\|?\s*', '', course_name)
                 courses.append({
@@ -114,14 +103,7 @@ class UniversalTranscriptParser:
                     'transcript_type': 'homeschool'
                 })
-        # Extract GPA information from homeschool transcript
-        gpa_data = {}
-        gpa_match = re.search(r'Cum\. GPA\s*\|\s*([\d\.]+)', text)
-        if gpa_match:
-            gpa_value = gpa_match.group(1)
-            gpa_data['unweighted'] = gpa_value
-            gpa_data['weighted'] = gpa_value  # Homeschool often has same weighted/unweighted
         return {
             'student_info': student_info,
             'courses': {'All': courses},
@@ -130,25 +112,19 @@ class UniversalTranscriptParser:
         }
     def _parse_doral_academy(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
-        """Parse Doral Academy specific format"""
         courses = []
-        # Extract student info
         student_info = {}
         name_match = re.search(r'LEGAL NAME:\s*([^\n]+)', text)
         if name_match:
             student_info['name'] = name_match.group(1).strip()
-        # Extract school year information
         year_pattern = re.compile(r'YEAR:\s*(\d{4}-\d{4})\s*GRADE LEVEL:\s*(\d{2})', re.MULTILINE)
         year_matches = year_pattern.finditer(text)
-        # Create mapping of grade levels to years
         grade_year_map = {}
         for match in year_matches:
             grade_year_map[match.group(2)] = match.group(1)
-        # Course pattern for Doral Academy
         course_pattern = re.compile(
             r'(\d)\s+(\d{7})\s+([^\n]+?)\s+([A-Z]{2})\s+([A-Z])\s+([A-Z])\s+([A-Z])\s+(\d\.\d{2})\s+(\d\.\d{2})',
             re.MULTILINE
@@ -176,17 +152,7 @@ class UniversalTranscriptParser:
             courses_by_grade[grade_level_num].append(course_info)
-        # Extract GPA information from Doral Academy transcript
-        gpa_data = {}
-        unweighted_match = re.search(r'Un-weighted GPA\s*([\d\.]+)', text)
-        weighted_match = re.search(r'Weighted GPA\s*([\d\.]+)', text)
-        if unweighted_match:
-            gpa_data['unweighted'] = unweighted_match.group(1)
-        if weighted_match:
-            gpa_data['weighted'] = weighted_match.group(1)
-        # Extract current grade level
         grade_level = "12" if re.search(r'GRADE LEVEL:\s*12', text) else "Unknown"
         return {
@@ -197,17 +163,14 @@ class UniversalTranscriptParser:
         }
     def _parse_miami_dade(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
-        """Parse standard Miami-Dade format"""
         courses = []
         courses_by_grade = defaultdict(list)
-        # Extract student info
         student_info = {}
         name_match = re.search(r'0783977 - ([^,]+),\s*([^\n]+)', text)
         if name_match:
             student_info['name'] = f"{name_match.group(2)} {name_match.group(1)}"
-        # Course pattern for Miami-Dade
         course_pattern = re.compile(
             r'([A-Z]-[A-Za-z\s&]+)\s*\|\s*(\d{4}-\d{4})\s*\|\s*(\d{2})\s*\|\s*([A-Z0-9]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([A-Z]?)\s*\|\s*([A-Z]?)\s*\|\s*([^\|]+)',
             re.MULTILINE
@@ -233,13 +196,7 @@ class UniversalTranscriptParser:
             courses_by_grade[match.group(3)].append(course_info)
-        # Extract GPA information
-        gpa_data = {
-            'weighted': self._extract_gpa(text, 'Weighted GPA'),
-            'unweighted': self._extract_gpa(text, 'Un-weighted GPA')
-        }
-        # Extract current grade level
         grade_level = re.search(r'Current Grade:\s*(\d+)', text).group(1) if re.search(r'Current Grade:\s*(\d+)', text) else "Unknown"
         return {
@@ -249,38 +206,50 @@ class UniversalTranscriptParser:
             'grade_level': grade_level
         }
-    def _extract_gpa(self, text: str, gpa_type: str) -> str:
-        """Helper method to extract GPA values"""
-        pattern = rf'{gpa_type}\s*([\d\.]+)'
-        match = re.search(pattern, text)
-        return match.group(1) if match else "Not Available"
-    def _compile_miami_dade_patterns(self):
-        return {
-            'student': re.compile(r'Current Grade:\s*(\d+).*YOG\s*(\d{4})'),
-            'course': re.compile(
-                r'([A-Z]-[A-Za-z\s&]+)\s*\|\s*(\d{4}-\d{4})\s*\|\s*(\d{2})\s*\|\s*([A-Z0-9]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([A-Z]?)\s*\|\s*([A-Z]?)\s*\|\s*([^\|]+)',
-                re.MULTILINE
-            )
-        }
-    def _compile_homeschool_patterns(self):
-        return {
-            'student': re.compile(r'Student Name:\s*(.+)\s*SSN:'),
-            'course': re.compile(
-                r'^\|?\s*([^\|]+?)\s*\|\s*([A-Z][+*]?)\s*\|\s*([^\|]+)\s*\|\s*(\d+\.?\d*)\s*\|\s*(\d+)'
-            )
-        }
-    def _compile_doral_academy_patterns(self):
-        return {
-            'student': re.compile(r'LEGAL NAME:\s*([^\n]+)'),
-            'course': re.compile(
-                r'(\d)\s+(\d{7})\s+([^\n]+?)\s+([A-Z]{2})\s+([A-Z])\s+([A-Z])\s+([A-Z])\s+(\d\.\d{2})\s+(\d\.\d{2})',
-                re.MULTILINE
-            )
-        }
 def parse_transcript(file):
     parser = UniversalTranscriptParser()
@@ -292,15 +261,19 @@ def parse_transcript(file):
         parsed_data = parser.parse_transcript(text)
-        # Create clear GPA output
         gpa_data = parsed_data.get('gpa', {})
-        weighted_gpa = gpa_data.get('weighted', 'Not Available')
-        unweighted_gpa = gpa_data.get('unweighted', 'Not Available')
-        output_text = "Transcript Processed Successfully!\n\n"
-        output_text += "GPA Information:\n"
-        output_text += f"- Weighted GPA: {weighted_gpa}\n"
-        output_text += f"- Unweighted GPA: {unweighted_gpa}\n"
         return output_text, parsed_data
     else:
@@ -309,48 +282,12 @@ def parse_transcript(file):
 # ========== LEARNING STYLE QUIZ ==========
 learning_style_questions = [
     "When you study for a test, you prefer to:",
-    "When you need directions to a new place, you prefer:",
-    "When you learn a new skill, you prefer to:",
-    "When you're trying to concentrate, you:",
-    "When you meet new people, you remember them by:",
-    "When you're assembling furniture or a gadget, you:",
-    "When choosing a restaurant, you rely most on:",
-    "When you're in a waiting room, you typically:",
-    "When giving someone instructions, you tend to:",
-    "When you're trying to recall information, you:",
-    "When you're at a museum or exhibit, you:",
-    "When you're learning a new language, you prefer:",
-    "When you're taking notes in class, you:",
-    "When you're explaining something complex, you:",
-    "When you're at a party, you enjoy:",
-    "When you're trying to remember a phone number, you:",
-    "When you're relaxing, you prefer to:",
-    "When you're learning to use new software, you:",
-    "When you're giving a presentation, you rely on:",
-    "When you're solving a difficult problem, you:"
 ]
 learning_style_options = [
     ["Read the textbook (Reading/Writing)", "Listen to lectures (Auditory)", "Use diagrams/charts (Visual)", "Practice problems (Kinesthetic)"],
-    ["Look at a map (Visual)", "Have someone tell you (Auditory)", "Write down directions (Reading/Writing)", "Try walking/driving there (Kinesthetic)"],
-    ["Read instructions (Reading/Writing)", "Have someone show you (Visual)", "Listen to explanations (Auditory)", "Try it yourself (Kinesthetic)"],
-    ["Need quiet (Reading/Writing)", "Need background noise (Auditory)", "Need to move around (Kinesthetic)", "Need visual stimulation (Visual)"],
-    ["Their face (Visual)", "Their name (Auditory)", "What you talked about (Reading/Writing)", "What you did together (Kinesthetic)"],
-    ["Read the instructions carefully (Reading/Writing)", "Look at the diagrams (Visual)", "Ask someone to explain (Auditory)", "Start putting pieces together (Kinesthetic)"],
-    ["Online photos of the food (Visual)", "Recommendations from friends (Auditory)", "Reading the menu online (Reading/Writing)", "Remembering how it felt to eat there (Kinesthetic)"],
-    ["Read magazines (Reading/Writing)", "Listen to music (Auditory)", "Watch TV (Visual)", "Fidget or move around (Kinesthetic)"],
-    ["Write them down (Reading/Writing)", "Explain verbally (Auditory)", "Demonstrate (Visual)", "Guide them physically (Kinesthetic)"],
-    ["See written words in your mind (Visual)", "Hear the information in your head (Auditory)", "Write it down to remember (Reading/Writing)", "Associate it with physical actions (Kinesthetic)"],
-    ["Read all the descriptions (Reading/Writing)", "Listen to audio guides (Auditory)", "Look at the displays (Visual)", "Touch interactive exhibits (Kinesthetic)"],
-    ["Study grammar rules (Reading/Writing)", "Listen to native speakers (Auditory)", "Use flashcards with images (Visual)", "Practice conversations (Kinesthetic)"],
-    ["Write detailed paragraphs (Reading/Writing)", "Record the lecture (Auditory)", "Draw diagrams and charts (Visual)", "Doodle while listening (Kinesthetic)"],
-    ["Write detailed steps (Reading/Writing)", "Explain verbally with examples (Auditory)", "Draw diagrams (Visual)", "Use physical objects to demonstrate (Kinesthetic)"],
-    ["Conversations with people (Auditory)", "Watching others or the environment (Visual)", "Writing notes or texting (Reading/Writing)", "Dancing or physical activities (Kinesthetic)"],
-    ["See the numbers in your mind (Visual)", "Say them aloud (Auditory)", "Write them down (Reading/Writing)", "Dial them on a keypad (Kinesthetic)"],
-    ["Read a book (Reading/Writing)", "Listen to music (Auditory)", "Watch TV/movies (Visual)", "Do something physical (Kinesthetic)"],
-    ["Read the manual (Reading/Writing)", "Ask someone to show you (Visual)", "Call tech support (Auditory)", "Experiment with the software (Kinesthetic)"],
-    ["Detailed notes (Reading/Writing)", "Verbal explanations (Auditory)", "Visual slides (Visual)", "Physical demonstrations (Kinesthetic)"],
-    ["Write out possible solutions (Reading/Writing)", "Talk through it with someone (Auditory)", "Draw diagrams (Visual)", "Build a model or prototype (Kinesthetic)"]
 ]
 def learning_style_quiz(*answers):
@@ -374,48 +311,19 @@ def learning_style_quiz(*answers):
     max_score = max(scores.values())
     total_questions = len(learning_style_questions)
-    # Calculate percentages
     percentages = {style: (score/total_questions)*100 for style, score in scores.items()}
-    # Sort styles by score (descending)
     sorted_styles = sorted(scores.items(), key=lambda x: x[1], reverse=True)
-    # Prepare detailed results
     result = "Your Learning Style Results:\n\n"
     for style, score in sorted_styles:
         result += f"{style}: {score}/{total_questions} ({percentages[style]:.1f}%)\n"
     result += "\n"
-    # Determine primary and secondary styles
     primary_styles = [style for style, score in scores.items() if score == max_score]
     if len(primary_styles) == 1:
         result += f"Your primary learning style is: {primary_styles[0]}\n\n"
-        if primary_styles[0] == "Visual":
-            result += "Tips for Visual Learners:\n"
-            result += "- Use color coding in your notes\n"
-            result += "- Create mind maps and diagrams\n"
-            result += "- Watch educational videos\n"
-            result += "- Use flashcards with images\n"
-        elif primary_styles[0] == "Auditory":
-            result += "Tips for Auditory Learners:\n"
-            result += "- Record lectures and listen to them\n"
-            result += "- Participate in study groups\n"
-            result += "- Explain concepts out loud to yourself\n"
-            result += "- Use rhymes or songs to remember information\n"
-        elif primary_styles[0] == "Reading/Writing":
-            result += "Tips for Reading/Writing Learners:\n"
-            result += "- Write detailed notes\n"
-            result += "- Create summaries in your own words\n"
-            result += "- Read textbooks and articles\n"
-            result += "- Make lists to organize information\n"
-        else:  # Kinesthetic
-            result += "Tips for Kinesthetic Learners:\n"
-            result += "- Use hands-on activities\n"
-            result += "- Take frequent movement breaks\n"
-            result += "- Create physical models\n"
-            result += "- Associate information with physical actions\n"
     else:
         result += f"You have multiple strong learning styles: {', '.join(primary_styles)}\n\n"
         result += "You may benefit from combining different learning approaches.\n"
@@ -426,7 +334,6 @@ def learning_style_quiz(*answers):
 def save_profile(name, age, interests, transcript, learning_style,
                 movie, movie_reason, show, show_reason,
                 book, book_reason, character, character_reason, blog):
-    # Convert age to int if it's a numpy number (from gradio Number input)
     age = int(age) if age else 0
     favorites = {
@@ -455,7 +362,6 @@ def save_profile(name, age, interests, transcript, learning_style,
     with open(json_path, "w") as f:
         json.dump(data, f, indent=2)
-    # Create profile summary with clear GPA display
     gpa = transcript.get('gpa', {})
     markdown_summary = f"""### Student Profile: {name}
 **Age:** {age}
@@ -492,30 +398,11 @@ def generate_response(message, history):
     if not profile:
         return "Please complete and save your profile first using the previous tabs."
-    # Get profile data
-    learning_style = profile.get("learning_style", "")
     transcript = profile.get("transcript", {})
     gpa = transcript.get("gpa", {})
-    courses = []
-    # Flatten all courses from all grades
-    if 'courses' in transcript:
-        if isinstance(transcript['courses'], dict):
-            for grade_courses in transcript['courses'].values():
-                courses.extend(grade_courses)
-        elif isinstance(transcript['courses'], list):
-            courses = transcript['courses']
-    # Common responses
-    greetings = ["hi", "hello", "hey"]
-    study_help = ["study", "learn", "prepare", "exam"]
-    grade_help = ["gpa", "grade", "weighted", "unweighted", "grades"]
-    course_help = ["courses", "classes", "subjects"]
-    if any(greet in message.lower() for greet in greetings):
-        return f"Hello {profile.get('name', 'there')}! How can I help you today?"
-    elif any(word in message.lower() for word in grade_help):
         response = "Your GPA Information:\n"
         response += f"- Weighted GPA: {gpa.get('weighted', 'Not Available')}\n"
         response += f"- Unweighted GPA: {gpa.get('unweighted', 'Not Available')}\n"
@@ -533,61 +420,7 @@ def generate_response(message, history):
         return response
-    elif any(word in message.lower() for word in study_help):
-        # Analyze course performance to give personalized advice
-        strong_subjects = [c['name'] for c in courses if 'grade' in c and c['grade'] in ['A', 'A+', 'B+']]
-        weak_subjects = [c['name'] for c in courses if 'grade' in c and c['grade'] in ['D', 'F']]
-        response = "Here are some personalized study tips:\n"
-        if strong_subjects:
-            response += f"\nYou're doing well in: {', '.join(strong_subjects[:3])}\n"
-            response += "→ Keep up the good work in these areas!\n"
-        if weak_subjects:
-            response += f"\nYou might want to focus more on: {', '.join(weak_subjects[:3])}\n"
-            response += "→ Consider getting extra help or tutoring\n"
-        # Add learning style specific tips
-        if "Visual" in learning_style:
-            response += "\nVisual Learner Tip: Try creating diagrams or mind maps\n"
-        elif "Auditory" in learning_style:
-            response += "\nAuditory Learner Tip: Record yourself explaining concepts\n"
-        elif "Reading/Writing" in learning_style:
-            response += "\nReading/Writing Tip: Write summaries in your own words\n"
-        elif "Kinesthetic" in learning_style:
-            response += "\nKinesthetic Tip: Use physical objects to demonstrate concepts\n"
-        return response
-    elif any(word in message.lower() for word in course_help):
-        if not courses:
-            return "No course information available."
-        # Group by subject area
-        subjects = defaultdict(list)
-        for course in courses:
-            if 'name' in course:
-                # Extract first word as subject area
-                subject = course['name'].split()[0]
-                subjects[subject].append(course)
-        response = "Your course subjects:\n"
-        for subject, subject_courses in subjects.items():
-            response += f"\n{subject} ({len(subject_courses)} courses)"
-        return response
-    elif "help" in message.lower():
-        return ("I can help with:\n"
-               "- Your GPA information\n"
-               "- Personalized study tips\n"
-               "- Course information\n"
-               "- Learning style recommendations")
-    else:
-        return ("I'm your personalized teaching assistant. "
-               "Ask me about your GPA, courses, or study tips!")
 # ========== GRADIO INTERFACE ==========
 with gr.Blocks() as app:

 import subprocess
 import importlib
 from datetime import datetime
+import re
+import os
+import json
+import pdfplumber
+from collections import defaultdict
+from typing import List, Dict, Union
+import gradio as gr
+from PyPDF2 import PdfReader
+from transformers import pipeline
 required_packages = {
     'gradio': 'gradio>=3.0',
 check_and_install_packages()
 # ========== TRANSCRIPT PARSING ==========
 class UniversalTranscriptParser:
     def __init__(self):
         }
     def parse_transcript(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
         transcript_type = self._identify_transcript_type(text)
         if transcript_type == 'homeschool':
             return self._parse_miami_dade(text)
     def _identify_transcript_type(self, text: str) -> str:
         if re.search(r'Sample OFFICIAL HIGH SCHOOL TRANSCRIPT', text):
             return 'homeschool'
         elif re.search(r'DORAL ACADEMY HIGH SCHOOL', text):
         return 'miami_dade'
     def _parse_homeschool(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
         courses = []
         current_grade = None
         current_year = None
         student_info = {}
         name_match = re.search(r'Student Name:\s*(.+)\s*SSN:', text)
         if name_match:
             student_info['name'] = name_match.group(1).strip()
         for line in text.split('\n'):
             grade_match = re.match(r'^\|?\s*(\d+th Grade)\s*\|.*(\d{4}-\d{4})', line)
             if grade_match:
                 current_grade = grade_match.group(1)
                 current_year = grade_match.group(2)
                 continue
             course_match = re.match(
                 r'^\|?\s*([^\|]+?)\s*\|\s*([A-Z][+*]?)\s*\|\s*([^\|]+)\s*\|\s*(\d+\.?\d*)\s*\|\s*(\d+)',
                 line
             if course_match and current_grade:
                 course_name = course_match.group(1).strip()
                 course_name = re.sub(r'^\|?\s*', '', course_name)
                 courses.append({
                     'transcript_type': 'homeschool'
                 })
+        gpa_data = self._extract_gpa_data(text)
         return {
             'student_info': student_info,
             'courses': {'All': courses},
         }
     def _parse_doral_academy(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
         courses = []
         student_info = {}
         name_match = re.search(r'LEGAL NAME:\s*([^\n]+)', text)
         if name_match:
             student_info['name'] = name_match.group(1).strip()
         year_pattern = re.compile(r'YEAR:\s*(\d{4}-\d{4})\s*GRADE LEVEL:\s*(\d{2})', re.MULTILINE)
         year_matches = year_pattern.finditer(text)
         grade_year_map = {}
         for match in year_matches:
             grade_year_map[match.group(2)] = match.group(1)
         course_pattern = re.compile(
             r'(\d)\s+(\d{7})\s+([^\n]+?)\s+([A-Z]{2})\s+([A-Z])\s+([A-Z])\s+([A-Z])\s+(\d\.\d{2})\s+(\d\.\d{2})',
             re.MULTILINE
             courses_by_grade[grade_level_num].append(course_info)
+        gpa_data = self._extract_gpa_data(text)
         grade_level = "12" if re.search(r'GRADE LEVEL:\s*12', text) else "Unknown"
         return {
         }
     def _parse_miami_dade(self, text: str) -> Dict[str, Union[Dict, List[Dict]]]:
         courses = []
         courses_by_grade = defaultdict(list)
         student_info = {}
         name_match = re.search(r'0783977 - ([^,]+),\s*([^\n]+)', text)
         if name_match:
             student_info['name'] = f"{name_match.group(2)} {name_match.group(1)}"
         course_pattern = re.compile(
             r'([A-Z]-[A-Za-z\s&]+)\s*\|\s*(\d{4}-\d{4})\s*\|\s*(\d{2})\s*\|\s*([A-Z0-9]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([^\|]+)\s*\|\s*([A-Z]?)\s*\|\s*([A-Z]?)\s*\|\s*([^\|]+)',
             re.MULTILINE
             courses_by_grade[match.group(3)].append(course_info)
+        gpa_data = self._extract_gpa_data(text)
         grade_level = re.search(r'Current Grade:\s*(\d+)', text).group(1) if re.search(r'Current Grade:\s*(\d+)', text) else "Unknown"
         return {
             'grade_level': grade_level
         }
+    def _extract_gpa_data(self, text: str) -> Dict[str, str]:
+        """Improved GPA extraction with multiple pattern matching"""
+        gpa_data = {}
+        # Weighted GPA patterns
+        weighted_patterns = [
+            r'Weighted GPA\s*:\s*([\d\.]+)',
+            r'Weighted GPA\s*([\d\.]+)',
+            r'GPA WTD\s*:\s*([\d\.]+)',
+            r'Weighted\s*:\s*([\d\.]+)'
+        ]
+        # Unweighted GPA patterns
+        unweighted_patterns = [
+            r'Un-weighted GPA\s*:\s*([\d\.]+)',
+            r'Unweighted GPA\s*([\d\.]+)',
+            r'GPA UNWTD\s*:\s*([\d\.]+)',
+            r'Unweighted\s*:\s*([\d\.]+)'
+        ]
+        # Try all weighted patterns
+        for pattern in weighted_patterns:
+            match = re.search(pattern, text, re.IGNORECASE)
+            if match:
+                gpa_data['weighted'] = match.group(1)
+                break
+        # Try all unweighted patterns
+        for pattern in unweighted_patterns:
+            match = re.search(pattern, text, re.IGNORECASE)
+            if match:
+                gpa_data['unweighted'] = match.group(1)
+                break
+        # Fallback to cumulative GPA if not found
+        if not gpa_data:
+            cumulative_match = re.search(r'Cumulative GPA\s*:\s*([\d\.]+)', text, re.IGNORECASE)
+            if cumulative_match:
+                gpa_data['weighted'] = cumulative_match.group(1)
+                gpa_data['unweighted'] = cumulative_match.group(1)
+        return gpa_data
+# ========== TRANSCRIPT PROCESSING ==========
 def parse_transcript(file):
     parser = UniversalTranscriptParser()
         parsed_data = parser.parse_transcript(text)
+        # Enhanced GPA display
         gpa_data = parsed_data.get('gpa', {})
+        weighted_gpa = gpa_data.get('weighted', 'Not Found (Please check transcript)')
+        unweighted_gpa = gpa_data.get('unweighted', 'Not Found (Please check transcript)')
+        output_text = "=== TRANSCRIPT ANALYSIS RESULTS ===\n\n"
+        output_text += "GPA INFORMATION:\n"
+        output_text += f"🔹 Weighted GPA: {weighted_gpa}\n"
+        output_text += f"🔹 Unweighted GPA: {unweighted_gpa}\n\n"
+        if 'Not Found' in weighted_gpa or 'Not Found' in unweighted_gpa:
+            output_text += "NOTE: Could not automatically locate GPA information.\n"
+            output_text += "Please check your transcript for GPA details and enter them manually if needed.\n"
         return output_text, parsed_data
     else:
 # ========== LEARNING STYLE QUIZ ==========
 learning_style_questions = [
     "When you study for a test, you prefer to:",
+    # ... [rest of your questions] ...
 ]
 learning_style_options = [
     ["Read the textbook (Reading/Writing)", "Listen to lectures (Auditory)", "Use diagrams/charts (Visual)", "Practice problems (Kinesthetic)"],
+    # ... [rest of your options] ...
 ]
 def learning_style_quiz(*answers):
     max_score = max(scores.values())
     total_questions = len(learning_style_questions)
     percentages = {style: (score/total_questions)*100 for style, score in scores.items()}
     sorted_styles = sorted(scores.items(), key=lambda x: x[1], reverse=True)
     result = "Your Learning Style Results:\n\n"
     for style, score in sorted_styles:
         result += f"{style}: {score}/{total_questions} ({percentages[style]:.1f}%)\n"
     result += "\n"
     primary_styles = [style for style, score in scores.items() if score == max_score]
     if len(primary_styles) == 1:
         result += f"Your primary learning style is: {primary_styles[0]}\n\n"
+        # ... [rest of your learning style tips] ...
     else:
         result += f"You have multiple strong learning styles: {', '.join(primary_styles)}\n\n"
         result += "You may benefit from combining different learning approaches.\n"
 def save_profile(name, age, interests, transcript, learning_style,
                 movie, movie_reason, show, show_reason,
                 book, book_reason, character, character_reason, blog):
     age = int(age) if age else 0
     favorites = {
     with open(json_path, "w") as f:
         json.dump(data, f, indent=2)
     gpa = transcript.get('gpa', {})
     markdown_summary = f"""### Student Profile: {name}
 **Age:** {age}
     if not profile:
         return "Please complete and save your profile first using the previous tabs."
     transcript = profile.get("transcript", {})
     gpa = transcript.get("gpa", {})
+    # When user asks about GPA
+    if any(word in message.lower() for word in ["gpa", "grade", "weighted", "unweighted"]):
         response = "Your GPA Information:\n"
         response += f"- Weighted GPA: {gpa.get('weighted', 'Not Available')}\n"
         response += f"- Unweighted GPA: {gpa.get('unweighted', 'Not Available')}\n"
         return response
+    # ... [rest of your AI assistant logic] ...
 # ========== GRADIO INTERFACE ==========
 with gr.Blocks() as app: