Spaces:
Runtime error
Runtime error
import gradio as gr | |
import pandas as pd | |
import json | |
import os | |
import re | |
from PyPDF2 import PdfReader | |
from collections import defaultdict | |
# ========== TRANSCRIPT PARSING FUNCTIONS ========== | |
def extract_courses_with_grade_levels(text): | |
grade_level_pattern = r"(Grade|Year)\s*[:]?\s*(\d+|Freshman|Sophomore|Junior|Senior)" | |
grade_match = re.search(grade_level_pattern, text, re.IGNORECASE) | |
current_grade_level = grade_match.group(2) if grade_match else "Unknown" | |
course_pattern = r""" | |
(?:^|\n) | |
(?: (Grade|Year)\s*[:]?\s*(\d+|Freshman|Sophomore|Junior|Senior)\s*[\n-]* )? | |
( | |
(?:[A-Z]{2,}\s?\d{3}) | |
| | |
[A-Z][a-z]+(?:\s[A-Z][a-z]+)* | |
) | |
\s* | |
(?: [:\-]?\s* ([A-F][+-]?|\d{2,3}%)? )? | |
""" | |
courses_by_grade = defaultdict(list) | |
current_grade = current_grade_level | |
for match in re.finditer(course_pattern, text, re.VERBOSE | re.MULTILINE): | |
grade_context, grade_level, course, grade = match.groups() | |
if grade_context: | |
current_grade = grade_level | |
if course: | |
course_info = {"course": course.strip()} | |
if grade: | |
course_info["grade"] = grade.strip() | |
courses_by_grade[current_grade].append(course_info) | |
return dict(courses_by_grade) | |
def parse_transcript(file): | |
if file.name.endswith('.csv'): | |
df = pd.read_csv(file) | |
elif file.name.endswith('.xlsx'): | |
df = pd.read_excel(file) | |
elif file.name.endswith('.pdf'): | |
text = '' | |
reader = PdfReader(file) | |
for page in reader.pages: | |
page_text = page.extract_text() | |
if page_text: | |
text += page_text + '\n' | |
# Grade level extraction | |
grade_match = re.search(r'(Grade|Year)[\s:]*(\d+|Freshman|Sophomore|Junior|Senior)', text, re.IGNORECASE) | |
grade_level = grade_match.group(2) if grade_match else "Unknown" | |
# Enhanced GPA extraction | |
gpa_data = {'weighted': "N/A", 'unweighted': "N/A"} | |
gpa_patterns = [ | |
r'Weighted GPA[\s:]*(\d\.\d{1,2})', | |
r'GPA \(Weighted\)[\s:]*(\d\.\d{1,2})', | |
r'Cumulative GPA \(Weighted\)[\s:]*(\d\.\d{1,2})', | |
r'Unweighted GPA[\s:]*(\d\.\d{1,2})', | |
r'GPA \(Unweighted\)[\s:]*(\d\.\d{1,2})', | |
r'Cumulative GPA \(Unweighted\)[\s:]*(\d\.\d{1,2})', | |
r'GPA[\s:]*(\d\.\d{1,2})' | |
] | |
for pattern in gpa_patterns: | |
for match in re.finditer(pattern, text, re.IGNORECASE): | |
gpa_value = match.group(1) | |
if 'weighted' in pattern.lower(): | |
gpa_data['weighted'] = gpa_value | |
elif 'unweighted' in pattern.lower(): | |
gpa_data['unweighted'] = gpa_value | |
else: | |
if gpa_data['unweighted'] == "N/A": | |
gpa_data['unweighted'] = gpa_value | |
if gpa_data['weighted'] == "N/A": | |
gpa_data['weighted'] = gpa_value | |
courses_by_grade = extract_courses_with_grade_levels(text) | |
output_text = f"Grade Level: {grade_level}\n\n" | |
if gpa_data['weighted'] != "N/A" or gpa_data['unweighted'] != "N/A": | |
output_text += "GPA Information:\n" | |
if gpa_data['unweighted'] != "N/A": | |
output_text += f"- Unweighted GPA: {gpa_data['unweighted']}\n" | |
if gpa_data['weighted'] != "N/A": | |
output_text += f"- Weighted GPA: {gpa_data['weighted']}\n" | |
else: | |
output_text += "No GPA information found\n" | |
output_text += "\n(Courses not shown here)" | |
return output_text, { | |
"gpa": gpa_data, | |
"grade_level": grade_level, | |
"courses": courses_by_grade | |
} | |
else: | |
return "Unsupported file format", None | |
# For CSV/XLSX fallback | |
gpa = "N/A" | |
for col in ['GPA', 'Grade Point Average', 'Cumulative GPA']: | |
if col in df.columns: | |
gpa = df[col].iloc[0] if isinstance(df[col].iloc[0], (float, int)) else "N/A" | |
break | |
grade_level = "N/A" | |
for col in ['Grade Level', 'Grade', 'Class', 'Year']: | |
if col in df.columns: | |
grade_level = df[col].iloc[0] | |
break | |
courses = [] | |
for col in ['Course', 'Subject', 'Course Name', 'Class']: | |
if col in df.columns: | |
courses = df[col].tolist() | |
break | |
output_text = f"Grade Level: {grade_level}\nGPA: {gpa}\n\nCourses:\n" | |
output_text += "\n".join(f"- {course}" for course in courses) | |
return output_text, { | |
"gpa": {"unweighted": gpa, "weighted": "N/A"}, | |
"grade_level": grade_level, | |
"courses": courses | |
} | |
# ========== LEARNING STYLE QUIZ ========== | |
learning_style_questions = [ | |
"When you study for a test, you prefer to:", | |
"When you need directions to a new place, you prefer:", | |
"When you learn a new skill, you prefer to:", | |
"When you're trying to concentrate, you:", | |
"When you meet new people, you remember them by:", | |
"When you're relaxing, you prefer to:", | |
"When you're explaining something to someone, you:", | |
"When you're trying to remember something, you:", | |
"When you're in a classroom, you learn best when:", | |
"When you're trying to solve a problem, you:", | |
"When you're taking notes, you:", | |
"When you're learning new software, you prefer to:", | |
"When you're at a museum, you spend the most time:", | |
"When you're assembling furniture, you:", | |
"When you're learning new vocabulary, you:", | |
"When you're giving a presentation, you prefer:", | |
"When you're at a party, you enjoy:", | |
"When you're taking a break from studying, you:", | |
"When you're learning dance moves, you:", | |
"When you're choosing a book, you prefer:" | |
] | |
learning_style_options = [ | |
["Read the textbook (Reading/Writing)", "Listen to lectures (Auditory)", "Use diagrams/charts (Visual)", "Practice problems (Kinesthetic)"], | |
["Look at a map (Visual)", "Have someone tell you (Auditory)", "Write down directions (Reading/Writing)", "Try walking/driving there (Kinesthetic)"], | |
["Read instructions (Reading/Writing)", "Have someone show you (Visual)", "Listen to explanations (Auditory)", "Try it yourself (Kinesthetic)"], | |
["Need quiet (Reading/Writing)", "Need background noise (Auditory)", "Need to move around (Kinesthetic)", "Need visual stimulation (Visual)"], | |
["Their face (Visual)", "Their name (Auditory)", "What you talked about (Reading/Writing)", "What you did together (Kinesthetic)"], | |
["Read (Reading/Writing)", "Listen to music (Auditory)", "Watch TV (Visual)", "Do something active (Kinesthetic)"], | |
["Write it down (Reading/Writing)", "Tell them verbally (Auditory)", "Show them (Visual)", "Demonstrate physically (Kinesthetic)"], | |
["See it written down (Visual)", "Say it out loud (Auditory)", "Write it down (Reading/Writing)", "Do it physically (Kinesthetic)"], | |
["Reading materials (Reading/Writing)", "Listening to lectures (Auditory)", "Seeing diagrams (Visual)", "Doing hands-on activities (Kinesthetic)"], | |
["Write down steps (Reading/Writing)", "Talk through it (Auditory)", "Draw diagrams (Visual)", "Try different approaches (Kinesthetic)"], | |
["Write detailed notes (Reading/Writing)", "Record lectures (Auditory)", "Draw mind maps (Visual)", "Take minimal notes (Kinesthetic)"], | |
["Read the manual (Reading/Writing)", "Have someone explain it (Auditory)", "Watch tutorial videos (Visual)", "Just start using it (Kinesthetic)"], | |
["Reading descriptions (Reading/Writing)", "Listening to audio guides (Auditory)", "Looking at exhibits (Visual)", "Interactive displays (Kinesthetic)"], | |
["Read instructions first (Reading/Writing)", "Ask someone to help (Auditory)", "Look at diagrams (Visual)", "Start assembling (Kinesthetic)"], | |
["Write them repeatedly (Reading/Writing)", "Say them repeatedly (Auditory)", "Use flashcards (Visual)", "Use them in conversation (Kinesthetic)"], | |
["Having detailed notes (Reading/Writing)", "Speaking freely (Auditory)", "Using visual aids (Visual)", "Demonstrating something (Kinesthetic)"], | |
["Conversations (Auditory)", "People-watching (Visual)", "Dancing/games (Kinesthetic)", "Reading about people (Reading/Writing)"], | |
["Read for fun (Reading/Writing)", "Listen to music (Auditory)", "Watch videos (Visual)", "Exercise (Kinesthetic)"], | |
["Watch demonstrations (Visual)", "Listen to instructions (Auditory)", "Read choreography (Reading/Writing)", "Try the moves (Kinesthetic)"], | |
["Text-heavy books (Reading/Writing)", "Audiobooks (Auditory)", "Books with pictures (Visual)", "Interactive books (Kinesthetic)"] | |
] | |
def learning_style_quiz(*answers): | |
scores = { | |
"Visual": 0, | |
"Auditory": 0, | |
"Reading/Writing": 0, | |
"Kinesthetic": 0 | |
} | |
# Map each answer to a learning style | |
for i, answer in enumerate(answers): | |
if answer in learning_style_options[i][0]: | |
scores["Reading/Writing"] += 1 | |
elif answer in learning_style_options[i][1]: | |
scores["Auditory"] += 1 | |
elif answer in learning_style_options[i][2]: | |
scores["Visual"] += 1 | |
elif answer in learning_style_options[i][3]: | |
scores["Kinesthetic"] += 1 | |
# Get the highest score(s) | |
max_score = max(scores.values()) | |
dominant_styles = [style for style, score in scores.items() if score == max_score] | |
# Generate result | |
if len(dominant_styles) == 1: | |
result = f"Your primary learning style is: {dominant_styles[0]}" | |
else: | |
result = f"You have multiple strong learning styles: {', '.join(dominant_styles)}" | |
# Add detailed breakdown | |
result += "\n\nDetailed Scores:\n" | |
for style, score in sorted(scores.items(), key=lambda x: x[1], reverse=True): | |
result += f"{style}: {score}/20\n" | |
return result | |
# ========== SAVE STUDENT PROFILE FUNCTION ========== | |
def save_profile(name, age, interests, transcript, learning_style, favorites, blog): | |
data = { | |
"name": name, | |
"age": age, | |
"interests": interests, | |
"transcript": transcript, | |
"learning_style": learning_style, | |
"favorites": favorites, | |
"blog": blog | |
} | |
os.makedirs("student_profiles", exist_ok=True) | |
json_path = os.path.join("student_profiles", f"{name.replace(' ', '_')}_profile.json") | |
with open(json_path, "w") as f: | |
json.dump(data, f, indent=2) | |
markdown_summary = f"""### Student Profile: {name} | |
**Age:** {age} | |
**Interests:** {interests} | |
**Learning Style:** {learning_style} | |
#### Transcript: | |
{transcript_display(transcript)} | |
#### Favorites: | |
- Movie: {favorites['movie']} ({favorites['movie_reason']}) | |
- Show: {favorites['show']} ({favorites['show_reason']}) | |
- Book: {favorites['book']} ({favorites['book_reason']}) | |
- Character: {favorites['character']} ({favorites['character_reason']}) | |
#### Blog: | |
{blog if blog else "_No blog provided_"} | |
""" | |
return markdown_summary | |
def transcript_display(transcript_dict): | |
if not transcript_dict: | |
return "No transcript uploaded." | |
if isinstance(transcript_dict, dict) and all(isinstance(v, list) for v in transcript_dict.values()): | |
display = "" | |
for grade_level, courses in transcript_dict.items(): | |
display += f"\n**Grade {grade_level}**\n" | |
for course in courses: | |
display += f"- {course['course']}" | |
if 'grade' in course: | |
display += f" (Grade: {course['grade']})" | |
display += "\n" | |
return display | |
return "\n".join([f"- {course}" for course in transcript_dict["courses"]] + | |
[f"Grade Level: {transcript_dict['grade_level']}", f"GPA: {transcript_dict['gpa']}"]) | |
# ========== GRADIO INTERFACE ========== | |
with gr.Blocks() as app: | |
with gr.Tab("Step 1: Upload Transcript"): | |
transcript_file = gr.File(label="Upload your transcript (CSV, Excel, or PDF)") | |
transcript_output = gr.Textbox(label="Transcript Output") | |
transcript_data = gr.State() | |
transcript_file.change(fn=parse_transcript, inputs=transcript_file, outputs=[transcript_output, transcript_data]) | |
with gr.Tab("Step 2: Learning Style Quiz"): | |
gr.Markdown("### Complete this 20-question quiz to determine your learning style") | |
quiz_components = [] | |
for i, (question, options) in enumerate(zip(learning_style_questions, learning_style_options)): | |
quiz_components.append( | |
gr.Radio(choices=options, label=f"{i+1}. {question}") | |
) | |
learning_output = gr.Textbox(label="Learning Style Result", lines=5) | |
gr.Button("Submit Quiz").click( | |
learning_style_quiz, | |
inputs=quiz_components, | |
outputs=learning_output | |
) | |
with gr.Tab("Step 3: Personal Questions"): | |
name = gr.Textbox(label="What's your name?") | |
age = gr.Number(label="How old are you?") | |
interests = gr.Textbox(label="What are your interests?") | |
movie = gr.Textbox(label="Favorite movie?") | |
movie_reason = gr.Textbox(label="Why do you like that movie?") | |
show = gr.Textbox(label="Favorite TV show?") | |
show_reason = gr.Textbox(label="Why do you like that show?") | |
book = gr.Textbox(label="Favorite book?") | |
book_reason = gr.Textbox(label="Why do you like that book?") | |
character = gr.Textbox(label="Favorite character?") | |
character_reason = gr.Textbox(label="Why do you like that character?") | |
blog_checkbox = gr.Checkbox(label="Do you want to write a blog?", value=False) | |
blog_text = gr.Textbox(label="Write your blog here", visible=False, lines=5) | |
blog_checkbox.change(fn=lambda x: gr.update(visible=x), inputs=blog_checkbox, outputs=blog_text) | |
with gr.Tab("Step 4: Save & Review"): | |
output_summary = gr.Markdown() | |
save_btn = gr.Button("Save Profile") | |
def gather_and_save(name, age, interests, movie, movie_reason, show, show_reason, | |
book, book_reason, character, character_reason, blog, transcript, learning_style): | |
favorites = { | |
"movie": movie, | |
"movie_reason": movie_reason, | |
"show": show, | |
"show_reason": show_reason, | |
"book": book, | |
"book_reason": book_reason, | |
"character": character, | |
"character_reason": character_reason, | |
} | |
return save_profile(name, age, interests, transcript, learning_style, favorites, blog) | |
save_btn.click(fn=gather_and_save, | |
inputs=[name, age, interests, movie, movie_reason, show, show_reason, | |
book, book_reason, character, character_reason, blog_text, | |
transcript_data, learning_output], | |
outputs=output_summary) | |
app.launch() |