Final_project / app.py
Dannyar608's picture
Update app.py
8912b3c verified
raw
history blame
20.9 kB
import gradio as gr
import pandas as pd
import json
import os
import re
from PyPDF2 import PdfReader
from collections import defaultdict
# ========== TRANSCRIPT PARSING FUNCTIONS ==========
def extract_courses_with_grade_levels(text):
grade_level_pattern = r"(Grade|Year)\s*[:]?\s*(\d+|Freshman|Sophomore|Junior|Senior)"
grade_match = re.search(grade_level_pattern, text, re.IGNORECASE)
current_grade_level = grade_match.group(2) if grade_match else "Unknown"
course_pattern = r"""
(?:^|\n)
(?: (Grade|Year)\s*[:]?\s*(\d+|Freshman|Sophomore|Junior|Senior)\s*[\n-]* )?
(
(?:[A-Z]{2,}\s?\d{3})
|
[A-Z][a-z]+(?:\s[A-Z][a-z]+)*
)
\s*
(?: [:\-]?\s* ([A-F][+-]?|\d{2,3}%)? )?
"""
courses_by_grade = defaultdict(list)
current_grade = current_grade_level
for match in re.finditer(course_pattern, text, re.VERBOSE | re.MULTILINE):
grade_context, grade_level, course, grade = match.groups()
if grade_context:
current_grade = grade_level
if course:
course_info = {"course": course.strip()}
if grade:
course_info["grade"] = grade.strip()
courses_by_grade[current_grade].append(course_info)
return dict(courses_by_grade)
def parse_transcript(file):
if file.name.endswith('.csv'):
df = pd.read_csv(file)
elif file.name.endswith('.xlsx'):
df = pd.read_excel(file)
elif file.name.endswith('.pdf'):
text = ''
reader = PdfReader(file)
for page in reader.pages:
page_text = page.extract_text()
if page_text:
text += page_text + '\n'
# Grade level extraction
grade_match = re.search(r'(Grade|Year)[\s:]*(\d+|Freshman|Sophomore|Junior|Senior)', text, re.IGNORECASE)
grade_level = grade_match.group(2) if grade_match else "Unknown"
# Enhanced GPA extraction
gpa_data = {'weighted': "N/A", 'unweighted': "N/A"}
gpa_patterns = [
r'Weighted GPA[\s:]*(\d\.\d{1,2})',
r'GPA \(Weighted\)[\s:]*(\d\.\d{1,2})',
r'Cumulative GPA \(Weighted\)[\s:]*(\d\.\d{1,2})',
r'Unweighted GPA[\s:]*(\d\.\d{1,2})',
r'GPA \(Unweighted\)[\s:]*(\d\.\d{1,2})',
r'Cumulative GPA \(Unweighted\)[\s:]*(\d\.\d{1,2})',
r'GPA[\s:]*(\d\.\d{1,2})'
]
for pattern in gpa_patterns:
for match in re.finditer(pattern, text, re.IGNORECASE):
gpa_value = match.group(1)
if 'weighted' in pattern.lower():
gpa_data['weighted'] = gpa_value
elif 'unweighted' in pattern.lower():
gpa_data['unweighted'] = gpa_value
else:
if gpa_data['unweighted'] == "N/A":
gpa_data['unweighted'] = gpa_value
if gpa_data['weighted'] == "N/A":
gpa_data['weighted'] = gpa_value
courses_by_grade = extract_courses_with_grade_levels(text)
output_text = f"Grade Level: {grade_level}\n\n"
if gpa_data['weighted'] != "N/A" or gpa_data['unweighted'] != "N/A":
output_text += "GPA Information:\n"
if gpa_data['unweighted'] != "N/A":
output_text += f"- Unweighted GPA: {gpa_data['unweighted']}\n"
if gpa_data['weighted'] != "N/A":
output_text += f"- Weighted GPA: {gpa_data['weighted']}\n"
else:
output_text += "No GPA information found\n"
output_text += "\n(Courses not shown here)"
return output_text, {
"gpa": gpa_data,
"grade_level": grade_level,
"courses": courses_by_grade
}
else:
return "Unsupported file format", None
# For CSV/XLSX fallback
gpa = "N/A"
for col in ['GPA', 'Grade Point Average', 'Cumulative GPA']:
if col in df.columns:
gpa = df[col].iloc[0] if isinstance(df[col].iloc[0], (float, int)) else "N/A"
break
grade_level = "N/A"
for col in ['Grade Level', 'Grade', 'Class', 'Year']:
if col in df.columns:
grade_level = df[col].iloc[0]
break
courses = []
for col in ['Course', 'Subject', 'Course Name', 'Class']:
if col in df.columns:
courses = df[col].tolist()
break
output_text = f"Grade Level: {grade_level}\nGPA: {gpa}\n\nCourses:\n"
output_text += "\n".join(f"- {course}" for course in courses)
return output_text, {
"gpa": {"unweighted": gpa, "weighted": "N/A"},
"grade_level": grade_level,
"courses": courses
}
# ========== LEARNING STYLE QUIZ ==========
learning_style_questions = [
"When you study for a test, you prefer to:",
"When you need directions to a new place, you prefer:",
"When you learn a new skill, you prefer to:",
"When you're trying to concentrate, you:",
"When you meet new people, you remember them by:",
"When you're relaxing, you prefer to:",
"When you're explaining something to someone, you:",
"When you're trying to remember something, you:",
"When you're in a classroom, you learn best when:",
"When you're trying to solve a problem, you:",
"When you're taking notes, you:",
"When you're learning new software, you prefer to:",
"When you're at a museum, you spend the most time:",
"When you're assembling furniture, you:",
"When you're learning new vocabulary, you:",
"When you're giving a presentation, you prefer:",
"When you're at a party, you enjoy:",
"When you're taking a break from studying, you:",
"When you're learning dance moves, you:",
"When you're choosing a book, you prefer:"
]
learning_style_options = [
["Read the textbook (Reading/Writing)", "Listen to lectures (Auditory)", "Use diagrams/charts (Visual)", "Practice problems (Kinesthetic)"],
["Look at a map (Visual)", "Have someone tell you (Auditory)", "Write down directions (Reading/Writing)", "Try walking/driving there (Kinesthetic)"],
["Read instructions (Reading/Writing)", "Have someone show you (Visual)", "Listen to explanations (Auditory)", "Try it yourself (Kinesthetic)"],
["Need quiet (Reading/Writing)", "Need background noise (Auditory)", "Need to move around (Kinesthetic)", "Need visual stimulation (Visual)"],
["Their face (Visual)", "Their name (Auditory)", "What you talked about (Reading/Writing)", "What you did together (Kinesthetic)"],
["Read (Reading/Writing)", "Listen to music (Auditory)", "Watch TV (Visual)", "Do something active (Kinesthetic)"],
["Write it down (Reading/Writing)", "Tell them verbally (Auditory)", "Show them (Visual)", "Demonstrate physically (Kinesthetic)"],
["See it written down (Visual)", "Say it out loud (Auditory)", "Write it down (Reading/Writing)", "Do it physically (Kinesthetic)"],
["Reading materials (Reading/Writing)", "Listening to lectures (Auditory)", "Seeing diagrams (Visual)", "Doing hands-on activities (Kinesthetic)"],
["Write down steps (Reading/Writing)", "Talk through it (Auditory)", "Draw diagrams (Visual)", "Try different approaches (Kinesthetic)"],
["Write detailed notes (Reading/Writing)", "Record lectures (Auditory)", "Draw mind maps (Visual)", "Take minimal notes (Kinesthetic)"],
["Read the manual (Reading/Writing)", "Have someone explain it (Auditory)", "Watch tutorial videos (Visual)", "Just start using it (Kinesthetic)"],
["Reading descriptions (Reading/Writing)", "Listening to audio guides (Auditory)", "Looking at exhibits (Visual)", "Interactive displays (Kinesthetic)"],
["Read instructions first (Reading/Writing)", "Ask someone to help (Auditory)", "Look at diagrams (Visual)", "Start assembling (Kinesthetic)"],
["Write them repeatedly (Reading/Writing)", "Say them repeatedly (Auditory)", "Use flashcards (Visual)", "Use them in conversation (Kinesthetic)"],
["Having detailed notes (Reading/Writing)", "Speaking freely (Auditory)", "Using visual aids (Visual)", "Demonstrating something (Kinesthetic)"],
["Conversations (Auditory)", "People-watching (Visual)", "Dancing/games (Kinesthetic)", "Reading about people (Reading/Writing)"],
["Read for fun (Reading/Writing)", "Listen to music (Auditory)", "Watch videos (Visual)", "Exercise (Kinesthetic)"],
["Watch demonstrations (Visual)", "Listen to instructions (Auditory)", "Read choreography (Reading/Writing)", "Try the moves (Kinesthetic)"],
["Text-heavy books (Reading/Writing)", "Audiobooks (Auditory)", "Books with pictures (Visual)", "Interactive books (Kinesthetic)"]
]
def learning_style_quiz(*answers):
scores = {
"Visual": 0,
"Auditory": 0,
"Reading/Writing": 0,
"Kinesthetic": 0
}
# Map each answer to a learning style
for i, answer in enumerate(answers):
if answer in learning_style_options[i][0]:
scores["Reading/Writing"] += 1
elif answer in learning_style_options[i][1]:
scores["Auditory"] += 1
elif answer in learning_style_options[i][2]:
scores["Visual"] += 1
elif answer in learning_style_options[i][3]:
scores["Kinesthetic"] += 1
# Get the highest score(s)
max_score = max(scores.values())
dominant_styles = [style for style, score in scores.items() if score == max_score]
# Generate result
if len(dominant_styles) == 1:
result = f"Your primary learning style is: {dominant_styles[0]}"
else:
result = f"You have multiple strong learning styles: {', '.join(dominant_styles)}"
# Add detailed breakdown
result += "\n\nDetailed Scores:\n"
for style, score in sorted(scores.items(), key=lambda x: x[1], reverse=True):
result += f"{style}: {score}/20\n"
return result
# ========== SAVE STUDENT PROFILE FUNCTION ==========
def save_profile(name, age, interests, transcript, learning_style, favorites, blog):
data = {
"name": name,
"age": age,
"interests": interests,
"transcript": transcript,
"learning_style": learning_style,
"favorites": favorites,
"blog": blog
}
os.makedirs("student_profiles", exist_ok=True)
json_path = os.path.join("student_profiles", f"{name.replace(' ', '_')}_profile.json")
with open(json_path, "w") as f:
json.dump(data, f, indent=2)
markdown_summary = f"""### Student Profile: {name}
**Age:** {age}
**Interests:** {interests}
**Learning Style:** {learning_style}
#### Transcript:
{transcript_display(transcript)}
#### Favorites:
- Movie: {favorites['movie']} ({favorites['movie_reason']})
- Show: {favorites['show']} ({favorites['show_reason']})
- Book: {favorites['book']} ({favorites['book_reason']})
- Character: {favorites['character']} ({favorites['character_reason']})
#### Blog:
{blog if blog else "_No blog provided_"}
"""
return markdown_summary
def transcript_display(transcript_dict):
if not transcript_dict:
return "No transcript uploaded."
if isinstance(transcript_dict, dict) and all(isinstance(v, list) for v in transcript_dict.values()):
display = ""
for grade_level, courses in transcript_dict.items():
display += f"\n**Grade {grade_level}**\n"
for course in courses:
display += f"- {course['course']}"
if 'grade' in course:
display += f" (Grade: {course['grade']})"
display += "\n"
return display
return "\n".join([f"- {course}" for course in transcript_dict["courses"]] +
[f"Grade Level: {transcript_dict['grade_level']}", f"GPA: {transcript_dict['gpa']}"])
# ========== AI TEACHING ASSISTANT ==========
def load_profile():
files = [f for f in os.listdir("student_profiles") if f.endswith('.json')]
if files:
with open(os.path.join("student_profiles", files[0]), "r") as f:
return json.load(f)
return {}
def generate_response(message, history):
profile = load_profile()
if not profile:
return "Please complete and save your profile first using the previous tabs."
# Get profile data
learning_style = profile.get("learning_style", "")
grade_level = profile.get("transcript", {}).get("grade_level", "unknown")
gpa = profile.get("transcript", {}).get("gpa", {})
interests = profile.get("interests", "")
# Common responses
greetings = ["hi", "hello", "hey"]
study_help = ["study", "learn", "prepare", "exam"]
grade_help = ["grade", "gpa", "score"]
interest_help = ["interest", "hobby", "passion"]
if any(greet in message.lower() for greet in greetings):
return f"Hello {profile.get('name', 'there')}! How can I help you today?"
elif any(word in message.lower() for word in study_help):
if "Visual" in learning_style:
response = ("Based on your visual learning style, I recommend:\n"
"- Creating mind maps or diagrams\n"
"- Using color-coded notes\n"
"- Watching educational videos\n"
"- Drawing concepts to understand them better")
elif "Auditory" in learning_style:
response = ("Based on your auditory learning style, I recommend:\n"
"- Recording lectures and listening to them\n"
"- Participating in study groups\n"
"- Explaining concepts out loud\n"
"- Using mnemonic devices with rhymes")
elif "Reading/Writing" in learning_style:
response = ("Based on your reading/writing learning style, I recommend:\n"
"- Writing detailed notes\n"
"- Creating summaries in your own words\n"
"- Reading textbooks and articles\n"
"- Making flashcards with written explanations")
elif "Kinesthetic" in learning_style:
response = ("Based on your kinesthetic learning style, I recommend:\n"
"- Hands-on practice\n"
"- Creating physical models\n"
"- Taking frequent movement breaks\n"
"- Using real-world applications of concepts")
else:
response = ("Here are some general study tips:\n"
"- Break study sessions into 25-minute chunks\n"
"- Review material regularly\n"
"- Teach concepts to someone else\n"
"- Practice with past exams or problems")
# Add grade-specific advice
if "9" in grade_level or "Freshman" in grade_level:
response += "\n\nAs a freshman, focus on building good study habits early."
elif "10" in grade_level or "Sophomore" in grade_level:
response += "\n\nAs a sophomore, start exploring subjects that interest you."
elif "11" in grade_level or "Junior" in grade_level:
response += "\n\nAs a junior, focus on preparing for college entrance exams."
elif "12" in grade_level or "Senior" in grade_level:
response += "\n\nAs a senior, balance college applications with maintaining your grades."
return response
elif any(word in message.lower() for word in grade_help):
return (f"Your GPA information:\n"
f"- Unweighted: {gpa.get('unweighted', 'N/A')}\n"
f"- Weighted: {gpa.get('weighted', 'N/A')}\n\n"
"To improve your grades:\n"
"- Set specific, measurable goals\n"
"- Meet with teachers to understand expectations\n"
"- Develop a consistent study schedule\n"
"- Focus on your weakest areas first")
elif any(word in message.lower() for word in interest_help):
return (f"I see you're interested in: {interests}\n\n"
"You might want to:\n"
"- Find clubs or activities related to these interests\n"
"- Explore career paths that align with them\n"
"- Connect these interests to your school subjects")
elif "help" in message.lower():
return ("I can help with:\n"
"- Study tips based on your learning style\n"
"- GPA and grade information\n"
"- Academic advice tailored to your grade level\n"
"- Connecting your interests to learning\n\n"
"Try asking about:\n"
"- How to study for your classes\n"
"- Ways to improve your grades\n"
"- How to connect your interests to school")
else:
return ("I'm your personalized teaching assistant. I can help with:\n"
"- Study strategies based on your learning style\n"
"- Understanding your academic performance\n"
"- Finding ways to connect school with your interests\n\n"
"Try asking me about study tips or your academic progress!")
# ========== GRADIO INTERFACE ==========
with gr.Blocks() as app:
with gr.Tab("Step 1: Upload Transcript"):
transcript_file = gr.File(label="Upload your transcript (CSV, Excel, or PDF)")
transcript_output = gr.Textbox(label="Transcript Output")
transcript_data = gr.State()
transcript_file.change(fn=parse_transcript, inputs=transcript_file, outputs=[transcript_output, transcript_data])
with gr.Tab("Step 2: Learning Style Quiz"):
gr.Markdown("### Complete this 20-question quiz to determine your learning style")
quiz_components = []
for i, (question, options) in enumerate(zip(learning_style_questions, learning_style_options)):
quiz_components.append(
gr.Radio(choices=options, label=f"{i+1}. {question}")
)
learning_output = gr.Textbox(label="Learning Style Result", lines=5)
gr.Button("Submit Quiz").click(
learning_style_quiz,
inputs=quiz_components,
outputs=learning_output
)
with gr.Tab("Step 3: Personal Questions"):
name = gr.Textbox(label="What's your name?")
age = gr.Number(label="How old are you?")
interests = gr.Textbox(label="What are your interests?")
movie = gr.Textbox(label="Favorite movie?")
movie_reason = gr.Textbox(label="Why do you like that movie?")
show = gr.Textbox(label="Favorite TV show?")
show_reason = gr.Textbox(label="Why do you like that show?")
book = gr.Textbox(label="Favorite book?")
book_reason = gr.Textbox(label="Why do you like that book?")
character = gr.Textbox(label="Favorite character?")
character_reason = gr.Textbox(label="Why do you like that character?")
blog_checkbox = gr.Checkbox(label="Do you want to write a blog?", value=False)
blog_text = gr.Textbox(label="Write your blog here", visible=False, lines=5)
blog_checkbox.change(fn=lambda x: gr.update(visible=x), inputs=blog_checkbox, outputs=blog_text)
with gr.Tab("Step 4: Save & Review"):
output_summary = gr.Markdown()
save_btn = gr.Button("Save Profile")
def gather_and_save(name, age, interests, movie, movie_reason, show, show_reason,
book, book_reason, character, character_reason, blog, transcript, learning_style):
favorites = {
"movie": movie,
"movie_reason": movie_reason,
"show": show,
"show_reason": show_reason,
"book": book,
"book_reason": book_reason,
"character": character,
"character_reason": character_reason,
}
return save_profile(name, age, interests, transcript, learning_style, favorites, blog)
save_btn.click(fn=gather_and_save,
inputs=[name, age, interests, movie, movie_reason, show, show_reason,
book, book_reason, character, character_reason, blog_text,
transcript_data, learning_output],
outputs=output_summary)
# AI Teaching Assistant Tab
with gr.Tab("🤖 AI Teaching Assistant"):
gr.Markdown("## Your Personalized Learning Assistant")
chatbot = gr.ChatInterface(
fn=generate_response,
examples=[
"How should I study for my next test?",
"What's my GPA information?",
"How can I improve my grades?",
"How can I connect my interests to school?"
]
)
app.launch()