Spaces:

samu
/

AnotherLanguageApp

Running

App Files Files Community

samu commited on 2 days ago

Commit

dcefa44

1 Parent(s): 8fde879

curriculum and logging

Browse files

Files changed (19) hide show

backend/__pycache__/config.cpython-312.pyc +0 -0
backend/__pycache__/database.cpython-312.pyc +0 -0
backend/__pycache__/main.cpython-312.pyc +0 -0
backend/config.py +64 -0
backend/main.py +26 -4
backend/utils/__pycache__/generate_completions.cpython-312.pyc +0 -0
backend/utils/generate_completions.py +1 -0
prev_backend_v0/backend/__pycache__/config.cpython-310.pyc +0 -0
prev_backend_v0/backend/__pycache__/config.cpython-312.pyc +0 -0
prev_backend_v0/backend/__pycache__/database.cpython-310.pyc +0 -0
prev_backend_v0/backend/__pycache__/database.cpython-312.pyc +0 -0
prev_backend_v0/backend/__pycache__/main.cpython-310.pyc +0 -0
prev_backend_v0/backend/__pycache__/main.cpython-312.pyc +0 -0
prev_backend_v0/backend/config.py +262 -0
prev_backend_v0/backend/database.py +293 -0
prev_backend_v0/backend/main.py +155 -0
prev_backend_v0/backend/utils/__pycache__/generate_completions.cpython-310.pyc +0 -0
prev_backend_v0/backend/utils/__pycache__/generate_completions.cpython-312.pyc +0 -0
prev_backend_v0/backend/utils/generate_completions.py +106 -0

backend/__pycache__/config.cpython-312.pyc CHANGED Viewed

Binary files a/backend/__pycache__/config.cpython-312.pyc and b/backend/__pycache__/config.cpython-312.pyc differ

backend/__pycache__/database.cpython-312.pyc CHANGED Viewed

Binary files a/backend/__pycache__/database.cpython-312.pyc and b/backend/__pycache__/database.cpython-312.pyc differ

backend/__pycache__/main.cpython-312.pyc CHANGED Viewed

Binary files a/backend/__pycache__/main.cpython-312.pyc and b/backend/__pycache__/main.cpython-312.pyc differ

backend/config.py CHANGED Viewed

@@ -21,6 +21,70 @@ Guidelines:
 Do not include any explanations, comments, or formatting — only valid JSON.
 """
 flashcard_mode_instructions = """
 # Metadata:
 # Native language: {native_language}

 Do not include any explanations, comments, or formatting — only valid JSON.
 """
+curriculum_instructions = """
+# Metadata:
+# Native language: {native_language}
+# Target language: {target_language}
+# Proficiency level: {proficiency}
+You are an AI-powered language learning assistant tasked with generating a tailored curriculum based on the user’s metadata. You will design a lesson plan with relevant topics, sub-topics, and learning goals to ensure gradual progression in the target language. All outputs should be in the user's native language.
+### Instructions:
+1. **Start with the Lesson Topic (Main Focus):**
+   - Select a broad lesson topic based on the user’s target language and proficiency. The topic should be aligned with the user's interests (e.g., business, travel, daily conversations, etc.).
+   - Example: "Business Vocabulary," "Travel Essentials," "Basic Conversation Skills."
+2. **Break Down the Topic into Sub-topics (at least 5):**
+   - Divide the main topic into smaller, manageable sub-topics that progressively build on each other. Each sub-topic should be linked to specific learning goals and should cover key vocabulary and grammar points.
+   - Example:
+     - **Topic:** Business Vocabulary
+       - Sub-topic 1: Introducing yourself professionally
+       - Sub-topic 2: Discussing work tasks
+       - Sub-topic 3: Asking for help in the office
+3. **Define Learning Goals for Each Sub-topic:**
+   - Clearly define the learning outcomes for each sub-topic. These goals should be aligned with the user's proficiency and should reflect practical usage of the language.
+   - Example: "By the end of this sub-topic, the learner will be able to introduce themselves in a professional context."
+### Output Format:
+You should return a JSON object containing:
+- `"lesson_topic"`: The main lesson focus, written in the user's native language.
+- `"sub_topics"`: A list of sub-topics, each with its own set of learning goals, written in the user's native language.
+   - Each sub-topic should have:
+     - `"sub_topic"`: A brief title of the sub-topic in the user's native language.
+     - `"learning_goals"`: A list of clear and measurable learning goals in the user's native language.
+**Example Output:**
+```json
+{
+  "lesson_topic": "Business Vocabulary",
+  "sub_topics": [
+    {
+      "sub_topic": "Introducing yourself in a professional setting",
+      "learning_goals": [
+        "Introduce yourself using professional language",
+        "Discuss your job role"
+      ]
+    },
+    {
+      "sub_topic": "Discussing work tasks",
+      "learning_goals": [
+        "Talk about ongoing projects",
+        "Explain work responsibilities"
+      ]
+    },
+    {
+      "sub_topic": "Asking for help in the office",
+      "learning_goals": [
+        "Politely ask for assistance",
+        "Understand and respond to common office requests"
+      ]
+    }
+  ]
+}
+"""
 flashcard_mode_instructions = """
 # Metadata:
 # Native language: {native_language}

backend/main.py CHANGED Viewed

@@ -32,10 +32,6 @@ async def get_db():
     finally:
         conn.close()
-# class GenerationRequest(BaseModel):
-#     user_id: int
-#     query: str
 class Message(BaseModel):
     role: Literal["user", "assistant"]
     content: str
@@ -58,6 +54,7 @@ async def root():
 @app.post("/extract/metadata")
 async def extract_metadata(data: MetadataRequest):
     try:
         response_str = await generate_completions.get_completions(
             data.query,
@@ -79,6 +76,31 @@ async def extract_metadata(data: MetadataRequest):
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
 @app.post("/generate/flashcards")
 async def generate_flashcards(data: GenerationRequest):
     try:

     finally:
         conn.close()
 class Message(BaseModel):
     role: Literal["user", "assistant"]
     content: str
 @app.post("/extract/metadata")
 async def extract_metadata(data: MetadataRequest):
+    logging.info(f"Query: {data.query}")
     try:
         response_str = await generate_completions.get_completions(
             data.query,
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
+@app.post("/generate/curriculum")
+async def generate_curriculum(data: GenerationRequest):
+    try:
+        # Use previously extracted metadata
+        instructions = (
+            config.curriculum_instructions
+            .replace("{native_language}", native_language or "unknown")
+            .replace("{target_language}", target_language or "unknown")
+            .replace("{proficiency}", proficiency or "unknown")
+        )
+        response = await generate_completions.get_completions(
+            data.query,
+            instructions
+        )
+        return JSONResponse(
+            content={
+                "data": response,
+                "type": "curriculum",
+                "status": "success"
+            },
+            status_code=200
+        )
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
 @app.post("/generate/flashcards")
 async def generate_flashcards(data: GenerationRequest):
     try:

backend/utils/__pycache__/generate_completions.cpython-312.pyc CHANGED Viewed

Binary files a/backend/utils/__pycache__/generate_completions.cpython-312.pyc and b/backend/utils/__pycache__/generate_completions.cpython-312.pyc differ

backend/utils/generate_completions.py CHANGED Viewed

@@ -97,6 +97,7 @@ async def get_completions(
     else:
         raise TypeError("Unexpected processed input type.")
     response = await client.chat.completions.create(
         model=os.getenv("MODEL"),
         messages=messages,

     else:
         raise TypeError("Unexpected processed input type.")
+    # print(os.getenv("MODEL"))
     response = await client.chat.completions.create(
         model=os.getenv("MODEL"),
         messages=messages,

prev_backend_v0/backend/__pycache__/config.cpython-310.pyc ADDED Viewed

Binary file (12 kB). View file

prev_backend_v0/backend/__pycache__/config.cpython-312.pyc ADDED Viewed

Binary file (14.4 kB). View file

prev_backend_v0/backend/__pycache__/database.cpython-310.pyc ADDED Viewed

Binary file (10.1 kB). View file

prev_backend_v0/backend/__pycache__/database.cpython-312.pyc ADDED Viewed

Binary file (12.6 kB). View file

prev_backend_v0/backend/__pycache__/main.cpython-310.pyc ADDED Viewed

Binary file (3.28 kB). View file

prev_backend_v0/backend/__pycache__/main.cpython-312.pyc ADDED Viewed

Binary file (6.71 kB). View file

prev_backend_v0/backend/config.py ADDED Viewed

	@@ -0,0 +1,262 @@

+language_metadata_extraction_prompt = """
+You are a language learning assistant. Your task is to analyze the user's input and infer their:
+- Native language (use the language of the input as a fallback if unsure)
+- Target language (the one they want to learn)
+- Proficiency level (beginner, intermediate, or advanced)
+Respond ONLY with a valid JSON object using the following format:
+{
+  "native_language": "<user's native language>",
+  "target_language": "<language the user wants to learn>",
+  "proficiency_level": "<beginner | intermediate | advanced>"
+}
+Guidelines:
+- If the user's native language is not explicitly stated, assume it's the same as the language used in the query.
+- If the target language is mentioned indirectly (e.g. "my Dutch isn't great"), infer that as the target language.
+- Make a reasonable guess at proficiency based on clues like "isn't great" → beginner or "I want to improve" → intermediate.
+- If you cannot infer something at all, write "unknown".
+Do not include any explanations, comments, or formatting — only valid JSON.
+"""
+flashcard_mode_instructions = """
+# Metadata:
+# Native language: {native_language}
+# Target language: {target_language}
+# Proficiency level: {proficiency}
+You are a highly adaptive vocabulary tutor capable of teaching any language. Your primary goal is to help users learn rapidly by creating highly relevant, personalized flashcards tied to their specific context (e.g., hobbies, work, studies).
+### Context Format
+You will receive a series of messages in the following structure:
+[
+  {"role": "user", "content": "<user input or query>"},
+  {"role": "assistant", "content": "<flashcards or assistant response>"},
+  ...
+]
+Treat this list as prior conversation history. Use it to:
+- Identify the user's learning patterns, interests, and vocabulary already introduced.
+- Avoid repeating previously generated flashcards.
+- Adjust difficulty based on progression.
+### Generation Guidelines
+When generating a new set of flashcards:
+1. **Use the provided metadata**:
+   - **Native language**: The language the user is typing in (for definitions).
+   - **Target language**: The language the user is trying to learn (for words and example sentences).
+   - **Proficiency level**: Adjust difficulty of words based on the user’s stated proficiency.
+2. **Avoid repetition**:
+   - If a word has already been introduced in a previous flashcard, do not repeat it.
+   - Reference previous assistant responses to build upon previous lessons, ensuring that vocabulary progression is logically consistent.
+3. **Adjust content based on proficiency**:
+   - For **beginner** users, use basic, high-frequency vocabulary.
+   - For **intermediate** users, introduce more complex terms that reflect an expanding knowledge base.
+   - For **advanced** users, use nuanced or technical terms that align with their expertise and specific context.
+4. **Domain relevance**:
+   - Make sure the words and examples are specific to the user’s context (e.g., their profession, hobbies, or field of study).
+   - Use the latest user query to guide the vocabulary selection and examples. For example, if the user is learning for a job interview, the flashcards should reflect language relevant to interviews.
+### Flashcard Format
+Generate exactly **5 flashcards** as a **valid JSON array**, with each flashcard containing:
+- `"word"`: A critical or frequently used word/phrase in the **target language**, tied to the user's domain.
+- `"definition"`: A concise, learner-friendly definition in the **base language** (the user’s native language).
+- `"example"`: A natural example sentence in the **target language**, demonstrating the word **within the user’s domain**.
+### Example Query and Expected Output
+#### Example Query:
+User: "Flashcards for my hobby: landscape photography in German (intermediate level, base: English)"
+#### Example Output:
+```json
+[
+  {"word": "Belichtung", "definition": "exposure (photography)", "example": "Die richtige Belichtung ist entscheidend für ein gutes Landschaftsfoto."},
+  {"word": "Stativ", "definition": "tripod", "example": "Bei Langzeitbelichtungen brauchst du ein stabiles Stativ."},
+  {"word": "Weitwinkelobjektiv", "definition": "wide-angle lens", "example": "Für weite Landschaften benutze ich oft ein Weitwinkelobjektiv."},
+  {"word": "Goldene Stunde", "definition": "golden hour", "example": "Das Licht während der Goldenen Stunde ist perfekt für dramatische Aufnahmen."},
+  {"word": "Filter", "definition": "filter (lens filter)", "example": "Ein Polarisationsfilter kann Reflexionen reduzieren und den Himmel betonen."}
+]
+"""
+exercise_mode_instructions = """
+# Metadata:
+# Native language: {native_language}
+# Target language: {target_language}
+# Proficiency level: {proficiency}
+You are a smart, context-aware language exercise generator. Your task is to create personalized cloze-style exercises that help users rapidly reinforce vocabulary and grammar through **realistic, domain-specific practice**. You support any language.
+### Context Format
+You will receive a list of previous messages:
+[
+  {"role": "user", "content": "<user input or query>"},
+  {"role": "assistant", "content": "<generated exercises>"}
+]
+Treat this list as prior conversation history. Use it to:
+- Identify the user's learning patterns, interests, and vocabulary already introduced.
+- Avoid repeating exercises or vocabulary.
+- Ensure progression in complexity or topic coverage.
+- Maintain continuity with the user’s learning focus.
+### Generation Task
+When generating a new set of exercises:
+1. **Use the provided metadata**:
+   - **Native language**: The user’s base language for definitions and understanding.
+   - **Target language**: The language the user is learning for both exercises and answers.
+   - **Proficiency level**: Adjust the complexity of the exercises based on the user's proficiency (beginner, intermediate, advanced).
+2. **Domain relevance**:
+   - Focus on the **domain of interest** (e.g., work, hobby, study area).
+   - Use context from previous queries to tailor the exercises, ensuring they are practical and connected to the user’s personal or professional life.
+3. **Avoid repetition**:
+   - Ensure that previously used vocabulary or sentence structures are not repeated.
+   - Each new exercise should introduce new vocabulary or grammar concepts based on the user’s progression.
+4. **Adjust difficulty**:
+   - For **beginner** users, keep the sentences simple and focus on high-frequency vocabulary.
+   - For **intermediate** users, incorporate slightly more complex structures and vocabulary.
+   - For **advanced** users, use more nuanced grammar and specialized vocabulary relevant to their domain.
+### Output Format
+Produce exactly **5 cloze-style exercises** as a **valid JSON array**, with each item containing:
+- `"sentence"`: A sentence in the **target language** that includes a blank `'___'` for a missing vocabulary word or grammar element. The sentence should be relevant to the user’s domain of interest.
+- `"answer"`: The correct word or phrase to fill in the blank.
+- `"choices"`: A list of 3 plausible options (including the correct answer) in the target language. Distractors should be believable but clearly incorrect in context.
+### Example Query and Expected Output
+#### Example Query:
+User: "Beginner French exercises about my work in marketing (base: English)"
+#### Expected Output:
+```json
+[
+  {"sentence": "Nous devons lancer la nouvelle ___ le mois prochain.", "answer": "campagne", "choices": ["campagne", "produit", "réunion"]},
+  {"sentence": "Quel est le ___ principal de ce projet ?", "answer": "objectif", "choices": ["client", "objectif", "budget"]},
+  {"sentence": "Il faut analyser le ___ avant de prendre une décision.", "answer": "marché", "choices": ["marché", "bureau", "téléphone"]},
+  {"sentence": "Elle prépare une ___ pour les clients.", "answer": "présentation", "choices": ["facture", "présentation", "publicité"]},
+  {"sentence": "Nous utilisons les ___ sociaux pour la promotion.", "answer": "réseaux", "choices": ["médias", "réseaux", "journaux"]}
+]
+"""
+simulation_mode_instructions = """
+# Metadata:
+# Native language: {native_language}
+# Target language: {target_language}
+# Proficiency level: {proficiency}
+You are a **creative, context-aware storytelling engine**. Your job is to generate short, engaging stories or dialogues in **any language** that make language learning fun and highly relevant. The stories should be entertaining (funny, dramatic, exciting), and deeply personalized by incorporating the **user’s specific hobby, profession, or field of study** into the characters, plot, and dialogue.
+### Context Format
+You will receive a list of prior messages:
+[
+  {"role": "user", "content": "<user input>"},
+  {"role": "assistant", "content": "<last generated story>"}
+]
+Treat this list as prior conversation history. Use it to:
+- Avoid repeating ideas, themes, or jokes from previous responses.
+- Build on past tone, vocabulary, or characters if appropriate.
+- Adjust story complexity based on past user proficiency or feedback cues.
+### Story Generation Task
+From the latest user message:
+1. **Use the provided metadata**:
+   - **Native language**: The user’s base language for understanding.
+   - **Target language**: The language the user is learning.
+   - **Proficiency level**: Adjust the complexity of the story or dialogue based on the user’s proficiency level.
+2. **Domain relevance**:
+   - Focus on the **user's domain of interest** (e.g., work, hobby, field of study).
+   - Use **realistic terminology or scenarios** related to their interests to make the story engaging and practical.
+3. **Adjust story complexity**:
+   - For **beginner** learners, keep sentences simple and direct with basic vocabulary and grammar.
+   - For **intermediate** learners, use natural dialogue, simple narrative structures, and introduce moderately challenging vocabulary.
+   - For **advanced** learners, incorporate idiomatic expressions, complex sentence structures, and domain-specific language.
+4. **Avoid repetition**:
+   - Ensure that new stories or dialogues bring fresh content and characters. Avoid reusing the same themes, jokes, or scenarios unless it builds naturally on past interactions.
+5. **Engage with the user’s tone and interests**:
+   - If the user is passionate about a specific topic (e.g., cooking, space exploration, or law), integrate that into the story. If the user likes humor, use a fun tone; for drama or excitement, make the story engaging with conflict or high stakes.
+### Output Format
+Return a valid **JSON object** with the following structure:
+- `"title"`: An engaging title in the **native language**.
+- `"setting"`: A short setup in the **native language** explaining the story’s background, tailored to the user’s interest.
+- `"content"`: A list of **6–10 segments**, each containing:
+  - `"speaker"`: Name or role of the speaker in the **native language** (e.g., "Narrator", "Professor Lee", "The Engineer").
+  - `"target_language_text"`: Sentence in the **target language**.
+  - `"phonetics"`: Standardized phonetic transcription (IPA, Pinyin, etc.) if applicable and helpful. Omit if unavailable or not useful.
+  - `"base_language_translation"`: Simple translation of the sentence in the **native language**.
+### Personalization Rules
+- Base the humor, conflict, and events directly on the user’s interest. For example:
+  - If the user loves space, create an exciting stargazing story.
+  - If they study law, create a courtroom dialogue with legal terms.
+  - If they’re into cooking, make the story about a cooking adventure.
+- Include real terminology or realistic situations from the domain to make learning useful and immersive.
+- Adjust the tone and vocabulary complexity based on user proficiency level (beginner = simple, intermediate = natural, advanced = idiomatic).
+- Keep the pacing tight — avoid overly long narrations or explanations.
+### Output Instructions
+Return only the final **JSON object**. Do not include:
+- Explanations
+- Notes
+- Comments
+- Markdown formatting
+### Example User Input
+"Funny story for intermediate French learner about cooking hobby (base: English)"
+### Example Output (French)
+```json
+{
+  "title": "La Panique de la Paella",
+  "setting": "Pierre essaie d'impressionner ses amis en cuisinant une paella espagnole authentique pour la première fois.",
+  "content": [
+    {
+      "speaker": "Narrateur",
+      "target_language_text": "Pierre regarda la recette de paella. Cela semblait facile.",
+      "phonetics": "pjeʁ ʁəɡaʁda la ʁesɛt də paɛʎa. sə.la sɛ̃blɛ ɛ.fa.sil",
+      "base_language_translation": "Pierre looked at the paella recipe. It seemed easy."
+    },
+    {
+      "speaker": "Pierre",
+      "target_language_text": "Il me faut du safran! Où est le safran?",
+      "phonetics": "il mə fo dy sa.fʁɑ̃! u ɛ lə sa.fʁɑ̃",
+      "base_language_translation": "I need saffron! Where is the saffron?"
+    },
+    {
+      "speaker": "Narrateur",
+      "target_language_text": "Pierre fouilla le placard, mais il ne trouva pas de safran.",
+      "phonetics": "pjeʁ fwi.jɑ lə pla.kɑʁ, mɛ il nə tʁu.va pa də sa.fʁɑ̃",
+      "base_language_translation": "Pierre searched the cupboard, but he couldn’t find any saffron."
+    },
+    {
+      "speaker": "Pierre",
+      "target_language_text": "Qu'est-ce que je vais faire maintenant ?",
+      "phonetics": "kɛs.kə ʒə vɛ fɛʁ mɛ̃tə.nɑ̃?",
+      "base_language_translation": "What am I going to do now?"
+    },
+    {
+      "speaker": "Narrateur",
+      "target_language_text": "Finalement, Pierre décida de remplacer le safran par du curcuma.",
+      "phonetics": "fi.nal.mɑ̃ pjeʁ de.si.da də ʁɑ̃.pla.sə lə sa.fʁɑ̃ paʁ dy kyʁ.ky.ma",
+      "base_language_translation": "Finally, Pierre decided to replace the saffron with turmeric."
+    },
+    {
+      "speaker": "Pierre",
+      "target_language_text": "C'est presque pareil, non ?",
+      "phonetics": "sɛ pʁɛs.kə paʁɛj, nɔ̃?",
+      "base_language_translation": "It's almost the same, right?"
+    }
+  ]
+}
+"""

prev_backend_v0/backend/database.py ADDED Viewed

	@@ -0,0 +1,293 @@

+import psycopg2
+import os
+from psycopg2 import sql
+from dotenv import load_dotenv
+load_dotenv()
+# Database Configuration from environment variables
+DB_NAME = os.getenv("POSTGRES_DB", "linguaai")
+DB_USER = os.getenv("POSTGRES_USER", "linguaai_user")
+DB_PASSWORD = os.getenv("POSTGRES_PASSWORD", "LinguaAI1008")
+DB_HOST = os.getenv("DB_HOST", "localhost")
+DB_PORT = os.getenv("DB_PORT", "5432")
+# SQL Schema Definition
+SCHEMA_SQL = """
+-- Drop existing objects if they exist
+-- Note: Some drops below might be for tables not defined in this specific script.
+DROP TABLE IF EXISTS user_activity_progress CASCADE;
+DROP TABLE IF EXISTS activities CASCADE;
+DROP TABLE IF EXISTS weekly_modules CASCADE;
+DROP TABLE IF EXISTS curriculums CASCADE;
+DROP TABLE IF EXISTS generated_flashcards CASCADE;
+DROP TABLE IF EXISTS flashcard_sets CASCADE;          -- Corrected name
+DROP TABLE IF EXISTS generated_exercises CASCADE;
+DROP TABLE IF EXISTS exercise_sets CASCADE;           -- Corrected name
+DROP TABLE IF EXISTS simulations CASCADE;             -- Corrected name
+DROP TABLE IF EXISTS users CASCADE;
+DROP TYPE IF EXISTS activity_status CASCADE;
+-- Table `users`
+CREATE TABLE users (
+    user_id SERIAL PRIMARY KEY,
+    username VARCHAR(50) UNIQUE NOT NULL,
+    email VARCHAR(100) UNIQUE NOT NULL,
+    password_hash VARCHAR(255) NOT NULL,
+    created_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP
+);
+-- Trigger function (remains the same)
+CREATE OR REPLACE FUNCTION update_updated_at_column()
+RETURNS TRIGGER AS $$
+BEGIN
+    NEW.updated_at = now();
+    RETURN NEW;
+END;
+$$ language 'plpgsql';
+-- Trigger for users (remains the same)
+CREATE TRIGGER users_update_updated_at
+    BEFORE UPDATE ON users
+    FOR EACH ROW
+    EXECUTE FUNCTION update_updated_at_column();
+-- ============================================
+-- Tables for Generated Content (Flashcards)
+-- ============================================
+-- Table `flashcard_sets` (Represents one request/query)
+CREATE TABLE flashcard_sets (
+    id SERIAL PRIMARY KEY,
+    user_id INTEGER NOT NULL REFERENCES users(user_id), -- Added FK reference for completeness
+    query TEXT NOT NULL,
+    flashcards JSONB NOT NULL,  -- Stores an array of 5 flashcards
+    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP -- Added updated_at for consistency
+);
+CREATE INDEX idx_flashcard_set_user ON flashcard_sets(user_id);
+-- Corrected Trigger definition for flashcard_sets
+CREATE TRIGGER flashcard_sets_update_updated_at      -- Renamed trigger
+    BEFORE UPDATE ON flashcard_sets                  -- Corrected table name
+    FOR EACH ROW
+    EXECUTE FUNCTION update_updated_at_column();     -- Assumes you want updated_at here too
+-- Table `generated_flashcards` (Individual flashcards within a set)
+CREATE TABLE generated_flashcards (
+    flashcard_id SERIAL PRIMARY KEY,
+    set_id INT NOT NULL REFERENCES flashcard_sets(id) ON DELETE CASCADE, -- Corrected FK reference (table and column)
+    word TEXT NOT NULL,
+    definition TEXT NOT NULL,
+    example TEXT, -- Example might be optional
+    created_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP
+);
+CREATE INDEX idx_flashcard_set ON generated_flashcards(set_id);
+-- Trigger for generated_flashcards (remains the same)
+CREATE TRIGGER generated_flashcards_update_updated_at
+    BEFORE UPDATE ON generated_flashcards
+    FOR EACH ROW
+    EXECUTE FUNCTION update_updated_at_column();
+-- ============================================
+-- Tables for Generated Content (Exercises)
+-- ============================================
+-- Table `exercise_sets` (Represents one request/query) -- Corrected comment
+CREATE TABLE exercise_sets (
+    id SERIAL PRIMARY KEY,
+    user_id INTEGER NOT NULL REFERENCES users(user_id), -- Added FK reference for completeness
+    query TEXT NOT NULL,
+    exercises JSONB NOT NULL,  -- Array of 5 exercises
+    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP -- Added updated_at for consistency
+);
+CREATE INDEX idx_exercise_set_user ON exercise_sets(user_id); -- Corrected table name (was already correct but double-checked)
+-- Corrected Trigger definition for exercise_sets
+CREATE TRIGGER exercise_sets_update_updated_at       -- Renamed trigger
+    BEFORE UPDATE ON exercise_sets                   -- Corrected table name
+    FOR EACH ROW
+    EXECUTE FUNCTION update_updated_at_column();      -- Assumes you want updated_at here too
+-- Table `generated_exercises` (Individual exercises within a set)
+CREATE TABLE generated_exercises (
+    exercise_id SERIAL PRIMARY KEY,
+    set_id INT NOT NULL REFERENCES exercise_sets(id) ON DELETE CASCADE, -- Corrected FK reference (table and column)
+    sentence TEXT NOT NULL,
+    answer TEXT NOT NULL,
+    choices JSONB NOT NULL, -- Storing the array of choices
+    created_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP
+);
+CREATE INDEX idx_exercise_set ON generated_exercises(set_id);
+-- Trigger for generated_exercises (remains the same)
+CREATE TRIGGER generated_exercises_update_updated_at
+    BEFORE UPDATE ON generated_exercises
+    FOR EACH ROW
+    EXECUTE FUNCTION update_updated_at_column();
+-- ============================================
+-- Table for Generated Content (Simulations)
+-- ============================================
+-- Table `simulations` (Represents one simulation request/result) -- Corrected comment
+CREATE TABLE simulations (
+    id SERIAL PRIMARY KEY,
+    user_id INTEGER NOT NULL REFERENCES users(user_id), -- Added FK reference for completeness
+    query TEXT NOT NULL,
+    scenario TEXT NOT NULL,
+    dialog JSONB NOT NULL,  -- Array of turns with 'role', 'chinese', 'pinyin', 'english'
+    created_at TIMESTAMP DEFAULT CURRENT_TIMESTAMP,
+    updated_at TIMESTAMPTZ DEFAULT CURRENT_TIMESTAMP -- Added updated_at for consistency
+);
+CREATE INDEX idx_simulation_user ON simulations(user_id); -- Corrected table name
+-- Corrected Trigger definition for simulations
+CREATE TRIGGER simulations_update_updated_at       -- Renamed trigger
+    BEFORE UPDATE ON simulations                   -- Corrected table name
+    FOR EACH ROW
+    EXECUTE FUNCTION update_updated_at_column();      -- Assumes you want updated_at here too
+"""
+def get_db_connection():
+    """Get a synchronous database connection."""
+    try:
+        conn = psycopg2.connect(
+            dbname=DB_NAME,
+            user=DB_USER,
+            password=DB_PASSWORD,
+            host=DB_HOST,
+            port=DB_PORT
+        )
+        return conn
+    except psycopg2.Error as e:
+        print(f"Database connection error: {e}")
+        raise
+def reset_sequences():
+    """Generate SQL to reset all sequences (auto-incrementing IDs) to 1."""
+    sequences_sql = """
+    SELECT 'ALTER SEQUENCE ' || sequence_name || ' RESTART WITH 1;'
+    FROM information_schema.sequences
+    WHERE sequence_schema = 'public';
+    """
+    return sequences_sql
+def reset_database(confirm=True):
+    """Reset the database by dropping all tables and recreating them."""
+    if confirm:
+        user_confirm = input("WARNING: This will DELETE ALL DATA. Type 'yes' to proceed: ")
+        if user_confirm.lower() != 'yes':
+            print("Database reset cancelled.")
+            return
+    conn = None
+    try:
+        conn = get_db_connection()
+        conn.autocommit = False
+        print("Database connection established.")
+        with conn.cursor() as cur:
+            print("Dropping and recreating schema...")
+            # Execute the main schema SQL (includes drops)
+            cur.execute(SCHEMA_SQL)
+            print("Schema recreated successfully.")
+            # Generate and execute sequence reset SQL
+            print("Resetting sequences...")
+            reset_sql_query = reset_sequences()
+            cur.execute(reset_sql_query)
+            reset_commands = cur.fetchall()
+            for command in reset_commands:
+                cur.execute(command[0])
+            print("Sequences reset successfully.")
+        conn.commit()
+        print("Database reset complete.")
+    except psycopg2.Error as e:
+        print(f"Database error during reset: {e}")
+        if conn:
+            conn.rollback()
+            print("Transaction rolled back.")
+    except Exception as e:
+        print(f"An unexpected error occurred during reset: {e}")
+        if conn:
+            conn.rollback()
+    finally:
+        if conn:
+            conn.close()
+            print("Database connection closed.")
+def setup_database(confirm=True):
+    """Set up the database schema if tables do not exist."""
+    if confirm:
+        user_confirm = input("Do you want to set up the database? Type 'yes' to proceed: ")
+        if user_confirm.lower() != 'yes':
+            print("Database setup cancelled.")
+            return
+    conn = None
+    try:
+        conn = get_db_connection()
+        conn.autocommit = False
+        print("Database connection established.")
+        with conn.cursor() as cur:
+            print("Checking if tables exist...")
+            cur.execute("""
+                SELECT EXISTS (
+                    SELECT FROM information_schema.tables
+                    WHERE table_schema = 'public'
+                    AND table_name = 'users'
+                );
+            """)
+            tables_exist = cur.fetchone()[0]
+            if tables_exist:
+                print("Tables already exist. Use reset_database() to reset the database or run setup with confirm=False.")
+                conn.rollback() # Rollback as no changes should be made
+                return
+            print("Creating schema...")
+            cur.execute(SCHEMA_SQL)
+            print("Schema created successfully.")
+        conn.commit()
+        print("Database setup complete.")
+    except psycopg2.Error as e:
+        print(f"Database error during setup: {e}")
+        if conn:
+            conn.rollback()
+            print("Transaction rolled back.")
+    except Exception as e:
+        print(f"An unexpected error occurred during setup: {e}")
+        if conn:
+            conn.rollback()
+    finally:
+        if conn:
+            conn.close()
+            print("Database connection closed.")
+if __name__ == "__main__":
+    action = input("Enter 'setup' to setup database or 'reset' to reset database: ").lower()
+    if action == 'reset':
+        reset_database()
+    elif action == 'setup':
+        setup_database()
+    else:
+        print("Invalid action. Use 'setup' or 'reset'.")

prev_backend_v0/backend/main.py ADDED Viewed

	@@ -0,0 +1,155 @@

+from fastapi import FastAPI, HTTPException
+from fastapi.responses import JSONResponse
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel
+from backend.utils import generate_completions
+from backend import config
+from backend.database import get_db_connection
+import psycopg2
+from psycopg2.extras import RealDictCursor
+from typing import Union, List, Literal, Optional
+import logging
+import json
+logging.basicConfig(level=logging.INFO)
+app = FastAPI()
+# Add CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],  # Allows all origins
+    allow_credentials=True,
+    allow_methods=["*"],  # Allows all methods
+    allow_headers=["*"],  # Allows all headers
+)
+# Dependency to get database connection
+async def get_db():
+    conn = await get_db_connection()
+    try:
+        yield conn
+    finally:
+        conn.close()
+# class GenerationRequest(BaseModel):
+#     user_id: int
+#     query: str
+class Message(BaseModel):
+    role: Literal["user", "assistant"]
+    content: str
+class GenerationRequest(BaseModel):
+    user_id: int
+    query: Union[str, List[Message]]
+class MetadataRequest(BaseModel):
+    query: str
+# Global metadata variables
+native_language: Optional[str] = None
+target_language: Optional[str] = None
+proficiency: Optional[str] = None
+@app.get("/")
+async def root():
+    return {"message": "Welcome to the AI Learning Assistant API!"}
+@app.post("/extract/metadata")
+async def extract_metadata(data: MetadataRequest):
+    try:
+        response_str = await generate_completions.get_completions(
+            data.query,
+            config.language_metadata_extraction_prompt
+        )
+        metadata_dict = json.loads(response_str)
+        # Update globals for other endpoints
+        globals()['native_language'] = metadata_dict.get('native_language', 'unknown')
+        globals()['target_language'] = metadata_dict.get('target_language', 'unknown')
+        globals()['proficiency'] = metadata_dict.get('proficiency_level', 'unknown')
+        return JSONResponse(
+            content={
+                "data": metadata_dict,
+                "type": "language_metadata",
+                "status": "success"
+            },
+            status_code=200
+        )
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/generate/flashcards")
+async def generate_flashcards(data: GenerationRequest):
+    try:
+        # Use previously extracted metadata
+        instructions = (
+            config.flashcard_mode_instructions
+            .replace("{native_language}", native_language or "unknown")
+            .replace("{target_language}", target_language or "unknown")
+            .replace("{proficiency}", proficiency or "unknown")
+        )
+        response = await generate_completions.get_completions(
+            data.query,
+            instructions
+        )
+        return JSONResponse(
+            content={
+                "data": response,
+                "type": "flashcards",
+                "status": "success"
+            },
+            status_code=200
+        )
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/generate/exercises")
+async def generate_exercises(data: GenerationRequest):
+    try:
+        # Use previously extracted metadata
+        instructions = (
+            config.exercise_mode_instructions
+            .replace("{native_language}", native_language or "unknown")
+            .replace("{target_language}", target_language or "unknown")
+            .replace("{proficiency}", proficiency or "unknown")
+        )
+        response = await generate_completions.get_completions(
+            data.query,
+            instructions
+        )
+        return JSONResponse(
+            content={
+                "data": response,
+                "type": "exercises",
+                "status": "success"
+            },
+            status_code=200
+        )
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+@app.post("/generate/simulation")
+async def generate_simulation(data: GenerationRequest):
+    try:
+        # Use previously extracted metadata
+        instructions = (
+            config.simulation_mode_instructions
+            .replace("{native_language}", native_language or "unknown")
+            .replace("{target_language}", target_language or "unknown")
+            .replace("{proficiency}", proficiency or "unknown")
+        )
+        response = await generate_completions.get_completions(
+            data.query,
+            instructions
+        )
+        return JSONResponse(
+            content={
+                "data": response,
+                "type": "simulation",
+                "status": "success"
+            },
+            status_code=200
+        )
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))

prev_backend_v0/backend/utils/__pycache__/generate_completions.cpython-310.pyc ADDED Viewed

Binary file (2.55 kB). View file

prev_backend_v0/backend/utils/__pycache__/generate_completions.cpython-312.pyc ADDED Viewed

Binary file (3.69 kB). View file

prev_backend_v0/backend/utils/generate_completions.py ADDED Viewed

	@@ -0,0 +1,106 @@

+from openai import AsyncOpenAI, OpenAI
+import asyncio
+import json
+from typing import AsyncIterator
+from typing import Union, List, Dict, Literal
+from dotenv import load_dotenv
+import os
+from pydantic import BaseModel
+load_dotenv()
+# Initialize the async client
+client = AsyncOpenAI(
+    base_url=os.getenv("BASE_URL"),
+    api_key=os.getenv("API_KEY"),
+)
+class Message(BaseModel):
+    role: Literal["user", "assistant"]
+    content: str
+# Helper function to flatten chat messages into a single string prompt
+def flatten_messages(messages: List[Message]) -> str:
+    return "\n".join([f"{m.role}: {m.content}" for m in messages])
+def process_input(data: Union[str, List[Dict[str, str]]]) -> Union[str, List[Dict[str, str]]]:
+    """
+    Processes input to either uppercase a string or modify the 'content' field
+    of a list of dictionaries.
+    """
+    if isinstance(data, str):
+        return data.strip()  # Ensures prompt is cleaned up (optional)
+    elif isinstance(data, list):
+        # Ensure each item in the list is a dictionary with a 'content' key
+        return [
+            {**item, "content": item["content"].strip()}  # Trims whitespace in 'content'
+            for item in data if isinstance(item, dict) and "content" in item
+        ]
+    else:
+        raise TypeError("Input must be a string or a list of dictionaries with a 'content' field")
+# async def get_completions(
+#     prompt: Union[str, List[Dict[str, str]]],
+#     instructions: str
+# ) -> str:
+#     processed_prompt = process_input(prompt)  # Ensures the input format is correct
+#     if isinstance(processed_prompt, str):
+#         messages = [
+#             {"role": "system", "content": instructions},
+#             {"role": "user", "content": processed_prompt}
+#         ]
+#     elif isinstance(processed_prompt, list):
+#         messages = [{"role": "system", "content": instructions}] + processed_prompt
+#     else:
+#         raise TypeError("Unexpected processed input type.")
+#     response = await client.chat.completions.create(
+#         model=os.getenv("MODEL"),
+#         messages=messages,
+#         response_format={"type": "json_object"}
+#     )
+#     output: str = response.choices[0].message.content
+#     return output
+async def get_completions(
+    prompt: Union[str, List[Dict[str, str]]],
+    instructions: str
+) -> str:
+    if isinstance(prompt, list):
+        formatted_query = flatten_messages(prompt)
+    else:
+        formatted_query = prompt
+    processed_prompt = process_input(formatted_query)
+    messages = [{"role": "system", "content": instructions}]
+    if isinstance(processed_prompt, str):
+        messages.append({"role": "user", "content": processed_prompt})
+    elif isinstance(processed_prompt, list):
+        # Only keep the history for context and append the latest user query at the end
+        history = processed_prompt[:-1]
+        last_user_msg = processed_prompt[-1]
+        # Optional: Validate that the last message is from the user
+        if last_user_msg.get("role") != "user":
+            raise ValueError("Last message must be from the user.")
+        messages += history
+        messages.append(last_user_msg)
+    else:
+        raise TypeError("Unexpected processed input type.")
+    response = await client.chat.completions.create(
+        model=os.getenv("MODEL"),
+        messages=messages,
+        response_format={"type": "json_object"}
+    )
+    return response.choices[0].message.content  # adjust based on your client