Spaces:

mikaelJ46
/

GoeHistBusn

Sleeping

File size: 41,335 Bytes

# --------------------------------------------------------------
# IGCSE Platform – Enhanced Past Papers System with Question Search
# Models: Gemini 2.5 (Primary) → Cohere → Z.ai → MiniMax (Fallbacks)
# --------------------------------------------------------------

import os
import json
from datetime import datetime
import gradio as gr
import PyPDF2
import time
import re
from PIL import Image
import io

# ---------- 1. Configure ALL AI Systems ----------
# Gemini (Primary)
try:
    import google.generativeai as genai
    genai.configure(api_key=os.getenv("GEMINI_API_KEY"))
    gemini_model = genai.GenerativeModel('gemini-2.5-pro')
    print("✅ Gemini AI initialized successfully (PRIMARY)")
except Exception as e:
    print(f"❌ Error initializing Gemini: {e}")
    gemini_model = None

# Cohere (Secondary)
try:
    import cohere
    cohere_client = cohere.Client(os.getenv("COHERE_API_KEY"))
    print("✅ Cohere initialized successfully (SECONDARY)")
except Exception as e:
    print(f"❌ Error initializing Cohere: {e}")
    cohere_client = None

# Z.ai (Tertiary)
try:
    from huggingface_hub import InferenceClient
    zai_client = InferenceClient(
        provider="novita",
        api_key=os.environ.get("HF_TOKEN"),
    )
    print("✅ Z.ai GLM-4.6 initialized successfully (TERTIARY)")
except Exception as e:
    print(f"❌ Error initializing Z.ai: {e}")
    zai_client = None

# MiniMax (Final Fallback)
try:
    minimax_client = InferenceClient(
        provider="novita",
        api_key=os.environ.get("HF_TOKEN"),
    )
    print("✅ MiniMax AI initialized successfully (FINAL FALLBACK)")
except Exception as e:
    print(f"❌ Error initializing MiniMax: {e}")
    minimax_client = None

# ---------- 2. Unified AI Function with Smart Fallback ----------
def ask_ai(prompt, temperature=0.7, max_retries=2):
    """
    Try models in order: Gemini → Cohere → Z.ai → MiniMax
    Returns: (response_text, source_name)
    """
    last_error = None
    
    # Try Gemini first (Primary)
    if gemini_model:
        for attempt in range(max_retries):
            try:
                response = gemini_model.generate_content(
                    prompt,
                    generation_config=genai.types.GenerationConfig(
                        temperature=temperature,
                    )
                )
                return response.text, "gemini"
            except Exception as e:
                last_error = e
                print(f"⚠ Gemini attempt {attempt+1} failed: {str(e)}")
                if attempt < max_retries - 1:
                    time.sleep(1)
    
    # Try Cohere (Secondary)
    if cohere_client:
        for attempt in range(max_retries):
            try:
                response = cohere_client.chat(
                    model="command-r-plus-08-2024",
                    message=prompt,
                    temperature=temperature
                )
                return response.text, "cohere"
            except Exception as e:
                last_error = e
                print(f"⚠ Cohere attempt {attempt+1} failed: {str(e)}")
                if attempt < max_retries - 1:
                    time.sleep(1)
    
    # Try Z.ai (Tertiary)
    if zai_client:
        for attempt in range(max_retries):
            try:
                completion = zai_client.chat.completions.create(
                    model="zai-org/GLM-4.6",
                    messages=[{"role": "user", "content": prompt}],
                    temperature=temperature
                )
                return completion.choices[0].message.content, "zai"
            except Exception as e:
                last_error = e
                print(f"⚠ Z.ai attempt {attempt+1} failed: {str(e)}")
                if attempt < max_retries - 1:
                    time.sleep(1)
    
    # Try MiniMax (Final Fallback)
    if minimax_client:
        try:
            completion = minimax_client.chat.completions.create(
                model="MiniMaxAI/MiniMax-M2",
                messages=[{"role": "user", "content": prompt}],
                temperature=temperature
            )
            return completion.choices[0].message.content, "minimax"
        except Exception as e:
            last_error = e
            print(f"⚠ MiniMax fallback failed: {str(e)}")
    
    # All failed
    error_msg = f"❌ Error: All AI services failed. Last error: {str(last_error)}"
    return error_msg, "error"

# ---------- 3. Enhanced Global Storage ----------
papers_storage = []
pdf_content_storage = {}
insert_storage = {}  # Store insert images/documents
questions_index = []  # Index of all extracted questions
ADMIN_PASSWORD = "@mikaelJ46"

# ---------- 4. Topic lists ----------
geography_topics = [
    "Population & Settlement", "Migration", "Urbanisation", "Rural Settlements",
    "Natural Hazards: Earthquakes", "Natural Hazards: Volcanoes", "Natural Hazards: Tropical Storms",
    "Rivers & Flooding", "Coasts & Coastal Management", "Weather & Climate",
    "Climate Change", "Ecosystems: Tropical Rainforests", "Ecosystems: Hot Deserts",
    "Economic Development", "Industry & Manufacturing", "Tourism", "Energy Resources",
    "Water Resources", "Agriculture & Food Production", "Environmental Risks",
    "Map Skills & Fieldwork", "GIS & Technology", "Sustainability"
]

history_topics = [
    "WWI: Causes & Origins", "WWI: Key Events & Battles", "WWI: Treaty of Versailles",
    "WWII: Causes", "WWII: Key Events", "WWII: Holocaust", "WWII: Impact & Consequences",
    "Cold War: Origins", "Cold War: Key Events", "Cold War: Cuban Missile Crisis",
    "Russian Revolution 1917", "Rise of Stalin", "Nazi Germany: Hitler's Rise",
    "Nazi Germany: Policies", "Nazi Germany: Life in Nazi Germany",
    "USA 1919-1941: Boom & Depression", "USA: New Deal", "USA: Civil Rights Movement",
    "China: Communist Revolution", "China: Mao's China",
    "Decolonisation", "United Nations", "Arab-Israeli Conflict",
    "Vietnam War", "Historical Skills & Sources", "Causation & Consequence"
]

business_topics = [
    "Business Activity & Types", "Business Objectives", "Stakeholders",
    "Business Structure & Organisation", "Recruitment & Selection", "Training & Development",
    "Motivation Theory", "Leadership & Management Styles", "Communication",
    "Marketing: Market Research", "Marketing Mix: Product", "Marketing Mix: Price",
    "Marketing Mix: Place", "Marketing Mix: Promotion", "Marketing Strategy",
    "Production Methods", "Quality Management", "Location Decisions",
    "Finance: Sources of Finance", "Finance: Cash Flow", "Finance: Break-even Analysis",
    "Finance: Financial Statements", "Business Growth", "Economics: Supply & Demand",
    "Economics: Market Structure", "International Business", "Business Ethics & Sustainability"
]

# ---------- 5. Enhanced PDF Processing with Question Extraction & Paper Intelligence ----------

def extract_text_from_pdf(pdf_file):
    """Extract text from uploaded PDF file"""
    if pdf_file is None:
        return ""
    try:
        pdf_reader = PyPDF2.PdfReader(pdf_file)
        text = ""
        for page in pdf_reader.pages:
            text += page.extract_text() + "\n"
        return text
    except Exception as e:
        return f"Error extracting PDF: {e}"

def identify_paper_details(text, filename):
    """Use AI to identify paper year, series, variant, and subject from content"""
    # Extract first 2000 characters for analysis
    sample_text = text[:2000] if len(text) > 2000 else text
    
    prompt = f"""Analyze this IGCSE past paper and identify its details.

Filename: {filename}
Paper Text Sample:
{sample_text}

Identify and return ONLY a JSON object with:
- subject: The subject name (e.g., "Mathematics", "Physics", "Chemistry", "Biology", "Geography", "History", "Business")
- year: The year (e.g., "2023", "2022")
- series: The exam series (e.g., "June", "November", "March", "May/June")
- variant: The paper variant (e.g., "1", "2", "3" or "11", "12", "21", "22")
- paper_number: The paper number (e.g., "1", "2", "3", "4")
- syllabus_code: If visible (e.g., "0580", "0625", "0610")

Look for patterns like:
- "June 2023" or "November 2022"
- "Paper 2 Variant 1" or "Paper 21"
- Subject codes like "0580/21/M/J/23"

Return ONLY valid JSON (no markdown):
{{"subject": "...", "year": "...", "series": "...", "variant": "...", "paper_number": "...", "syllabus_code": "..."}}"""
    
    try:
        response, _ = ask_ai(prompt, temperature=0.1)
        clean_txt = response.replace("```json", "").replace("```", "").strip()
        details = json.loads(clean_txt)
        return details
    except Exception as e:
        print(f"Error identifying paper details: {e}")
        # Fallback to filename parsing
        return parse_filename_for_details(filename)

def parse_filename_for_details(filename):
    """Fallback: Parse filename for paper details"""
    import re
    
    details = {
        "subject": "Unknown",
        "year": "Unknown",
        "series": "Unknown",
        "variant": "Unknown",
        "paper_number": "Unknown",
        "syllabus_code": "Unknown"
    }
    
    # Common patterns in IGCSE filenames
    # e.g., "0580_w23_qp_21.pdf" or "Physics_June_2023_P2.pdf"
    
    # Try to extract year
    year_match = re.search(r'(20\d{2})|(\d{2}(?=_[wsmj]|[WS]))', filename)
    if year_match:
        year = year_match.group(1) or ("20" + year_match.group(2))
        details["year"] = year
    
    # Try to extract series
    if re.search(r'[Jj]une?|[Mm]ay[_/-]?[Jj]une?|mj|MJ', filename):
        details["series"] = "May/June"
    elif re.search(r'[Nn]ov(ember)?|ON', filename):
        details["series"] = "October/November"
    elif re.search(r'[Mm]ar(ch)?|FM', filename):
        details["series"] = "February/March"
    
    # Try to extract variant
    variant_match = re.search(r'[Vv]ariant[_\s]?(\d)|[Pp]aper[_\s]?(\d{1,2})|_qp_(\d{1,2})', filename)
    if variant_match:
        details["variant"] = variant_match.group(1) or variant_match.group(2) or variant_match.group(3)
    
    # Try to extract syllabus code
    code_match = re.search(r'\b(0\d{3})\b', filename)
    if code_match:
        details["syllabus_code"] = code_match.group(1)
        # Map code to subject
        code_subject_map = {
            '0580': 'Mathematics', '0625': 'Physics', '0610': 'Biology',
            '0620': 'Chemistry', '0460': 'Geography', '0455': 'Economics',
            '0450': 'Business Studies', '0470': 'History'
        }
        details["subject"] = code_subject_map.get(code_match.group(1), "Unknown")
    
    return details

def extract_questions_from_text(text, paper_id, paper_title, subject, paper_details):
    """Use AI to intelligently extract questions from past paper text"""
    if not text or len(text) < 100:
        return []
    
    prompt = f"""Analyze this IGCSE {subject} past paper and extract ALL questions.

Paper Details:
- Subject: {subject}
- Year: {paper_details.get('year', 'Unknown')}
- Series: {paper_details.get('series', 'Unknown')}
- Paper: {paper_details.get('paper_number', 'Unknown')}
- Variant: {paper_details.get('variant', 'Unknown')}

Paper Text:
{text[:8000]}

Extract each question and return as JSON array. For each question include:
- question_number (e.g., "1(a)", "2(b)(i)")
- question_text (the complete question)
- marks (number of marks)
- topic (what IGCSE topic this relates to)
- requires_insert (true/false - does it reference Fig., Source, Table, etc?)

Return ONLY valid JSON array (no markdown):
[{{"question_number": "1(a)", "question_text": "...", "marks": 4, "topic": "...", "requires_insert": false}}, ...]

If text is incomplete, extract what you can find."""
    
    try:
        response, _ = ask_ai(prompt, temperature=0.2)
        clean_txt = response.replace("```json", "").replace("```", "").strip()
        questions = json.loads(clean_txt)
        
        # Add metadata to each question including paper details
        for q in questions:
            q['paper_id'] = paper_id
            q['paper_title'] = paper_title
            q['subject'] = subject
            q['year'] = paper_details.get('year', 'Unknown')
            q['series'] = paper_details.get('series', 'Unknown')
            q['variant'] = paper_details.get('variant', 'Unknown')
            q['paper_number'] = paper_details.get('paper_number', 'Unknown')
            q['syllabus_code'] = paper_details.get('syllabus_code', 'Unknown')
        
        return questions
    except Exception as e:
        print(f"Error extracting questions: {e}")
        # Fallback: simple regex extraction
        return extract_questions_fallback(text, paper_id, paper_title, subject, paper_details)

def extract_questions_fallback(text, paper_id, paper_title, subject, paper_details):
    """Fallback method using regex patterns"""
    questions = []
    # Pattern for question numbers like "1(a)", "2(b)(i)", "3", etc.
    pattern = r'(\d+(?:\([a-z]\))?(?:\([ivx]+\))?)\s+(.{20,500}?)\[(\d+)\]'
    matches = re.finditer(pattern, text, re.IGNORECASE)
    
    for match in matches:
        q_num = match.group(1)
        q_text = match.group(2).strip()
        marks = int(match.group(3))
        
        questions.append({
            'question_number': q_num,
            'question_text': q_text,
            'marks': marks,
            'topic': 'General',
            'requires_insert': bool(re.search(r'Fig\.|Source|Table|Insert|Photograph', q_text, re.IGNORECASE)),
            'paper_id': paper_id,
            'paper_title': paper_title,
            'subject': subject,
            'year': paper_details.get('year', 'Unknown'),
            'series': paper_details.get('series', 'Unknown'),
            'variant': paper_details.get('variant', 'Unknown'),
            'paper_number': paper_details.get('paper_number', 'Unknown'),
            'syllabus_code': paper_details.get('syllabus_code', 'Unknown')
        })
    
    return questions

def process_insert_file(insert_file):
    """Process insert file (PDF or image)"""
    if insert_file is None:
        return None, None
    
    try:
        file_name = insert_file.name
        file_ext = file_name.lower().split('.')[-1]
        
        if file_ext == 'pdf':
            # Extract text and try to get images from PDF
            text = extract_text_from_pdf(insert_file)
            return text, "pdf"
        elif file_ext in ['jpg', 'jpeg', 'png', 'gif']:
            # Store image
            image = Image.open(insert_file)
            return image, "image"
        else:
            return None, None
    except Exception as e:
        print(f"Error processing insert: {e}")
        return None, None

# ---------- 6. AI Tutor with Multi-Model Support ----------
def ai_tutor_chat(message, history, subject, topic):
    if not message.strip():
        return history

    subject_context = {
        "Geography": "You are an expert IGCSE Geography tutor. Focus on physical and human geography, case studies, map skills, and geographical skills. Use real-world examples and encourage critical thinking about global issues.",
        "History": "You are an expert IGCSE History tutor. Focus on historical analysis, source evaluation, causation, consequence, and continuity/change. Encourage evidence-based arguments and historical context.",
        "Business": "You are an expert IGCSE Business Studies tutor. Focus on business concepts, real-world applications, case studies, and analytical skills. Help students understand business decisions and their impacts."
    }

    system = f"""{subject_context[subject]}
Focus on {topic or 'any topic'}. Be encouraging, clear, and pedagogical.
Provide detailed explanations with examples and real-world applications.
Use case studies where appropriate and help students develop exam skills.
Encourage critical thinking and analytical skills."""
    
    # Build conversation context
    conversation = ""
    for user_msg, bot_msg in history[-5:]:
        if user_msg:
            conversation += f"Student: {user_msg}\n"
        if bot_msg:
            clean_msg = bot_msg.replace("🔵 ", "").replace("🟢 ", "").replace("🟣 ", "")
            conversation += f"Tutor: {clean_msg}\n"
    
    conversation += f"Student: {message}\nTutor:"
    full_prompt = f"{system}\n\nConversation:\n{conversation}"
    
    bot_response, source = ask_ai(full_prompt, temperature=0.7)
    
    # Add source indicator if not from Gemini
    if source == "cohere":
        bot_response = f"🔵 {bot_response}"
    elif source == "zai":
        bot_response = f"🟢 {bot_response}"
    elif source == "minimax":
        bot_response = f"🟣 {bot_response}"
    
    history.append((message, bot_response))
    return history

def clear_chat():
    return []

# ---------- 7. Case Study Generator ----------
def generate_case_study(subject, topic):
    if not topic:
        return "Select a topic first!"
    
    prompt = f"""Create a detailed IGCSE {subject} case study for the topic: "{topic}".

The case study should include:
1. Real-world example or location (be specific)
2. Background context and key facts
3. Relevant data and statistics
4. Analysis points and key issues
5. Different perspectives/stakeholders
6. Impacts (economic, social, environmental where relevant)
7. Exam-style questions students could practice

Make it engaging, factual, and exam-relevant for IGCSE level."""
    
    response, source = ask_ai(prompt, temperature=0.6)
    
    if source in ["cohere", "zai", "minimax"]:
        response = f"{response}\n\n_[Generated by {source.title()}]_"
    
    return response

# ---------- 8. Source Analysis (for History) ----------
def analyze_source(source_text, question):
    if not source_text.strip():
        return "Enter a source to analyze."
    
    prompt = f"""As an IGCSE History examiner, analyze this historical source:

SOURCE:
{source_text}

QUESTION: {question if question else "Evaluate the usefulness of this source for a historian studying this period."}

Provide:
1. **Content Analysis**: What information does the source provide?
2. **Provenance**: Origin, author, date, audience, purpose (if determinable)
3. **Reliability**: How reliable is this source? What are its limitations?
4. **Usefulness**: How useful is it for historians? What can/can't it tell us?
5. **Context**: What historical context is needed to understand this source?
6. **Cross-reference**: What other sources would help verify/challenge this?

Use IGCSE History exam criteria and techniques."""
    
    response, source = ask_ai(prompt, temperature=0.4)
    
    if source in ["cohere", "zai", "minimax"]:
        response = f"{response}\n\n_[Analysis by {source.title()}]_"
    
    return response

# ---------- 9. Business Calculator ----------
def business_calculator(calc_type, values):
    """Handle business calculations with AI explanation"""
    
    calculations = {
        "Break-even": "Fixed Costs ÷ (Selling Price - Variable Cost per unit)",
        "Profit": "Total Revenue - Total Costs",
        "Gross Profit Margin": "(Gross Profit ÷ Revenue) × 100",
        "Net Profit Margin": "(Net Profit ÷ Revenue) × 100",
        "Market Share": "(Company Sales ÷ Total Market Sales) × 100",
        "Return on Investment": "((Profit - Investment) ÷ Investment) × 100"
    }
    
    prompt = f"""Explain how to calculate {calc_type} in IGCSE Business Studies.

Formula: {calculations.get(calc_type, "Standard business formula")}

Given values: {values}

Provide:
1. Step-by-step calculation
2. Clear explanation of what each component means
3. What the result tells us about the business
4. How this metric is used in business decisions
5. Limitations of this metric"""
    
    response, source = ask_ai(prompt, temperature=0.3)
    
    if source in ["cohere", "zai", "minimax"]:
        response = f"{response}\n\n_[Explained by {source.title()}]_"
    
    return response

# ---------- 10. Practice Questions (Enhanced with PDF context) ----------
def generate_question(subject, topic):
    if not topic:
        return "Select a topic!", "", ""
    
    # Get relevant PDF content if available
    pdf_context = ""
    for paper_id, content in pdf_content_storage.items():
        paper = next((p for p in papers_storage if p['id'] == paper_id), None)
        if paper and paper['subject'] == subject:
            pdf_context += f"\n\nReference material from {paper['title']}:\n{content[:3000]}"
    
    question_guidance = {
        "Geography": "Include command words (describe, explain, evaluate). May require case study knowledge or map interpretation.",
        "History": "Include source material or ask about causation/consequence. Test historical analysis and evaluation skills.",
        "Business": "Include a business scenario or data. Test application of business concepts and analytical skills."
    }
    
    prompt = f"""Create ONE high-quality IGCSE {subject} exam question on the topic: "{topic}".
{question_guidance[subject]}
{"Base the question style on this reference material:" + pdf_context if pdf_context else "Create an authentic exam-style question."}

The question should:
- Use appropriate exam command words
- Be worth 6-8 marks
- Test both knowledge and analysis/evaluation
- Include any necessary context or data
- Be answerable in 8-12 minutes

Return ONLY valid JSON (no markdown):
{{"question": "complete question with context", "expectedAnswer": "key points a good answer should include", "markScheme": "detailed marking criteria with mark allocations"}}"""
    
    response, source = ask_ai(prompt, temperature=0.4)
    
    try:
        clean_txt = response.replace("```json", "").replace("```", "").strip()
        data = json.loads(clean_txt)
        return data["question"], data.get("expectedAnswer", ""), data.get("markScheme", "")
    except Exception as e:
        return response, "", f"Error: {e}"

def check_answer(question, expected, user_answer, subject):
    if not user_answer.strip():
        return "Write your answer first!"
    
    subject_criteria = {
        "Geography": "geographical knowledge, case study examples, use of terminology, analysis of causes/effects/solutions",
        "History": "historical knowledge, use of sources/evidence, analysis of causation/consequence, balanced evaluation",
        "Business": "business knowledge, application to scenarios, analysis using business concepts, justified recommendations"
    }
    
    prompt = f"""Evaluate this IGCSE {subject} answer using exam board criteria:

Question: {question}
Expected: {expected}

Student's answer:
{user_answer}

Assess based on: {subject_criteria[subject]}

Return JSON (no markdown):
{{"isCorrect": true/false, "score": 0-100, "marks": "X/8", "feedback": "detailed feedback on content and exam technique", "improvements": "specific suggestions", "strengths": "what was done well", "examTips": "exam-specific advice"}}"""
    
    response, source = ask_ai(prompt, temperature=0.3)
    
    try:
        clean_txt = response.replace("```json", "").replace("```", "").strip()
        fb = json.loads(clean_txt)
        result = f"""📊 Score: {fb.get('score', 'N/A')}% ({fb.get('marks', 'N/A')})

📝 Detailed Feedback:
{fb['feedback']}

✅ Your Strengths:
{fb.get('strengths', 'Good effort!')}

📈 How to Improve:
{fb['improvements']}

💡 Exam Tips:
{fb.get('examTips', 'Keep practicing!')}"""
        
        if source in ["cohere", "zai", "minimax"]:
            result += f"\n\n_[Graded by {source.title()}]_"
        
        return result
    except Exception:
        return response

# ---------- 11. Enhanced Past Papers System with Paper Intelligence ----------
def search_questions_by_topic(subject, topic):
    """Search for questions matching a specific topic"""
    if not questions_index:
        return "📭 No questions available yet. Admin needs to upload past papers first!"
    
    # Filter questions
    matching = [q for q in questions_index 
                if q['subject'] == subject and 
                (topic.lower() in q['topic'].lower() or topic.lower() in q['question_text'].lower())]
    
    if not matching:
        return f"📭 No questions found for {topic} in {subject}. Try a different topic or broader search."
    
    # Format output with paper details
    result = f"### 🎯 Found {len(matching)} question(s) on '{topic}' in {subject}\n\n"
    
    for i, q in enumerate(matching, 1):
        insert_note = " 🖼️ **[Requires Insert]**" if q.get('requires_insert') else ""
        
        # Enhanced paper info display
        paper_info = f"**{q['year']} {q['series']}** - Paper {q['paper_number']}"
        if q.get('variant') != 'Unknown':
            paper_info += f" Variant {q['variant']}"
        if q.get('syllabus_code') != 'Unknown':
            paper_info += f" ({q['syllabus_code']})"
        
        result += f"""**Question {i}** - {paper_info}
📝 **{q['question_number']}** [{q['marks']} marks]{insert_note}
{q['question_text']}

{'─'*80}
"""
    
    return result

def get_paper_insert(paper_id):
    """Retrieve insert for a specific paper"""
    if paper_id in insert_storage:
        insert_data, insert_type = insert_storage[paper_id]
        if insert_type == "image":
            return insert_data, "Image insert loaded ✅"
        elif insert_type == "pdf":
            return None, f"Insert text:\n\n{insert_data[:2000]}..."
    return None, "No insert available for this paper"

def view_papers_student(subject):
    """View all papers for a subject with detailed information"""
    filtered = [p for p in papers_storage if p["subject"] == subject]
    if not filtered:
        return f"📭 No {subject} papers available."
    
    result = ""
    for p in filtered:
        insert_note = " 🖼️ Insert Available" if p['id'] in insert_storage else ""
        q_count = len([q for q in questions_index if q['paper_id'] == p['id']])
        
        # Get paper details
        paper_details = p.get('paper_details', {})
        year = paper_details.get('year', 'Unknown')
        series = paper_details.get('series', 'Unknown')
        variant = paper_details.get('variant', 'Unknown')
        paper_num = paper_details.get('paper_number', 'Unknown')
        syllabus = paper_details.get('syllabus_code', 'Unknown')
        
        paper_info = f"**{year} {series}** - Paper {paper_num}"
        if variant != 'Unknown':
            paper_info += f" Variant {variant}"
        if syllabus != 'Unknown':
            paper_info += f" ({syllabus})"
        
        result += f"""**{p['title']}** {'📄 PDF' if p.get('has_pdf') else ''}{insert_note}
{paper_info}
⏰ Uploaded: {p['uploaded_at']} | 📝 {q_count} questions extracted
{p['content'][:200]}...

{'═'*80}
"""
    
    return result

# ---------- 12. Admin Functions with Enhanced Paper Processing ----------
def verify_admin_password(password):
    if password == ADMIN_PASSWORD:
        return gr.update(visible=True), gr.update(visible=False), "✅ Access granted!"
    return gr.update(visible=False), gr.update(visible=True), "❌ Incorrect password!"

def upload_paper(title, subject, content, pdf_file, insert_file):
    """Enhanced upload with AI-powered paper identification and question extraction"""
    if not all([title, subject, content]):
        return "⚠ Please fill all required fields!", get_papers_list(), "📊 Status: Waiting for upload"
    
    paper_id = len(papers_storage) + 1
    
    # Process PDF
    pdf_text = ""
    paper_details = {}
    if pdf_file is not None:
        pdf_text = extract_text_from_pdf(pdf_file)
        if pdf_text and not pdf_text.startswith("Error"):
            # Use AI to identify paper details
            paper_details = identify_paper_details(pdf_text, pdf_file.name)
            pdf_content_storage[paper_id] = pdf_text
            
            # Add paper details to content
            detail_str = f"\n\n📋 **Paper Details:**"
            detail_str += f"\n- Year: {paper_details.get('year', 'Unknown')}"
            detail_str += f"\n- Series: {paper_details.get('series', 'Unknown')}"
            detail_str += f"\n- Paper: {paper_details.get('paper_number', 'Unknown')}"
            detail_str += f"\n- Variant: {paper_details.get('variant', 'Unknown')}"
            if paper_details.get('syllabus_code') != 'Unknown':
                detail_str += f"\n- Syllabus Code: {paper_details.get('syllabus_code')}"
            content += detail_str
            content += f"\n[📄 PDF extracted: {len(pdf_text)} characters]"
    
    # Process Insert
    insert_data = None
    insert_type = None
    if insert_file is not None:
        insert_data, insert_type = process_insert_file(insert_file)
        if insert_data:
            insert_storage[paper_id] = (insert_data, insert_type)
            content += f"\n[🖼️ Insert attached: {insert_type}]"
    
    # Add paper to storage
    papers_storage.append({
        "id": paper_id,
        "title": title,
        "subject": subject,
        "content": content,
        "has_pdf": bool(pdf_text and not pdf_text.startswith("Error")),
        "has_insert": bool(insert_data),
        "paper_details": paper_details,
        "uploaded_at": datetime.now().strftime("%Y-%m-%d %H:%M")
    })
    
    # Extract questions from PDF using AI
    status_msg = "✅ Paper uploaded!"
    if pdf_text and not pdf_text.startswith("Error"):
        status_msg += "\n⏳ AI is extracting questions and analyzing paper structure..."
        questions = extract_questions_from_text(pdf_text, paper_id, title, subject, paper_details)
        questions_index.extend(questions)
        
        # Enhanced status with paper details
        paper_info = f"{paper_details.get('year', 'Unknown')} {paper_details.get('series', 'Unknown')}"
        if paper_details.get('variant') != 'Unknown':
            paper_info += f" Variant {paper_details.get('variant')}"
        
        status_msg += f"\n✅ Extracted {len(questions)} questions from **{paper_info}**!"
        status_msg += f"\n📋 Identified as: {subject} Paper {paper_details.get('paper_number', 'Unknown')}"
    
    return status_msg, get_papers_list(), f"📊 Total papers: {len(papers_storage)} | Total questions: {len(questions_index)}"

def get_papers_list():
    """Get formatted list of all papers with detailed information"""
    if not papers_storage:
        return "No papers yet."
    
    result = []
    for p in papers_storage:
        paper_details = p.get('paper_details', {})
        year = paper_details.get('year', 'Unknown')
        series = paper_details.get('series', 'Unknown')
        variant = paper_details.get('variant', 'Unknown')
        paper_num = paper_details.get('paper_number', 'Unknown')
        
        paper_info = f"{year} {series} - Paper {paper_num}"
        if variant != 'Unknown':
            paper_info += f" V{variant}"
        
        insert_icon = '🖼️ Insert' if p.get('has_insert') else ''
        pdf_icon = '📄 PDF' if p.get('has_pdf') else ''
        
        result.append(f"**{p['title']}** ({p['subject']}) {pdf_icon} {insert_icon}\n{paper_info}\n⏰ {p['uploaded_at']}\n{p['content'][:120]}...\n{'─'*60}")
    
    return "\n".join(result)

# ---------- 13. Gradio UI ----------
with gr.Blocks(theme=gr.themes.Soft(), title="IGCSE Platform") as app:
    gr.Markdown("""
    # 🎓 IGCSE Learning Platform
    Geography 🌍 | History 📜 | Business 💼
    _Powered by Gemini AI with intelligent multi-model fallback system_
    """)

    with gr.Tabs():
        # ───── STUDENT PORTAL ─────
        with gr.Tab("👨‍🎓 Student Portal"):
            with gr.Tabs():
                # AI TUTOR
                with gr.Tab("🤖 AI Tutor"):
                    gr.Markdown("### Chat with Your AI Tutor\n*Get expert help in Geography, History, or Business*")
                    with gr.Row():
                        subj = gr.Radio(["Geography", "History", "Business"], label="Subject", value="Geography")
                        topc = gr.Dropdown(geography_topics, label="Topic (optional)", allow_custom_value=True)

                    def update_topics(s):
                        topics = {"Geography": geography_topics, "History": history_topics, "Business": business_topics}
                        return gr.Dropdown(choices=topics[s], value=None)
                    subj.change(update_topics, subj, topc)

                    chat = gr.Chatbot(height=450, show_label=False)
                    txt = gr.Textbox(placeholder="Ask anything... e.g., 'Explain causes of earthquakes' or 'What led to WWI?'", label="Message")
                    with gr.Row():
                        send = gr.Button("Send 📤", variant="primary")
                        clr = gr.Button("Clear 🗑")
                    send.click(ai_tutor_chat, [txt, chat, subj, topc], chat)
                    txt.submit(ai_tutor_chat, [txt, chat, subj, topc], chat)
                    clr.click(clear_chat, outputs=chat)

                # PAST PAPERS BROWSER - NEW!
                with gr.Tab("📚 Past Papers Browser"):
                    gr.Markdown("""### 🎯 Search Real Exam Questions by Topic
*Find actual IGCSE questions from uploaded past papers*""")
                    
                    with gr.Row():
                        pp_subject = gr.Radio(["Geography", "History", "Business"], label="Subject", value="Geography")
                        pp_topic = gr.Dropdown(geography_topics, label="Select Topic")
                    
                    pp_subject.change(update_topics, pp_subject, pp_topic)
                    
                    search_btn = gr.Button("🔍 Search Questions", variant="primary", size="lg")
                    questions_output = gr.Markdown(label="Questions Found", value="Select a topic and click Search")
                    
                    search_btn.click(search_questions_by_topic, [pp_subject, pp_topic], questions_output)
                    
                    gr.Markdown("---\n### 📄 Browse All Papers")
                    browse_subject = gr.Radio(["Geography", "History", "Business"], label="Subject", value="Geography")
                    papers_display = gr.Markdown(label="Available Papers")
                    gr.Button("📖 Show All Papers").click(view_papers_student, browse_subject, papers_display)

                # CASE STUDIES
                with gr.Tab("📋 Case Studies"):
                    gr.Markdown("### Generate Detailed Case Studies")
                    with gr.Row():
                        cs_subj = gr.Radio(["Geography", "History", "Business"], label="Subject", value="Geography")
                        cs_topic = gr.Dropdown(geography_topics, label="Topic")
                    cs_subj.change(update_topics, cs_subj, cs_topic)
                    cs_output = gr.Textbox(lines=20, label="Case Study", interactive=False)
                    gr.Button("🔍 Generate Case Study", variant="primary").click(
                        generate_case_study, [cs_subj, cs_topic], cs_output
                    )

                # SOURCE ANALYSIS (History)
                with gr.Tab("📜 Source Analysis"):
                    gr.Markdown("### Historical Source Analysis Tool")
                    source_text = gr.Textbox(lines=8, label="📄 Paste Historical Source", 
                                            placeholder="Paste the source text here (e.g., extract from a speech, letter, document...)")
                    source_q = gr.Textbox(label="❓ Question (optional)", 
                                         placeholder="e.g., 'How useful is this source for understanding...?'")
                    source_output = gr.Textbox(lines=16, label="Analysis", interactive=False)
                    gr.Button("🔍 Analyze Source", variant="primary").click(
                        analyze_source, [source_text, source_q], source_output
                    )

                # BUSINESS CALCULATOR
                with gr.Tab("💰 Business Calculator"):
                    gr.Markdown("### Business Calculations & Explanations")
                    calc_type = gr.Dropdown(
                        ["Break-even", "Profit", "Gross Profit Margin", "Net Profit Margin", 
                         "Market Share", "Return on Investment"],
                        label="Calculation Type"
                    )
                    calc_values = gr.Textbox(lines=3, label="Values", 
                                            placeholder="e.g., Fixed Costs: $10,000, Price: $50, Variable Cost: $30")
                    calc_output = gr.Textbox(lines=14, label="Calculation & Explanation", interactive=False)
                    gr.Button("🧮 Calculate & Explain", variant="primary").click(
                        business_calculator, [calc_type, calc_values], calc_output
                    )

                # PRACTICE QUESTIONS
                with gr.Tab("✍ Practice"):
                    gr.Markdown("### Generate & Practice Exam Questions")
                    with gr.Row():
                        ps = gr.Radio(["Geography", "History", "Business"], label="Subject", value="Geography")
                        pt = gr.Dropdown(geography_topics, label="Topic")
                    ps.change(update_topics, ps, pt)

                    q = gr.Textbox(label="📝 Question", lines=6, interactive=False)
                    exp = gr.Textbox(label="Expected Answer Points", lines=3, visible=False)
                    mark = gr.Textbox(label="📊 Mark Scheme", lines=4, interactive=False)
                    ans = gr.Textbox(lines=10, label="✏ Your Answer", placeholder="Type your answer here...")
                    fb = gr.Textbox(lines=14, label="📋 Feedback", interactive=False)

                    with gr.Row():
                        gr.Button("🎲 Generate Question", variant="primary").click(
                            generate_question, [ps, pt], [q, exp, mark]
                        )
                        gr.Button("✅ Check Answer", variant="secondary").click(
                            check_answer, [q, exp, ans, ps], fb
                        )

        # ───── ADMIN PANEL ─────
        with gr.Tab("🔐 Admin Panel"):
            with gr.Column() as login_section:
                gr.Markdown("### 🔐 Admin Login")
                pwd = gr.Textbox(label="Password", type="password", placeholder="Enter admin password")
                login_btn = gr.Button("🔓 Login", variant="primary")
                login_status = gr.Textbox(label="Status", interactive=False)
            
            with gr.Column(visible=False) as admin_section:
                gr.Markdown("""### 📤 Upload Past Papers & Resources
                
**Instructions:**
1. **Title**: e.g., "Paper 2 Geography - June 2023"
2. **Subject**: Select Geography, History, or Business
3. **Content**: Add description, syllabus code, or notes
4. **PDF**: Upload the actual past paper (questions will be auto-extracted)
5. **Insert**: Upload any accompanying insert/resource booklet (images, maps, sources, etc.)

The system will automatically:
- Extract all questions from the PDF
- Index them by topic for student search
- Store insert materials for reference
""")
                
                with gr.Row():
                    with gr.Column():
                        t = gr.Textbox(label="📋 Title", placeholder="e.g., Paper 2 - June 2023")
                        s = gr.Radio(["Geography", "History", "Business"], label="Subject", value="Geography")
                        c = gr.Textbox(lines=5, label="Content/Description", 
                                      placeholder="Add notes, syllabus code, or instructions...")
                        pdf = gr.File(label="📄 Past Paper PDF (questions will be extracted)", file_types=[".pdf"])
                        insert = gr.File(label="🖼️ Insert/Resource Booklet (optional)", 
                                        file_types=[".pdf", ".jpg", ".jpeg", ".png"])
                        
                        up = gr.Button("⬆ Upload Paper", variant="primary", size="lg")
                        st = gr.Textbox(label="Upload Status", lines=3)
                        stats = gr.Textbox(label="📊 Database Statistics", value="📊 Status: No papers uploaded yet")
                    
                    with gr.Column():
                        gr.Markdown("### 📚 All Uploaded Papers")
                        lst = gr.Textbox(lines=24, label="Papers Database", value=get_papers_list(), 
                                        interactive=False, show_label=False)
                
                up.click(upload_paper, [t, s, c, pdf, insert], [st, lst, stats])
            
            login_btn.click(verify_admin_password, [pwd], [admin_section, login_section, login_status])

    gr.Markdown("""
    ---
    **System Status:** 🟢 Gemini AI (Primary) | 🔵 Cohere (Secondary) | 🟢 Z.ai (Tertiary) | 🟣 MiniMax (Fallback)
    
    **Features:**
    - 🎯 Smart question extraction from past papers
    - 🖼️ Insert/resource support for visual materials
    - 🔍 Topic-based question search
    - 🤖 Multi-AI fallback system for reliability
    """)

app.launch()