Files
ds-fire-fighter/app.py
T

437 lines
16 KiB
Python
Raw Normal View History

2025-02-06 20:22:43 +00:00
import os
from typing import Optional
from fastapi import FastAPI, HTTPException, Security, Depends
from fastapi.security import APIKeyHeader
from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import JSONResponse
from dotenv import load_dotenv
from utils.document_loader import load_document
import json
from pydantic import BaseModel
from src.llm import ai_chat
from langchain_openai import ChatOpenAI
import requests
import tempfile
from scripts.generate_pdf import create_pdf
from scripts.generate_theme import generate_theme
from scripts.generate_quiz import generate_quiz
from typing import Dict, Any
from fastapi.responses import Response
from datetime import datetime
from fastapi import HTTPException
from pydantic import BaseModel
2025-02-12 19:25:12 +00:00
from typing import Optional, Union, Dict, Any,List,Optional, List, Tuple, Any
2025-02-06 20:22:43 +00:00
import os
import requests
import os
from PyPDF2 import PdfReader
from config import QUIZ_TYPES
# Load environment variables
load_dotenv()
API_KEY = os.getenv("API_KEY_ACCESS")
base_path = os.path.join("data", "config_files")
QUESTIONS_PATH = os.path.join(base_path, "questions.json")
THEME_CONTEXT_PATH = os.path.join(base_path, "theme_context.json")
2025-02-08 02:39:43 +01:00
with open(THEME_CONTEXT_PATH, "r", encoding="utf-8") as f:
themes = json.load(f)
2025-02-06 20:22:43 +00:00
# Initialize FastAPI app
app = FastAPI(
title="Fire Fighter Interview API",
description="API For fire fighter",
version="1.0.0"
)
# Add CORS middleware
app.add_middleware(
CORSMiddleware,
allow_origins=["*"],
allow_credentials=True,
allow_methods=["*"],
allow_headers=["*"],
)
# Setup API key authentication
api_key_header = APIKeyHeader(name="Authorization", auto_error=False)
async def get_api_key(api_key_header: str = Security(api_key_header)) -> str:
"""Validate API key from header"""
if not api_key_header or not api_key_header.startswith('Bearer '):
raise HTTPException(
status_code=401,
detail={"error": "Unauthorized", "message": "API key is missing or invalid."}
)
token = api_key_header.split(' ')[1]
if token != API_KEY:
raise HTTPException(
status_code=401,
detail={"error": "Unauthorized", "message": "API key does not match."}
)
return token
class ChatRequest(BaseModel):
resume_url: Optional[str] = None
query: str=None
chat_id: int
2025-02-06 20:22:43 +00:00
theme_id: Optional[int] = 1
2025-02-08 02:39:43 +01:00
full_history_url: Optional[str] = None
form_id:Optional[int] = None
feedback: Optional[str] = None
generate_theme:str="NO"
2025-02-06 20:22:43 +00:00
class ChatResponse(BaseModel):
message: str
end: bool
2025-02-08 03:09:00 +01:00
pop_theme_generation:bool
2025-02-06 20:22:43 +00:00
error: Optional[str] = None
class GeneratePDFRequest(BaseModel):
resume_url: Optional[str] = None
chat_id: int
2025-02-11 19:20:53 +01:00
theme_id: Optional[int] = 1
2025-02-06 20:22:43 +00:00
full_history_url: Optional[str] = None
2025-02-06 21:01:22 +00:00
form_id:Optional[int] = None
2025-02-11 19:20:53 +01:00
generate_theme:str="YES"
2025-02-06 20:22:43 +00:00
class QuizRequest(BaseModel):
pdf_url: str
quiz_type: int # 1, 2, or 3 corresponding to QUIZ_TYPES
class QuizResponse(BaseModel):
success: bool
message: str
2025-02-12 19:25:12 +00:00
quiz_data: Optional[List[Any]] = None
2025-02-06 20:22:43 +00:00
error: Optional[str] = None
async def extract_pdf_text(pdf_url: str) -> Union[str, None]:
"""Extract text from PDF and handle potential errors."""
try:
response = requests.get(pdf_url)
response.raise_for_status()
# Create a temporary file
with tempfile.NamedTemporaryFile(delete=False, suffix='.pdf') as temp_pdf:
temp_pdf.write(response.content)
temp_path = temp_pdf.name
# Extract text from PDF
reader = PdfReader(temp_path)
text = "\n\n".join(
page.extract_text() for page in reader.pages if page.extract_text()
)
# Clean up temporary file
os.unlink(temp_path)
if not text.strip():
return None
return text
except requests.RequestException as e:
raise HTTPException(
status_code=400,
detail=f"Error downloading PDF: {str(e)}"
)
except Exception as e:
raise HTTPException(
status_code=500,
detail=f"Error processing PDF: {str(e)}"
)
2025-02-08 02:39:43 +01:00
@app.post("/rescue-career/chat")
2025-02-06 20:22:43 +00:00
async def chat_endpoint(
request: ChatRequest,
api_key: str = Depends(get_api_key)
):
try:
# Validate theme
2025-02-08 02:39:43 +01:00
print(f"Received request with theme_id: {request.theme_id}") # Debugging print
2025-02-06 20:22:43 +00:00
matching_themes = [t for t in themes if t["id"] == request.theme_id]
if not matching_themes:
2025-02-08 02:39:43 +01:00
print(f"No theme found with ID: {request.theme_id}") # Debugging print
2025-02-06 20:22:43 +00:00
raise HTTPException(
status_code=400,
detail=f"No theme found with ID {request.theme_id}"
)
2025-02-08 02:39:43 +01:00
print(f"Validated theme ID: {request.theme_id}") # Print statement added
2025-02-06 20:22:43 +00:00
resume_docs = ""
if request.resume_url:
2025-02-08 02:39:43 +01:00
print(f"Loading resume from URL: {request.resume_url}") # Debugging print
2025-02-06 20:22:43 +00:00
docs = load_document(request.resume_url)
if not docs:
2025-02-08 02:39:43 +01:00
print("Invalid resume URL: Unable to fetch document") # Debugging print
2025-02-06 20:22:43 +00:00
raise HTTPException(
status_code=400,
detail="Invalid resume URL: Unable to fetch document"
)
resume_docs = "\n".join(f"- {doc.page_content}" for doc in docs)
2025-02-08 02:39:43 +01:00
print(f"Loaded resume documents: {resume_docs}") # Debugging print
full_history_docs = ""
if request.full_history_url:
print(f"Loading full history from URL: {request.full_history_url}") # Debugging print
docs = load_document(request.full_history_url)
if not docs:
print("Invalid full history URL: Unable to fetch document") # Debugging print
raise HTTPException(
status_code=400,
detail="Invalid full history URL: Unable to fetch document"
)
full_history_docs = "\n".join(f"- {doc.page_content}" for doc in docs)
print(f"Loaded full history documents: {full_history_docs}") # Debugging print
2025-02-06 20:22:43 +00:00
2025-02-08 02:39:43 +01:00
form_response_docs = ""
if request.form_id:
print(f"Fetching form response for form_id: {request.form_id}") # Debugging print
try:
x_api_key = os.getenv("BACKEND_XAPI_KEY")
url = f"{os.getenv('BACKEND_BASE_URL')}/v3/api/custom/theme-document/answer/{request.form_id}?x-project={x_api_key}"
result = requests.get(url)
result.raise_for_status() # Ensure we raise an error for bad responses
form_response = result.json()["data"] # Return response in JSON format
form_response_docs = "\n".join(f"- {form_response}")
print(f"Fetched form response: {form_response}") # Debugging print
except requests.RequestException as e:
print(f"Error fetching onboarding data: {str(e)}") # Debugging print
raise HTTPException(
status_code=400,
detail="Unable to fetch onboarding data"
)
2025-02-06 20:22:43 +00:00
# Parse response
2025-02-08 02:39:43 +01:00
print("Parsing AI response...") # Debugging print
2025-02-11 19:20:53 +01:00
query = request.query
if not query:
query = "Let's get started"
2025-02-08 02:39:43 +01:00
response = ai_chat(
2025-02-11 19:20:53 +01:00
query=query,
conversation_id=request.chat_id,
2025-02-08 02:39:43 +01:00
theme_id=request.theme_id,
resume=resume_docs,
full_history=full_history_docs,
2025-02-11 19:20:53 +01:00
form_response=form_response_docs
2025-02-06 20:22:43 +00:00
)
2025-02-11 19:20:53 +01:00
print(response)
2025-02-08 02:39:43 +01:00
return ChatResponse(
2025-02-11 19:20:53 +01:00
message=response.get("message", ""),
end=response.get("end", "no") == "yes",
pop_theme_generation=response.get("pop_theme_generation","no") == "yes",
2025-02-08 02:39:43 +01:00
error=None
)
2025-02-06 20:22:43 +00:00
except Exception as e:
2025-02-08 02:39:43 +01:00
print(f"Error processing chat request: {str(e)}") # Print statement added
2025-02-06 20:22:43 +00:00
raise HTTPException(
status_code=500,
detail=f"Error processing chat request: {str(e)}"
)
2025-02-08 02:39:43 +01:00
2025-02-06 20:22:43 +00:00
@app.post("/rescue-career/generate-theme")
async def generate_pdf_endpoint(
2025-02-11 19:20:53 +01:00
request: GeneratePDFRequest,
2025-02-06 20:22:43 +00:00
api_key: str = Depends(get_api_key)
):
try:
2025-02-08 02:39:43 +01:00
print(f"Received request with theme_id: {request.theme_id}") # Debugging print
matching_themes = [t for t in themes if t["id"] == request.theme_id]
if not matching_themes:
print(f"No theme found with ID: {request.theme_id}") # Debugging print
2025-02-06 20:22:43 +00:00
raise HTTPException(
2025-02-08 02:39:43 +01:00
status_code=400,
detail=f"No theme found with ID {request.theme_id}"
2025-02-06 20:22:43 +00:00
)
2025-02-08 02:39:43 +01:00
print(f"Validated theme ID: {request.theme_id}") # Print statement added
2025-02-06 20:22:43 +00:00
resume_docs = ""
if request.resume_url:
2025-02-08 02:39:43 +01:00
print(f"Loading resume from URL: {request.resume_url}") # Debugging print
2025-02-06 20:22:43 +00:00
docs = load_document(request.resume_url)
if not docs:
2025-02-08 02:39:43 +01:00
print("Invalid resume URL: Unable to fetch document") # Debugging print
2025-02-06 20:22:43 +00:00
raise HTTPException(
status_code=400,
detail="Invalid resume URL: Unable to fetch document"
)
resume_docs = "\n".join(f"- {doc.page_content}" for doc in docs)
2025-02-08 02:39:43 +01:00
print(f"Loaded resume documents: {resume_docs}") # Debugging print
2025-02-06 20:22:43 +00:00
full_history_docs = ""
if request.full_history_url:
2025-02-08 02:39:43 +01:00
print(f"Loading full history from URL: {request.full_history_url}") # Debugging print
2025-02-06 20:22:43 +00:00
docs = load_document(request.full_history_url)
if not docs:
2025-02-08 02:39:43 +01:00
print("Invalid full history URL: Unable to fetch document") # Debugging print
2025-02-06 20:22:43 +00:00
raise HTTPException(
status_code=400,
2025-02-08 02:39:43 +01:00
detail="Invalid full history URL: Unable to fetch document"
2025-02-06 20:22:43 +00:00
)
full_history_docs = "\n".join(f"- {doc.page_content}" for doc in docs)
2025-02-08 02:39:43 +01:00
print(f"Loaded full history documents: {full_history_docs}") # Debugging print
2025-02-06 21:01:22 +00:00
form_response_docs = ""
if request.form_id:
2025-02-08 02:39:43 +01:00
print(f"Fetching form response for form_id: {request.form_id}") # Debugging print
2025-02-06 21:01:22 +00:00
try:
x_api_key = os.getenv("BACKEND_XAPI_KEY")
url = f"{os.getenv('BACKEND_BASE_URL')}/v3/api/custom/theme-document/answer/{request.form_id}?x-project={x_api_key}"
result = requests.get(url)
2025-02-08 02:39:43 +01:00
result.raise_for_status() # Ensure we raise an error for bad responses
form_response = result.json()["data"] # Return response in JSON format
form_response_docs = "\n".join(f"- {form_response}")
print(f"Fetched form response: {form_response}") # Debugging print
except requests.RequestException as e:
print(f"Error fetching onboarding data: {str(e)}") # Debugging print
2025-02-06 21:01:22 +00:00
raise HTTPException(
status_code=400,
2025-02-08 02:39:43 +01:00
detail="Unable to fetch onboarding data"
2025-02-06 21:01:22 +00:00
)
2025-02-08 02:39:43 +01:00
# Here you would fetch the conversation data using the conversation_id
# This is a placeholder - replace with your actual conversation data fetching logic
# Get AI-generated theme content
# Get AI-generated theme content
2025-02-08 02:39:43 +01:00
response = ai_chat(
2025-02-11 19:20:53 +01:00
query="NOW GENERATE THE STARTPOP FRAMEWORK",
conversation_id=request.chat_id,
2025-02-08 02:39:43 +01:00
theme_id=request.theme_id,
resume=resume_docs,
full_history=full_history_docs,
2025-02-06 21:01:22 +00:00
form_response=form_response_docs,
2025-02-08 02:39:43 +01:00
generate_theme="YES"
)
print(f"AI Response for theme: {response}")
2025-02-08 02:39:43 +01:00
# Ensure AI response is valid
if not isinstance(response, str):
raise HTTPException(status_code=500, detail="Invalid AI response format")
2025-02-06 20:22:43 +00:00
2025-02-08 02:39:43 +01:00
# Generate PDF
response_data = json.loads(response)
pdf_content = create_pdf(response_data)
2025-02-06 20:22:43 +00:00
timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
file_path = f"theme_{timestamp}.pdf"
# Save the PDF locally temporarily
with open(file_path, "wb") as file:
file.write(pdf_content)
# Upload the PDF to S3 using the API
upload_url = f"{os.getenv('BACKEND_BASE_URL')}/v3/api/custom/theme/doc-upload?x-project={x_api_key}"
with open(file_path, 'rb') as file:
files = {'file': file}
upload_response = requests.post(upload_url, files=files)
# Check if the upload was successful
if upload_response.status_code != 200:
raise HTTPException(status_code=upload_response.status_code, detail="File upload to S3 failed: " + upload_response.text)
upload_data = upload_response.json() # Get the response in JSON format
# Extract the uploaded file URL
theme_url = upload_data.get("url") # Adjust this key based on the actual API response structure
if not theme_url:
raise HTTPException(status_code=500, detail="Failed to retrieve theme URL from upload response")
# Clean up the temporary file
os.remove(file_path)
# Return JSON response with theme URL and text
return {
"theme_url": theme_url,
"theme_text": response_data
}
2025-02-06 20:22:43 +00:00
except Exception as e:
2025-02-08 02:39:43 +01:00
print(f"Error generating theme: {str(e)}")
raise HTTPException(status_code=500, detail=f"Error: {str(e)}")
2025-02-06 20:22:43 +00:00
@app.post("/rescue-career/generate-quiz", response_model=QuizResponse)
async def generate_quiz_endpoint(
request: QuizRequest,
api_key: str = Depends(get_api_key)
):
"""Generate quiz based on PDF content and quiz type."""
# Validate quiz type
if request.quiz_type not in QUIZ_TYPES:
raise HTTPException(
status_code=400,
detail=f"Invalid quiz type. Must be one of: {list(QUIZ_TYPES)}"
)
try:
# Extract text from PDF
pdf_text = await extract_pdf_text(request.pdf_url)
if not pdf_text:
return QuizResponse(
success=False,
message="PDF extraction completed but no text content found",
error="Empty PDF content"
)
# Generate quiz using the existing function
quiz_data = generate_quiz(
startpop_pdf=pdf_text,
quiz_type=request.quiz_type
)
if not quiz_data:
return QuizResponse(
success=False,
message="Quiz generation failed",
error="Unable to generate quiz from the provided content"
)
return QuizResponse(
success=True,
message="Quiz generated successfully",
quiz_data=quiz_data
)
except HTTPException as he:
raise he
except Exception as e:
raise HTTPException(
status_code=500,
detail=f"Unexpected error during quiz generation: {str(e)}"
)
async def get_conversation_data(conversation_id: str) -> dict:
"""
Fetch conversation data using the conversation ID.
Replace this with your actual implementation to fetch conversation data.
"""
try:
storage_path = "conversations.json"
with open(storage_path, 'r') as f:
convs = json.load(f)
convs_id = convs[conversation_id]
return convs_id
except Exception as e:
print(f"Error fetching conversation data: {e}")
return None
@app.on_event("startup")
async def startup_event():
"""Initialize required components on startup"""
pass
if __name__ == "__main__":
import uvicorn
2025-02-12 19:25:12 +00:00
uvicorn.run("app:app", host="0.0.0.0", port=5048, reload=True)