From 350f21637cf5f73d98e3f2f008f2250fd71605ba Mon Sep 17 00:00:00 2001
From: Ayomide <olaniyifolashadeayo@gmail.com>
Date: Thu, 10 Jul 2025 15:16:16 +0100
Subject: [PATCH] Initial commit

---
 .gitignore                                 | 109 +++++++++++++++++
 LICENSE                                    |   0
 backend/brand_style.py                     |  78 ++++++++++++
 backend/config.py                          |  11 ++
 backend/copywriter.py                      |  24 ++++
 backend/embeddings.py                      |  18 +++
 backend/main.py                            | 131 +++++++++++++++++++++
 backend/requirements.txt                   |   7 ++
 backend/vector_store.py                    |  37 ++++++
 data/style_guidelines/email_template.txt   |   1 +
 data/style_guidelines/general_template.txt |   1 +
 data/style_guidelines/social_template.txt  |   1 +
 docs/API_Documendation.md                  |   0
 docs/README.md                             |  97 +++++++++++++++
 14 files changed, 515 insertions(+)
 create mode 100644 .gitignore
 create mode 100644 LICENSE
 create mode 100644 backend/brand_style.py
 create mode 100644 backend/config.py
 create mode 100644 backend/copywriter.py
 create mode 100644 backend/embeddings.py
 create mode 100644 backend/main.py
 create mode 100644 backend/requirements.txt
 create mode 100644 backend/vector_store.py
 create mode 100644 data/style_guidelines/email_template.txt
 create mode 100644 data/style_guidelines/general_template.txt
 create mode 100644 data/style_guidelines/social_template.txt
 create mode 100644 docs/API_Documendation.md
 create mode 100644 docs/README.md

diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..fdfbea6
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,109 @@
+# Byte-compiled / optimized / DLL files
+__pycache__/
+*.py[cod]
+*$py.class
+
+# Distribution / packaging
+.Python
+build/
+develop-eggs/
+dist/
+downloads/
+eggs/
+.eggs/
+lib/
+lib64/
+parts/
+sdist/
+var/
+wheels/
+*.egg-info/
+.installed.cfg
+*.egg
+MANIFEST
+
+# Installer logs
+pip-log.txt
+pip-delete-this-directory.txt
+
+# Unit test / coverage reports
+htmlcov/
+.tox/
+.nox/
+.coverage
+*.cover
+*.py,cover
+.hypothesis/
+.pytest_cache/
+
+# Jupyter Notebook
+.ipynb_checkpoints
+
+### Environment ###
+.env
+.venv
+env/
+venv/
+ENV/
+env.bak/
+venv.bak/
+
+# Virtual environment
+pythonenv*
+
+### IDE ###
+# VS Code
+.vscode/
+!.vscode/settings.json
+!.vscode/tasks.json
+!.vscode/launch.json
+!.vscode/extensions.json
+
+# PyCharm
+.idea/
+*.iml
+*.ipr
+*.iws
+
+### Data Files ###
+# Raw and processed news
+data/raw_news/
+data/processed_news/
+*.csv
+*.json
+*.parquet
+*.feather
+*.pkl
+*.pickle
+*.db
+*.sqlite
+
+# Vector database files
+*.faiss
+*.index
+*.bin
+*.vec
+
+### Logs ###
+*.log
+logs/
+
+### OS Generated ###
+.DS_Store
+.DS_Store?
+._*
+.Spotlight-V100
+.Trashes
+ehthumbs.db
+Thumbs.db
+
+### Groq/Cohere Cache ###
+.cache/
+model_cache/
+
+### Test Files ###
+test_output/
+benchmark_results/
+
+### Documentation ###
+docs/_build/
\ No newline at end of file
diff --git a/LICENSE b/LICENSE
new file mode 100644
index 0000000..e69de29
diff --git a/backend/brand_style.py b/backend/brand_style.py
new file mode 100644
index 0000000..123f42d
--- /dev/null
+++ b/backend/brand_style.py
@@ -0,0 +1,78 @@
+from typing import Dict
+import json
+from pathlib import Path
+
+
+class BrandStyle:
+    def __init__(self):
+        self.style = self._load_style()
+        self.templates = {
+            "email": self._load_template("email"),
+            "social": self._load_template("social"),
+            "general": self._load_template("general")
+        }
+
+    def _load_style(self) -> Dict:
+        path = Path("data/style_guidelines/style.json")
+        if path.exists():
+            return json.loads(path.read_text())
+        else:
+            # Create default style if doesn't exist
+            default_style = {
+                "tone": "professional",
+                "phrases": ["innovative", "results-driven", "empowering", "transformation"],
+                "avoid": ["cheap", "guarantee", "spam", "scam"]
+            }
+            path.parent.mkdir(parents=True, exist_ok=True)
+            path.write_text(json.dumps(default_style, indent=2))
+            return default_style
+
+    def _load_template(self, name: str) -> str:
+        path = Path(f"data/style_guidelines/{name}_template.txt")
+        if path.exists():
+            return path.read_text()
+        else:
+            # Create default templates if they don't exist
+            templates = {
+                "email": "Write a professional email that engages the reader and includes a clear call-to-action.",
+                "social": "Create an engaging social media post that captures attention and encourages interaction.",
+                "general": "Generate marketing copy that is compelling, authentic, and aligned with brand values."
+            }
+            path.parent.mkdir(parents=True, exist_ok=True)
+            path.write_text(templates.get(name, ""))
+            return templates.get(name, "")
+
+    def get_prompt(self, request) -> str:
+        # Handle both dict and Pydantic model objects
+        if hasattr(request, 'dict'):
+            # It's a Pydantic model
+            request_dict = request.dict()
+            tone = request.tone or self.style['tone']
+            content_type = request.content_type
+        else:
+            # It's already a dict
+            request_dict = request
+            tone = request_dict.get('tone', self.style['tone'])
+            content_type = request_dict.get('content_type', 'general')
+
+        return f"""
+You are a marketing assistant for Adriana James. Follow these brand guidelines:
+
+TONE: {tone}
+STYLE: Professional, authentic, and empowering
+
+PREFERRED PHRASES: {', '.join(self.style['phrases'])}
+AVOID USING: {', '.join(self.style['avoid'])}
+
+CONTENT TYPE: {content_type}
+TEMPLATE GUIDANCE: {self.templates.get(content_type, self.templates['general'])}
+
+Create marketing copy that:
+1. Reflects Adriana James' brand voice
+2. Is engaging and authentic
+3. Includes a clear value proposition
+4. Has a compelling call-to-action when appropriate
+5. Feels personal and relatable
+
+Remember: Focus on transformation, empowerment, and results while maintaining professionalism.
+"""
diff --git a/backend/config.py b/backend/config.py
new file mode 100644
index 0000000..14d2d55
--- /dev/null
+++ b/backend/config.py
@@ -0,0 +1,11 @@
+import os
+from dotenv import load_dotenv
+
+load_dotenv()
+
+
+class Config:
+    OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
+    COHERE_API_KEY = os.getenv("COHERE_API_KEY")
+    DATA_PATH = "data/past_campaigns/campaigns.json"
+    FAISS_INDEX_PATH = "data/vector_store.index"
\ No newline at end of file
diff --git a/backend/copywriter.py b/backend/copywriter.py
new file mode 100644
index 0000000..7b7f705
--- /dev/null
+++ b/backend/copywriter.py
@@ -0,0 +1,24 @@
+# backend/copywriter.py
+from .vector_store import VectorStore
+from .brand_style import BrandStyle
+import openai
+
+class Copywriter:
+    def __init__(self):
+        self.vector_store = VectorStore()
+        self.brand_style = BrandStyle()
+    
+    def generate_copy(self, request):
+        # Move the generation logic from main.py here
+        similar = self.vector_store.search(request.prompt, request.content_type)
+        
+        response = openai.ChatCompletion.create(
+            model="gpt-3.5-turbo",
+            messages=[
+                {"role": "system", "content": self.brand_style.get_prompt(request)},
+                {"role": "user", "content": f"Prompt: {request.prompt}\n\nSimilar examples:\n{similar}"}
+            ],
+            temperature=0.7
+        )
+        
+        return response.choices[0].message.content
\ No newline at end of file
diff --git a/backend/embeddings.py b/backend/embeddings.py
new file mode 100644
index 0000000..4980add
--- /dev/null
+++ b/backend/embeddings.py
@@ -0,0 +1,18 @@
+from config import Config
+import cohere
+import openai
+
+class Embeddings:
+    def __init__(self):
+        self.cohere = cohere.Client(Config.COHERE_API_KEY)
+    
+    def get_embedding(self, text: str, engine: str = "cohere"):
+        if engine == "cohere":
+            response = self.cohere.embed(texts=[text], model="small")
+            return response.embeddings[0]
+        else:  # OpenAI fallback
+            response = openai.Embedding.create(
+                input=[text],
+                model="text-embedding-ada-002"
+            )
+            return response.data[0].embedding
\ No newline at end of file
diff --git a/backend/main.py b/backend/main.py
new file mode 100644
index 0000000..8729793
--- /dev/null
+++ b/backend/main.py
@@ -0,0 +1,131 @@
+from fastapi import FastAPI, HTTPException, UploadFile, File
+from fastapi.middleware.cors import CORSMiddleware
+from pydantic import BaseModel
+from typing import Optional, List
+import json
+from datetime import datetime
+from .vector_store import VectorStore
+from .brand_style import BrandStyle
+from .config import Config
+import openai
+import os
+
+# Initialize OpenAI
+openai.api_key = Config.OPENAI_API_KEY
+
+# Initialize
+app = FastAPI(title="Marketing Assistant AI", version="0.1.0")
+vector_store = VectorStore()
+brand_style = BrandStyle()
+
+# CORS
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+# Models
+class CampaignRequest(BaseModel):
+    prompt: str
+    content_type: str = "general"
+    tone: Optional[str] = None
+
+class Campaign(BaseModel):
+    content: str
+    content_type: str
+    metadata: dict = {}
+
+# Routes
+@app.post("/generate")
+async def generate_copy(request: CampaignRequest):
+    """Generate marketing copy based on prompt and brand guidelines"""
+    try:
+        # Get similar content from vector store
+        similar = vector_store.search(request.prompt, request.content_type)
+        
+        # Format similar content for context
+        similar_content = ""
+        if similar:
+            similar_content = "\n\nSimilar past campaigns for reference:\n"
+            for i, campaign in enumerate(similar[:3], 1):
+                similar_content += f"{i}. {campaign.get('content', '')}\n"
+        
+        # Generate with OpenAI
+        system_prompt = brand_style.get_prompt(request)
+        user_prompt = f"Create marketing copy for: {request.prompt}{similar_content}"
+        
+        response = openai.ChatCompletion.create(
+            model="gpt-3.5-turbo",
+            messages=[
+                {"role": "system", "content": system_prompt},
+                {"role": "user", "content": user_prompt}
+            ],
+            temperature=0.7,
+            max_tokens=500
+        )
+        
+        generated_copy = response.choices[0].message.content
+        
+        # Store the generated copy for future reference
+        new_campaign = {
+            "content": generated_copy,
+            "content_type": request.content_type,
+            "metadata": {
+                "prompt": request.prompt,
+                "tone": request.tone,
+                "generated_at": datetime.now().isoformat()
+            }
+        }
+        
+        # Add to vector store for future similarity searches
+        vector_store.add_campaign(new_campaign)
+        
+        return {"result": generated_copy}
+    
+    except Exception as e:
+        print(f"Error in generate_copy: {str(e)}")  # For debugging
+        raise HTTPException(status_code=500, detail=str(e))
+
+@app.post("/add-campaign")
+async def add_campaign(campaign: Campaign):
+    """Add a new campaign to the vector store"""
+    try:
+        # Add timestamp to metadata
+        campaign_data = campaign.dict()
+        campaign_data["metadata"]["added_at"] = datetime.now().isoformat()
+        
+        vector_store.add_campaign(campaign_data)
+        return {"status": "success"}
+    except Exception as e:
+        print(f"Error in add_campaign: {str(e)}")  # For debugging
+        raise HTTPException(status_code=500, detail=str(e))
+
+@app.get("/search")
+async def search_campaigns(query: str, limit: int = 5):
+    """Search for similar campaigns"""
+    try:
+        results = vector_store.search(query, k=limit)
+        return {"results": results}
+    except Exception as e:
+        print(f"Error in search_campaigns: {str(e)}")  # For debugging
+        raise HTTPException(status_code=500, detail=str(e))
+
+@app.get("/")
+async def root():
+    """Health check endpoint"""
+    return {"message": "Marketing Assistant AI is running", "version": "0.1.0"}
+
+@app.get("/health")
+async def health_check():
+    """Detailed health check"""
+    return {
+        "status": "healthy",
+        "vector_store_size": len(vector_store.campaigns),
+        "timestamp": datetime.now().isoformat()
+    }
+
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8000)
\ No newline at end of file
diff --git a/backend/requirements.txt b/backend/requirements.txt
new file mode 100644
index 0000000..a0844b4
--- /dev/null
+++ b/backend/requirements.txt
@@ -0,0 +1,7 @@
+fastapi
+uvicorn
+openai==0.28
+cohere
+sentence-transformers
+faiss-cpu
+python-dotenv
\ No newline at end of file
diff --git a/backend/vector_store.py b/backend/vector_store.py
new file mode 100644
index 0000000..11f11ad
--- /dev/null
+++ b/backend/vector_store.py
@@ -0,0 +1,37 @@
+import faiss
+import numpy as np
+from sentence_transformers import SentenceTransformer
+from .config import Config
+import json
+from pathlib import Path
+
+
+class VectorStore:
+    def __init__(self):
+        self.model = SentenceTransformer('all-MiniLM-L6-v2')
+        self.index = faiss.IndexFlatL2(384)
+        self.campaigns = []
+        self._load_data()
+
+    def _load_data(self):
+        if Path(Config.DATA_PATH).exists():
+            with open(Config.DATA_PATH) as f:
+                self.campaigns = json.load(f)
+                if self.campaigns:
+                    embeddings = self.model.encode([c["content"] for c in self.campaigns])
+                    self.index.add(embeddings)
+
+    def add_campaign(self, campaign: dict):
+        self.campaigns.append(campaign)
+        embedding = self.model.encode([campaign["content"]])
+        self.index.add(embedding)
+        self._save_data()
+
+    def search(self, query: str, content_type: str = None, k: int = 3):
+        query_embedding = self.model.encode([query])
+        distances, indices = self.index.search(query_embedding, k)
+        return [self.campaigns[i] for i in indices[0]]
+
+    def _save_data(self):
+        with open(Config.DATA_PATH, 'w') as f:
+            json.dump(self.campaigns, f)
\ No newline at end of file
diff --git a/data/style_guidelines/email_template.txt b/data/style_guidelines/email_template.txt
new file mode 100644
index 0000000..db4abba
--- /dev/null
+++ b/data/style_guidelines/email_template.txt
@@ -0,0 +1 @@
+Write a professional email that engages the reader and includes a clear call-to-action.
\ No newline at end of file
diff --git a/data/style_guidelines/general_template.txt b/data/style_guidelines/general_template.txt
new file mode 100644
index 0000000..84dac8f
--- /dev/null
+++ b/data/style_guidelines/general_template.txt
@@ -0,0 +1 @@
+Generate marketing copy that is compelling, authentic, and aligned with brand values.
\ No newline at end of file
diff --git a/data/style_guidelines/social_template.txt b/data/style_guidelines/social_template.txt
new file mode 100644
index 0000000..c7629be
--- /dev/null
+++ b/data/style_guidelines/social_template.txt
@@ -0,0 +1 @@
+Create an engaging social media post that captures attention and encourages interaction.
\ No newline at end of file
diff --git a/docs/API_Documendation.md b/docs/API_Documendation.md
new file mode 100644
index 0000000..e69de29
diff --git a/docs/README.md b/docs/README.md
new file mode 100644
index 0000000..7f0f633
--- /dev/null
+++ b/docs/README.md
@@ -0,0 +1,97 @@
+# Marketing Assistant AI
+
+## Project Overview
+
+Marketing Assistant AI is an AI-powered tool designed to streamline the process of ideation, copywriting, and marketing campaign creation. It generates marketing content in line with the brand tone and voice of Adriana James, producing drafts that can be validated and refined by a human marketer.
+
+## Objectives
+
+* Reduce the time required to generate marketing copy.
+* Create content for emails, campaigns, social media, website copy, funnel pages, and more.
+* Ensure the AI produces copywriting that aligns with the brand tone and voice of Adriana James.
+* Allow ongoing updates to improve the AI’s performance and accuracy.
+
+## Deliverables
+
+* A custom-trained LLM fine-tuned for marketing and copywriting.
+* Ability to generate copy in the same style and brand tone of Adriana James.
+
+## Tech Stack
+
+* **LLM** : Open-source or proprietary LLM fine-tuned for marketing.
+* **Embeddings & Re-Ranking** : Cohere for embeddings and ranking results.
+* **Backend** : FastAPI for API services.
+* **Vector Database** : FAISS for content retrieval.
+* **Storage** : Local storage for historical marketing data.
+
+## File Structure
+
+```
+Marketing_Assistant_AI/
+│-- backend/
+│   │-- main.py  # FastAPI backend
+│   │-- copywriter.py  # AI-powered copy generation module
+│   │-- vector_store.py  # Manages vector database operations
+│   │-- embeddings.py  # Generates embeddings using Cohere
+│   │-- brand_style.py  # Ensures brand tone consistency
+│   │-- config.py  # Configuration settings
+│   │-- requirements.txt  # Dependencies
+│
+│-- data/
+│   │-- past_campaigns/  # Stores past marketing campaigns
+│   │-- user_queries/  # Stores past user queries for AI training
+│   │-- style_guidelines/  # Reference materials for brand tone
+│
+│-- docs/
+│   │-- README.md  # Documentation for new developers
+│   │-- API_Documentation.md  # API details
+│
+│-- .env  # Environment variables
+│-- .gitignore  # Git ignore file
+│-- LICENSE  # License information
+```
+
+## Setup & Installation
+
+### 1. Clone the Repository
+
+```bash
+git clone http://23.29.118.76:3000/Test/ds_task_marketing_assistant_ai
+cd marketing-assistant-ai
+```
+
+### 2. Set Up the Backend
+
+```bash
+cd backend
+pip install -r requirements.txt
+python main.py
+```
+
+## AI Copywriting Process
+
+1. **User Input** : The user submits a request (e.g., "Generate an email campaign for a product launch").
+2. **Preprocessing** : The AI extracts key details and matches them with past marketing data.
+3. **Generation** : The fine-tuned LLM creates a draft aligned with Adriana James' brand tone.
+4. **Refinement** : The AI applies re-ranking to prioritize relevant content.
+5. **Final Output** : The generated copy is displayed for user review and editing.
+
+### Example API Usage
+
+#### Generate Marketing Copy
+
+```python
+import requests
+
+url = "http://localhost:8000/generate-copy"
+data = {"prompt": "Write a social media post for our new product launch"}
+response = requests.post(url, json=data)
+print(response.json())
+```
+
+## Success Criteria
+
+* AI generates copywriting that accurately reflects the brand tone.
+* AI can be updated with new marketing materials.
+* CRUD functionality to manage training data.
+* AI adapts to new marketing trends and user queries.