Add requirements.txt with essential dependencies for the project

2025-10-05 11:29:45 +00:00
commit 3d48cf0385
15 changed files with 3686 additions and 0 deletions
@@ -0,0 +1,469 @@
+import logging
+import time
+from typing import List, Tuple
+
+import groq
+
+from config import settings
+from schemas import Match, Receipt, Transaction
+
+# Set up logging
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+
+class AIMatcher:
+    def __init__(self, use_batch_matching=True):
+        self.client = groq.Groq(api_key=settings.GROQ_API_KEY)
+        self.model = "llama-3.1-8b-instant"
+        self.max_retries = 3
+        self.retry_delay = 2  # seconds - increased for rate limiting
+        self.rate_limit_delay = 1.0  # seconds between API calls
+        self.last_api_call = 0
+        self.use_batch_matching = (
+            use_batch_matching  # Toggle between new and legacy methods
+        )
+
+    def match_receipts_to_transactions(
+        self, receipts: List[Receipt], transactions: List[Transaction]
+    ) -> List[Match]:
+        """Match receipts to transactions using AI"""
+        logger.info(
+            f"Starting AI matching for {len(receipts)} receipts against {len(transactions)} transactions"
+        )
+        matches = []
+
+        for i, receipt in enumerate(receipts):
+            logger.info(
+                f"Processing receipt {i + 1}/{len(receipts)}: {receipt.vendor} - ${receipt.amount}"
+            )
+
+            # Rate limiting
+            self._rate_limit()
+
+            # Get the BEST match for this receipt (highest confidence score)
+            best_match = self._find_best_match(receipt, transactions)
+            if best_match:
+                matches.append(best_match)
+                logger.info(
+                    f"Found match: {best_match.confidence_score:.3f} - {best_match.match_reason}"
+                )
+            else:
+                logger.warning(
+                    f"No match found for receipt: {receipt.vendor} - ${receipt.amount}"
+                )
+
+        # Sort by confidence score (highest first)
+        matches = sorted(matches, key=lambda x: x.confidence_score, reverse=True)
+        logger.info(f"AI matching completed. Found {len(matches)} matches")
+        return matches
+
+    def _rate_limit(self):
+        """Implement rate limiting to avoid API quota exhaustion"""
+        current_time = time.time()
+        time_since_last_call = current_time - self.last_api_call
+
+        if time_since_last_call < self.rate_limit_delay:
+            sleep_time = self.rate_limit_delay - time_since_last_call
+            logger.debug(f"Rate limiting: sleeping for {sleep_time:.2f} seconds")
+            time.sleep(sleep_time)
+
+        self.last_api_call = time.time()
+
+    def _find_best_match(
+        self, receipt: Receipt, transactions: List[Transaction]
+    ) -> Match:
+        """Find the BEST match for a receipt using a single AI call for all candidates"""
+        candidates = self._filter_candidates(receipt, transactions)
+        if not candidates:
+            logger.warning(
+                f"No candidates found for receipt: {receipt.vendor} - ${receipt.amount}"
+            )
+            return None
+
+        logger.info(f"Found {len(candidates)} candidates for receipt: {receipt.vendor}")
+
+        # Choose matching method based on configuration
+        if self.use_batch_matching:
+            # New efficient method: single AI call for all candidates
+            best_match = self._find_best_match_single_call(receipt, candidates)
+        else:
+            # Legacy method: individual AI calls (fallback)
+            best_match = self._find_best_match_legacy(receipt, candidates)
+
+        return best_match
+
+    def _find_best_match_single_call(
+        self, receipt: Receipt, candidates: List[Transaction]
+    ) -> Match:
+        """Find the best match using a single AI call to evaluate all candidates"""
+        if not candidates:
+            return None
+
+        # Limit candidates to avoid token limits (adjust based on your needs)
+        max_candidates = 10
+        if len(candidates) > max_candidates:
+            # Sort by amount similarity and take top candidates
+            candidates = sorted(
+                candidates, key=lambda t: abs(receipt.amount - abs(t.amount))
+            )[:max_candidates]
+            logger.info(
+                f"Limited candidates to top {max_candidates} by amount similarity"
+            )
+
+        # Build comprehensive prompt with all candidates
+        candidates_text = ""
+        for i, transaction in enumerate(candidates):
+            transaction_amount_abs = abs(transaction.amount)
+            date_diff = abs((receipt.receipt_date - transaction.transaction_date).days)
+            amount_diff = abs(receipt.amount - transaction_amount_abs)
+            amount_percent_diff = (
+                (amount_diff / receipt.amount) * 100 if receipt.amount > 0 else 0
+            )
+
+            candidates_text += f"""
+Candidate {i + 1}:
+- Vendor: {transaction.vendor}
+- Amount: ${transaction.amount} (absolute: ${transaction_amount_abs})
+- Date: {transaction.transaction_date.strftime("%Y-%m-%d")} ({date_diff} days difference)
+- Notes: {transaction.notes}
+- Amount difference: ${amount_diff} ({amount_percent_diff:.1f}%)
+"""
+
+        prompt = f"""
+You are an expert at matching receipts to bank transactions. Analyze the receipt below against ALL the candidate transactions and return the BEST match.
+
+RECEIPT TO MATCH:
+- Vendor: {receipt.vendor}
+- Amount: ${receipt.amount}
+- Date: {receipt.receipt_date.strftime("%Y-%m-%d")}
+- Description: {receipt.description}
+- Category: {receipt.category}
+
+CANDIDATE TRANSACTIONS:
+{candidates_text}
+
+SCORING CRITERIA:
+- Perfect matches (same vendor, amount, date): 0.95-1.0
+- High confidence (minor differences): 0.8-0.94
+- Medium confidence (moderate differences): 0.6-0.79
+- Low confidence (significant differences): 0.4-0.59
+- Very low confidence (major differences): 0.2-0.39
+- Minimal similarity: 0.1-0.19
+- No meaningful similarity: 0.0-0.09
+
+Consider vendor name similarity, amount accuracy, date proximity, and description/notes relevance.
+
+IMPORTANT: You MUST return the candidate with the highest match score, even if it's very low. Never return NONE.
+Return ONLY the best match in this exact format:
+CANDIDATE_NUMBER|CONFIDENCE_SCORE|REASON
+
+Example: 3|0.87|Same vendor name, exact amount match, 1 day apart
+Example of low match: 5|0.15|Best available option despite significant differences in vendor and amount
+"""
+
+        for attempt in range(self.max_retries):
+            try:
+                result = self._call_groq_api_with_timeout(
+                    prompt, timeout=45
+                )  # Longer timeout for complex prompt
+
+                # Parse the single result
+                candidate_num, score, reason = self._parse_single_match_response(result)
+
+                if candidate_num == -1:  # Parsing error occurred
+                    logger.warning(
+                        f"Failed to parse AI response for receipt: {receipt.vendor}"
+                    )
+                    return None
+
+                if 0 <= candidate_num < len(candidates):
+                    best_transaction = candidates[candidate_num]
+                    logger.info(
+                        f"AI selected candidate {candidate_num + 1}: {best_transaction.vendor} (score: {score:.3f})"
+                    )
+                    return Match(receipt, best_transaction, score, reason)
+                else:
+                    logger.warning(
+                        f"AI returned invalid candidate number: {candidate_num}"
+                    )
+                    return None
+
+            except Exception as e:
+                logger.warning(
+                    f"Attempt {attempt + 1} failed for receipt {receipt.id}: {str(e)}"
+                )
+                if attempt < self.max_retries - 1:
+                    sleep_time = self.retry_delay * (2**attempt)
+                    logger.info(f"Waiting {sleep_time} seconds before retry...")
+                    time.sleep(sleep_time)
+                else:
+                    logger.error(f"All attempts failed for receipt {receipt.id}")
+                    return None
+
+        return None
+
+    def _parse_single_match_response(self, result: str) -> Tuple[int, float, str]:
+        """Parse AI response for single best match"""
+        result = result.strip()
+        logger.debug(f"Parsing single match response: {result}")
+
+        try:
+            if result.upper().startswith("NONE"):
+                # This should not happen with new prompt, but handle as parsing error
+                logger.warning(
+                    "AI returned NONE despite being instructed to always return best match"
+                )
+                return -1, 0.0, "AI returned NONE unexpectedly"
+
+            if "|" in result:
+                parts = result.split("|")
+                if len(parts) >= 3:
+                    candidate_str = parts[0].strip()
+                    score_str = parts[1].strip()
+                    reason = "|".join(parts[2:]).strip()
+
+                    # Extract candidate number
+                    import re
+
+                    candidate_match = re.search(r"\d+", candidate_str)
+                    if candidate_match:
+                        candidate_num = (
+                            int(candidate_match.group()) - 1
+                        )  # Convert to 0-based index
+                    else:
+                        raise ValueError("No candidate number found")
+
+                    # Extract score
+                    score_clean = "".join(
+                        c for c in score_str if c.isdigit() or c == "."
+                    )
+                    score = float(score_clean) if score_clean else 0.0
+
+                    # Ensure score is in valid range
+                    score = max(0.0, min(1.0, score))
+
+                    logger.debug(
+                        f"Parsed: candidate={candidate_num}, score={score}, reason={reason}"
+                    )
+                    return candidate_num, score, reason
+
+        except Exception as e:
+            logger.warning(f"Error parsing single match response: {e}")
+
+        # Fallback
+        logger.warning(f"Could not parse single match response: {result}")
+        return -1, 0.0, f"Parse error: {result[:50]}..."
+
+    def _filter_candidates(
+        self, receipt: Receipt, transactions: List[Transaction]
+    ) -> List[Transaction]:
+        """Filter transactions to create a reasonable candidate list"""
+        candidates = []
+        amount_threshold = receipt.amount * 2.0  # 200% threshold - very inclusive
+
+        for transaction in transactions:
+            # Use absolute value for transaction amount comparison
+            transaction_amount_abs = abs(transaction.amount)
+
+            # Only exclude transactions with obviously different amounts
+            if abs(receipt.amount - transaction_amount_abs) <= amount_threshold:
+                candidates.append(transaction)
+
+        logger.debug(
+            f"Filtered {len(transactions)} transactions to {len(candidates)} candidates"
+        )
+        return candidates
+
+    def _find_best_match_legacy(
+        self, receipt: Receipt, transactions: List[Transaction]
+    ) -> Match:
+        """Legacy method: Find the best match using individual API calls (kept as fallback)"""
+        candidates = self._filter_candidates(receipt, transactions)
+        if not candidates:
+            return None
+
+        best_match = None
+        highest_score = 0
+
+        for transaction in candidates:
+            score, reason = self._calculate_match_score(receipt, transaction)
+            logger.debug(
+                f"Score {score:.3f} for transaction {transaction.vendor}: {reason}"
+            )
+
+            if score > highest_score:
+                highest_score = score
+                best_match = Match(receipt, transaction, score, reason)
+
+        return best_match
+
+    def _calculate_match_score(
+        self, receipt: Receipt, transaction: Transaction
+    ) -> Tuple[float, str]:
+        """Calculate match score using AI"""
+        # Calculate differences for the AI to consider
+        date_diff = abs((receipt.receipt_date - transaction.transaction_date).days)
+        transaction_amount_abs = abs(transaction.amount)
+        amount_diff = abs(receipt.amount - transaction_amount_abs)
+        amount_percent_diff = (
+            (amount_diff / receipt.amount) * 100 if receipt.amount > 0 else 0
+        )
+
+        prompt = f"""
+        Compare this receipt with this transaction and provide a confidence score (0-1) and brief reason, the reason must be a single sentence without any special formatting.
+        
+        Receipt: {receipt.vendor}, ${receipt.amount}, {receipt.receipt_date.strftime("%Y-%m-%d")}
+        Receipt Description: {receipt.description}
+        Receipt Category: {receipt.category}
+        Transaction: {transaction.vendor}, ${transaction.amount} (absolute: ${transaction_amount_abs}), {transaction.transaction_date.strftime("%Y-%m-%d")}
+        Transaction Notes: {transaction.notes}
+        
+        Differences:
+        - Date difference: {date_diff} days
+        - Amount difference: ${amount_diff} ({amount_percent_diff:.1f}%)
+        - Vendor comparison: "{receipt.vendor}" vs "{transaction.vendor}"
+        - Description/Notes comparison: "{receipt.description}" vs "{transaction.notes}"
+        - Category: {receipt.category}
+        
+        Score this potential match based on how likely it is the correct match:
+        
+        - Perfect matches (same vendor, amount, date): 0.95-1.0
+        - High confidence (minor differences): 0.8-0.94
+        - Medium confidence (moderate differences): 0.6-0.79
+        - Low confidence (significant differences): 0.4-0.59
+        - Very low confidence (major differences): 0.2-0.39
+        - Minimal similarity: 0.1-0.19
+        - No meaningful similarity: 0.0-0.09
+        
+        Consider description and category similarity in your scoring.
+        
+        IMPORTANT: Return ONLY the score and reason separated by a pipe character.
+        Format: [score]|[reason]
+        Example: 0.85|Same vendor, same amount, 2 days apart
+        """
+
+        for attempt in range(self.max_retries):
+            try:
+                result = self._call_groq_api_with_timeout(
+                    prompt, timeout=30
+                )  # Increased timeout
+
+                # Parse the result - handle multiple formats
+                score, reason = self._parse_ai_response(result)
+
+                logger.debug(f"AI Response: {result}")
+                logger.debug(f"Parsed: score={score}, reason={reason}")
+
+                return score, reason
+
+            except Exception as e:
+                logger.warning(
+                    f"Attempt {attempt + 1} failed for receipt {receipt.id}: {str(e)}"
+                )
+                if attempt < self.max_retries - 1:
+                    # Exponential backoff for rate limiting
+                    sleep_time = self.retry_delay * (2**attempt)
+                    logger.info(f"Waiting {sleep_time} seconds before retry...")
+                    time.sleep(sleep_time)
+                else:
+                    logger.error(f"All attempts failed for receipt {receipt.id}")
+                    return 0.0, f"AI error after {self.max_retries} attempts: {str(e)}"
+
+    def _parse_ai_response(self, result: str) -> Tuple[float, str]:
+        """Parse AI response with robust error handling"""
+        result = result.strip()
+        logger.debug(f"Parsing AI response: {result}")
+
+        # Try to find score in various formats
+        if "|" in result:
+            parts = result.split("|")
+            logger.debug(f"Split response into {len(parts)} parts: {parts}")
+
+            # Look for a numeric score in any part
+            for i, part in enumerate(parts):
+                part = part.strip()
+                try:
+                    # Remove any non-numeric characters except decimal point
+                    score_str_clean = "".join(
+                        c for c in part if c.isdigit() or c == "."
+                    )
+                    if score_str_clean:
+                        score = float(score_str_clean)
+                        if 0 <= score <= 1:  # Valid confidence score
+                            # Get reason from other parts
+                            reason_parts = [
+                                p.strip()
+                                for j, p in enumerate(parts)
+                                if j != i and p.strip()
+                            ]
+                            reason = (
+                                " | ".join(reason_parts)
+                                if reason_parts
+                                else "Score extracted"
+                            )
+                            logger.debug(
+                                f"Found score {score} in part {i}, reason: {reason}"
+                            )
+                            return score, reason
+                except ValueError:
+                    continue
+
+        # Try to extract just a number from the response
+        try:
+            import re
+
+            numbers = re.findall(r"\d+\.?\d*", result)
+            if numbers:
+                for num_str in numbers:
+                    score = float(num_str)
+                    if 0 <= score <= 1:  # Valid confidence score
+                        logger.debug(f"Extracted score {score} from response")
+                        return score, f"Extracted from response: {result[:50]}..."
+        except (ValueError, IndexError):
+            pass
+
+        # Fallback - try to find any number and normalize it
+        try:
+            import re
+
+            numbers = re.findall(r"\d+\.?\d*", result)
+            if numbers:
+                score = float(numbers[0])
+                # Normalize to 0-1 range if it's a percentage or other scale
+                if score > 1:
+                    score = score / 100  # Assume percentage
+                score = max(0, min(1, score))  # Clamp to 0-1
+                logger.debug(f"Normalized score {score} from response")
+                return score, f"Normalized from response: {result[:50]}..."
+        except (ValueError, IndexError):
+            pass
+
+        # Final fallback
+        logger.warning(f"Could not parse AI response: {result}")
+        return 0.0, f"Unparseable response: {result[:50]}..."
+
+    def _call_groq_api_with_timeout(self, prompt: str, timeout: int = 15) -> str:
+        """Make API call with timeout and retry logic"""
+        import concurrent.futures
+
+        def api_call():
+            try:
+                response = self.client.chat.completions.create(
+                    model=self.model,
+                    messages=[{"role": "user", "content": prompt}],
+                    max_tokens=200,
+                    temperature=0.1,
+                )
+                return response.choices[0].message.content.strip()
+            except Exception as e:
+                raise e
+
+        try:
+            with concurrent.futures.ThreadPoolExecutor() as executor:
+                future = executor.submit(api_call)
+                return future.result(timeout=timeout)
+        except concurrent.futures.TimeoutError:
+            raise Exception(f"API call timed out after {timeout} seconds")
+        except Exception as e:
+            raise e
@@ -0,0 +1,175 @@
+from dataclasses import dataclass
+from typing import Any, Dict, List
+
+from schemas import Receipt, Transaction
+from services.tax_rules_engine import TaxRulesEngine
+
+
+@dataclass
+class AIRule:
+    name: str
+    condition: str
+    action: str
+    source: str
+    status: str = "active"
+
+
+class AIRulesEngine:
+    def __init__(self):
+        self.rules: List[AIRule] = []
+        self.tax_rules_engine = TaxRulesEngine()
+        self._load_default_rules()
+
+    def _load_default_rules(self):
+        self.rules = [
+            AIRule(
+                "exact_amount_match", "amount_diff <= 0.01", "auto_approve", "system"
+            ),
+            AIRule(
+                "same_vendor_same_date",
+                "vendor_match and date_diff <= 1",
+                "high_confidence",
+                "system",
+            ),
+            AIRule(
+                "gas_station_pattern",
+                "vendor_contains_gas_or_fuel",
+                "categorize_transport",
+                "system",
+            ),
+            # Tax-related rules
+            AIRule(
+                "fx_currency_mismatch",
+                "currency_mismatch",
+                "flag_fx_review",
+                "tax_system",
+            ),
+            AIRule(
+                "meals_entertainment",
+                "is_meals_entertainment",
+                "apply_me_tax_rule",
+                "tax_system",
+            ),
+            AIRule(
+                "provincial_tax_calculation",
+                "has_address_info",
+                "calculate_provincial_tax",
+                "tax_system",
+            ),
+        ]
+
+    def apply_rules(self, receipt: Receipt, transaction: Transaction) -> Dict[str, Any]:
+        results = {
+            "auto_approve": False,
+            "confidence_boost": 0,
+            "category": None,
+            "tax_analysis": {},
+        }
+
+        for rule in self.rules:
+            if rule.status != "active":
+                continue
+
+            if self._evaluate_condition(rule.condition, receipt, transaction):
+                self._execute_action(rule.action, results, receipt, transaction)
+
+        return results
+
+    def _evaluate_condition(
+        self, condition: str, receipt: Receipt, transaction: Transaction
+    ) -> bool:
+        """Safely evaluate rule conditions without using eval()"""
+        amount_diff = abs(receipt.amount - abs(transaction.amount))
+        date_diff = abs((receipt.receipt_date - transaction.transaction_date).days)
+        vendor_match = (
+            receipt.vendor.lower() in transaction.vendor.lower()
+            or transaction.vendor.lower() in receipt.vendor.lower()
+        )
+        vendor_lower = receipt.vendor.lower()
+        vendor_contains_gas_or_fuel = "gas" in vendor_lower or "fuel" in vendor_lower
+
+        # Tax-related conditions
+        currency_mismatch = receipt.currency != transaction.currency
+        is_meals_entertainment = receipt.is_meals_entertainment
+        has_address_info = (
+            receipt.billing_address is not None or receipt.shipping_address is not None
+        )
+
+        # Handle specific condition types safely
+        if condition == "amount_diff <= 0.01":
+            return amount_diff <= 0.01
+        elif condition == "vendor_match and date_diff <= 1":
+            return vendor_match and date_diff <= 1
+        elif condition == "vendor_contains_gas_or_fuel":
+            return vendor_contains_gas_or_fuel
+        elif condition == "currency_mismatch":
+            return currency_mismatch
+        elif condition == "is_meals_entertainment":
+            return is_meals_entertainment
+        elif condition == "has_address_info":
+            return has_address_info
+        else:
+            # For any other conditions, try to evaluate them safely
+            try:
+                # Only allow safe operations
+                safe_globals = {
+                    "amount_diff": amount_diff,
+                    "date_diff": date_diff,
+                    "vendor_match": vendor_match,
+                    "vendor_contains_gas_or_fuel": vendor_contains_gas_or_fuel,
+                    "currency_mismatch": currency_mismatch,
+                    "is_meals_entertainment": is_meals_entertainment,
+                    "has_address_info": has_address_info,
+                    "receipt": receipt,
+                    "transaction": transaction,
+                    "abs": abs,
+                    "len": len,
+                    "min": min,
+                    "max": max,
+                    "sum": sum,
+                    "round": round,
+                }
+                return eval(condition, safe_globals, {})
+            except (SyntaxError, NameError, TypeError) as e:
+                print(f"Warning: Invalid condition '{condition}': {e}")
+                return False
+
+    def _execute_action(
+        self,
+        action: str,
+        results: Dict[str, Any],
+        receipt: Receipt,
+        transaction: Transaction,
+    ):
+        if action == "auto_approve":
+            results["auto_approve"] = True
+        elif action == "high_confidence":
+            results["confidence_boost"] += 0.2
+        elif action == "categorize_transport":
+            results["category"] = "Transportation"
+        elif action == "flag_fx_review":
+            # Apply FX rule and flag for review
+            fx_result = self.tax_rules_engine.apply_fx_rule(receipt, transaction)
+            results["tax_analysis"]["fx"] = fx_result
+            if fx_result.get("requires_manual_review", False):
+                results["confidence_boost"] -= 0.1  # Reduce confidence for FX issues
+        elif action == "apply_me_tax_rule":
+            # Apply meals & entertainment rule
+            me_result = self.tax_rules_engine.apply_meals_entertainment_rule(receipt)
+            results["tax_analysis"]["meals_entertainment"] = me_result
+        elif action == "calculate_provincial_tax":
+            # Calculate provincial tax
+            tax_result = self.tax_rules_engine.apply_sales_tax_rule(receipt)
+            results["tax_analysis"]["sales_tax"] = tax_result
+
+    def add_rule(self, rule: AIRule):
+        self.rules.append(rule)
+
+    def remove_rule(self, rule_name: str):
+        self.rules = [r for r in self.rules if r.name != rule_name]
+
+    def apply_tax_rules(
+        self, receipt: Receipt, transaction: Transaction = None
+    ) -> Dict[str, Any]:
+        """Apply all tax rules to a receipt/transaction pair"""
+        return self.tax_rules_engine.apply_all_tax_rules(receipt, transaction)
@@ -0,0 +1,547 @@
+import base64
+import logging
+import os
+from datetime import datetime
+from typing import Any, Dict
+
+import aiofiles
+import groq
+import PyPDF2
+
+from config import settings
+
+logger = logging.getLogger(__name__)
+
+
+class DocumentProcessor:
+    def __init__(self):
+        self.client = groq.Groq(api_key=settings.GROQ_API_KEY)
+        self.model = "meta-llama/llama-4-scout-17b-16e-instruct"  # Vision model
+
+    async def process_file(self, file_path: str, file_type: str) -> Dict[str, Any]:
+        """Process uploaded file and extract receipt data"""
+        try:
+            if file_type.lower() in ["jpg", "jpeg", "png", "gif", "bmp"]:
+                return await self._process_image(file_path)
+            elif file_type.lower() == "pdf":
+                return await self._process_pdf(file_path)
+            else:
+                raise ValueError(f"Unsupported file type: {file_type}")
+        except Exception as e:
+            return {"error": str(e)}
+
+    async def _process_image(self, image_path: str) -> Dict[str, Any]:
+        """Extract data from image using Groq vision"""
+        try:
+            # Encode image to base64
+            base64_image = self._encode_image(image_path)
+
+            # Create Groq vision prompt
+            prompt = """
+            Analyze this receipt image and extract the following information in JSON format:
+            {
+                "vendor": "Store/company name",
+                "description": "Detailed description of items/services purchased",
+                "total_amount": 0.00,
+                "tax_amount": 0.00,
+                "date": "YYYY-MM-DD",
+                "category": "Food/Transport/Office/Other",
+                "confidence": 0.95,
+                "currency": "USD"
+            }
+            
+            Rules:
+            - Extract vendor name as it appears on receipt
+            - Extract description of items/services purchased (e.g., "Coffee and sandwich", "Gasoline", "Office supplies")
+            - Total amount should be the final total including tax
+            - Tax amount is separate tax line if available
+            - Date should be the date on the receipt
+            - Categorize based on vendor type (Starbucks=Food, Shell=Transport, etc.)
+            - Confidence score 0-1 based on how clear the receipt is
+            - Currency should be the currency used on the receipt (e.g., "USD", "EUR")
+
+            Return only valid JSON.
+            """
+
+            # Call Groq vision API with correct format
+            response = self.client.chat.completions.create(
+                messages=[
+                    {
+                        "role": "user",
+                        "content": [
+                            {"type": "text", "text": prompt},
+                            {
+                                "type": "image_url",
+                                "image_url": {
+                                    "url": f"data:image/jpeg;base64,{base64_image}",
+                                },
+                            },
+                        ],
+                    }
+                ],
+                model=self.model,
+                max_tokens=500,
+                temperature=0.1,
+            )
+
+            # Parse response
+            result_text = response.choices[0].message.content.strip()
+            return self._parse_extraction_result(result_text)
+
+        except Exception as e:
+            return {"error": f"Image processing error: {str(e)}"}
+
+    def _encode_image(self, image_path: str) -> str:
+        """Encode image to base64 string"""
+        with open(image_path, "rb") as image_file:
+            return base64.b64encode(image_file.read()).decode("utf-8")
+
+    async def _process_pdf(self, pdf_path: str) -> Dict[str, Any]:
+        """Extract data from PDF by converting to image first"""
+        try:
+            # For now, extract text from PDF and process as text
+            text_content = self._extract_text_from_pdf(pdf_path)
+            return self._process_text_content(text_content)
+
+        except Exception as e:
+            return {"error": f"PDF processing error: {str(e)}"}
+
+    def _extract_text_from_pdf(self, pdf_path: str) -> str:
+        """Extract text from PDF"""
+        try:
+            with open(pdf_path, "rb") as file:
+                pdf_reader = PyPDF2.PdfReader(file)
+                text = ""
+                for page in pdf_reader.pages:
+                    text += page.extract_text() + "\n"
+                return text
+        except Exception:
+            return ""
+
+    def _process_text_content(self, text_content: str) -> Dict[str, Any]:
+        """Process text content using Groq (fallback for PDFs)"""
+        try:
+            prompt = f"""
+            Analyze this receipt text and extract the following information in JSON format:
+            
+            Receipt Text:
+            {text_content}
+            
+            Extract:
+            {{
+                "vendor": "Store/company name",
+                "description": "Detailed description of items/services purchased",
+                "total_amount": 0.00,
+                "tax_amount": 0.00,
+                "date": "YYYY-MM-DD",
+                "category": "Food/Transport/Office/Other",
+                "confidence": 0.95,
+                "currency": "USD"
+            }}
+            
+            Rules:
+            - Extract vendor name as it appears on receipt
+            - Extract description of items/services purchased (e.g., "Coffee and sandwich", "Gasoline", "Office supplies")
+            - Total amount should be the final total including tax
+            - Tax amount is separate tax line if available
+            - Date should be the date on the receipt
+            - Categorize based on vendor type
+            - Confidence score 0-1 based on clarity
+            - Currency should be the currency used on the receipt (e.g., "USD", "EUR")
+            
+            Return only valid JSON.
+            """
+
+            response = self.client.chat.completions.create(
+                model=self.model,
+                messages=[{"role": "user", "content": prompt}],
+                max_tokens=500,
+                temperature=0.1,
+            )
+
+            result_text = response.choices[0].message.content.strip()
+            return self._parse_extraction_result(result_text)
+
+        except Exception as e:
+            return {"error": f"Text processing error: {str(e)}"}
+
+    def _parse_extraction_result(self, result_text: str) -> Dict[str, Any]:
+        """Parse Groq response and extract JSON data"""
+        try:
+            # Clean up response and extract JSON
+            import json
+            import re
+
+            # Find JSON in response - try multiple patterns
+            json_match = re.search(r"\{.*\}", result_text, re.DOTALL)
+            if json_match:
+                json_str = json_match.group()
+
+                # Clean up common JSON issues
+                json_str = re.sub(
+                    r",\s*([}\]])", r"\1", json_str
+                )  # Remove trailing commas
+                json_str = re.sub(
+                    r"([{,])\s*([a-zA-Z_][a-zA-Z0-9_]*)\s*:", r'\1"\2":', json_str
+                )  # Quote unquoted keys
+
+                try:
+                    data = json.loads(json_str)
+                except json.JSONDecodeError as e:
+                    # Try to fix common JSON issues
+                    logger.warning(f"Initial JSON parsing failed: {e}")
+
+                    # Try to extract individual fields using regex
+                    vendor_match = re.search(r'"vendor"\s*:\s*"([^"]*)"', json_str)
+                    description_match = re.search(
+                        r'"description"\s*:\s*"([^"]*)"', json_str
+                    )
+                    total_amount_match = re.search(
+                        r'"total_amount"\s*:\s*([0-9.]+)', json_str
+                    )
+                    tax_amount_match = re.search(
+                        r'"tax_amount"\s*:\s*([0-9.]+)', json_str
+                    )
+                    date_match = re.search(r'"date"\s*:\s*"([^"]*)"', json_str)
+                    category_match = re.search(r'"category"\s*:\s*"([^"]*)"', json_str)
+                    confidence_match = re.search(
+                        r'"confidence"\s*:\s*([0-9.]+)', json_str
+                    )
+                    currency_match = re.search(
+                        r'"currency"\s*:\s*"([^"]*)"', json_str
+                    )
+
+                    data = {
+                        "vendor": vendor_match.group(1) if vendor_match else "",
+                        "description": description_match.group(1)
+                        if description_match
+                        else "",
+                        "total_amount": float(total_amount_match.group(1))
+                        if total_amount_match
+                        else 0.0,
+                        "tax_amount": float(tax_amount_match.group(1))
+                        if tax_amount_match
+                        else 0.0,
+                        "date": date_match.group(1) if date_match else "",
+                        "category": category_match.group(1)
+                        if category_match
+                        else "Other",
+                        "confidence": float(confidence_match.group(1))
+                        if confidence_match
+                        else 0.5,
+                        "currency": currency_match.group(1) if currency_match else "CAD"
+                    }
+
+                # Validate and clean data
+                return {
+                    "vendor": str(data.get("vendor", "")).strip(),
+                    "description": str(data.get("description", "")).strip(),
+                    "total_amount": float(data.get("total_amount", 0)),
+                    "tax_amount": float(data.get("tax_amount", 0)),
+                    "date": str(data.get("date", "")).strip(),
+                    "category": str(data.get("category", "Other")).strip(),
+                    "confidence": float(data.get("confidence", 0.5)),
+                    "extraction_success": True,
+                    "currency": data.get("currency", "CAD").strip(),
+                }
+            else:
+                # Try to extract fields from plain text
+                logger.warning("No JSON found in response, attempting text extraction")
+                return self._extract_from_plain_text(result_text)
+
+        except Exception as e:
+            logger.error(f"JSON parsing error: {str(e)}")
+            return {
+                "error": f"JSON parsing error: {str(e)}",
+                "extraction_success": False,
+            }
+
+    def _extract_from_plain_text(self, text: str) -> Dict[str, Any]:
+        """Extract receipt data from plain text when JSON parsing fails"""
+        try:
+            import re
+
+            # Extract vendor (look for common patterns)
+            vendor_patterns = [
+                r"(?:vendor|store|merchant|company)\s*[:\-]?\s*([A-Za-z0-9\s&.,]+)",
+                r"([A-Z][A-Za-z0-9\s&.,]{3,30})",  # Capitalized words
+            ]
+
+            vendor = ""
+            for pattern in vendor_patterns:
+                match = re.search(pattern, text, re.IGNORECASE)
+                if match:
+                    vendor = match.group(1).strip()
+                    break
+
+            # Extract amount (look for currency patterns)
+            amount_patterns = [
+                r"\$?\s*([0-9,]+\.?[0-9]*)",
+                r"(?:total|amount|sum)\s*[:\-]?\s*\$?\s*([0-9,]+\.?[0-9]*)",
+            ]
+
+            total_amount = 0.0
+            for pattern in amount_patterns:
+                match = re.search(pattern, text, re.IGNORECASE)
+                if match:
+                    try:
+                        total_amount = float(match.group(1).replace(",", ""))
+                        break
+                    except ValueError:
+                        continue
+
+            # Extract date
+            date_patterns = [
+                r"(\d{4}-\d{2}-\d{2})",
+                r"(\d{1,2}/\d{1,2}/\d{2,4})",
+                r"(Jan|Feb|Mar|Apr|May|Jun|Jul|Aug|Sep|Oct|Nov|Dec)\s+\d{1,2},?\s+\d{4}",
+            ]
+
+            date = ""
+            for pattern in date_patterns:
+                match = re.search(pattern, text, re.IGNORECASE)
+                if match:
+                    date = match.group(0)
+                    break
+
+            return {
+                "vendor": vendor or "Unknown",
+                "total_amount": total_amount,
+                "tax_amount": 0.0,
+                "date": date or "",
+                "category": "Other",
+                "confidence": 0.3,  # Low confidence for text extraction
+                "extraction_success": True,
+            }
+
+        except Exception as e:
+            logger.error(f"Text extraction error: {str(e)}")
+            return {
+                "vendor": "Unknown",
+                "total_amount": 0.0,
+                "tax_amount": 0.0,
+                "date": "",
+                "category": "Other",
+                "confidence": 0.1,
+                "extraction_success": False,
+                "error": f"Text extraction failed: {str(e)}",
+            }
+
+    async def save_uploaded_file(self, file_content: bytes, filename: str) -> str:
+        """Save uploaded file to temporary storage"""
+        try:
+            # Create uploads directory if it doesn't exist
+            upload_dir = "uploads"
+            os.makedirs(upload_dir, exist_ok=True)
+
+            # Generate unique filename
+            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+            safe_filename = f"{timestamp}_{filename.replace(' ', '_')}"
+            file_path = os.path.join(upload_dir, safe_filename)
+
+            # Save file
+            async with aiofiles.open(file_path, "wb") as f:
+                await f.write(file_content)
+
+            return file_path
+
+        except Exception as e:
+            raise Exception(f"Failed to save file: {str(e)}")
+
+    async def extract_transactions_from_image(self, image_path: str) -> Dict[str, Any]:
+        """Extract multiple transactions from an image (bank statement, credit card statement, etc.)"""
+        try:
+            # Encode image to base64
+            base64_image = self._encode_image(image_path)
+
+            # Create Groq vision prompt for transaction extraction
+            prompt = """
+            Analyze this financial document image (bank statement, credit card statement, etc.) and extract ALL transactions in JSON format.
+            
+            Look for transaction lists, payment records, or any financial entries that show:
+            - Date
+            - Amount (positive or negative)
+            - Vendor/Description/Payee name
+            - Any additional notes or memo
+            
+            Return the transactions as a JSON array:
+            {
+                "extraction_success": true,
+                "transactions": [
+                    {
+                        "date": "YYYY-MM-DD",
+                        "amount": 0.00,
+                        "vendor": "Vendor name",
+                        "memo": "Additional notes"
+                    },
+                    {
+                        "date": "YYYY-MM-DD", 
+                        "amount": -0.00,
+                        "vendor": "Another vendor",
+                        "memo": "Payment or charge description"
+                    }
+                ]
+            }
+            
+            Rules:
+            - Extract ALL visible transactions
+            - Include both positive (credits) and negative (debits) amounts
+            - Use the actual date format from the document
+            - Vendor should be the merchant/payee name
+            - Memo can include transaction type, reference numbers, etc.
+            - If no transactions found, return empty array but set extraction_success to true
+            
+            Return only valid JSON.
+            """
+
+            # Call Groq vision API
+            response = self.client.chat.completions.create(
+                messages=[
+                    {
+                        "role": "user",
+                        "content": [
+                            {"type": "text", "text": prompt},
+                            {
+                                "type": "image_url",
+                                "image_url": {
+                                    "url": f"data:image/jpeg;base64,{base64_image}",
+                                },
+                            },
+                        ],
+                    }
+                ],
+                model=self.model,
+                max_tokens=2000,  # Higher token limit for multiple transactions
+                temperature=0.1,
+            )
+
+            # Parse response
+            result_text = response.choices[0].message.content.strip()
+            return self._parse_transaction_extraction_result(result_text)
+
+        except Exception as e:
+            return {
+                "extraction_success": False,
+                "error": f"Transaction extraction error: {str(e)}",
+                "transactions": [],
+            }
+
+    def _parse_transaction_extraction_result(self, result_text: str) -> Dict[str, Any]:
+        """Parse Groq response for transaction extraction"""
+        try:
+            import json
+            import re
+
+            # Find the first '{' and last '}'
+            start = result_text.find("{")
+            end = result_text.rfind("}")
+            if start == -1 or end == -1 or end <= start:
+                return {
+                    "extraction_success": False,
+                    "error": "Could not find JSON object in AI response",
+                    "transactions": [],
+                }
+            json_str = result_text[start : end + 1]
+
+            # Remove trailing commas before } or ]
+            json_str = re.sub(r",\s*([}\]])", r"\1", json_str)
+
+            try:
+                data = json.loads(json_str)
+            except Exception as e:
+                import logging
+
+                logging.error(f"JSON parsing error: {str(e)}")
+                logging.error(f"Offending JSON string:\n{json_str}")
+                return {
+                    "extraction_success": False,
+                    "error": f"JSON parsing error: {str(e)}",
+                    "transactions": [],
+                }
+
+            # Validate and clean data
+            transactions = data.get("transactions", [])
+            cleaned_transactions = []
+            for txn in transactions:
+                try:
+                    cleaned_txn = {
+                        "date": str(txn.get("date", "")).strip(),
+                        "amount": float(
+                            str(txn.get("amount", 0)).replace("$", "").replace(",", "")
+                        ),
+                        "vendor": str(txn.get("vendor", "")).strip(),
+                        "memo": str(txn.get("memo", "")).strip(),
+                    }
+                    cleaned_transactions.append(cleaned_txn)
+                except Exception:
+                    continue
+            return {
+                "extraction_success": data.get("extraction_success", True),
+                "transactions": cleaned_transactions,
+                "total_transactions": len(cleaned_transactions),
+            }
+        except Exception as e:
+            import logging
+
+            logging.error(f"JSON parsing error (outer): {str(e)}")
+            return {
+                "extraction_success": False,
+                "error": f"JSON parsing error: {str(e)}",
+                "transactions": [],
+            }
+
+    def _parse_date_to_iso(self, date_str: str) -> str:
+        """Parse various date formats and convert to YYYY-MM-DD"""
+        try:
+            import re
+            from datetime import datetime
+
+            date_str = date_str.strip().upper()
+
+            # Handle formats like "MAY 22", "JUN 01", "MAY 22, 2024"
+            month_pattern = r"(JAN|FEB|MAR|APR|MAY|JUN|JUL|AUG|SEP|OCT|NOV|DEC)\s+(\d{1,2})(?:,\s*(\d{4}))?"
+            match = re.match(month_pattern, date_str)
+
+            if match:
+                month_abbr, day, year = match.groups()
+                month_map = {
+                    "JAN": 1,
+                    "FEB": 2,
+                    "MAR": 3,
+                    "APR": 4,
+                    "MAY": 5,
+                    "JUN": 6,
+                    "JUL": 7,
+                    "AUG": 8,
+                    "SEP": 9,
+                    "OCT": 10,
+                    "NOV": 11,
+                    "DEC": 12,
+                }
+
+                month = month_map[month_abbr]
+                day = int(day)
+                year = int(year) if year else datetime.now().year
+
+                # Handle 2-digit years
+                if year < 100:
+                    year += 2000
+
+                return f"{year:04d}-{month:02d}-{day:02d}"
+
+            # Handle YYYY-MM-DD format
+            if re.match(r"\d{4}-\d{2}-\d{2}", date_str):
+                return date_str
+
+            # Handle MM/DD/YYYY format
+            if re.match(r"\d{1,2}/\d{1,2}/\d{4}", date_str):
+                return datetime.strptime(date_str, "%m/%d/%Y").strftime("%Y-%m-%d")
+
+            # Handle MM/DD/YY format
+            if re.match(r"\d{1,2}/\d{1,2}/\d{2}", date_str):
+                return datetime.strptime(date_str, "%m/%d/%y").strftime("%Y-%m-%d")
+
+            return None
+
+        except Exception:
+            return None
@@ -0,0 +1,76 @@
+import json
+import os
+from dataclasses import dataclass
+from datetime import datetime, timedelta
+from typing import List
+
+
+@dataclass
+class FeedbackLog:
+    transaction_id: str
+    original_match: str
+    correction: str
+    reason: str
+    timestamp: datetime
+    user_id: str
+
+
+class FeedbackLogger:
+    def __init__(self, log_file: str = "feedback_logs.json"):
+        self.log_file = log_file
+        self.logs: List[FeedbackLog] = self._load_logs()
+
+    def _load_logs(self) -> List[FeedbackLog]:
+        if not os.path.exists(self.log_file):
+            return []
+
+        try:
+            with open(self.log_file, "r") as f:
+                data = json.load(f)
+                return [FeedbackLog(**log) for log in data]
+        except Exception:
+            return []
+
+    def _save_logs(self):
+        with open(self.log_file, "w") as f:
+            json.dump(
+                [
+                    {
+                        "transaction_id": log.transaction_id,
+                        "original_match": log.original_match,
+                        "correction": log.correction,
+                        "reason": log.reason,
+                        "timestamp": log.timestamp.isoformat(),
+                        "user_id": log.user_id,
+                    }
+                    for log in self.logs
+                ],
+                f,
+                indent=2,
+            )
+
+    def log_override(
+        self,
+        transaction_id: str,
+        original_match: str,
+        correction: str,
+        reason: str,
+        user_id: str,
+    ):
+        log = FeedbackLog(
+            transaction_id=transaction_id,
+            original_match=original_match,
+            correction=correction,
+            reason=reason,
+            timestamp=datetime.now(),
+            user_id=user_id,
+        )
+        self.logs.append(log)
+        self._save_logs()
+
+    def get_logs_by_transaction(self, transaction_id: str) -> List[FeedbackLog]:
+        return [log for log in self.logs if log.transaction_id == transaction_id]
+
+    def get_recent_logs(self, days: int = 30) -> List[FeedbackLog]:
+        cutoff = datetime.now() - timedelta(days=days)
+        return [log for log in self.logs if log.timestamp > cutoff]
@@ -0,0 +1,89 @@
+from typing import Any, Dict, List
+
+from services.ai_matcher import AIMatcher
+from services.ai_rules import AIRulesEngine
+from services.feedback_logger import FeedbackLogger
+from schemas import Match, Receipt, Transaction
+
+
+class MatchingEngine:
+    def __init__(self):
+        self.ai_matcher = AIMatcher()
+        self.rules_engine = AIRulesEngine()
+        self.feedback_logger = FeedbackLogger()
+
+    def process_matching(
+        self, receipts: List[Receipt], transactions: List[Transaction]
+    ) -> List[Match]:
+        # Get AI matches
+        ai_matches = self.ai_matcher.match_receipts_to_transactions(
+            receipts, transactions
+        )
+
+        # Apply rules and enhance matches
+        enhanced_matches = []
+        for match in ai_matches:
+            enhanced_match = self._enhance_match_with_rules(match)
+            enhanced_matches.append(enhanced_match)
+
+        return enhanced_matches
+
+    def _enhance_match_with_rules(self, match: Match) -> Match:
+        rule_results = self.rules_engine.apply_rules(match.receipt, match.transaction)
+
+        # Apply confidence boost from rules
+        if rule_results["confidence_boost"] > 0:
+            match.confidence_score = min(
+                1.0, match.confidence_score + rule_results["confidence_boost"]
+            )
+
+        # Auto-approve if rules say so
+        if rule_results["auto_approve"]:
+            match.confidence_score = 1.0
+            match.match_reason += " (Auto-approved by rules)"
+
+        # Add tax analysis to match
+        if rule_results.get("tax_analysis"):
+            match.tax_analysis = rule_results["tax_analysis"]
+
+        return match
+
+    def approve_match(self, match: Match, user_id: str):
+        # Log the approval
+        self.feedback_logger.log_override(
+            transaction_id=match.transaction.id,
+            original_match=f"AI Score: {match.confidence_score}",
+            correction="Approved",
+            reason="User approved match",
+            user_id=user_id,
+        )
+
+    def reject_match(self, match: Match, reason: str, user_id: str):
+        # Log the rejection
+        self.feedback_logger.log_override(
+            transaction_id=match.transaction.id,
+            original_match=f"AI Score: {match.confidence_score}",
+            correction="Rejected",
+            reason=reason,
+            user_id=user_id,
+        )
+
+    def get_matching_stats(self, matches: List[Match]) -> Dict[str, Any]:
+        if not matches:
+            return {
+                "total": 0,
+                "high_confidence": 0,
+                "low_confidence": 0,
+                "avg_score": 0,
+            }
+
+        high_confidence = len([m for m in matches if m.confidence_score >= 0.8])
+        low_confidence = len([m for m in matches if m.confidence_score < 0.8])
+        avg_score = sum(m.confidence_score for m in matches) / len(matches)
+
+        return {
+            "total": len(matches),
+            "high_confidence": high_confidence,
+            "low_confidence": low_confidence,
+            "avg_score": round(avg_score, 3),
+        }
@@ -0,0 +1,276 @@
+import logging
+from typing import Any, Dict, Optional
+
+from schemas import Address, Asset, Receipt, Transaction
+
+logger = logging.getLogger(__name__)
+
+
+class TaxRulesEngine:
+    """Engine to handle tax calculations based on the four tax rules"""
+
+    # Provincial tax rates (simplified - in production, use a tax rate API)
+    PROVINCIAL_TAX_RATES = {
+        "ON": 0.13,  # Ontario HST
+        "QC": 0.14975,  # Quebec QST
+        "BC": 0.12,  # British Columbia
+        "AB": 0.05,  # Alberta
+        "SK": 0.11,  # Saskatchewan
+        "MB": 0.12,  # Manitoba
+        "NS": 0.15,  # Nova Scotia
+        "NB": 0.15,  # New Brunswick
+        "NL": 0.15,  # Newfoundland and Labrador
+        "PE": 0.15,  # Prince Edward Island
+        "NT": 0.05,  # Northwest Territories
+        "NU": 0.05,  # Nunavut
+        "YT": 0.05,  # Yukon
+    }
+
+    def __init__(self):
+        self.logger = logging.getLogger(__name__)
+
+    def apply_sales_tax_rule(self, receipt: Receipt) -> Dict[str, Any]:
+        """
+        Sales Tax Rule: Apply correct sales tax based on billing vs shipping addresses
+        """
+        try:
+            # Determine which address to use for tax calculation
+            tax_address = self._get_tax_address(receipt)
+
+            if not tax_address:
+                return {
+                    "success": False,
+                    "error": "No valid address found for tax calculation",
+                    "calculated_tax": 0.0,
+                    "tax_rate": 0.0,
+                }
+
+            # Get tax rate for the province
+            tax_rate = self.PROVINCIAL_TAX_RATES.get(tax_address.province, 0.0)
+
+            # Calculate tax amount
+            calculated_tax = receipt.amount * tax_rate
+
+            return {
+                "success": True,
+                "calculated_tax": calculated_tax,
+                "tax_rate": tax_rate,
+                "tax_address": tax_address.province,
+                "rule_applied": "Sales Tax Rule",
+            }
+
+        except Exception as e:
+            self.logger.error(f"Error applying sales tax rule: {str(e)}")
+            return {
+                "success": False,
+                "error": str(e),
+                "calculated_tax": 0.0,
+                "tax_rate": 0.0,
+            }
+
+    def _get_tax_address(self, receipt: Receipt) -> Optional[Address]:
+        """Determine which address to use for tax calculation"""
+        # Rule: Use shipping address if different from billing, otherwise use billing
+        if receipt.shipping_address and receipt.billing_address:
+            if self._addresses_different(
+                receipt.billing_address, receipt.shipping_address
+            ):
+                return receipt.shipping_address
+            else:
+                return receipt.billing_address
+        elif receipt.shipping_address:
+            return receipt.shipping_address
+        elif receipt.billing_address:
+            return receipt.billing_address
+        else:
+            return None
+
+    def _addresses_different(self, billing: Address, shipping: Address) -> bool:
+        """Check if billing and shipping addresses are different"""
+        return (
+            billing.province != shipping.province
+            or billing.city != shipping.city
+            or billing.postal_code != shipping.postal_code
+        )
+
+    def apply_fx_rule(
+        self, receipt: Receipt, transaction: Transaction
+    ) -> Dict[str, Any]:
+        """
+        Foreign Exchange Rule: Handle currency mismatches
+        """
+        try:
+            # Check for currency mismatch
+            if receipt.currency != transaction.currency:
+                fx_discrepancy = abs(receipt.amount - abs(transaction.amount))
+
+                return {
+                    "success": True,
+                    "fx_discrepancy": fx_discrepancy,
+                    "receipt_currency": receipt.currency,
+                    "transaction_currency": transaction.currency,
+                    "receipt_amount": receipt.amount,
+                    "transaction_amount": abs(transaction.amount),
+                    "requires_manual_review": True,
+                    "rule_applied": "Foreign Exchange Rule",
+                }
+            else:
+                return {
+                    "success": True,
+                    "fx_discrepancy": 0.0,
+                    "requires_manual_review": False,
+                    "rule_applied": "No FX Rule (same currency)",
+                }
+
+        except Exception as e:
+            self.logger.error(f"Error applying FX rule: {str(e)}")
+            return {
+                "success": False,
+                "error": str(e),
+                "fx_discrepancy": 0.0,
+                "requires_manual_review": False,
+            }
+
+    def calculate_straight_line_depreciation(
+        self, asset: Asset, year: int
+    ) -> Dict[str, Any]:
+        """
+        Straight-Line Depreciation for accounting purposes
+        """
+        try:
+            if year > asset.useful_life_years:
+                return {
+                    "success": False,
+                    "error": f"Year {year} exceeds useful life of {asset.useful_life_years} years",
+                    "depreciation": 0.0,
+                }
+
+            # Straight-line formula: (Cost - Residual Value) / Useful Life
+            annual_depreciation = (
+                asset.purchase_amount - asset.residual_value
+            ) / asset.useful_life_years
+
+            return {
+                "success": True,
+                "depreciation": annual_depreciation,
+                "book_value": asset.purchase_amount - (annual_depreciation * year),
+                "method": "Straight-Line",
+                "rule_applied": "Depreciation Rule (Accounting)",
+            }
+
+        except Exception as e:
+            self.logger.error(f"Error calculating straight-line depreciation: {str(e)}")
+            return {"success": False, "error": str(e), "depreciation": 0.0}
+
+    def calculate_cca_depreciation(self, asset: Asset, year: int) -> Dict[str, Any]:
+        """
+        CCA (Capital Cost Allowance) Depreciation for tax purposes
+        """
+        try:
+            if year < 1:
+                return {
+                    "success": False,
+                    "error": "Year must be at least 1",
+                    "depreciation": 0.0,
+                }
+
+            # CCA uses declining balance method
+            book_value = asset.purchase_amount
+            total_depreciation = 0.0
+
+            for current_year in range(1, year + 1):
+                # CCA is calculated on the declining balance
+                cca_amount = book_value * asset.cca_rate
+                book_value -= cca_amount
+                total_depreciation += cca_amount
+
+                # Stop if book value reaches residual value
+                if book_value <= asset.residual_value:
+                    break
+
+            return {
+                "success": True,
+                "depreciation": cca_amount,  # Current year depreciation
+                "total_depreciation": total_depreciation,
+                "book_value": max(book_value, asset.residual_value),
+                "method": "CCA Declining Balance",
+                "rule_applied": "Depreciation Rule (Tax)",
+            }
+
+        except Exception as e:
+            self.logger.error(f"Error calculating CCA depreciation: {str(e)}")
+            return {"success": False, "error": str(e), "depreciation": 0.0}
+
+    def apply_meals_entertainment_rule(self, receipt: Receipt) -> Dict[str, Any]:
+        """
+        Meals & Entertainment Tax Deduction Rule
+        """
+        try:
+            if not receipt.is_meals_entertainment:
+                return {
+                    "success": True,
+                    "tax_deduction": receipt.amount,
+                    "accounting_deduction": receipt.amount,
+                    "rule_applied": "No M&E Rule (not meals/entertainment)",
+                }
+
+            # For tax purposes: 50% deductible
+            tax_deduction = receipt.amount * 0.5
+
+            # For accounting purposes: 100% deductible
+            accounting_deduction = receipt.amount
+
+            # Sales tax is fully deductible for accounting
+            tax_on_meal = receipt.tax
+
+            return {
+                "success": True,
+                "tax_deduction": tax_deduction,
+                "accounting_deduction": accounting_deduction,
+                "tax_on_meal": tax_on_meal,
+                "rule_applied": "Meals & Entertainment Rule",
+            }
+
+        except Exception as e:
+            self.logger.error(f"Error applying meals & entertainment rule: {str(e)}")
+            return {
+                "success": False,
+                "error": str(e),
+                "tax_deduction": 0.0,
+                "accounting_deduction": 0.0,
+            }
+
+    def apply_all_tax_rules(
+        self, receipt: Receipt, transaction: Transaction = None
+    ) -> Dict[str, Any]:
+        """
+        Apply all tax rules to a receipt
+        """
+        results = {
+            "receipt_id": receipt.id,
+            "rules_applied": [],
+            "sales_tax": {},
+            "fx_analysis": {},
+            "meals_entertainment": {},
+        }
+
+        # Apply Sales Tax Rule
+        sales_tax_result = self.apply_sales_tax_rule(receipt)
+        results["sales_tax"] = sales_tax_result
+        if sales_tax_result["success"]:
+            results["rules_applied"].append("Sales Tax Rule")
+
+        # Apply FX Rule (if transaction provided)
+        if transaction:
+            fx_result = self.apply_fx_rule(receipt, transaction)
+            results["fx_analysis"] = fx_result
+            if fx_result["success"]:
+                results["rules_applied"].append("Foreign Exchange Rule")
+
+        # Apply Meals & Entertainment Rule
+        me_result = self.apply_meals_entertainment_rule(receipt)
+        results["meals_entertainment"] = me_result
+        if me_result["success"]:
+            results["rules_applied"].append("Meals & Entertainment Rule")
+
+        return results