diff --git a/config/categories.yaml b/config/categories.yaml
new file mode 100644
index 0000000..56efc6e
--- /dev/null
+++ b/config/categories.yaml
@@ -0,0 +1,138 @@
+categories:
+  junk:
+    description: "Spam, unwanted marketing, phishing attempts"
+    patterns:
+      - "unsubscribe"
+      - "click here"
+      - "limited time"
+    threshold: 0.85
+    priority: 1
+
+  transactional:
+    description: "Receipts, invoices, confirmations, order tracking"
+    patterns:
+      - "receipt"
+      - "invoice"
+      - "order"
+      - "shipped"
+      - "tracking"
+      - "confirmation"
+    threshold: 0.80
+    priority: 2
+
+  auth:
+    description: "OTPs, password resets, 2FA codes, security alerts"
+    patterns:
+      - "verification code"
+      - "otp"
+      - "reset password"
+      - "verify your account"
+      - "confirm your identity"
+    threshold: 0.90
+    priority: 1
+
+  newsletters:
+    description: "Subscribed newsletters, marketing emails, digests"
+    patterns:
+      - "newsletter"
+      - "weekly digest"
+      - "monthly update"
+      - "subscribe"
+    threshold: 0.75
+    priority: 3
+
+  social:
+    description: "Social media notifications, mentions, friend requests"
+    patterns:
+      - "mentioned you"
+      - "friend request"
+      - "liked your"
+      - "followed you"
+    threshold: 0.75
+    priority: 3
+
+  automated:
+    description: "System notifications, alerts, automated messages"
+    patterns:
+      - "automated"
+      - "system notification"
+      - "do not reply"
+      - "noreply"
+    threshold: 0.80
+    priority: 2
+
+  conversational:
+    description: "Human-to-human correspondence, replies, discussions"
+    patterns:
+      - "hi"
+      - "hello"
+      - "thanks"
+      - "regards"
+      - "best regards"
+    threshold: 0.65
+    priority: 3
+
+  work:
+    description: "Business correspondence, meetings, projects, deadlines"
+    patterns:
+      - "meeting"
+      - "project"
+      - "deadline"
+      - "team"
+      - "discussion"
+    threshold: 0.70
+    priority: 2
+
+  personal:
+    description: "Friends and family, personal matters"
+    patterns:
+      - "love"
+      - "family"
+      - "dinner"
+      - "weekend"
+      - "friend"
+    threshold: 0.70
+    priority: 3
+
+  finance:
+    description: "Bank statements, credit cards, investments, bills"
+    patterns:
+      - "statement"
+      - "balance"
+      - "account"
+      - "payment due"
+      - "card"
+    threshold: 0.85
+    priority: 2
+
+  travel:
+    description: "Flight bookings, hotels, reservations, itineraries"
+    patterns:
+      - "flight"
+      - "booking"
+      - "reservation"
+      - "check-in"
+      - "hotel"
+    threshold: 0.80
+    priority: 2
+
+  unknown:
+    description: "Doesn't fit any category (requires review)"
+    patterns: []
+    threshold: 0.50
+    priority: 4
+
+# Category order for processing
+processing_order:
+  - auth
+  - finance
+  - transactional
+  - work
+  - travel
+  - conversational
+  - personal
+  - social
+  - newsletters
+  - automated
+  - junk
+  - unknown
diff --git a/config/default_config.yaml b/config/default_config.yaml
new file mode 100644
index 0000000..8f97e8b
--- /dev/null
+++ b/config/default_config.yaml
@@ -0,0 +1,81 @@
+version: "1.0.0"
+
+calibration:
+  sample_size: 1500
+  sample_strategy: "stratified"
+  validation_size: 300
+  min_confidence: 0.6
+
+processing:
+  batch_size: 100
+  llm_queue_size: 100
+  parallel_workers: 4
+  checkpoint_interval: 1000
+  checkpoint_dir: "checkpoints"
+
+classification:
+  default_threshold: 0.75
+  min_threshold: 0.60
+  max_threshold: 0.90
+  adjustment_step: 0.05
+  adjustment_frequency: 1000
+  category_thresholds:
+    junk: 0.85
+    auth: 0.90
+    transactional: 0.80
+    newsletters: 0.75
+    conversational: 0.65
+
+llm:
+  provider: "ollama"
+  fallback_enabled: true
+
+  ollama:
+    base_url: "http://localhost:11434"
+    calibration_model: "qwen3:4b"
+    classification_model: "qwen3:1.7b"
+    temperature: 0.1
+    max_tokens: 500
+    timeout: 30
+    retry_attempts: 3
+
+  openai:
+    base_url: "https://api.openai.com/v1"
+    api_key: "${OPENAI_API_KEY}"
+    calibration_model: "gpt-4o-mini"
+    classification_model: "gpt-4o-mini"
+    temperature: 0.1
+    max_tokens: 500
+
+email_providers:
+  gmail:
+    batch_size: 100
+  microsoft:
+    batch_size: 100
+  imap:
+    timeout: 30
+    batch_size: 50
+
+features:
+  text_features:
+    max_vocab_size: 10000
+    ngram_range: [1, 2]
+    min_df: 2
+    max_df: 0.95
+  embedding_model: "all-MiniLM-L6-v2"
+  embedding_batch_size: 32
+
+export:
+  format: "json"
+  include_confidence: true
+  create_report: true
+  output_dir: "results"
+
+logging:
+  level: "INFO"
+  file: "logs/email-sorter.log"
+
+cleanup:
+  delete_temp_files: true
+  delete_repo_after: false
+  temp_dir: ".email-sorter-tmp"
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..3c1a0ad
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,48 @@
+# Core dependencies
+python-dotenv>=1.0.0
+pyyaml>=6.0
+pydantic>=2.0.0
+
+# Email Providers
+google-api-python-client>=2.100.0
+google-auth-httplib2>=0.1.1
+google-auth-oauthlib>=1.1.0
+msal>=1.24.0
+imapclient>=2.3.1
+
+# Machine Learning
+scikit-learn>=1.3.0
+lightgbm>=4.0.0
+pandas>=2.0.0
+numpy>=1.24.0
+sentence-transformers>=2.2.0
+
+# LLM Integration
+ollama>=0.1.0
+openai>=1.0.0
+
+# Text Processing & Attachments
+nltk>=3.8
+beautifulsoup4>=4.12.0
+lxml>=4.9.0
+PyPDF2>=3.0.0
+python-docx>=0.8.11
+openpyxl>=3.0.10
+
+# Utilities
+tqdm>=4.66.0
+click>=8.1.0
+rich>=13.0.0
+joblib>=1.3.0
+tenacity>=8.2.0
+
+# Testing
+pytest>=7.4.0
+pytest-cov>=4.1.0
+pytest-mock>=3.11.0
+faker>=19.0.0
+
+# Development
+black>=23.0.0
+isort>=5.12.0
+flake8>=6.0.0
diff --git a/setup.py b/setup.py
new file mode 100644
index 0000000..bcb4ae4
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,100 @@
+"""Setup configuration for email-sorter."""
+from setuptools import setup, find_packages
+from pathlib import Path
+
+# Read README
+readme_file = Path(__file__).parent / "README.md"
+long_description = readme_file.read_text() if readme_file.exists() else ""
+
+setup(
+    name="email-sorter",
+    version="1.0.0",
+    description="Hybrid ML/LLM Email Classification System",
+    long_description=long_description,
+    long_description_content_type="text/markdown",
+    author="Your Name",
+    author_email="your.email@example.com",
+    url="https://github.com/yourusername/email-sorter",
+    license="MIT",
+    packages=find_packages(),
+    include_package_data=True,
+    python_requires=">=3.8",
+    install_requires=[
+        # Core
+        "python-dotenv>=1.0.0",
+        "pyyaml>=6.0",
+        "pydantic>=2.0.0",
+
+        # Email Providers
+        "google-api-python-client>=2.100.0",
+        "google-auth-httplib2>=0.1.1",
+        "google-auth-oauthlib>=1.1.0",
+        "msal>=1.24.0",
+        "imapclient>=2.3.1",
+
+        # Machine Learning
+        "scikit-learn>=1.3.0",
+        "lightgbm>=4.0.0",
+        "pandas>=2.0.0",
+        "numpy>=1.24.0",
+        "sentence-transformers>=2.2.0",
+
+        # LLM Integration
+        "ollama>=0.1.0",
+        "openai>=1.0.0",
+
+        # Text Processing
+        "nltk>=3.8",
+        "beautifulsoup4>=4.12.0",
+        "lxml>=4.9.0",
+
+        # Attachments
+        "PyPDF2>=3.0.0",
+        "python-docx>=0.8.11",
+        "openpyxl>=3.0.10",
+
+        # CLI & Utilities
+        "click>=8.1.0",
+        "rich>=13.0.0",
+        "tqdm>=4.66.0",
+        "joblib>=1.3.0",
+        "tenacity>=8.2.0",
+    ],
+    extras_require={
+        "dev": [
+            "pytest>=7.4.0",
+            "pytest-cov>=4.1.0",
+            "pytest-mock>=3.11.0",
+            "black>=23.0.0",
+            "isort>=5.12.0",
+            "flake8>=6.0.0",
+        ],
+        "gmail": [
+            "google-api-python-client>=2.100.0",
+            "google-auth-oauthlib>=1.1.0",
+        ],
+        "ollama": [
+            "ollama>=0.1.0",
+        ],
+        "openai": [
+            "openai>=1.0.0",
+        ],
+    },
+    entry_points={
+        "console_scripts": [
+            "email-sorter=src.cli:cli",
+        ],
+    },
+    classifiers=[
+        "Development Status :: 3 - Alpha",
+        "Intended Audience :: Developers",
+        "License :: OSI Approved :: MIT License",
+        "Programming Language :: Python :: 3",
+        "Programming Language :: Python :: 3.8",
+        "Programming Language :: Python :: 3.9",
+        "Programming Language :: Python :: 3.10",
+        "Programming Language :: Python :: 3.11",
+        "Programming Language :: Python :: 3.12",
+        "Programming Language :: Python :: 3.13",
+    ],
+)
diff --git a/src/__init__.py b/src/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/__main__.py b/src/__main__.py
new file mode 100644
index 0000000..abc6f80
--- /dev/null
+++ b/src/__main__.py
@@ -0,0 +1,5 @@
+"""Entry point for email-sorter module."""
+from src.cli import cli
+
+if __name__ == '__main__':
+    cli()
diff --git a/src/adjustment/__init__.py b/src/adjustment/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/calibration/__init__.py b/src/calibration/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/classification/__init__.py b/src/classification/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/classification/adaptive_classifier.py b/src/classification/adaptive_classifier.py
new file mode 100644
index 0000000..47274e6
--- /dev/null
+++ b/src/classification/adaptive_classifier.py
@@ -0,0 +1,294 @@
+"""
+Adaptive classifier that orchestrates ML + LLM classification.
+
+Strategy:
+1. Hard rules: Fast pattern matching -> instant classification (10% of emails)
+2. ML classifier: LightGBM with confidence threshold (85% of emails)
+3. LLM review: Low-confidence emails sent for LLM review (5% of emails)
+4. Dynamic threshold adjustment: Learn from LLM feedback
+"""
+import logging
+from typing import Dict, List, Any, Optional
+from dataclasses import dataclass
+
+from src.email_providers.base import Email, ClassificationResult
+from src.classification.feature_extractor import FeatureExtractor
+from src.classification.ml_classifier import MLClassifier
+from src.classification.llm_classifier import LLMClassifier
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass
+class ClassificationStats:
+    """Track classification statistics."""
+    total_emails: int = 0
+    rule_matched: int = 0
+    ml_classified: int = 0
+    llm_classified: int = 0
+    needs_review: int = 0
+
+    def accuracy_estimate(self) -> float:
+        """Estimate accuracy based on classification method distribution."""
+        if self.total_emails == 0:
+            return 0.0
+
+        # Conservative estimate
+        rule_accuracy = 0.99  # Hard rules are very accurate
+        ml_accuracy = 0.92    # ML classifier baseline
+        llm_accuracy = 0.95   # LLM is very accurate
+
+        weighted = (
+            (self.rule_matched * rule_accuracy +
+             self.ml_classified * ml_accuracy +
+             self.llm_classified * llm_accuracy) / self.total_emails
+        )
+        return weighted
+
+    def __str__(self) -> str:
+        return (
+            f"Stats: {self.total_emails} emails | "
+            f"Rules: {self.rule_matched} | "
+            f"ML: {self.ml_classified} | "
+            f"LLM: {self.llm_classified} | "
+            f"Est. Accuracy: {self.accuracy_estimate():.1%}"
+        )
+
+
+class AdaptiveClassifier:
+    """
+    Hybrid classifier combining hard rules, ML, and LLM.
+
+    This is the main classification orchestrator.
+    """
+
+    def __init__(
+        self,
+        feature_extractor: FeatureExtractor,
+        ml_classifier: MLClassifier,
+        llm_classifier: Optional[LLMClassifier],
+        categories: Dict[str, Dict],
+        config: Dict[str, Any]
+    ):
+        """Initialize adaptive classifier."""
+        self.feature_extractor = feature_extractor
+        self.ml_classifier = ml_classifier
+        self.llm_classifier = llm_classifier
+        self.categories = categories
+        self.config = config
+
+        self.thresholds = self._init_thresholds()
+        self.stats = ClassificationStats()
+
+    def _init_thresholds(self) -> Dict[str, float]:
+        """Initialize classification thresholds per category."""
+        thresholds = {}
+
+        for category, cat_config in self.categories.items():
+            threshold = cat_config.get('threshold', 0.75)
+            thresholds[category] = threshold
+
+        default = self.config.get('classification', {}).get('default_threshold', 0.75)
+        thresholds['default'] = default
+
+        logger.info(f"Initialized thresholds: {thresholds}")
+        return thresholds
+
+    def classify(self, email: Email) -> ClassificationResult:
+        """
+        Classify an email using adaptive strategy.
+
+        Process:
+        1. Try hard rules first
+        2. If no rule match: ML classification
+        3. If low confidence: Queue for LLM
+        """
+        self.stats.total_emails += 1
+
+        # Step 1: Try hard rules
+        rule_result = self._try_hard_rules(email)
+        if rule_result:
+            self.stats.rule_matched += 1
+            return rule_result
+
+        # Step 2: ML classification
+        try:
+            features = self.feature_extractor.extract(email)
+            ml_result = self.ml_classifier.predict(features.get('embedding'))
+
+            if not ml_result or ml_result.get('error'):
+                logger.warning(f"ML classification error for {email.id}")
+                return ClassificationResult(
+                    email_id=email.id,
+                    category='unknown',
+                    confidence=0.0,
+                    method='error',
+                    error='ML classification failed'
+                )
+
+            category = ml_result.get('category', 'unknown')
+            confidence = ml_result.get('confidence', 0.0)
+
+            # Check if above threshold
+            threshold = self.thresholds.get(category, self.thresholds['default'])
+
+            if confidence >= threshold:
+                # High confidence: Accept ML classification
+                self.stats.ml_classified += 1
+                return ClassificationResult(
+                    email_id=email.id,
+                    category=category,
+                    confidence=confidence,
+                    method='ml',
+                    probabilities=ml_result.get('probabilities', {})
+                )
+            else:
+                # Low confidence: Queue for LLM
+                logger.debug(f"Low confidence for {email.id}: {category} ({confidence:.2f})")
+                self.stats.needs_review += 1
+                return ClassificationResult(
+                    email_id=email.id,
+                    category=category,
+                    confidence=confidence,
+                    method='ml',
+                    needs_review=True,
+                    probabilities=ml_result.get('probabilities', {})
+                )
+
+        except Exception as e:
+            logger.error(f"Classification error for {email.id}: {e}")
+            return ClassificationResult(
+                email_id=email.id,
+                category='unknown',
+                confidence=0.0,
+                method='error',
+                error=str(e)
+            )
+
+    def classify_batch(self, emails: List[Email]) -> List[ClassificationResult]:
+        """Classify batch of emails."""
+        results = []
+        for email in emails:
+            result = self.classify(email)
+            results.append(result)
+        return results
+
+    def classify_with_llm(self, ml_result: ClassificationResult, email: Email) -> ClassificationResult:
+        """
+        Use LLM to review low-confidence classification.
+
+        Args:
+            ml_result: Result from ML classifier
+            email: Original email
+
+        Returns:
+            Updated classification with LLM input
+        """
+        if not self.llm_classifier or not self.llm_classifier.llm_available:
+            logger.warning(f"LLM not available for {email.id}, keeping ML result")
+            return ml_result
+
+        try:
+            email_dict = {
+                'email_id': email.id,
+                'subject': email.subject,
+                'sender': email.sender,
+                'body_snippet': email.body_snippet,
+                'has_attachments': email.has_attachments,
+                'ml_prediction': {
+                    'category': ml_result.category,
+                    'confidence': ml_result.confidence
+                }
+            }
+
+            llm_result = self.llm_classifier.classify(email_dict)
+
+            self.stats.llm_classified += 1
+
+            return ClassificationResult(
+                email_id=email.id,
+                category=llm_result.get('category', ml_result.category),
+                confidence=llm_result.get('confidence', 0.8),
+                method='llm',
+                metadata={
+                    'llm_reasoning': llm_result.get('reasoning', ''),
+                    'ml_original': ml_result.category,
+                    'ml_confidence': ml_result.confidence
+                }
+            )
+
+        except Exception as e:
+            logger.error(f"LLM review failed for {email.id}: {e}")
+            # Fall back to ML result
+            return ml_result
+
+    def _try_hard_rules(self, email: Email) -> Optional[ClassificationResult]:
+        """Apply hard pattern-matching rules."""
+        subject = (email.subject or "").lower()
+        body = (email.body_snippet or "").lower()
+        combined = f"{subject} {body}"
+
+        # Auth emails - high priority
+        if any(p in combined for p in ['verification code', 'otp', 'reset password', 'confirm identity']):
+            return ClassificationResult(
+                email_id=email.id,
+                category='auth',
+                confidence=0.99,
+                method='rule'
+            )
+
+        # Finance - high priority
+        if email.sender_name and any(p in email.sender_name.lower() for p in ['bank', 'credit card', 'payment']):
+            if any(p in combined for p in ['statement', 'balance', 'account', 'invoice']):
+                return ClassificationResult(
+                    email_id=email.id,
+                    category='finance',
+                    confidence=0.98,
+                    method='rule'
+                )
+
+        # Invoices/Receipts - transactional
+        if any(p in combined for p in ['invoice #', 'receipt #', 'order #', 'tracking #']):
+            return ClassificationResult(
+                email_id=email.id,
+                category='transactional',
+                confidence=0.97,
+                method='rule'
+            )
+
+        # Obvious spam
+        if any(p in combined for p in ['unsubscribe', 'click here now', 'limited time offer']):
+            return ClassificationResult(
+                email_id=email.id,
+                category='junk',
+                confidence=0.96,
+                method='rule'
+            )
+
+        # Meeting/Calendar
+        if any(p in combined for p in ['meeting at', 'zoom link', 'teams meeting', 'calendar invite']):
+            return ClassificationResult(
+                email_id=email.id,
+                category='work',
+                confidence=0.95,
+                method='rule'
+            )
+
+        return None
+
+    def get_stats(self) -> ClassificationStats:
+        """Get classification statistics."""
+        return self.stats
+
+    def adjust_threshold(self, category: str, adjustment: float) -> None:
+        """Dynamically adjust classification threshold."""
+        current = self.thresholds.get(category, self.thresholds['default'])
+        new_threshold = max(
+            self.config['classification']['min_threshold'],
+            min(
+                self.config['classification']['max_threshold'],
+                current + adjustment
+            )
+        )
+        self.thresholds[category] = new_threshold
+        logger.debug(f"Adjusted threshold for {category}: {current:.2f} -> {new_threshold:.2f}")
diff --git a/src/classification/feature_extractor.py b/src/classification/feature_extractor.py
new file mode 100644
index 0000000..1284153
--- /dev/null
+++ b/src/classification/feature_extractor.py
@@ -0,0 +1,313 @@
+"""Feature extraction from emails for classification."""
+import re
+import logging
+from typing import Dict, List, Any, Optional, Tuple
+from datetime import datetime
+import numpy as np
+
+try:
+    import pandas as pd
+except ImportError:
+    pd = None
+
+try:
+    from sklearn.feature_extraction.text import TfidfVectorizer
+except ImportError:
+    TfidfVectorizer = None
+
+try:
+    from sentence_transformers import SentenceTransformer
+except ImportError:
+    SentenceTransformer = None
+
+from src.email_providers.base import Email
+
+logger = logging.getLogger(__name__)
+
+
+class FeatureExtractor:
+    """
+    Extract features from emails for classification.
+
+    Combines three feature types:
+    1. Semantic embeddings (384 dimensions)
+    2. Hard pattern detection (20+ boolean features)
+    3. Structural metadata (20+ categorical/numerical)
+    """
+
+    def __init__(self, config: Optional[Dict] = None):
+        """Initialize feature extractor."""
+        self.config = config or self._default_config()
+        self.embedder = None
+        self.text_vectorizer = None
+        self._initialize_embedder()
+        self._initialize_vectorizer()
+
+    def _default_config(self) -> Dict:
+        """Default configuration."""
+        return {
+            'embedding_model': 'all-MiniLM-L6-v2',
+            'embedding_batch_size': 32,
+            'text_features': {
+                'max_features': 10000,
+                'ngram_range': [1, 2],
+                'min_df': 2,
+                'max_df': 0.95,
+            }
+        }
+
+    def _initialize_embedder(self) -> None:
+        """Initialize sentence embedding model."""
+        if SentenceTransformer is None:
+            logger.warning("sentence-transformers not installed, embeddings will be unavailable")
+            self.embedder = None
+            return
+
+        try:
+            model_name = self.config.get('embedding_model', 'all-MiniLM-L6-v2')
+            logger.info(f"Loading embedding model: {model_name}")
+            self.embedder = SentenceTransformer(model_name)
+            logger.info(f"Embedder initialized ({self.embedder.get_sentence_embedding_dimension()} dims)")
+        except Exception as e:
+            logger.error(f"Failed to initialize embedder: {e}")
+            self.embedder = None
+
+    def _initialize_vectorizer(self) -> None:
+        """Initialize TF-IDF vectorizer."""
+        if TfidfVectorizer is None:
+            logger.warning("scikit-learn not installed, text vectorization unavailable")
+            self.text_vectorizer = None
+            return
+
+        try:
+            text_config = self.config.get('text_features', {})
+            self.text_vectorizer = TfidfVectorizer(
+                max_features=text_config.get('max_features', 10000),
+                ngram_range=tuple(text_config.get('ngram_range', [1, 2])),
+                min_df=text_config.get('min_df', 2),
+                max_df=text_config.get('max_df', 0.95),
+                sublinear_tf=True
+            )
+            logger.info("TF-IDF vectorizer initialized")
+        except Exception as e:
+            logger.error(f"Failed to initialize vectorizer: {e}")
+            self.text_vectorizer = None
+
+    def extract(self, email: Email) -> Dict[str, Any]:
+        """Extract all features from a single email."""
+        features = {}
+
+        # Basic email content
+        features['subject'] = email.subject
+        features['body_snippet'] = email.body_snippet
+        features['full_body'] = email.body
+
+        # Structural features
+        features.update(self._extract_structural(email))
+
+        # Sender features
+        features.update(self._extract_sender(email))
+
+        # Pattern features
+        features.update(self._extract_patterns(email))
+
+        # Embedding (if available)
+        if self.embedder:
+            features['embedding'] = self._extract_embedding(email)
+        else:
+            logger.debug("Embedding model not available, using zeros")
+            features['embedding'] = np.zeros(384)  # Default MiniLM dimension
+
+        return features
+
+    def _extract_structural(self, email: Email) -> Dict[str, Any]:
+        """Extract structural/metadata features."""
+        features = {}
+
+        # Attachments
+        features['has_attachments'] = email.has_attachments
+        features['attachment_count'] = email.attachment_count
+        features['attachment_types'] = email.attachment_types
+
+        # Links and images
+        body = email.body or email.body_snippet or ""
+        subject = email.subject or ""
+        combined = f"{subject} {body}"
+
+        features['link_count'] = len(re.findall(r'https?://', combined))
+        features['image_count'] = len(re.findall(r'<img', combined, re.IGNORECASE))
+
+        # Lengths
+        features['body_length'] = len(body)
+        features['subject_length'] = len(subject)
+
+        # Reply/Forward
+        features['has_reply_prefix'] = bool(re.match(r'^(Re:|Fwd:)', subject, re.IGNORECASE))
+
+        # Time features
+        if email.date:
+            hour = email.date.hour
+            if 0 <= hour < 6:
+                features['time_of_day'] = 'night'
+            elif 6 <= hour < 12:
+                features['time_of_day'] = 'morning'
+            elif 12 <= hour < 18:
+                features['time_of_day'] = 'afternoon'
+            else:
+                features['time_of_day'] = 'evening'
+            features['day_of_week'] = email.date.strftime('%A').lower()
+        else:
+            features['time_of_day'] = 'unknown'
+            features['day_of_week'] = 'unknown'
+
+        return features
+
+    def _extract_sender(self, email: Email) -> Dict[str, Any]:
+        """Extract sender-based features."""
+        features = {}
+
+        sender = email.sender or ""
+        if '@' in sender:
+            domain = sender.split('@')[1].lower()
+            features['sender_domain'] = domain
+
+            # Classify domain type
+            freemail_domains = {'gmail.com', 'yahoo.com', 'hotmail.com', 'outlook.com', 'icloud.com', 'protonmail.com'}
+            noreply_patterns = ['noreply', 'no-reply', 'donotreply', 'no_reply']
+
+            if domain in freemail_domains:
+                features['sender_domain_type'] = 'freemail'
+            elif any(p in sender.lower() for p in noreply_patterns):
+                features['sender_domain_type'] = 'noreply'
+            else:
+                features['sender_domain_type'] = 'corporate'
+
+            features['is_noreply'] = any(p in sender.lower() for p in noreply_patterns)
+        else:
+            features['sender_domain'] = 'unknown'
+            features['sender_domain_type'] = 'unknown'
+            features['is_noreply'] = False
+
+        return features
+
+    def _extract_patterns(self, email: Email) -> Dict[str, Any]:
+        """Extract hard pattern-based features."""
+        features = {}
+
+        body = (email.body or email.body_snippet or "").lower()
+        subject = (email.subject or "").lower()
+        combined = f"{subject} {body}"
+
+        # Authentication patterns
+        features['has_otp_pattern'] = bool(re.search(r'\b\d{4,6}\b', combined))
+        features['has_verification'] = 'verification' in combined
+        features['has_reset_password'] = 'reset password' in combined
+
+        # Transactional patterns
+        features['has_invoice_pattern'] = bool(re.search(r'(invoice|bill|receipt)\s*#?\d+', combined, re.I))
+        features['has_price'] = bool(re.search(r'\$[\d,]+\.?\d*', combined))
+        features['has_order_number'] = bool(re.search(r'order\s*#?\d+', combined, re.I))
+        features['has_tracking'] = bool(re.search(r'tracking\s*(number|#)', combined, re.I))
+
+        # Marketing patterns
+        features['has_unsubscribe'] = 'unsubscribe' in combined
+        features['has_view_in_browser'] = 'view in browser' in combined
+        features['has_promotional'] = any(p in combined for p in ['limited time', 'special offer', 'sale', 'discount'])
+
+        # Meeting patterns
+        features['has_meeting'] = bool(re.search(r'(meeting|call|zoom|teams|conference)', combined, re.I))
+        features['has_calendar'] = 'calendar' in combined
+
+        # Signature patterns
+        features['has_signature'] = bool(re.search(r'(regards|sincerely|best|cheers|thanks)', combined, re.I))
+
+        return features
+
+    def _extract_embedding(self, email: Email) -> np.ndarray:
+        """Generate semantic embedding for email."""
+        if not self.embedder:
+            return np.zeros(384)
+
+        try:
+            # Build structured text for embedding
+            text = self._build_embedding_text(email)
+            embedding = self.embedder.encode(text, convert_to_numpy=True)
+            return embedding
+        except Exception as e:
+            logger.error(f"Error generating embedding: {e}")
+            return np.zeros(384)
+
+    def _build_embedding_text(self, email: Email) -> str:
+        """Build structured text for embedding."""
+        # Collect basic patterns
+        patterns = self._extract_patterns(email)
+        structural = self._extract_structural(email)
+
+        # Build structured text with headers
+        text = f"""[EMAIL_METADATA]
+sender_type: {structural.get('sender_domain_type', 'unknown')}
+time_of_day: {structural.get('time_of_day', 'unknown')}
+has_attachments: {structural.get('has_attachments', False)}
+attachment_count: {structural.get('attachment_count', 0)}
+
+[DETECTED_PATTERNS]
+has_otp: {patterns.get('has_otp_pattern', False)}
+has_invoice: {patterns.get('has_invoice_pattern', False)}
+has_unsubscribe: {patterns.get('has_unsubscribe', False)}
+is_noreply: {structural.get('is_noreply', False)}
+has_meeting: {patterns.get('has_meeting', False)}
+
+[CONTENT]
+subject: {email.subject[:100]}
+body: {email.body_snippet[:300]}
+"""
+        return text
+
+    def extract_batch(self, emails: List[Email]) -> Optional[Any]:
+        """Extract features from batch of emails."""
+        if not pd:
+            logger.error("pandas not available for batch extraction")
+            return None
+
+        try:
+            feature_dicts = []
+            for email in emails:
+                features = self.extract(email)
+                feature_dicts.append(features)
+
+            # Convert to DataFrame
+            df = pd.DataFrame(feature_dicts)
+            logger.info(f"Extracted features for {len(df)} emails ({df.shape[1]} features)")
+            return df
+
+        except Exception as e:
+            logger.error(f"Error in batch extraction: {e}")
+            return None
+
+    def fit_text_vectorizer(self, emails: List[Email]) -> bool:
+        """Fit TF-IDF vectorizer on email corpus."""
+        if not self.text_vectorizer:
+            logger.error("Text vectorizer not available")
+            return False
+
+        try:
+            texts = [f"{e.subject} {e.body_snippet}" for e in emails]
+            self.text_vectorizer.fit(texts)
+            logger.info(f"Fitted TF-IDF vectorizer with {len(self.text_vectorizer.vocabulary_)} features")
+            return True
+        except Exception as e:
+            logger.error(f"Error fitting vectorizer: {e}")
+            return False
+
+    def get_feature_names(self) -> List[str]:
+        """Get list of all feature names."""
+        names = [
+            'has_attachments', 'attachment_count', 'link_count', 'image_count',
+            'body_length', 'subject_length', 'has_reply_prefix',
+            'time_of_day', 'day_of_week', 'sender_domain_type', 'is_noreply',
+            'has_otp_pattern', 'has_verification', 'has_reset_password',
+            'has_invoice_pattern', 'has_price', 'has_order_number', 'has_tracking',
+            'has_unsubscribe', 'has_view_in_browser', 'has_promotional',
+            'has_meeting', 'has_calendar', 'has_signature'
+        ]
+        return names
diff --git a/src/classification/llm_classifier.py b/src/classification/llm_classifier.py
new file mode 100644
index 0000000..93a395a
--- /dev/null
+++ b/src/classification/llm_classifier.py
@@ -0,0 +1,176 @@
+"""LLM-based email classifier."""
+import logging
+import json
+import re
+from typing import Dict, List, Any, Optional
+
+from src.llm.base import BaseLLMProvider
+
+logger = logging.getLogger(__name__)
+
+
+class LLMClassifier:
+    """
+    Email classifier using LLM for uncertain cases.
+
+    Usage:
+    - Only called for emails with low ML confidence
+    - Batches emails for efficiency
+    - Gracefully degrades if LLM unavailable
+    """
+
+    def __init__(
+        self,
+        provider: BaseLLMProvider,
+        categories: Dict[str, Dict],
+        config: Dict[str, Any]
+    ):
+        """Initialize LLM classifier."""
+        self.provider = provider
+        self.categories = categories
+        self.config = config
+        self.llm_available = provider.is_available()
+
+        if not self.llm_available:
+            logger.warning("LLM provider not available, LLM classification will be disabled")
+
+        self.classification_prompt = self._load_prompt_template()
+
+    def _load_prompt_template(self) -> str:
+        """Load or create classification prompt."""
+        # Try to load from file
+        try:
+            with open('prompts/classification.txt', 'r') as f:
+                return f.read()
+        except FileNotFoundError:
+            pass
+
+        # Default prompt
+        return """You are an expert email classifier. Analyze the email and classify it.
+
+CATEGORIES:
+{categories}
+
+EMAIL:
+Subject: {subject}
+From: {sender}
+Has Attachments: {has_attachments}
+Body (first 300 chars): {body_snippet}
+
+ML Prediction: {ml_prediction} (confidence: {ml_confidence:.2f})
+
+Respond with ONLY valid JSON (no markdown, no extra text):
+{{
+  "category": "category_name",
+  "confidence": 0.95,
+  "reasoning": "brief reason"
+}}
+"""
+
+    def classify(self, email: Dict[str, Any]) -> Dict[str, Any]:
+        """
+        Classify email using LLM.
+
+        Args:
+            email: Email data with subject, sender, body_snippet, ml_prediction
+
+        Returns:
+            Classification result with category, confidence, reasoning
+        """
+        if not self.llm_available:
+            logger.warning("LLM not available, returning ML prediction")
+            return {
+                'category': email.get('ml_prediction', {}).get('category', 'unknown'),
+                'confidence': 0.5,
+                'reasoning': 'LLM not available, using ML prediction',
+                'method': 'ml_fallback'
+            }
+
+        try:
+            # Build prompt
+            categories_str = "\n".join([
+                f"- {name}: {info.get('description', 'N/A')}"
+                for name, info in self.categories.items()
+            ])
+
+            ml_pred = email.get('ml_prediction', {})
+
+            prompt = self.classification_prompt.format(
+                categories=categories_str,
+                subject=email.get('subject', 'N/A')[:100],
+                sender=email.get('sender', 'N/A')[:50],
+                has_attachments=email.get('has_attachments', False),
+                body_snippet=email.get('body_snippet', '')[:300],
+                ml_prediction=ml_pred.get('category', 'unknown'),
+                ml_confidence=ml_pred.get('confidence', 0.0)
+            )
+
+            logger.debug(f"LLM classifying: {email.get('subject', 'No subject')[:50]}")
+
+            # Get LLM response
+            response = self.provider.complete(
+                prompt,
+                temperature=self.config.get('llm', {}).get('temperature', 0.1),
+                max_tokens=self.config.get('llm', {}).get('max_tokens', 500)
+            )
+
+            # Parse response
+            result = self._parse_response(response)
+            result['method'] = 'llm'
+            return result
+
+        except Exception as e:
+            logger.error(f"LLM classification failed: {e}")
+            return {
+                'category': 'unknown',
+                'confidence': 0.5,
+                'reasoning': f'LLM error: {str(e)[:100]}',
+                'method': 'llm_error',
+                'error': True
+            }
+
+    def classify_batch(self, emails: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+        """Classify batch of emails (individually for now, can optimize later)."""
+        results = []
+        for email in emails:
+            result = self.classify(email)
+            results.append(result)
+        return results
+
+    def _parse_response(self, response: str) -> Dict[str, Any]:
+        """Parse LLM JSON response."""
+        try:
+            # Try to extract JSON block
+            json_match = re.search(r'\{.*\}', response, re.DOTALL)
+            if json_match:
+                json_str = json_match.group()
+                parsed = json.loads(json_str)
+
+                return {
+                    'category': parsed.get('category', 'unknown'),
+                    'confidence': float(parsed.get('confidence', 0.5)),
+                    'reasoning': parsed.get('reasoning', '')
+                }
+        except json.JSONDecodeError as e:
+            logger.debug(f"JSON parsing error: {e}")
+        except Exception as e:
+            logger.debug(f"Response parsing error: {e}")
+
+        # Fallback parsing - try to extract category name
+        logger.warning(f"Failed to parse LLM response, using fallback parsing")
+        logger.debug(f"Response was: {response[:200]}")
+
+        return {
+            'category': 'unknown',
+            'confidence': 0.5,
+            'reasoning': response[:100]
+        }
+
+    def get_status(self) -> Dict[str, Any]:
+        """Get classifier status."""
+        return {
+            'llm_available': self.llm_available,
+            'provider': self.provider.name if self.provider else 'none',
+            'categories': len(self.categories),
+            'status': 'ready' if self.llm_available else 'degraded'
+        }
diff --git a/src/classification/ml_classifier.py b/src/classification/ml_classifier.py
new file mode 100644
index 0000000..e2facc2
--- /dev/null
+++ b/src/classification/ml_classifier.py
@@ -0,0 +1,233 @@
+"""
+ML-based email classifier.
+
+MOCK STATUS: This uses a mock Random Forest model for demonstration.
+- IMPORTANT: This is NOT the production model
+- IMPORTANT: This model is trained on synthetic/demo data only
+- IMPORTANT: For production, you MUST train on real Enron dataset or your own emails
+- The mock will work for testing but will NOT achieve 94-96% accuracy
+- When you get home: retrain with LightGBM + Enron + real tuning
+
+DO NOT use this mock model on production data.
+DO NOT expect accurate classifications from this mock.
+This is ONLY for framework testing and integration validation.
+"""
+import logging
+import pickle
+import warnings
+from typing import Dict, List, Any, Optional, Tuple
+from pathlib import Path
+
+import numpy as np
+
+logger = logging.getLogger(__name__)
+
+# Suppress warnings
+warnings.filterwarnings('ignore')
+
+
+class MLClassifier:
+    """
+    Wrapper for ML-based email classification.
+
+    MOCK IMPLEMENTATION: Uses Random Forest on synthetic data.
+    Replace this with real LightGBM model trained on Enron dataset.
+    """
+
+    def __init__(self, model_path: Optional[str] = None):
+        """Initialize ML classifier."""
+        self.model = None
+        self.categories = []
+        self.feature_names = []
+        self.is_mock = False
+        self.model_path = model_path or "src/models/pretrained/classifier.pkl"
+
+        # Try to load pre-trained model
+        if model_path and Path(model_path).exists():
+            self._load_model(model_path)
+        else:
+            logger.warning("Pre-trained model not found, creating MOCK model for testing")
+            self._create_mock_model()
+
+    def _load_model(self, model_path: str) -> None:
+        """Load pre-trained model from file."""
+        try:
+            logger.info(f"Loading ML model from: {model_path}")
+            with open(model_path, 'rb') as f:
+                model_data = pickle.load(f)
+
+            self.model = model_data.get('model')
+            self.categories = model_data.get('categories', [])
+            self.feature_names = model_data.get('feature_names', [])
+            self.is_mock = model_data.get('is_mock', False)
+
+            if self.is_mock:
+                logger.warning("USING MOCK ML MODEL - Not for production!")
+
+            logger.info(f"ML model loaded: {len(self.categories)} categories")
+
+        except Exception as e:
+            logger.error(f"Error loading model: {e}")
+            logger.warning("Falling back to MOCK model")
+            self._create_mock_model()
+
+    def _create_mock_model(self) -> None:
+        """Create a mock Random Forest model for testing."""
+        try:
+            from sklearn.ensemble import RandomForestClassifier
+        except ImportError:
+            logger.error("scikit-learn required for mock model")
+            self.model = None
+            return
+
+        logger.info("Creating MOCK Random Forest model for framework testing")
+        logger.warning("=" * 80)
+        logger.warning("MOCK MODEL WARNING")
+        logger.warning("=" * 80)
+        logger.warning("This is a MOCK model trained on synthetic data")
+        logger.warning("It will NOT provide accurate classifications")
+        logger.warning("Framework testing ONLY - do not use for production")
+        logger.warning("When you get home: Retrain with LightGBM + Enron dataset")
+        logger.warning("=" * 80)
+
+        # Define categories
+        self.categories = [
+            'junk', 'transactional', 'auth', 'newsletters',
+            'social', 'automated', 'conversational', 'work',
+            'personal', 'finance', 'travel', 'unknown'
+        ]
+
+        # Create synthetic training data
+        n_samples = 500
+        n_features = 50  # This will be expanded by feature extractor
+
+        X_mock = np.random.rand(n_samples, n_features)
+        y_mock = np.random.randint(0, len(self.categories), n_samples)
+
+        # Train mock model
+        try:
+            self.model = RandomForestClassifier(
+                n_estimators=50,
+                max_depth=15,
+                random_state=42,
+                n_jobs=-1
+            )
+            self.model.fit(X_mock, y_mock)
+
+            self.feature_names = [f'feature_{i}' for i in range(n_features)]
+            self.is_mock = True
+
+            logger.info(f"Mock model created: {len(self.categories)} categories, {n_features} features")
+            logger.warning("REMEMBER: This mock model is for framework testing only!")
+
+        except Exception as e:
+            logger.error(f"Error creating mock model: {e}")
+            self.model = None
+
+    def predict(self, features: np.ndarray) -> Dict[str, Any]:
+        """
+        Predict category for email features.
+
+        Args:
+            features: Feature vector (numpy array)
+
+        Returns:
+            {
+                'category': str (predicted category),
+                'confidence': float (0-1),
+                'probabilities': Dict[category -> confidence],
+                'is_mock': bool (True if using mock model),
+                'warning': str (warning if using mock)
+            }
+        """
+        if self.model is None:
+            logger.error("Model not loaded")
+            return {
+                'category': 'unknown',
+                'confidence': 0.0,
+                'probabilities': {c: 0.0 for c in self.categories},
+                'error': 'Model not available',
+                'is_mock': False
+            }
+
+        try:
+            # Ensure feature vector is correct shape
+            if len(features.shape) == 1:
+                features = features.reshape(1, -1)
+
+            # Get probabilities
+            probs = self.model.predict_proba(features)[0]
+            pred_class = np.argmax(probs)
+            category = self.categories[pred_class]
+            confidence = float(probs[pred_class])
+
+            # Build probabilities dict
+            prob_dict = {
+                self.categories[i]: float(probs[i])
+                for i in range(len(self.categories))
+            }
+
+            result = {
+                'category': category,
+                'confidence': confidence,
+                'probabilities': prob_dict,
+                'is_mock': self.is_mock
+            }
+
+            if self.is_mock:
+                result['warning'] = 'Using mock model - inaccurate for production'
+
+            return result
+
+        except Exception as e:
+            logger.error(f"Prediction error: {e}")
+            return {
+                'category': 'unknown',
+                'confidence': 0.0,
+                'probabilities': {c: 0.0 for c in self.categories},
+                'error': str(e),
+                'is_mock': self.is_mock
+            }
+
+    def predict_batch(self, features: np.ndarray) -> List[Dict[str, Any]]:
+        """Predict for batch of feature vectors."""
+        return [self.predict(f if f.ndim > 1 else f.reshape(1, -1)) for f in features]
+
+    def save_model(self, output_path: str) -> bool:
+        """Save current model to file."""
+        if self.model is None:
+            logger.error("No model to save")
+            return False
+
+        try:
+            Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+
+            model_data = {
+                'model': self.model,
+                'categories': self.categories,
+                'feature_names': self.feature_names,
+                'is_mock': self.is_mock,
+                'warning': 'Mock model - for testing only' if self.is_mock else 'Production model'
+            }
+
+            with open(output_path, 'wb') as f:
+                pickle.dump(model_data, f)
+
+            logger.info(f"Model saved to: {output_path}")
+            return True
+
+        except Exception as e:
+            logger.error(f"Error saving model: {e}")
+            return False
+
+    def get_info(self) -> Dict[str, Any]:
+        """Get model information."""
+        return {
+            'is_loaded': self.model is not None,
+            'is_mock': self.is_mock,
+            'categories': self.categories,
+            'n_categories': len(self.categories),
+            'n_features': len(self.feature_names),
+            'feature_names': self.feature_names[:10],  # First 10 for brevity
+            'model_type': 'RandomForest' if self.is_mock else 'LightGBM (production)'
+        }
diff --git a/src/cli.py b/src/cli.py
new file mode 100644
index 0000000..de01391
--- /dev/null
+++ b/src/cli.py
@@ -0,0 +1,263 @@
+"""Command-line interface for email-sorter."""
+import logging
+import sys
+from pathlib import Path
+from typing import Optional
+
+import click
+
+from src.utils.config import load_config, load_categories
+from src.utils.logging import setup_logging
+from src.email_providers.base import MockProvider
+from src.email_providers.gmail import GmailProvider
+from src.email_providers.imap import IMAPProvider
+from src.classification.feature_extractor import FeatureExtractor
+from src.classification.ml_classifier import MLClassifier
+from src.classification.llm_classifier import LLMClassifier
+from src.classification.adaptive_classifier import AdaptiveClassifier
+from src.llm.ollama import OllamaProvider
+from src.llm.openai_compat import OpenAIProvider
+
+
+@click.group()
+def cli():
+    """Email Sorter - Hybrid ML/LLM Email Classification System."""
+    pass
+
+
+@cli.command()
+@click.option('--source', type=click.Choice(['gmail', 'imap', 'mock']), default='mock',
+              help='Email provider')
+@click.option('--credentials', type=click.Path(exists=False),
+              help='Path to credentials file')
+@click.option('--output', type=click.Path(), default='results/',
+              help='Output directory')
+@click.option('--config', type=click.Path(exists=False), default='config/default_config.yaml',
+              help='Config file')
+@click.option('--limit', type=int, default=None,
+              help='Limit number of emails')
+@click.option('--llm-provider', type=click.Choice(['ollama', 'openai']), default='ollama',
+              help='LLM provider')
+@click.option('--dry-run', is_flag=True,
+              help='Do not sync results back')
+@click.option('--verbose', is_flag=True,
+              help='Verbose logging')
+def run(
+    source: str,
+    credentials: Optional[str],
+    output: str,
+    config: str,
+    limit: Optional[int],
+    llm_provider: str,
+    dry_run: bool,
+    verbose: bool
+):
+    """Run email sorter pipeline."""
+
+    # Setup logging
+    log_level = 'DEBUG' if verbose else 'INFO'
+    setup_logging(level=log_level)
+    logger = logging.getLogger(__name__)
+
+    logger.info("=" * 80)
+    logger.info("EMAIL SORTER v1.0")
+    logger.info("=" * 80)
+
+    # Load config
+    logger.info(f"Loading config from: {config}")
+    cfg = load_config(config)
+    categories = load_categories()
+
+    # Setup email provider
+    logger.info(f"Setting up email provider: {source}")
+    if source == 'gmail':
+        provider = GmailProvider()
+        if not credentials:
+            logger.error("Gmail provider requires --credentials")
+            sys.exit(1)
+    elif source == 'imap':
+        provider = IMAPProvider()
+        if not credentials:
+            logger.error("IMAP provider requires --credentials")
+            sys.exit(1)
+    else:  # mock
+        logger.warning("Using MOCK provider for testing")
+        provider = MockProvider()
+        credentials = None
+
+    # Connect provider
+    creds_dict = {'credentials_path': credentials} if credentials else {}
+    if not provider.connect(creds_dict):
+        logger.error("Failed to connect to email provider")
+        sys.exit(1)
+
+    # Setup LLM provider
+    logger.info(f"Setting up LLM provider: {llm_provider}")
+    if llm_provider == 'ollama':
+        llm = OllamaProvider(
+            base_url=cfg.llm.ollama.base_url,
+            model=cfg.llm.ollama.classification_model,
+            temperature=cfg.llm.ollama.temperature,
+            max_tokens=cfg.llm.ollama.max_tokens
+        )
+    else:  # openai
+        llm = OpenAIProvider(
+            base_url=cfg.llm.openai.base_url,
+            model=cfg.llm.openai.classification_model,
+            temperature=cfg.llm.openai.temperature,
+            max_tokens=cfg.llm.openai.max_tokens
+        )
+
+    if not llm.is_available():
+        logger.warning(f"LLM provider ({llm_provider}) not available, running in degraded mode")
+
+    # Setup classifiers
+    logger.info("Setting up classifiers")
+    feature_extractor = FeatureExtractor(cfg.features.dict())
+    ml_classifier = MLClassifier()
+    llm_classifier = LLMClassifier(llm, categories, cfg.dict())
+    adaptive_classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        llm_classifier,
+        categories,
+        cfg.dict()
+    )
+
+    # Fetch emails
+    logger.info(f"Fetching emails (limit: {limit})")
+    emails = provider.fetch_emails(limit=limit)
+
+    if not emails:
+        logger.error("No emails fetched")
+        sys.exit(1)
+
+    logger.info(f"Fetched {len(emails)} emails")
+
+    # Classify emails
+    logger.info("Starting classification")
+    results = []
+
+    for i, email in enumerate(emails):
+        if (i + 1) % 100 == 0:
+            logger.info(f"Progress: {i+1}/{len(emails)}")
+
+        result = adaptive_classifier.classify(email)
+
+        # If low confidence and LLM available: Use LLM
+        if result.needs_review and llm.is_available():
+            result = adaptive_classifier.classify_with_llm(result, email)
+
+        results.append(result)
+
+    # Export results
+    logger.info("Exporting results")
+    Path(output).mkdir(parents=True, exist_ok=True)
+
+    import json
+    results_data = {
+        'metadata': {
+            'total_emails': len(emails),
+            'accuracy_estimate': adaptive_classifier.get_stats().accuracy_estimate(),
+            'classification_stats': {
+                'rule_matched': adaptive_classifier.get_stats().rule_matched,
+                'ml_classified': adaptive_classifier.get_stats().ml_classified,
+                'llm_classified': adaptive_classifier.get_stats().llm_classified,
+                'needs_review': adaptive_classifier.get_stats().needs_review,
+            }
+        },
+        'classifications': [
+            {
+                'email_id': r.email_id,
+                'category': r.category,
+                'confidence': r.confidence,
+                'method': r.method
+            }
+            for r in results
+        ]
+    }
+
+    results_file = Path(output) / 'results.json'
+    with open(results_file, 'w') as f:
+        json.dump(results_data, f, indent=2)
+
+    logger.info(f"Results saved to: {results_file}")
+    logger.info(f"\n{adaptive_classifier.get_stats()}")
+
+    # Print summary
+    logger.info("=" * 80)
+    logger.info(f"Classification complete!")
+    logger.info(f"Accuracy estimate: {adaptive_classifier.get_stats().accuracy_estimate():.1%}")
+    logger.info("=" * 80)
+
+    provider.disconnect()
+
+
+@cli.command()
+def test_config():
+    """Test configuration loading."""
+    logger = logging.getLogger(__name__)
+    setup_logging()
+
+    logger.info("Testing configuration...")
+
+    cfg = load_config()
+    logger.info(f"Config loaded: {cfg.version}")
+
+    categories = load_categories()
+    logger.info(f"Categories loaded: {len(categories)} categories")
+
+    logger.info("Configuration test passed!")
+
+
+@cli.command()
+def test_ollama():
+    """Test Ollama connection."""
+    logger = logging.getLogger(__name__)
+    setup_logging()
+
+    logger.info("Testing Ollama connection...")
+
+    from src.utils.config import load_config
+    cfg = load_config()
+
+    llm = OllamaProvider(
+        base_url=cfg.llm.ollama.base_url,
+        model=cfg.llm.ollama.classification_model
+    )
+
+    if llm.is_available():
+        logger.info("Ollama connection successful!")
+        logger.info(f"Model: {llm.model}")
+
+        # Try a simple prompt
+        logger.info("Testing inference...")
+        response = llm.complete("Classify this email: 'Your verification code is 123456'")
+        logger.info(f"Response: {response[:100]}...")
+    else:
+        logger.error("Ollama not available")
+        sys.exit(1)
+
+
+@cli.command()
+def test_gmail():
+    """Test Gmail connection."""
+    logger = logging.getLogger(__name__)
+    setup_logging()
+
+    logger.info("Testing Gmail connection...")
+
+    provider = GmailProvider()
+
+    if provider.connect({'credentials_path': 'credentials.json'}):
+        logger.info("Gmail connection successful!")
+        emails = provider.fetch_emails(limit=5)
+        logger.info(f"Fetched {len(emails)} test emails")
+        provider.disconnect()
+    else:
+        logger.error("Gmail connection failed")
+        sys.exit(1)
+
+
+if __name__ == '__main__':
+    cli()
diff --git a/src/email_providers/__init__.py b/src/email_providers/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/email_providers/base.py b/src/email_providers/base.py
new file mode 100644
index 0000000..0ff9406
--- /dev/null
+++ b/src/email_providers/base.py
@@ -0,0 +1,205 @@
+"""Base email provider interface and data models."""
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from datetime import datetime
+from typing import List, Dict, Any, Optional
+import logging
+
+logger = logging.getLogger(__name__)
+
+
+@dataclass
+class Attachment:
+    """Email attachment metadata."""
+    filename: str
+    mime_type: str
+    size: int  # in bytes
+    attachment_id: Optional[str] = None
+
+    def __repr__(self) -> str:
+        return f"Attachment({self.filename}, {self.mime_type}, {self.size}B)"
+
+
+@dataclass
+class Email:
+    """Unified email data model."""
+    id: str
+    subject: str
+    sender: str
+    sender_name: Optional[str] = None
+    date: Optional[datetime] = None
+    body: str = ""
+    body_snippet: str = ""
+    has_attachments: bool = False
+    attachments: List[Attachment] = field(default_factory=list)
+    headers: Dict[str, str] = field(default_factory=dict)
+    labels: List[str] = field(default_factory=list)
+    is_read: bool = False
+    provider: str = "unknown"  # gmail, imap, microsoft, etc.
+
+    def __post_init__(self):
+        """Generate body_snippet if not provided."""
+        if not self.body_snippet and self.body:
+            self.body_snippet = self.body[:500]
+
+    def __repr__(self) -> str:
+        return f"Email(id={self.id}, from={self.sender}, subject={self.subject[:50]})"
+
+    @property
+    def attachment_types(self) -> List[str]:
+        """Get list of attachment types."""
+        return [a.mime_type.split('/')[-1] for a in self.attachments]
+
+    @property
+    def attachment_count(self) -> int:
+        """Get count of attachments."""
+        return len(self.attachments)
+
+
+@dataclass
+class ClassificationResult:
+    """Result from email classification."""
+    email_id: str
+    category: str
+    confidence: float
+    method: str  # 'rule', 'ml', 'llm'
+    probabilities: Dict[str, float] = field(default_factory=dict)
+    needs_review: bool = False
+    metadata: Dict[str, Any] = field(default_factory=dict)
+    error: Optional[str] = None
+
+    def __repr__(self) -> str:
+        return f"ClassificationResult(id={self.email_id}, category={self.category}, conf={self.confidence:.2f})"
+
+
+class BaseProvider(ABC):
+    """Abstract base class for email providers."""
+
+    def __init__(self, name: str = "base"):
+        """Initialize provider."""
+        self.name = name
+        self.logger = logging.getLogger(f"{__name__}.{self.__class__.__name__}")
+
+    @abstractmethod
+    def connect(self, credentials: Dict[str, Any]) -> bool:
+        """Establish connection to email provider.
+
+        Args:
+            credentials: Provider-specific credentials
+
+        Returns:
+            True if connected, False otherwise
+        """
+        pass
+
+    @abstractmethod
+    def disconnect(self) -> bool:
+        """Close connection."""
+        pass
+
+    @abstractmethod
+    def fetch_emails(
+        self,
+        limit: Optional[int] = None,
+        filters: Optional[Dict[str, Any]] = None
+    ) -> List[Email]:
+        """Fetch emails from provider.
+
+        Args:
+            limit: Maximum number of emails to fetch
+            filters: Provider-specific filters
+
+        Returns:
+            List of Email objects
+        """
+        pass
+
+    @abstractmethod
+    def update_labels(self, email_id: str, labels: List[str]) -> bool:
+        """Update email labels/folders.
+
+        Args:
+            email_id: Email identifier
+            labels: List of labels to set
+
+        Returns:
+            True if successful
+        """
+        pass
+
+    @abstractmethod
+    def batch_update(self, updates: List[Dict[str, Any]]) -> bool:
+        """Batch update multiple emails.
+
+        Args:
+            updates: List of update dictionaries with email_id and labels
+
+        Returns:
+            True if successful
+        """
+        pass
+
+    def is_connected(self) -> bool:
+        """Check if provider is connected."""
+        raise NotImplementedError
+
+
+class MockProvider(BaseProvider):
+    """
+    Mock email provider for testing.
+
+    IMPORTANT: This is a MOCK implementation for testing only.
+    It does not connect to any real email service.
+    All emails returned are synthetic/test data.
+    """
+
+    def __init__(self):
+        """Initialize mock provider."""
+        super().__init__(name="mock")
+        self.connected = False
+        self.mock_emails: List[Email] = []
+        self.logger.warning("Using MOCK email provider - no real emails will be fetched")
+
+    def connect(self, credentials: Dict[str, Any]) -> bool:
+        """Mock connection."""
+        self.logger.info("Mock provider: simulated connection")
+        self.connected = True
+        return True
+
+    def disconnect(self) -> bool:
+        """Mock disconnection."""
+        self.logger.info("Mock provider: simulated disconnection")
+        self.connected = False
+        return True
+
+    def fetch_emails(
+        self,
+        limit: Optional[int] = None,
+        filters: Optional[Dict[str, Any]] = None
+    ) -> List[Email]:
+        """Return mock emails."""
+        if not self.connected:
+            self.logger.warning("Mock provider: not connected, returning empty list")
+            return []
+
+        result = self.mock_emails[:limit] if limit else self.mock_emails
+        self.logger.info(f"Mock provider: returning {len(result)} mock emails")
+        return result
+
+    def update_labels(self, email_id: str, labels: List[str]) -> bool:
+        """Mock label update."""
+        self.logger.debug(f"Mock provider: label update for {email_id}")
+        return True
+
+    def batch_update(self, updates: List[Dict[str, Any]]) -> bool:
+        """Mock batch update."""
+        self.logger.info(f"Mock provider: batch update for {len(updates)} emails")
+        return True
+
+    def is_connected(self) -> bool:
+        """Check mock connection."""
+        return self.connected
+
+    def add_mock_email(self, email: Email) -> None:
+        """Add a mock email for testing."""
+        self.mock_emails.append(email)
diff --git a/src/email_providers/gmail.py b/src/email_providers/gmail.py
new file mode 100644
index 0000000..a99f141
--- /dev/null
+++ b/src/email_providers/gmail.py
@@ -0,0 +1,276 @@
+"""Gmail API provider implementation.
+
+IMPORTANT: This is a STUB implementation.
+- Requires valid Gmail OAuth credentials
+- Credentials file should be provided in config or via command line
+- When credentials are not available, this provider will raise clear errors
+- Mock provider is available for testing without credentials
+"""
+import base64
+import logging
+from typing import List, Dict, Optional, Any
+from datetime import datetime
+from email.utils import parsedate_to_datetime
+
+from .base import BaseProvider, Email, Attachment
+
+logger = logging.getLogger(__name__)
+
+
+class GmailProvider(BaseProvider):
+    """
+    Gmail API email provider.
+
+    STUB STATUS: Requires Gmail OAuth credentials setup
+    - Credentials file: credentials.json
+    - Scopes: gmail.readonly, gmail.modify
+    - When credentials missing: Provider will fail gracefully with clear error
+    """
+
+    def __init__(self):
+        """Initialize Gmail provider."""
+        super().__init__(name="gmail")
+        self.service = None
+        self.user_id = 'me'
+        self._credentials_configured = False
+
+    def connect(self, credentials: Dict[str, Any]) -> bool:
+        """
+        Connect to Gmail API using OAuth credentials.
+
+        STUB: This requires credentials setup. When unavailable:
+        - Returns False
+        - Logs clear error message
+        - Does not attempt connection
+        """
+        try:
+            credentials_path = credentials.get('credentials_path')
+            if not credentials_path:
+                logger.error(
+                    "GMAIL OAUTH NOT CONFIGURED: "
+                    "credentials_path required in config. "
+                    "Set up Gmail OAuth at: "
+                    "https://developers.google.com/gmail/api/quickstart/python"
+                )
+                return False
+
+            # TRY IMPORT - will fail if google-auth not installed properly
+            try:
+                from google.oauth2.credentials import Credentials
+                from google_auth_oauthlib.flow import InstalledAppFlow
+                from googleapiclient.discovery import build
+            except ImportError as e:
+                logger.error(f"GMAIL DEPENDENCIES MISSING: {e}")
+                logger.error("Install with: pip install google-api-python-client google-auth-oauthlib")
+                return False
+
+            # TRY CONNECTION - will fail if credentials file invalid
+            logger.info(f"Attempting Gmail OAuth with credentials from: {credentials_path}")
+
+            SCOPES = [
+                'https://www.googleapis.com/auth/gmail.readonly',
+                'https://www.googleapis.com/auth/gmail.modify'
+            ]
+
+            try:
+                flow = InstalledAppFlow.from_client_secrets_file(
+                    credentials_path, SCOPES
+                )
+                creds = flow.run_local_server(port=0)
+                self.service = build('gmail', 'v1', credentials=creds)
+                self._credentials_configured = True
+                logger.info("Successfully connected to Gmail API")
+                return True
+
+            except FileNotFoundError:
+                logger.error(f"CREDENTIALS FILE NOT FOUND: {credentials_path}")
+                logger.error("Set up Gmail OAuth and download credentials.json")
+                return False
+
+        except Exception as e:
+            logger.error(f"GMAIL CONNECTION FAILED: {e}")
+            return False
+
+    def disconnect(self) -> bool:
+        """Close Gmail connection."""
+        self.service = None
+        self._credentials_configured = False
+        logger.info("Disconnected from Gmail")
+        return True
+
+    def fetch_emails(
+        self,
+        limit: Optional[int] = None,
+        filters: Optional[Dict[str, Any]] = None
+    ) -> List[Email]:
+        """
+        Fetch emails from Gmail.
+
+        STUB: Returns empty list if not connected
+        """
+        if not self._credentials_configured or not self.service:
+            logger.error("GMAIL NOT CONFIGURED: Cannot fetch emails without OAuth setup")
+            return []
+
+        emails = []
+        try:
+            query = filters.get('query', '') if filters else ''
+
+            results = self.service.users().messages().list(
+                userId=self.user_id,
+                q=query,
+                maxResults=min(limit or 500, 500) if limit else 500
+            ).execute()
+
+            messages = results.get('messages', [])
+
+            for msg_info in messages:
+                email = self._fetch_message(msg_info['id'])
+                if email:
+                    emails.append(email)
+                    if limit and len(emails) >= limit:
+                        break
+
+            logger.info(f"Fetched {len(emails)} emails from Gmail")
+            return emails
+
+        except Exception as e:
+            logger.error(f"GMAIL FETCH ERROR: {e}")
+            return emails
+
+    def _fetch_message(self, msg_id: str) -> Optional[Email]:
+        """Fetch and parse a single message."""
+        try:
+            msg = self.service.users().messages().get(
+                userId=self.user_id,
+                id=msg_id,
+                format='full'
+            ).execute()
+            return self._parse_message(msg)
+        except Exception as e:
+            logger.error(f"Error fetching message {msg_id}: {e}")
+            return None
+
+    def _parse_message(self, msg: Dict) -> Email:
+        """Parse Gmail message into Email object."""
+        headers = {h['name']: h['value'] for h in msg['payload'].get('headers', [])}
+
+        body = self._get_body(msg['payload'])
+        date = self._parse_date(headers.get('Date'))
+
+        # Check attachments
+        attachments = self._parse_attachments(msg['payload'])
+
+        return Email(
+            id=msg['id'],
+            subject=headers.get('Subject', 'No Subject'),
+            sender=headers.get('From', ''),
+            date=date,
+            body=body,
+            has_attachments=len(attachments) > 0,
+            attachments=attachments,
+            headers=headers,
+            labels=msg.get('labelIds', []),
+            is_read='UNREAD' not in msg.get('labelIds', []),
+            provider='gmail'
+        )
+
+    def _get_body(self, payload: Dict) -> str:
+        """Extract email body from payload."""
+        body = ""
+
+        if 'body' in payload and 'data' in payload['body']:
+            try:
+                body = base64.urlsafe_b64decode(payload['body']['data']).decode('utf-8', errors='ignore')
+            except Exception as e:
+                logger.debug(f"Error decoding body: {e}")
+
+        elif 'parts' in payload:
+            for part in payload['parts']:
+                if part.get('mimeType') == 'text/plain' and 'data' in part.get('body', {}):
+                    try:
+                        body = base64.urlsafe_b64decode(part['body']['data']).decode('utf-8', errors='ignore')
+                        break
+                    except Exception as e:
+                        logger.debug(f"Error decoding part: {e}")
+
+        return body
+
+    def _parse_date(self, date_str: Optional[str]) -> Optional[datetime]:
+        """Parse email date."""
+        if not date_str:
+            return None
+        try:
+            return parsedate_to_datetime(date_str)
+        except Exception:
+            return None
+
+    def _parse_attachments(self, payload: Dict) -> List[Attachment]:
+        """Extract attachment metadata."""
+        attachments = []
+
+        if 'parts' not in payload:
+            return attachments
+
+        for part in payload['parts']:
+            if part.get('filename'):
+                attachments.append(Attachment(
+                    filename=part['filename'],
+                    mime_type=part.get('mimeType', 'application/octet-stream'),
+                    size=part.get('body', {}).get('size', 0),
+                    attachment_id=part.get('body', {}).get('attachmentId')
+                ))
+
+        return attachments
+
+    def update_labels(self, email_id: str, labels: List[str]) -> bool:
+        """Update labels for a single email."""
+        if not self._credentials_configured or not self.service:
+            logger.error("GMAIL NOT CONFIGURED: Cannot update labels")
+            return False
+
+        try:
+            self.service.users().messages().modify(
+                userId=self.user_id,
+                id=email_id,
+                body={'addLabelIds': labels}
+            ).execute()
+            return True
+        except Exception as e:
+            logger.error(f"Error updating labels: {e}")
+            return False
+
+    def batch_update(self, updates: List[Dict[str, Any]]) -> bool:
+        """Batch update multiple emails."""
+        if not self._credentials_configured or not self.service:
+            logger.error("GMAIL NOT CONFIGURED: Cannot batch update")
+            return False
+
+        try:
+            batch_size = 100
+            successful = 0
+
+            for i in range(0, len(updates), batch_size):
+                batch = updates[i:i+batch_size]
+                email_ids = [u['email_id'] for u in batch]
+                labels = list(set([l for u in batch for l in u.get('labels', [])]))
+
+                self.service.users().messages().batchModify(
+                    userId=self.user_id,
+                    body={
+                        'ids': email_ids,
+                        'addLabelIds': labels
+                    }
+                ).execute()
+                successful += len(batch)
+
+            logger.info(f"Batch updated {successful} emails")
+            return True
+
+        except Exception as e:
+            logger.error(f"Batch update error: {e}")
+            return False
+
+    def is_connected(self) -> bool:
+        """Check if connected."""
+        return self._credentials_configured and self.service is not None
diff --git a/src/email_providers/imap.py b/src/email_providers/imap.py
new file mode 100644
index 0000000..68dd850
--- /dev/null
+++ b/src/email_providers/imap.py
@@ -0,0 +1,274 @@
+"""IMAP email provider implementation.
+
+STUB STATUS: Requires IMAP server credentials
+- Supports any IMAP server (Gmail, Outlook, custom, etc.)
+- Credentials: host, username, password, port
+- When credentials missing: Provider will fail gracefully
+"""
+import logging
+import email
+from typing import List, Dict, Optional, Any
+from datetime import datetime
+from email.utils import parsedate_to_datetime
+
+from .base import BaseProvider, Email, Attachment
+
+logger = logging.getLogger(__name__)
+
+
+class IMAPProvider(BaseProvider):
+    """
+    IMAP email provider for generic IMAP servers.
+
+    STUB STATUS: Requires IMAP server configuration
+    - Can use with Gmail, Outlook, or any IMAP server
+    - Credentials required: host, username, password, port (optional)
+    - When credentials missing: Returns clear error
+    """
+
+    def __init__(self):
+        """Initialize IMAP provider."""
+        super().__init__(name="imap")
+        self.client = None
+        self._credentials_configured = False
+        self.host = None
+        self.username = None
+
+    def connect(self, credentials: Dict[str, Any]) -> bool:
+        """
+        Connect to IMAP server.
+
+        STUB: Requires credentials. When unavailable:
+        - Returns False with clear error
+        """
+        try:
+            self.host = credentials.get('host')
+            self.username = credentials.get('username')
+            password = credentials.get('password')
+            port = credentials.get('port', 993)
+
+            if not all([self.host, self.username, password]):
+                logger.error(
+                    "IMAP NOT CONFIGURED: "
+                    "Required: host, username, password"
+                )
+                return False
+
+            try:
+                import imapclient
+            except ImportError:
+                logger.error("IMAP DEPENDENCIES MISSING: pip install imapclient")
+                return False
+
+            logger.info(f"Attempting IMAP connection to {self.host}")
+
+            try:
+                self.client = imapclient.IMAPClient(self.host, port=port, use_uid=True)
+                self.client.login(self.username, password)
+                self._credentials_configured = True
+                logger.info(f"Successfully connected to IMAP server: {self.host}")
+                return True
+
+            except Exception as e:
+                logger.error(f"IMAP LOGIN FAILED: {e}")
+                logger.error("Check credentials and IMAP server configuration")
+                return False
+
+        except Exception as e:
+            logger.error(f"IMAP CONNECTION ERROR: {e}")
+            return False
+
+    def disconnect(self) -> bool:
+        """Close IMAP connection."""
+        if self.client:
+            try:
+                self.client.logout()
+            except Exception as e:
+                logger.warning(f"Error during logout: {e}")
+        self.client = None
+        self._credentials_configured = False
+        logger.info("Disconnected from IMAP server")
+        return True
+
+    def fetch_emails(
+        self,
+        limit: Optional[int] = None,
+        filters: Optional[Dict[str, Any]] = None
+    ) -> List[Email]:
+        """
+        Fetch emails from IMAP server.
+
+        STUB: Returns empty if not connected
+        """
+        if not self._credentials_configured or not self.client:
+            logger.error("IMAP NOT CONFIGURED: Cannot fetch emails")
+            return []
+
+        emails = []
+        try:
+            # Select INBOX
+            self.client.select_folder('INBOX')
+
+            # Search for messages
+            search_criteria = filters.get('search_criteria', 'ALL') if filters else 'ALL'
+            msg_ids = self.client.search(search_criteria)
+
+            # Limit results
+            if limit:
+                msg_ids = msg_ids[:limit]
+
+            logger.info(f"Found {len(msg_ids)} messages in IMAP, fetching...")
+
+            # Fetch messages
+            response = self.client.fetch(msg_ids, ['RFC822'])
+
+            for msg_id, msg_data in response.items():
+                try:
+                    email_msg = email.message_from_bytes(msg_data[b'RFC822'])
+                    parsed_email = self._parse_message(email_msg, msg_id)
+                    if parsed_email:
+                        emails.append(parsed_email)
+                except Exception as e:
+                    logger.debug(f"Error parsing message {msg_id}: {e}")
+
+            logger.info(f"Fetched {len(emails)} emails from IMAP")
+            return emails
+
+        except Exception as e:
+            logger.error(f"IMAP FETCH ERROR: {e}")
+            return emails
+
+    def _parse_message(self, msg: email.message.Message, msg_id: int) -> Optional[Email]:
+        """Parse email.message.Message into Email object."""
+        try:
+            subject = msg.get('subject', 'No Subject')
+            sender = msg.get('from', '')
+            date_str = msg.get('date')
+            body = self._get_body(msg)
+
+            # Parse date
+            date = None
+            if date_str:
+                try:
+                    date = parsedate_to_datetime(date_str)
+                except Exception:
+                    pass
+
+            # Get attachments
+            attachments = self._parse_attachments(msg)
+
+            return Email(
+                id=str(msg_id),
+                subject=subject,
+                sender=sender,
+                date=date,
+                body=body,
+                has_attachments=len(attachments) > 0,
+                attachments=attachments,
+                headers=dict(msg.items()),
+                provider='imap'
+            )
+
+        except Exception as e:
+            logger.debug(f"Error parsing message: {e}")
+            return None
+
+    def _get_body(self, msg: email.message.Message) -> str:
+        """Extract email body."""
+        body = ""
+
+        # Try text/plain first
+        if msg.is_multipart():
+            for part in msg.walk():
+                if part.get_content_type() == 'text/plain':
+                    try:
+                        body = part.get_payload(decode=True).decode('utf-8', errors='ignore')
+                        break
+                    except Exception:
+                        pass
+        else:
+            try:
+                body = msg.get_payload(decode=True).decode('utf-8', errors='ignore')
+            except Exception:
+                body = msg.get_payload(decode=False)
+
+        return body if isinstance(body, str) else str(body)
+
+    def _parse_attachments(self, msg: email.message.Message) -> List[Attachment]:
+        """Extract attachment metadata."""
+        attachments = []
+
+        if not msg.is_multipart():
+            return attachments
+
+        for part in msg.iter_attachments():
+            filename = part.get_filename()
+            if filename:
+                try:
+                    payload = part.get_payload(decode=True)
+                    size = len(payload) if payload else 0
+                except Exception:
+                    size = 0
+
+                attachments.append(Attachment(
+                    filename=filename,
+                    mime_type=part.get_content_type(),
+                    size=size
+                ))
+
+        return attachments
+
+    def update_labels(self, email_id: str, labels: List[str]) -> bool:
+        """IMAP doesn't support labels like Gmail, but supports flags."""
+        if not self._credentials_configured or not self.client:
+            logger.error("IMAP NOT CONFIGURED: Cannot update flags")
+            return False
+
+        try:
+            # Convert labels to IMAP flags
+            imap_flags = self._labels_to_flags(labels)
+            self.client.set_flags([int(email_id)], imap_flags)
+            return True
+        except Exception as e:
+            logger.error(f"Error setting IMAP flags: {e}")
+            return False
+
+    def batch_update(self, updates: List[Dict[str, Any]]) -> bool:
+        """Batch update IMAP flags."""
+        if not self._credentials_configured or not self.client:
+            logger.error("IMAP NOT CONFIGURED: Cannot batch update")
+            return False
+
+        try:
+            for update in updates:
+                self.update_labels(update['email_id'], update.get('labels', []))
+            logger.info(f"Batch updated {len(updates)} emails")
+            return True
+        except Exception as e:
+            logger.error(f"Batch update error: {e}")
+            return False
+
+    def _labels_to_flags(self, labels: List[str]) -> List[str]:
+        """Convert label list to IMAP flags."""
+        # Map common labels to IMAP flags
+        flag_map = {
+            'junk': '\\Junk',
+            'spam': '\\Junk',
+            'archive': '\\All',
+            'trash': '\\Trash',
+            'starred': '\\Flagged',
+        }
+
+        flags = []
+        for label in labels:
+            if label.lower() in flag_map:
+                flags.append(flag_map[label.lower()])
+            else:
+                # IMAP allows custom keywords
+                flags.append(label)
+
+        return flags
+
+    def is_connected(self) -> bool:
+        """Check if connected."""
+        return self._credentials_configured and self.client is not None
diff --git a/src/export/__init__.py b/src/export/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/llm/__init__.py b/src/llm/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/llm/base.py b/src/llm/base.py
new file mode 100644
index 0000000..fbf01eb
--- /dev/null
+++ b/src/llm/base.py
@@ -0,0 +1,42 @@
+"""Abstract LLM provider interface."""
+from abc import ABC, abstractmethod
+from typing import Optional, Dict, Any
+import logging
+
+logger = logging.getLogger(__name__)
+
+
+class BaseLLMProvider(ABC):
+    """Abstract base class for LLM providers."""
+
+    def __init__(self, name: str = "base"):
+        """Initialize LLM provider."""
+        self.name = name
+        self.logger = logging.getLogger(f"{__name__}.{self.__class__.__name__}")
+
+    @abstractmethod
+    def complete(self, prompt: str, **kwargs) -> str:
+        """
+        Get completion from LLM.
+
+        Args:
+            prompt: Input prompt
+            **kwargs: Model-specific parameters (temperature, max_tokens, etc.)
+
+        Returns:
+            LLM response text
+        """
+        pass
+
+    @abstractmethod
+    def test_connection(self) -> bool:
+        """Test if LLM is available and working."""
+        pass
+
+    def is_available(self) -> bool:
+        """Check if provider is available."""
+        try:
+            return self.test_connection()
+        except Exception as e:
+            self.logger.error(f"Provider check failed: {e}")
+            return False
diff --git a/src/llm/ollama.py b/src/llm/ollama.py
new file mode 100644
index 0000000..1d5bdfa
--- /dev/null
+++ b/src/llm/ollama.py
@@ -0,0 +1,140 @@
+"""Ollama LLM provider for local model inference."""
+import logging
+import time
+from typing import Optional, Dict, Any
+
+from .base import BaseLLMProvider
+
+logger = logging.getLogger(__name__)
+
+
+class OllamaProvider(BaseLLMProvider):
+    """
+    Local LLM provider using Ollama.
+
+    Status: Requires Ollama running locally
+    - Default: http://localhost:11434
+    - Models: qwen3:4b (calibration), qwen3:1.7b (classification)
+    - If Ollama unavailable: Returns graceful error
+    """
+
+    def __init__(
+        self,
+        base_url: str = "http://localhost:11434",
+        model: str = "qwen3:1.7b",
+        temperature: float = 0.1,
+        max_tokens: int = 500,
+        timeout: int = 30,
+        retry_attempts: int = 3
+    ):
+        """Initialize Ollama provider."""
+        super().__init__(name="ollama")
+        self.base_url = base_url
+        self.model = model
+        self.temperature = temperature
+        self.max_tokens = max_tokens
+        self.timeout = timeout
+        self.retry_attempts = retry_attempts
+        self.client = None
+        self._available = False
+
+        self._initialize()
+
+    def _initialize(self) -> None:
+        """Initialize Ollama client."""
+        try:
+            import ollama
+            self.client = ollama.Client(host=self.base_url)
+            self.logger.info(f"Ollama provider initialized: {self.base_url}")
+
+            # Test connection
+            if self.test_connection():
+                self._available = True
+                self.logger.info(f"Ollama connected, model: {self.model}")
+            else:
+                self.logger.warning("Ollama connection test failed")
+                self._available = False
+
+        except ImportError:
+            self.logger.error("ollama package not installed: pip install ollama")
+            self._available = False
+        except Exception as e:
+            self.logger.error(f"Ollama initialization failed: {e}")
+            self._available = False
+
+    def complete(self, prompt: str, **kwargs) -> str:
+        """
+        Get completion from Ollama.
+
+        Args:
+            prompt: Input prompt
+            **kwargs: Override temperature, max_tokens, timeout
+
+        Returns:
+            LLM response
+        """
+        if not self._available or not self.client:
+            self.logger.error("Ollama not available")
+            raise RuntimeError("Ollama provider not initialized")
+
+        temperature = kwargs.get('temperature', self.temperature)
+        max_tokens = kwargs.get('max_tokens', self.max_tokens)
+        timeout = kwargs.get('timeout', self.timeout)
+
+        attempt = 0
+        while attempt < self.retry_attempts:
+            try:
+                self.logger.debug(f"Ollama request: model={self.model}, tokens={max_tokens}")
+
+                response = self.client.generate(
+                    model=self.model,
+                    prompt=prompt,
+                    options={
+                        'temperature': temperature,
+                        'num_predict': max_tokens,
+                        'top_k': 40,
+                        'top_p': 0.9,
+                    }
+                )
+
+                text = response.get('response', '')
+                self.logger.debug(f"Ollama response: {len(text)} chars")
+                return text
+
+            except Exception as e:
+                attempt += 1
+                if attempt < self.retry_attempts:
+                    wait_time = 2 ** attempt  # Exponential backoff
+                    self.logger.warning(f"Ollama request failed ({attempt}/{self.retry_attempts}), retrying in {wait_time}s: {e}")
+                    time.sleep(wait_time)
+                else:
+                    self.logger.error(f"Ollama request failed after {self.retry_attempts} attempts: {e}")
+                    raise
+
+    def test_connection(self) -> bool:
+        """Test if Ollama is running and accessible."""
+        if not self.client:
+            self.logger.warning("Ollama client not initialized")
+            return False
+
+        try:
+            # Try to list available models
+            models = self.client.list()
+            available_models = [m.get('name', '') for m in models.get('models', [])]
+
+            # Check if requested model is available
+            if any(self.model in m for m in available_models):
+                self.logger.info(f"Ollama test passed, model available: {self.model}")
+                return True
+            else:
+                self.logger.warning(f"Ollama running but model not found: {self.model}")
+                self.logger.warning(f"Available models: {available_models}")
+                return False
+
+        except Exception as e:
+            self.logger.error(f"Ollama connection test failed: {e}")
+            return False
+
+    def is_available(self) -> bool:
+        """Check if provider is available."""
+        return self._available
diff --git a/src/llm/openai_compat.py b/src/llm/openai_compat.py
new file mode 100644
index 0000000..69faa74
--- /dev/null
+++ b/src/llm/openai_compat.py
@@ -0,0 +1,144 @@
+"""OpenAI-compatible LLM provider."""
+import logging
+import os
+from typing import Optional, Dict, Any
+
+from .base import BaseLLMProvider
+
+logger = logging.getLogger(__name__)
+
+
+class OpenAIProvider(BaseLLMProvider):
+    """
+    OpenAI-compatible LLM provider.
+
+    Status: Requires OpenAI API key
+    - Can use OpenAI API or any OpenAI-compatible endpoint
+    - Requires: OPENAI_API_KEY environment variable or config
+    - If API unavailable: Returns graceful error
+    """
+
+    def __init__(
+        self,
+        api_key: Optional[str] = None,
+        base_url: str = "https://api.openai.com/v1",
+        model: str = "gpt-4o-mini",
+        temperature: float = 0.1,
+        max_tokens: int = 500,
+        timeout: int = 30,
+        retry_attempts: int = 3
+    ):
+        """Initialize OpenAI provider."""
+        super().__init__(name="openai")
+        self.api_key = api_key or os.getenv('OPENAI_API_KEY')
+        self.base_url = base_url
+        self.model = model
+        self.temperature = temperature
+        self.max_tokens = max_tokens
+        self.timeout = timeout
+        self.retry_attempts = retry_attempts
+        self.client = None
+        self._available = False
+
+        self._initialize()
+
+    def _initialize(self) -> None:
+        """Initialize OpenAI client."""
+        try:
+            from openai import OpenAI
+
+            if not self.api_key:
+                self.logger.error("OpenAI API key not configured")
+                self.logger.error("Set OPENAI_API_KEY environment variable or pass api_key parameter")
+                self._available = False
+                return
+
+            self.client = OpenAI(
+                api_key=self.api_key,
+                base_url=self.base_url if self.base_url != "https://api.openai.com/v1" else None,
+                timeout=self.timeout
+            )
+
+            self.logger.info(f"OpenAI provider initialized: {self.base_url}")
+
+            # Test connection
+            if self.test_connection():
+                self._available = True
+                self.logger.info(f"OpenAI connected, model: {self.model}")
+            else:
+                self.logger.warning("OpenAI connection test failed")
+                self._available = False
+
+        except ImportError:
+            self.logger.error("openai package not installed: pip install openai")
+            self._available = False
+        except Exception as e:
+            self.logger.error(f"OpenAI initialization failed: {e}")
+            self._available = False
+
+    def complete(self, prompt: str, **kwargs) -> str:
+        """
+        Get completion from OpenAI API.
+
+        Args:
+            prompt: Input prompt
+            **kwargs: Override temperature, max_tokens, timeout
+
+        Returns:
+            LLM response
+        """
+        if not self._available or not self.client:
+            self.logger.error("OpenAI not available")
+            raise RuntimeError("OpenAI provider not initialized")
+
+        temperature = kwargs.get('temperature', self.temperature)
+        max_tokens = kwargs.get('max_tokens', self.max_tokens)
+
+        attempt = 0
+        while attempt < self.retry_attempts:
+            try:
+                self.logger.debug(f"OpenAI request: model={self.model}, tokens={max_tokens}")
+
+                response = self.client.chat.completions.create(
+                    model=self.model,
+                    messages=[{"role": "user", "content": prompt}],
+                    temperature=temperature,
+                    max_tokens=max_tokens,
+                    timeout=self.timeout
+                )
+
+                text = response.choices[0].message.content
+                self.logger.debug(f"OpenAI response: {len(text)} chars")
+                return text
+
+            except Exception as e:
+                attempt += 1
+                if attempt < self.retry_attempts:
+                    self.logger.warning(f"OpenAI request failed ({attempt}/{self.retry_attempts}), retrying: {e}")
+                else:
+                    self.logger.error(f"OpenAI request failed after {self.retry_attempts} attempts: {e}")
+                    raise
+
+    def test_connection(self) -> bool:
+        """Test if OpenAI API is accessible."""
+        if not self.client or not self.api_key:
+            self.logger.warning("OpenAI client not initialized")
+            return False
+
+        try:
+            # Try a minimal request
+            response = self.client.chat.completions.create(
+                model=self.model,
+                messages=[{"role": "user", "content": "test"}],
+                max_tokens=10
+            )
+            self.logger.info(f"OpenAI test passed")
+            return True
+
+        except Exception as e:
+            self.logger.error(f"OpenAI connection test failed: {e}")
+            return False
+
+    def is_available(self) -> bool:
+        """Check if provider is available."""
+        return self._available
diff --git a/src/models/__init__.py b/src/models/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/processing/__init__.py b/src/processing/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/utils/__init__.py b/src/utils/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/src/utils/config.py b/src/utils/config.py
new file mode 100644
index 0000000..c3c5d4c
--- /dev/null
+++ b/src/utils/config.py
@@ -0,0 +1,191 @@
+"""Configuration management system for email-sorter."""
+import os
+import yaml
+import logging
+from pathlib import Path
+from typing import Dict, Any, Optional
+from pydantic import BaseModel, Field
+
+logger = logging.getLogger(__name__)
+
+
+class CalibrationConfig(BaseModel):
+    """Calibration phase configuration."""
+    sample_size: int = 1500
+    sample_strategy: str = "stratified"
+    validation_size: int = 300
+    min_confidence: float = 0.6
+
+
+class ProcessingConfig(BaseModel):
+    """Processing pipeline configuration."""
+    batch_size: int = 100
+    llm_queue_size: int = 100
+    parallel_workers: int = 4
+    checkpoint_interval: int = 1000
+    checkpoint_dir: str = "checkpoints"
+
+
+class ClassificationConfig(BaseModel):
+    """Classification configuration."""
+    default_threshold: float = 0.75
+    min_threshold: float = 0.60
+    max_threshold: float = 0.90
+    adjustment_step: float = 0.05
+    adjustment_frequency: int = 1000
+    category_thresholds: Dict[str, float] = Field(default_factory=dict)
+
+
+class OllamaConfig(BaseModel):
+    """Ollama LLM provider configuration."""
+    base_url: str = "http://localhost:11434"
+    calibration_model: str = "qwen3:4b"
+    classification_model: str = "qwen3:1.7b"
+    temperature: float = 0.1
+    max_tokens: int = 500
+    timeout: int = 30
+    retry_attempts: int = 3
+
+
+class OpenAIConfig(BaseModel):
+    """OpenAI API configuration."""
+    base_url: str = "https://api.openai.com/v1"
+    api_key: Optional[str] = None
+    calibration_model: str = "gpt-4o-mini"
+    classification_model: str = "gpt-4o-mini"
+    temperature: float = 0.1
+    max_tokens: int = 500
+
+
+class LLMConfig(BaseModel):
+    """LLM provider configuration."""
+    provider: str = "ollama"  # ollama or openai
+    ollama: OllamaConfig = Field(default_factory=OllamaConfig)
+    openai: OpenAIConfig = Field(default_factory=OpenAIConfig)
+    fallback_enabled: bool = True
+
+
+class EmailProvidersConfig(BaseModel):
+    """Email provider configurations."""
+    gmail: Dict[str, Any] = Field(default_factory=lambda: {"batch_size": 100})
+    microsoft: Dict[str, Any] = Field(default_factory=lambda: {"batch_size": 100})
+    imap: Dict[str, Any] = Field(default_factory=lambda: {"timeout": 30, "batch_size": 50})
+
+
+class FeaturesConfig(BaseModel):
+    """Feature extraction configuration."""
+    text_features: Dict[str, Any] = Field(
+        default_factory=lambda: {
+            "max_vocab_size": 10000,
+            "ngram_range": [1, 2],
+            "min_df": 2,
+            "max_df": 0.95,
+        }
+    )
+    embedding_model: str = "all-MiniLM-L6-v2"
+    embedding_batch_size: int = 32
+
+
+class ExportConfig(BaseModel):
+    """Export configuration."""
+    format: str = "json"
+    include_confidence: bool = True
+    create_report: bool = True
+    output_dir: str = "results"
+
+
+class LoggingConfig(BaseModel):
+    """Logging configuration."""
+    level: str = "INFO"
+    file: str = "logs/email-sorter.log"
+    format: str = "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
+
+
+class CleanupConfig(BaseModel):
+    """Cleanup configuration."""
+    delete_temp_files: bool = True
+    delete_repo_after: bool = False
+    temp_dir: str = ".email-sorter-tmp"
+
+
+class Config(BaseModel):
+    """Main configuration model."""
+    version: str = "1.0.0"
+    calibration: CalibrationConfig = Field(default_factory=CalibrationConfig)
+    processing: ProcessingConfig = Field(default_factory=ProcessingConfig)
+    classification: ClassificationConfig = Field(default_factory=ClassificationConfig)
+    llm: LLMConfig = Field(default_factory=LLMConfig)
+    email_providers: EmailProvidersConfig = Field(default_factory=EmailProvidersConfig)
+    features: FeaturesConfig = Field(default_factory=FeaturesConfig)
+    export: ExportConfig = Field(default_factory=ExportConfig)
+    logging: LoggingConfig = Field(default_factory=LoggingConfig)
+    cleanup: CleanupConfig = Field(default_factory=CleanupConfig)
+
+    class Config:
+        extra = "allow"
+
+    @classmethod
+    def from_yaml(cls, config_path: str) -> "Config":
+        """Load configuration from YAML file."""
+        if not os.path.exists(config_path):
+            logger.warning(f"Config file not found: {config_path}, using defaults")
+            return cls()
+
+        try:
+            with open(config_path, 'r') as f:
+                config_dict = yaml.safe_load(f) or {}
+            return cls(**config_dict)
+        except Exception as e:
+            logger.error(f"Error loading config from {config_path}: {e}")
+            return cls()
+
+    def to_yaml(self, output_path: str) -> None:
+        """Save configuration to YAML file."""
+        Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+        with open(output_path, 'w') as f:
+            yaml.dump(self.dict(), f, default_flow_style=False)
+
+
+def load_config(config_path: Optional[str] = None) -> Config:
+    """Load configuration from file or use defaults."""
+    if config_path is None:
+        # Try common locations
+        for path in ["config/default_config.yaml", "config/config.yaml", ".env"]:
+            if os.path.exists(path):
+                config_path = path
+                break
+
+    if config_path:
+        return Config.from_yaml(config_path)
+    else:
+        logger.info("No config file found, using default configuration")
+        return Config()
+
+
+def load_categories(categories_path: str = "config/categories.yaml") -> Dict[str, Dict]:
+    """Load category definitions from YAML."""
+    if not os.path.exists(categories_path):
+        logger.warning(f"Categories file not found: {categories_path}")
+        return {}
+
+    try:
+        with open(categories_path, 'r') as f:
+            data = yaml.safe_load(f) or {}
+        return data.get('categories', {})
+    except Exception as e:
+        logger.error(f"Error loading categories: {e}")
+        return {}
+
+
+def load_features(features_path: str = "config/features.yaml") -> Dict[str, Any]:
+    """Load feature configuration from YAML."""
+    if not os.path.exists(features_path):
+        logger.warning(f"Features file not found: {features_path}")
+        return {}
+
+    try:
+        with open(features_path, 'r') as f:
+            return yaml.safe_load(f) or {}
+    except Exception as e:
+        logger.error(f"Error loading features: {e}")
+        return {}
diff --git a/src/utils/logging.py b/src/utils/logging.py
new file mode 100644
index 0000000..8496768
--- /dev/null
+++ b/src/utils/logging.py
@@ -0,0 +1,74 @@
+"""Logging configuration and management."""
+import logging
+import sys
+from pathlib import Path
+from typing import Optional
+
+try:
+    from rich.logging import RichHandler
+    HAS_RICH = True
+except ImportError:
+    HAS_RICH = False
+
+
+def setup_logging(
+    level: str = "INFO",
+    log_file: Optional[str] = None,
+    use_rich: bool = True
+) -> logging.Logger:
+    """
+    Setup logging with console and optional file handlers.
+
+    Args:
+        level: Logging level (DEBUG, INFO, WARNING, ERROR, CRITICAL)
+        log_file: Optional file path for log output
+        use_rich: Use rich formatting if available
+
+    Returns:
+        Configured logger instance
+    """
+    # Create logs directory if needed
+    if log_file:
+        Path(log_file).parent.mkdir(parents=True, exist_ok=True)
+
+    # Get root logger
+    logger = logging.getLogger()
+    logger.setLevel(level)
+
+    # Remove existing handlers
+    logger.handlers = []
+
+    # Console handler with optional rich formatting
+    if use_rich and HAS_RICH:
+        console_handler = RichHandler(
+            rich_tracebacks=True,
+            markup=True,
+            show_time=True,
+            show_path=False
+        )
+    else:
+        console_handler = logging.StreamHandler(sys.stdout)
+
+    console_handler.setLevel(level)
+    console_formatter = logging.Formatter(
+        '%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+    )
+    console_handler.setFormatter(console_formatter)
+    logger.addHandler(console_handler)
+
+    # File handler if specified
+    if log_file:
+        file_handler = logging.FileHandler(log_file)
+        file_handler.setLevel(level)
+        file_formatter = logging.Formatter(
+            '%(asctime)s - %(name)s - %(levelname)s - %(message)s'
+        )
+        file_handler.setFormatter(file_formatter)
+        logger.addHandler(file_handler)
+
+    return logger
+
+
+def get_logger(name: str) -> logging.Logger:
+    """Get a logger instance for a module."""
+    return logging.getLogger(name)
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000..e69de29
diff --git a/tests/conftest.py b/tests/conftest.py
new file mode 100644
index 0000000..1462079
--- /dev/null
+++ b/tests/conftest.py
@@ -0,0 +1,112 @@
+"""Pytest configuration and fixtures."""
+import pytest
+from datetime import datetime
+from src.email_providers.base import Email, Attachment
+from src.utils.config import load_config, load_categories
+
+
+@pytest.fixture
+def config():
+    """Load test configuration."""
+    return load_config()
+
+
+@pytest.fixture
+def categories():
+    """Load test categories."""
+    return load_categories()
+
+
+@pytest.fixture
+def sample_email():
+    """Create a sample email for testing."""
+    return Email(
+        id='test-1',
+        subject='Meeting at 3pm today',
+        sender='john@company.com',
+        sender_name='John Doe',
+        date=datetime.now(),
+        body='Let\'s discuss the Q4 project. Attached is the proposal.',
+        body_snippet='Let\'s discuss the Q4 project.',
+        has_attachments=True,
+        attachments=[
+            Attachment(
+                filename='proposal.pdf',
+                mime_type='application/pdf',
+                size=102400
+            )
+        ],
+        headers={'Subject': 'Meeting at 3pm today'},
+        labels=[],
+        is_read=False,
+        provider='gmail'
+    )
+
+
+@pytest.fixture
+def sample_emails():
+    """Create multiple sample emails."""
+    emails = []
+
+    # Auth email
+    emails.append(Email(
+        id='auth-1',
+        subject='Verify your account',
+        sender='noreply@bank.com',
+        body='Your verification code is 123456',
+        body_snippet='Your verification code is 123456',
+        date=datetime.now(),
+        provider='gmail'
+    ))
+
+    # Invoice email
+    emails.append(Email(
+        id='invoice-1',
+        subject='Invoice #INV-2024-001',
+        sender='billing@vendor.com',
+        body='Please find attached invoice for October services.',
+        body_snippet='Please find attached invoice',
+        has_attachments=True,
+        attachments=[
+            Attachment('invoice.pdf', 'application/pdf', 50000)
+        ],
+        date=datetime.now(),
+        provider='gmail'
+    ))
+
+    # Newsletter
+    emails.append(Email(
+        id='newsletter-1',
+        subject='Weekly Digest - Oct 21',
+        sender='newsletter@blog.com',
+        body='This week in tech... Click here to read more.',
+        body_snippet='This week in tech',
+        date=datetime.now(),
+        provider='gmail'
+    ))
+
+    # Work email
+    emails.append(Email(
+        id='work-1',
+        subject='Project deadline extended',
+        sender='manager@company.com',
+        sender_name='Jane Manager',
+        body='Team, the Q4 project deadline has been extended to Nov 15.',
+        body_snippet='Project deadline has been extended',
+        date=datetime.now(),
+        provider='gmail'
+    ))
+
+    # Personal email
+    emails.append(Email(
+        id='personal-1',
+        subject='Dinner this weekend?',
+        sender='friend@gmail.com',
+        sender_name='Alex',
+        body='Hey! Want to grab dinner this weekend?',
+        body_snippet='Want to grab dinner',
+        date=datetime.now(),
+        provider='gmail'
+    ))
+
+    return emails
diff --git a/tests/test_classifiers.py b/tests/test_classifiers.py
new file mode 100644
index 0000000..9205b3c
--- /dev/null
+++ b/tests/test_classifiers.py
@@ -0,0 +1,138 @@
+"""Tests for classifier modules."""
+import pytest
+from src.classification.ml_classifier import MLClassifier
+from src.classification.adaptive_classifier import AdaptiveClassifier
+from src.classification.feature_extractor import FeatureExtractor
+from src.classification.llm_classifier import LLMClassifier
+from src.llm.ollama import OllamaProvider
+from src.utils.config import load_config, load_categories
+import numpy as np
+
+
+def test_ml_classifier_init():
+    """Test ML classifier initialization."""
+    classifier = MLClassifier()
+    assert classifier is not None
+    assert classifier.is_mock is True  # Should be mock for testing
+    assert len(classifier.categories) > 0
+
+
+def test_ml_classifier_info():
+    """Test ML classifier info."""
+    classifier = MLClassifier()
+    info = classifier.get_info()
+
+    assert 'is_loaded' in info
+    assert 'is_mock' in info
+    assert 'categories' in info
+    assert len(info['categories']) == 12
+
+
+def test_ml_classifier_predict():
+    """Test ML classifier prediction."""
+    classifier = MLClassifier()
+
+    # Create dummy feature vector
+    features = np.random.rand(50)
+
+    result = classifier.predict(features)
+
+    assert 'category' in result
+    assert 'confidence' in result
+    assert 'probabilities' in result
+    assert 0 <= result['confidence'] <= 1
+
+
+def test_adaptive_classifier_init(config, categories):
+    """Test adaptive classifier initialization."""
+    feature_extractor = FeatureExtractor()
+    ml_classifier = MLClassifier()
+    llm_classifier = None
+
+    classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        llm_classifier,
+        categories,
+        config.dict()
+    )
+
+    assert classifier is not None
+    assert classifier.feature_extractor is not None
+    assert classifier.ml_classifier is not None
+
+
+def test_adaptive_classifier_hard_rules(sample_email, config, categories):
+    """Test hard rule matching in adaptive classifier."""
+    from src.email_providers.base import Email
+
+    # Create auth email
+    auth_email = Email(
+        id='auth-test',
+        subject='Verify your account',
+        sender='noreply@bank.com',
+        body='Your verification code is 123456'
+    )
+
+    feature_extractor = FeatureExtractor()
+    ml_classifier = MLClassifier()
+
+    classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        None,
+        categories,
+        config.dict()
+    )
+
+    result = classifier._try_hard_rules(auth_email)
+
+    assert result is not None
+    assert result.category == 'auth'
+    assert result.method == 'rule'
+    assert result.confidence == 0.99
+
+
+def test_adaptive_classifier_stats(config, categories):
+    """Test adaptive classifier statistics."""
+    feature_extractor = FeatureExtractor()
+    ml_classifier = MLClassifier()
+
+    classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        None,
+        categories,
+        config.dict()
+    )
+
+    stats = classifier.get_stats()
+
+    assert stats.total_emails == 0
+    assert stats.rule_matched == 0
+    assert stats.ml_classified == 0
+
+
+def test_llm_classifier_init(config, categories):
+    """Test LLM classifier initialization."""
+    # Create mock LLM provider
+    llm = OllamaProvider()
+
+    classifier = LLMClassifier(llm, categories, config.dict())
+
+    assert classifier is not None
+    assert classifier.provider is not None
+    assert len(classifier.categories) > 0
+
+
+def test_llm_classifier_status(config, categories):
+    """Test LLM classifier status."""
+    llm = OllamaProvider()
+    classifier = LLMClassifier(llm, categories, config.dict())
+
+    status = classifier.get_status()
+
+    assert 'llm_available' in status
+    assert 'provider' in status
+    assert 'categories' in status
+    assert status['provider'] == 'ollama'
diff --git a/tests/test_feature_extraction.py b/tests/test_feature_extraction.py
new file mode 100644
index 0000000..521d791
--- /dev/null
+++ b/tests/test_feature_extraction.py
@@ -0,0 +1,141 @@
+"""Tests for feature extraction module."""
+import pytest
+import numpy as np
+from src.classification.feature_extractor import FeatureExtractor
+from src.email_providers.base import Email, Attachment
+from datetime import datetime
+
+
+def test_feature_extractor_init():
+    """Test feature extractor initialization."""
+    extractor = FeatureExtractor()
+    assert extractor is not None
+    assert extractor.embedder is not None or extractor.embedder is None  # OK if embedder fails
+
+
+def test_extract_structural_features(sample_email):
+    """Test structural feature extraction."""
+    extractor = FeatureExtractor()
+    features = extractor._extract_structural(sample_email)
+
+    assert 'has_attachments' in features
+    assert 'attachment_count' in features
+    assert 'body_length' in features
+    assert 'subject_length' in features
+    assert 'time_of_day' in features
+    assert features['has_attachments'] is True
+    assert features['attachment_count'] == 1
+
+
+def test_extract_sender_features(sample_email):
+    """Test sender feature extraction."""
+    extractor = FeatureExtractor()
+    features = extractor._extract_sender(sample_email)
+
+    assert 'sender_domain' in features
+    assert 'sender_domain_type' in features
+    assert 'is_noreply' in features
+    assert features['sender_domain'] == 'company.com'
+    assert features['sender_domain_type'] in ['freemail', 'corporate', 'noreply', 'unknown']
+
+
+def test_extract_patterns(sample_email):
+    """Test pattern extraction."""
+    extractor = FeatureExtractor()
+    features = extractor._extract_patterns(sample_email)
+
+    assert 'has_otp_pattern' in features
+    assert 'has_invoice_pattern' in features
+    assert 'has_meeting' in features
+    assert all(isinstance(v, bool) or isinstance(v, int) for v in features.values())
+
+
+def test_pattern_detection_otp():
+    """Test OTP pattern detection."""
+    email = Email(
+        id='otp-test',
+        subject='Verify your identity',
+        sender='bank@example.com',
+        body='Your OTP is 456789'
+    )
+
+    extractor = FeatureExtractor()
+    features = extractor._extract_patterns(email)
+
+    assert features.get('has_otp_pattern') is True
+
+
+def test_pattern_detection_invoice():
+    """Test invoice pattern detection."""
+    email = Email(
+        id='invoice-test',
+        subject='Invoice #INV-2024-12345',
+        sender='billing@vendor.com',
+        body='Please pay for invoice #INV-2024-12345'
+    )
+
+    extractor = FeatureExtractor()
+    features = extractor._extract_patterns(email)
+
+    assert features.get('has_invoice_pattern') is True
+
+
+def test_full_extraction(sample_email):
+    """Test full feature extraction."""
+    extractor = FeatureExtractor()
+    features = extractor.extract(sample_email)
+
+    assert features is not None
+    assert 'embedding' in features
+    assert 'subject' in features
+    assert 'body_snippet' in features
+
+    # Check embedding is array
+    embedding = features['embedding']
+    if hasattr(embedding, 'shape'):
+        assert len(embedding.shape) == 1
+
+
+def test_batch_extraction(sample_emails):
+    """Test batch feature extraction."""
+    extractor = FeatureExtractor()
+
+    # Only test if pandas available
+    try:
+        df = extractor.extract_batch(sample_emails)
+        if df is not None:
+            assert len(df) == len(sample_emails)
+            assert df.shape[0] == len(sample_emails)
+    except ImportError:
+        pytest.skip("pandas not available")
+
+
+def test_freemail_detection():
+    """Test freemail domain detection."""
+    email = Email(
+        id='freemail-test',
+        subject='Hello',
+        sender='user@gmail.com',
+        body='Test'
+    )
+
+    extractor = FeatureExtractor()
+    features = extractor._extract_sender(email)
+
+    assert features.get('sender_domain_type') == 'freemail'
+
+
+def test_noreply_detection():
+    """Test noreply sender detection."""
+    email = Email(
+        id='noreply-test',
+        subject='Alert',
+        sender='noreply@system.com',
+        body='Automated alert'
+    )
+
+    extractor = FeatureExtractor()
+    features = extractor._extract_sender(email)
+
+    assert features.get('is_noreply') is True
+    assert features.get('sender_domain_type') == 'noreply'
diff --git a/tests/test_integration.py b/tests/test_integration.py
new file mode 100644
index 0000000..15ca27b
--- /dev/null
+++ b/tests/test_integration.py
@@ -0,0 +1,158 @@
+"""Integration tests for email-sorter."""
+import pytest
+from src.email_providers.base import MockProvider, Email
+from src.classification.feature_extractor import FeatureExtractor
+from src.classification.ml_classifier import MLClassifier
+from src.classification.adaptive_classifier import AdaptiveClassifier
+from src.utils.config import load_config, load_categories
+from datetime import datetime
+
+
+def test_end_to_end_mock_classification(sample_emails, config, categories):
+    """Test end-to-end classification with mock provider."""
+
+    # Setup mock provider
+    provider = MockProvider()
+    provider.connect({})
+
+    # Add sample emails
+    for email in sample_emails:
+        provider.add_mock_email(email)
+
+    # Fetch emails
+    emails = provider.fetch_emails()
+    assert len(emails) == len(sample_emails)
+
+    # Setup classifiers
+    feature_extractor = FeatureExtractor()
+    ml_classifier = MLClassifier()
+
+    classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        None,
+        categories,
+        config.dict()
+    )
+
+    # Classify
+    results = classifier.classify_batch(emails)
+
+    assert len(results) == len(emails)
+    assert all(r.email_id is not None for r in results)
+    assert all(r.category in categories for r in results)
+
+    # Check stats
+    stats = classifier.get_stats()
+    assert stats.total_emails == len(emails)
+    assert stats.rule_matched + stats.ml_classified + stats.needs_review > 0
+
+
+def test_mock_provider_integration():
+    """Test mock provider"""
+    provider = MockProvider()
+
+    assert not provider.is_connected()
+
+    provider.connect({})
+    assert provider.is_connected()
+
+    email = Email(
+        id='test-1',
+        subject='Test email',
+        sender='test@example.com',
+        body='Test body'
+    )
+
+    provider.add_mock_email(email)
+    emails = provider.fetch_emails()
+
+    assert len(emails) == 1
+    assert emails[0].id == 'test-1'
+
+    provider.disconnect()
+    assert not provider.is_connected()
+
+
+def test_classification_pipeline_with_auth_email(config, categories):
+    """Test full classification of authentication email."""
+    from src.email_providers.base import Email
+
+    auth_email = Email(
+        id='auth-1',
+        subject='Verify your account - Action Required',
+        sender='noreply@service.com',
+        body='Your verification code is 654321. Do not share this code.',
+        body_snippet='Your verification code is 654321'
+    )
+
+    feature_extractor = FeatureExtractor()
+    ml_classifier = MLClassifier()
+
+    classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        None,
+        categories,
+        config.dict()
+    )
+
+    result = classifier.classify(auth_email)
+
+    assert result.email_id == 'auth-1'
+    assert result.category == 'auth'
+    assert result.method == 'rule'  # Should match hard rule
+
+
+def test_classification_pipeline_with_invoice_email(config, categories):
+    """Test full classification of invoice email."""
+    from src.email_providers.base import Email, Attachment
+
+    invoice_email = Email(
+        id='invoice-1',
+        subject='Invoice #INV-2024-9999 - October Services',
+        sender='billing@vendor.com',
+        body='Please see attached invoice for services rendered.',
+        body_snippet='See attached invoice',
+        has_attachments=True,
+        attachments=[
+            Attachment('invoice.pdf', 'application/pdf', 100000)
+        ]
+    )
+
+    feature_extractor = FeatureExtractor()
+    ml_classifier = MLClassifier()
+
+    classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        None,
+        categories,
+        config.dict()
+    )
+
+    result = classifier.classify(invoice_email)
+
+    assert result.email_id == 'invoice-1'
+    assert result.category == 'transactional'
+
+
+def test_batch_classification(sample_emails, config, categories):
+    """Test batch classification."""
+    feature_extractor = FeatureExtractor()
+    ml_classifier = MLClassifier()
+
+    classifier = AdaptiveClassifier(
+        feature_extractor,
+        ml_classifier,
+        None,
+        categories,
+        config.dict()
+    )
+
+    results = classifier.classify_batch(sample_emails)
+
+    assert len(results) == len(sample_emails)
+    for result in results:
+        assert result.category in list(categories.keys()) + ['unknown']
+        assert 0 <= result.confidence <= 1