whitehackr · whitehackr · Sep 26, 2025 · Sep 26, 2025 · Sep 27, 2025 · Sep 27, 2025
diff --git a/.claude/settings.local.json b/.claude/settings.local.json
@@ -0,0 +1,9 @@
+{
+  "permissions": {
+    "allow": [
+      "Bash(git add:*)"
+    ],
+    "deny": [],
+    "ask": []
+  }
+}
diff --git a/.env.production.template b/.env.production.template
@@ -0,0 +1,43 @@
+# Production Environment Configuration Template for Railway Deployment
+# These environment variables should be set in Railway's environment settings
+
+# Redis Configuration (automatically set by Railway Redis service)
+# REDIS_URL=redis://...  # Railway sets this automatically
+
+# ML Prediction Storage Configuration
+ML_PREDICTION_TTL=2592000
+ML_STORAGE_VERBOSE=false
+
+# MLflow Configuration (local development - ephemeral in Railway)
+MLFLOW_TRACKING_URI=sqlite:///mlflow.db
+MLFLOW_EXPERIMENT_NAME=bnpl_shadow_mode_production
+
+# API Configuration
+PORT=8000
+
+# Application Environment
+ENVIRONMENT=production
+
+# Logging Configuration
+LOG_LEVEL=INFO
+
+# Performance Tuning
+UVICORN_WORKERS=1
+UVICORN_MAX_REQUESTS=1000
+UVICORN_TIMEOUT_KEEP_ALIVE=5
+
+# Shadow Mode Configuration
+SHADOW_MODE_ENABLED=true
+DEFAULT_DECISION_POLICY=balanced
+
+# Notes for Railway Deployment:
+# 1. Railway automatically sets REDIS_URL when Redis service is added
+# 2. PORT is automatically set by Railway
+# 3. All other variables should be set in Railway's environment settings
+# 4. MLflow data will be stored in the container filesystem (ephemeral)
+# 5. For persistent MLflow storage, configure external MLflow server
+#
+# Known Limitations (to be addressed in future PR):
+# - MLflow data is ephemeral and disappears on container restart
+# - No team access to MLflow UI - only local development
+# - Consider hosted MLflow server for production team collaboration
diff --git a/.env.redis.template b/.env.redis.template
@@ -0,0 +1,21 @@
+# Redis Configuration for ML Prediction Caching - Flit Project
+#
+# INSTRUCTIONS:
+# 1. Copy this file to .env.redis
+# 2. Replace YOUR_REDIS_URL_HERE with actual Redis URL from Railway
+# 3. Never commit .env.redis to git
+#
+# Get Redis URL from Railway:
+# 1. Go to railway.app -> flit project -> Redis service -> Variables tab
+# 2. Copy REDIS_URL value
+# 3. Paste below
+
+REDIS_URL=YOUR_REDIS_URL_HERE
+REDIS_DB_TRANSACTIONS=0
+REDIS_DB_PREDICTIONS=1
+REDIS_TTL_SECONDS=604800
+RAILWAY_PROJECT=flit
+
+# BigQuery Configuration
+BIGQUERY_PROJECT=flit-data-platform
+GOOGLE_APPLICATION_CREDENTIALS=/../../../../.gcp/your-gcp-credentials.json
diff --git a/.gitignore b/.gitignore
@@ -1,2 +1,12 @@
 __pycache__/
 logs/
+
+# Environment files (contain sensitive credentials)
+.env
+.env.*
+!.env.*.template
+
+# MLflow artifacts (local development only)
+mlflow.db
+mlruns/
+mlflow-artifacts/
diff --git a/CLAUDE.md b/CLAUDE.md
@@ -0,0 +1,104 @@
+# Claude Code Assistant Configuration
+
+## Documentation Standards
+
+### PR Comment Technical Depth Requirements
+
+All PR comments documenting technical decisions must meet **Sr Principal Engineer** standards:
+
+#### Content Depth
+- **Educational First**: Write to teach junior, mid, and senior engineers simultaneously
+- **Technical Rigor**: Explain not just what was built, but why design decisions were made
+- **Trade-off Analysis**: Document alternatives considered and rejection rationale
+- **Context Setting**: Establish problem space before presenting solutions
+- **Probabilistic Thinking**: When applicable, explain statistical/ML reasoning in depth
+
+#### Writing Style
+- **Prose Over Bullets**: Use solid prose for complex explanations; bullets only for simple lists
+- **Human Voice**: Sound like an experienced engineer teaching, not AI-generated content
+- **No Attribution**: Never reference "Sr Principal" titles, experience levels, or self-promotion. Also, no attributions to Claude Code.
+- **Depth Without Repetition**: Be comprehensive but never redundant
+
+#### Technical Documentation Pattern
+```markdown
+## Problem Context
+[Establish the technical challenge and why it matters]
+
+### Design Decision: [Clear title]
+[Explain the chosen approach with code examples]
+
+### Alternative Approaches Considered
+[Detail what was rejected and why]
+
+### Technical Deep Dive
+[Explain the underlying principles, statistics, algorithms]
+
+### Trade-offs & Future Considerations
+[Long-term implications and improvement paths]
+```
+
+#### Code Quality Standards
+- Always show working code examples
+- Include performance metrics and benchmarks
+- Document edge cases and error handling
+- Explain statistical/mathematical foundations when relevant
+
+### Development Commands
+
+Standard commands for this repository:
+
+#### Testing
+```bash
+# Run all tests (organized)
+python run_tests.py
+
+# Run specific test categories
+poetry run pytest tests/unit/ -v          # Unit tests only
+poetry run pytest tests/integration/ -v   # Integration tests only
+
+# Run individual test modules
+python tests/unit/features/test_feature_engineering.py
+python tests/unit/models/test_multi_model_predictor.py
+python tests/integration/test_api_endpoints.py
+```
+
+#### Linting & Type Checking
+```bash
+# Run before committing
+poetry run ruff check .
+poetry run mypy .
+```
+
+#### Model Development
+```bash
+# Activate environment
+poetry shell
+
+# Production artifact validation
+poetry run pytest tests/integration/ -v
+```
+
+### Commit Message Standards
+
+- **Concise but complete**: Summarize the change and key technical points
+- **No excessive detail**: Technical depth belongs in PR comments, not commit messages
+- **Imperative mood**: "Implement X" not "Implemented X"
+- **Reference documentation**: When complex decisions are made, reference PR comments
+
+### Known Issues Management
+
+Maintain `docs/models/domain_monthyr_known_issues.md` with:
+- **Clear prioritization**: 🔴 Blocking, 🟡 Important, 🟢 Enhancement
+- **Technical solutions**: Specific code examples for fixes
+- **Business impact**: How issues affect production deployment
+- **Timeline guidance**: When to address each issue
+
+### Educational Philosophy
+
+Every technical document should enable a junior/mid/sr engineer to:
+1. **Understand the problem** being solved
+2. **Learn the reasoning** behind design decisions
+3. **Implement similar solutions** in different contexts
+4. **Recognize trade-offs** in their own work
+
+This documentation serves as both project record and engineering education resource.
diff --git a/DEPLOYMENT.md b/DEPLOYMENT.md
@@ -0,0 +1,35 @@
+# BNPL Production Deployment v0.1.0
+
+## Phase 2: Core Pipeline Development
+
+Production deployment of BNPL ML models with shadow mode capabilities.
+
+### Current Implementation Status
+
+- [x] Production branch setup
+- [x] Artifact validation (6/6 models ready)
+- [ ] Single-transaction feature engineering
+- [ ] Multi-model predictor
+- [ ] API endpoints
+- [ ] Shadow mode controller
+- [ ] Docker + Railway deployment
+
+### Target Architecture
+
+```
+API Request → Feature Engineering → Multi-Model Prediction → Shadow Logging → Business Decision
+```
+
+### Performance Goals
+
+- <100ms transaction processing (from 2ms research baseline)
+- 36 features exactly matching training pipeline
+- Support for 4 model deployment modes
+
+## Next Steps
+
+1. Implement `engineer_single_transaction()` method
+2. Create flexible `BNPLPredictor` class
+3. Build REST API endpoints
+4. Add MLflow integration
+5. Docker containerization for Railway
diff --git a/Dockerfile b/Dockerfile
@@ -0,0 +1,48 @@
+# BNPL ML API Production Dockerfile for Railway Deployment
+FROM python:3.11-slim
+
+# Set environment variables for production
+ENV PYTHONUNBUFFERED=1 \
+    PYTHONDONTWRITEBYTECODE=1 \
+    PIP_NO_CACHE_DIR=1 \
+    PIP_DISABLE_PIP_VERSION_CHECK=1
+
+# Set working directory
+WORKDIR /app
+
+# Install system dependencies for ML libraries
+RUN apt-get update && apt-get install -y \
+    build-essential \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+# Poetry configuration (commented out due to Railway build issues)
+# RUN pip install poetry==1.6.1
+# ENV POETRY_NO_INTERACTION=1 \
+#     POETRY_VENV_IN_PROJECT=1 \
+#     POETRY_CACHE_DIR=/tmp/poetry_cache
+# COPY pyproject.toml poetry.lock ./
+# RUN poetry install --only=main && rm -rf $POETRY_CACHE_DIR
+
+# Use requirements.txt for Railway deployment (workaround for Poetry connection issues)
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+# Copy application code
+COPY . .
+
+# Create non-root user for security
+RUN useradd --create-home --shell /bin/bash app \
+    && chown -R app:app /app
+USER app
+
+# Expose port (Railway will set PORT environment variable)
+EXPOSE 8000
+
+# Health check for Railway
+HEALTHCHECK --interval=30s --timeout=30s --start-period=5s --retries=3 \
+    CMD curl -f http://localhost:$PORT/v1/bnpl/health || exit 1
+
+# Start command for Railway deployment (updated for pip-based install)
+# CMD poetry run uvicorn flit_ml.api.main:app --host 0.0.0.0 --port $PORT
+CMD python -m uvicorn flit_ml.api.main:app --host 0.0.0.0 --port ${PORT:-8000}