hubmapconsortium
diff --git a/‎src/app.py‎
Lines changed: 4 additions & 0 deletions b/‎src/app.py‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎src/setup_lifecycle_hooks.py‎
Lines changed: 127 additions & 0 deletions b/‎src/setup_lifecycle_hooks.py‎
Lines changed: 127 additions & 0 deletions
diff --git a/‎test/README.md‎
Lines changed: 177 additions & 0 deletions b/‎test/README.md‎
Lines changed: 177 additions & 0 deletions
@@ -38,6 +38,7 @@
 from schema.schema_constants import TriggerTypeEnum
 from metadata_constraints import get_constraints, constraints_json_is_valid
 # from lib.ontology import initialize_ubkg, init_ontology, Ontology, UbkgSDK
+from setup_lifecycle_hooks import setup_flask_lifecycle_hooks
 
 # HuBMAP commons
 from hubmap_commons import string_helper
@@ -64,6 +65,9 @@
 # will be inherited by the sub-module loggers
 logger = logging.getLogger()
 
+# Add in Flask lifecycle hooks which rely on the logger being instantiated
+setup_flask_lifecycle_hooks(app)
+
 # Remove trailing slash / from URL base to avoid "//" caused by config with trailing slash
 app.config['UUID_API_URL'] = app.config['UUID_API_URL'].strip('/')
 app.config['INGEST_API_URL'] = app.config['INGEST_API_URL'].strip('/')
 
@@ -0,0 +1,127 @@
+"""
+Flask lifecycle hooks for API request/response logging.  Uses the existing global logger configured in app.py.
+
+Provides before_request and after_request hooks that log API usage in using
+Common Log Format, as previously used for API Gateway custom access log format on AWS.
+https://en.wikipedia.org/wiki/Common_Log_Format#Combined_Log_Format
+
+Log format:
+    $sourceIp $caller $user [$requestTime] "$method $resourcePath $protocol" $status $responseLength $requestId
+replacement for AWS API Gateway custom access log format:
+    $context.identity.sourceIp $context.identity.caller $context.identity.user [$context.requestTime]
+    "$context.httpMethod $context.resourcePath $context.protocol"
+    $context.status $context.responseLength $context.requestId
+
+Example log output:
+    [2026-03-07 10:30:45] DEBUG in setup_lifecycle_hooks: Request started: GET /entities/abc123 from 172.19.0.1 [ID: req-1709809845-1234]
+    [2026-03-07 10:30:45] INFO in setup_lifecycle_hooks: 172.19.0.1 - user@example.com [07/Mar/2026:10:30:45 +0000] "GET /entities/abc123 HTTP/1.1" 200 1234 req-1709809845-1234
+"""
+
+import logging
+import time
+from flask import request, g
+from datetime import datetime
+
+# Use the same logger configuration as app.py
+logger = logging.getLogger(__name__)
+
+def setup_flask_lifecycle_hooks(app):
+    """
+    Register Flask lifecycle hooks for request/response logging.
+    
+    Sets up before_request and after_request handlers that log all API calls
+    using the existing logger configured in app.py.
+    
+    Args:
+        app: Flask application instance
+        
+    Usage:
+        from setup_lifecycle_hooks import setup_flask_lifecycle_hooks
+        
+        app = Flask(__name__)
+        # ... existing logger configuration ...
+        setup_flask_lifecycle_hooks(app)
+    """
+    
+    @app.before_request
+    def log_endpoint_request():
+        """
+        Log basic request information at DEBUG level when request starts.
+        
+        Runs BEFORE any route function executes.
+        Captures request start time and generates unique request ID.
+        """
+        # Store request start time for potential duration calculation
+        g.request_start_time = time.time()
+        
+        # Generate unique request ID for tracking this request
+        g.request_id = f"req-{int(time.time() * 1000)}-{hash(request.remote_addr) % 10000}"
+        
+        # Log request start at DEBUG level
+        logger.debug(
+            f"Request started: {request.method} {request.path} "
+            f"from {request.remote_addr} [ID: {g.request_id}]"
+        )
+    
+    @app.after_request
+    def log_endpoint_response(response):
+        """
+        Log complete API usage in AWS API Gateway format at INFO level.
+        
+        Runs AFTER route function executes (or after error handler if route failed).
+        Has access to both request and response data.
+        
+        Format matches AWS API Gateway custom access logs:
+            $sourceIp $caller $user [$requestTime] "$method $resourcePath $protocol" $status $responseLength $requestId
+        
+        Args:
+            response: Flask response object
+            
+        Returns:
+            response: Must return the response unchanged
+        """
+        # Extract request details
+        source_ip = request.remote_addr or '-'
+        
+        # Caller - not available without AWS IAM, use '-'
+        caller = '-'
+        
+        # User from X-Hubmap-User header (set by hubmap-auth after authorization)
+        # Falls back to '-' if not authenticated
+        user = request.headers.get('X-Hubmap-User', '-')
+        
+        # Request time in AWS/Apache format: [DD/MMM/YYYY:HH:MM:SS +0000]
+        request_time = datetime.utcnow().strftime('%d/%b/%Y:%H:%M:%S +0000')
+        
+        # HTTP method, path, and protocol
+        method = request.method
+        resource_path = request.path
+        protocol = request.environ.get('SERVER_PROTOCOL', 'HTTP/1.1')
+        
+        # Response status code
+        status = response.status_code
+        
+        # Response length (content length in bytes)
+        response_length = '-'
+        if response.content_length:
+            response_length = response.content_length
+        elif hasattr(response, 'data'):
+            response_length = len(response.data)
+        
+        # Request ID (generated in before_request, or '-' if not available)
+        request_id = getattr(g, 'request_id', '-')
+        
+        # Format log message matching AWS API Gateway custom access log format:
+        # $sourceIp $caller $user [$requestTime] "$method $resourcePath $protocol" $status $responseLength $requestId
+        log_message = (
+            f'{source_ip} {caller} {user} '
+            f'[{request_time}] '
+            f'"{method} {resource_path} {protocol}" '
+            f'{status} {response_length} {request_id}'
+        )
+        
+        # Log at INFO level using existing logger
+        logger.info(log_message)
+        
+        # Must return response unchanged for Flask
+        return response
@@ -0,0 +1,177 @@
+# Entity-API Test Suite
+
+This directory contains all tests for the entity-api service, organized by test type and deployment environment.
+
+## Directory Structure
+
+```
+test/
+├── README.md                    # This file - test suite overview
+├── localhost/                   # Tests for localhost Docker deployment
+│   ├── integration/            # Integration tests with hubmap-auth
+│   └── performance/            # Performance benchmarks (future)
+└── [existing test files]       # Other test types
+```
+
+## Test Categories
+
+### Localhost Tests (`localhost/`)
+
+Tests for entity-api running in Docker Desktop for local development and proof-of-concept deployments.
+
+**When to run:** Before pushing changes that affect localhost deployment, Docker configuration, or hubmap-auth integration.
+
+**See:** [localhost/README.md](localhost/README.md)
+
+### Integration Tests (`localhost/integration/`)
+
+End-to-end tests verifying entity-api integrates correctly with hubmap-auth for authorization over the `gateway_hubmap` Docker network.
+
+**See:** [localhost/integration/README.md](localhost/integration/README.md)
+
+### Performance Tests (`localhost/performance/`) - Future
+
+Load testing and performance benchmarks for localhost deployment.
+
+## Quick Start
+
+### Run All Tests
+
+```bash
+# Activate virtual environment
+source .venv/bin/activate
+
+# Run all tests
+python -m unittest discover -s test -v
+```
+
+### Run Localhost Integration Tests Only
+
+```bash
+source .venv/bin/activate
+python -m unittest discover -s test/localhost/integration -v
+```
+
+### Prerequisites
+
+1. **Docker containers running:**
+   ```bash
+   # Start hubmap-auth first
+   cd gateway
+   ./docker-localhost.sh start
+   
+   # Then start entity-api
+   cd entity-api/docker
+   ./docker-localhost.sh start
+   
+   # Verify both are healthy
+   docker ps | grep -E "hubmap-auth|entity-api"
+   ```
+
+2. **Python virtual environment:**
+
+   Tests use the same dependencies as the main application:
+   
+   ```bash
+   # Create virtual environment (first time only)
+   python3 -m venv .venv
+   
+   # Activate virtual environment
+   source .venv/bin/activate
+   
+   # Install application dependencies (includes requests)
+   pip install -r src/requirements.txt
+   ```
+
+## CI/CD Integration
+
+These tests are designed to run in GitHub Actions or similar CI/CD systems. Example workflow:
+
+```yaml
+name: Entity-API Localhost Integration Tests
+
+on: [push, pull_request]
+
+jobs:
+  test:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+      
+      - name: Checkout gateway repo
+        uses: actions/checkout@v3
+        with:
+          repository: hubmapconsortium/gateway
+          path: gateway
+      
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.13'
+      
+      - name: Create Docker network
+        run: docker network create gateway_hubmap
+      
+      - name: Start hubmap-auth
+        run: |
+          cd gateway
+          ./docker-localhost.sh build
+          ./docker-localhost.sh start
+      
+      - name: Wait for hubmap-auth healthy
+        run: timeout 60 bash -c 'until docker ps | grep hubmap-auth | grep healthy; do sleep 2; done'
+      
+      - name: Start entity-api
+        run: |
+          cd docker
+          ./docker-localhost.sh build
+          ./docker-localhost.sh start
+      
+      - name: Wait for entity-api healthy
+        run: timeout 60 bash -c 'until docker ps | grep entity-api | grep healthy; do sleep 2; done'
+      
+      - name: Install test dependencies
+        run: |
+          python -m venv .venv
+          source .venv/bin/activate
+          pip install -r src/requirements.txt
+      
+      - name: Run integration tests
+        run: |
+          source .venv/bin/activate
+          python -m unittest discover -s test/localhost/integration -v
+```
+
+## Contributing
+
+When adding new tests:
+
+1. **Choose the right directory** - Place tests in the appropriate subdirectory based on type
+2. **Follow existing patterns** - Match the style and structure of existing tests
+3. **Add documentation** - Update relevant README files
+4. **Keep tests independent** - Each test should run in isolation
+5. **Use descriptive names** - Test names should clearly indicate what they verify
+6. **Handle errors gracefully** - Provide actionable error messages
+
+## Test Execution Order
+
+Tests are discovered and run alphabetically by default. If execution order matters:
+
+1. Use `setUpClass` and `tearDownClass` for class-level setup
+2. Use `setUp` and `tearDown` for test-level setup
+3. Name test files to control discovery order if needed
+
+## Getting Help
+
+- **Test failures:** Check container logs with `docker logs entity-api`
+- **Connection errors:** Verify containers are running with `docker ps`
+- **Import errors:** Ensure virtual environment is activated
+- **Docker issues:** Check Docker Desktop is running
+- **Auth failures:** Verify hubmap-auth is running and healthy
+
+## Related Documentation
+
+- [Entity-API Deployment Guide](../README.md)
+- [Gateway API Endpoints Configuration](../../gateway/api_endpoints.localhost.json)
+- [Docker Compose Configuration](../docker/docker-compose.localhost.yml)
+- [Gateway Test Suite](../../gateway/test/README.md)