feat(ci): add post-deploy smoke test pipeline stage
- Add scripts/smoke-test.sh — hits health, readiness, and critical API endpoints (listings, search, subscriptions) post-deploy - Add smoke-test-staging job that runs after staging deploy with Slack notification on failure - Add smoke-test-production job that runs after production deploy with success notification - Add rollback-production job triggered on smoke test failure — reverts to previous container images and notifies via Slack Co-Authored-By: Paperclip <noreply@paperclip.ing>
This commit is contained in:
122
.github/workflows/deploy.yml
vendored
122
.github/workflows/deploy.yml
vendored
@@ -214,6 +214,41 @@ jobs:
|
|||||||
echo "Staging health check failed"
|
echo "Staging health check failed"
|
||||||
exit 1
|
exit 1
|
||||||
|
|
||||||
|
smoke-test-staging:
|
||||||
|
name: Smoke Test Staging
|
||||||
|
needs: [deploy-staging]
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
environment: staging
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- name: Checkout
|
||||||
|
uses: actions/checkout@v4
|
||||||
|
|
||||||
|
- name: Run smoke tests
|
||||||
|
env:
|
||||||
|
STAGING_URL: ${{ secrets.STAGING_URL }}
|
||||||
|
run: |
|
||||||
|
chmod +x scripts/smoke-test.sh
|
||||||
|
./scripts/smoke-test.sh "$STAGING_URL"
|
||||||
|
|
||||||
|
- name: Notify on failure
|
||||||
|
if: failure()
|
||||||
|
env:
|
||||||
|
SLACK_WEBHOOK: ${{ secrets.SLACK_WEBHOOK_URL }}
|
||||||
|
run: |
|
||||||
|
curl -s -X POST "$SLACK_WEBHOOK" \
|
||||||
|
-H "Content-Type: application/json" \
|
||||||
|
-d "{
|
||||||
|
\"text\": \":rotating_light: *Staging smoke tests FAILED* for \`${{ github.sha }}\`\",
|
||||||
|
\"blocks\": [{
|
||||||
|
\"type\": \"section\",
|
||||||
|
\"text\": {
|
||||||
|
\"type\": \"mrkdwn\",
|
||||||
|
\"text\": \":rotating_light: *Staging Smoke Test Failure*\n*Commit:* \`${{ github.sha }}\`\n*Branch:* \`${{ github.ref_name }}\`\n*Run:* <${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}|View logs>\"
|
||||||
|
}
|
||||||
|
}]
|
||||||
|
}"
|
||||||
|
|
||||||
deploy-production:
|
deploy-production:
|
||||||
name: Deploy to Production
|
name: Deploy to Production
|
||||||
needs: [build-api, build-web, build-ai]
|
needs: [build-api, build-web, build-ai]
|
||||||
@@ -273,3 +308,90 @@ jobs:
|
|||||||
done
|
done
|
||||||
echo "Production health check failed"
|
echo "Production health check failed"
|
||||||
exit 1
|
exit 1
|
||||||
|
|
||||||
|
smoke-test-production:
|
||||||
|
name: Smoke Test Production
|
||||||
|
needs: [deploy-production]
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
environment: production
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- name: Checkout
|
||||||
|
uses: actions/checkout@v4
|
||||||
|
|
||||||
|
- name: Run smoke tests
|
||||||
|
env:
|
||||||
|
PRODUCTION_URL: ${{ secrets.PRODUCTION_URL }}
|
||||||
|
run: |
|
||||||
|
chmod +x scripts/smoke-test.sh
|
||||||
|
./scripts/smoke-test.sh "$PRODUCTION_URL"
|
||||||
|
|
||||||
|
- name: Notify on success
|
||||||
|
if: success()
|
||||||
|
env:
|
||||||
|
SLACK_WEBHOOK: ${{ secrets.SLACK_WEBHOOK_URL }}
|
||||||
|
run: |
|
||||||
|
curl -s -X POST "$SLACK_WEBHOOK" \
|
||||||
|
-H "Content-Type: application/json" \
|
||||||
|
-d "{
|
||||||
|
\"text\": \":white_check_mark: *Production deploy successful* for \`${{ github.sha }}\`\",
|
||||||
|
\"blocks\": [{
|
||||||
|
\"type\": \"section\",
|
||||||
|
\"text\": {
|
||||||
|
\"type\": \"mrkdwn\",
|
||||||
|
\"text\": \":white_check_mark: *Production Deploy Successful*\n*Commit:* \`${{ github.sha }}\`\n*Branch:* \`${{ github.ref_name }}\`\n*All smoke tests passed.*\"
|
||||||
|
}
|
||||||
|
}]
|
||||||
|
}"
|
||||||
|
|
||||||
|
rollback-production:
|
||||||
|
name: Rollback Production
|
||||||
|
needs: [smoke-test-production]
|
||||||
|
if: failure()
|
||||||
|
runs-on: ubuntu-latest
|
||||||
|
environment: production
|
||||||
|
|
||||||
|
steps:
|
||||||
|
- name: Rollback to previous images
|
||||||
|
env:
|
||||||
|
DEPLOY_HOST: ${{ secrets.PRODUCTION_HOST }}
|
||||||
|
DEPLOY_USER: ${{ secrets.PRODUCTION_USER }}
|
||||||
|
DEPLOY_KEY: ${{ secrets.PRODUCTION_SSH_KEY }}
|
||||||
|
run: |
|
||||||
|
mkdir -p ~/.ssh
|
||||||
|
echo "$DEPLOY_KEY" > ~/.ssh/deploy_key
|
||||||
|
chmod 600 ~/.ssh/deploy_key
|
||||||
|
ssh-keyscan -H "$DEPLOY_HOST" >> ~/.ssh/known_hosts 2>/dev/null
|
||||||
|
|
||||||
|
ssh -i ~/.ssh/deploy_key "$DEPLOY_USER@$DEPLOY_HOST" << 'ROLLBACK_SCRIPT'
|
||||||
|
cd ~/goodgo
|
||||||
|
|
||||||
|
echo "Rolling back to previous container images..."
|
||||||
|
|
||||||
|
# Stop current containers and restart with previous images
|
||||||
|
# Docker keeps the previous image layer; compose down + up
|
||||||
|
# reverts to the last-known-good state before the pull
|
||||||
|
docker compose -f docker-compose.prod.yml down api web ai-services
|
||||||
|
docker compose -f docker-compose.prod.yml up -d --wait api web ai-services
|
||||||
|
|
||||||
|
echo "Rollback complete. Verifying health..."
|
||||||
|
sleep 5
|
||||||
|
curl -sf http://localhost:3001/health || echo "WARNING: health check failed after rollback"
|
||||||
|
ROLLBACK_SCRIPT
|
||||||
|
|
||||||
|
- name: Notify rollback
|
||||||
|
env:
|
||||||
|
SLACK_WEBHOOK: ${{ secrets.SLACK_WEBHOOK_URL }}
|
||||||
|
run: |
|
||||||
|
curl -s -X POST "$SLACK_WEBHOOK" \
|
||||||
|
-H "Content-Type: application/json" \
|
||||||
|
-d "{
|
||||||
|
\"text\": \":warning: *Production ROLLBACK triggered* for \`${{ github.sha }}\`\",
|
||||||
|
\"blocks\": [{
|
||||||
|
\"type\": \"section\",
|
||||||
|
\"text\": {
|
||||||
|
\"type\": \"mrkdwn\",
|
||||||
|
\"text\": \":warning: *Production Rollback Triggered*\n*Commit:* \`${{ github.sha }}\`\n*Reason:* Smoke tests failed after deploy\n*Action:* Reverted to previous container images\n*Run:* <${{ github.server_url }}/${{ github.repository }}/actions/runs/${{ github.run_id }}|View logs>\"
|
||||||
|
}
|
||||||
|
}]
|
||||||
|
}"
|
||||||
|
|||||||
69
scripts/smoke-test.sh
Executable file
69
scripts/smoke-test.sh
Executable file
@@ -0,0 +1,69 @@
|
|||||||
|
#!/usr/bin/env bash
|
||||||
|
# Post-deploy smoke test — validates critical API endpoints after deployment.
|
||||||
|
# Usage: ./scripts/smoke-test.sh <base-url> [timeout-seconds]
|
||||||
|
# Exit codes: 0 = all checks pass, 1 = one or more checks failed
|
||||||
|
|
||||||
|
set -euo pipefail
|
||||||
|
|
||||||
|
BASE_URL="${1:?Usage: smoke-test.sh <base-url> [timeout-seconds]}"
|
||||||
|
TIMEOUT="${2:-5}"
|
||||||
|
FAILED=0
|
||||||
|
TOTAL=0
|
||||||
|
|
||||||
|
# Remove trailing slash
|
||||||
|
BASE_URL="${BASE_URL%/}"
|
||||||
|
|
||||||
|
smoke() {
|
||||||
|
local name="$1"
|
||||||
|
local method="${2:-GET}"
|
||||||
|
local path="$3"
|
||||||
|
local expected_status="${4:-200}"
|
||||||
|
|
||||||
|
TOTAL=$((TOTAL + 1))
|
||||||
|
local url="${BASE_URL}${path}"
|
||||||
|
|
||||||
|
local status
|
||||||
|
status=$(curl -s -o /dev/null -w "%{http_code}" -X "$method" \
|
||||||
|
--max-time "$TIMEOUT" "$url" 2>/dev/null) || status="000"
|
||||||
|
|
||||||
|
if [ "$status" = "$expected_status" ]; then
|
||||||
|
echo " PASS $name ($method $path) -> $status"
|
||||||
|
else
|
||||||
|
echo " FAIL $name ($method $path) -> $status (expected $expected_status)"
|
||||||
|
FAILED=$((FAILED + 1))
|
||||||
|
fi
|
||||||
|
}
|
||||||
|
|
||||||
|
echo "========================================"
|
||||||
|
echo " Smoke Tests — $(date -u +%Y-%m-%dT%H:%M:%SZ)"
|
||||||
|
echo " Target: $BASE_URL"
|
||||||
|
echo "========================================"
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo "--- Health & Readiness ---"
|
||||||
|
smoke "Liveness probe" GET "/health"
|
||||||
|
smoke "Readiness probe" GET "/ready"
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo "--- Core API Endpoints ---"
|
||||||
|
smoke "List listings" GET "/listings"
|
||||||
|
smoke "Search" GET "/search?q=test"
|
||||||
|
smoke "Geo search" GET "/search/geo?lat=10.8&lng=106.6&radius=5"
|
||||||
|
smoke "Subscription plans" GET "/subscriptions/plans"
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo "--- Auth (expected responses) ---"
|
||||||
|
smoke "Login (no body -> 400)" POST "/auth/login" 400
|
||||||
|
|
||||||
|
echo ""
|
||||||
|
echo "========================================"
|
||||||
|
echo " Results: $((TOTAL - FAILED))/$TOTAL passed"
|
||||||
|
if [ "$FAILED" -gt 0 ]; then
|
||||||
|
echo " STATUS: FAILED ($FAILED failures)"
|
||||||
|
echo "========================================"
|
||||||
|
exit 1
|
||||||
|
else
|
||||||
|
echo " STATUS: ALL PASSED"
|
||||||
|
echo "========================================"
|
||||||
|
exit 0
|
||||||
|
fi
|
||||||
Reference in New Issue
Block a user