Merge pull request #108 from smart-mcp-proxy/fix/include-tray-binary-in-all-platforms

Dumbris · web-flow · commit 9b0c03589ed4 · 2025-10-27T18:53:33.000+02:00
fix: include mcpproxy-tray binary in Windows archives
diff --git a/.github/workflows/pr-build.yml b/.github/workflows/pr-build.yml
@@ -63,16 +63,16 @@ jobs:
             cgo: "0"
             name: mcpproxy-linux-arm64
             archive_format: tar.gz
-          - os: ubuntu-latest
+          - os: windows-latest
             goos: windows
             goarch: amd64
-            cgo: "0"
+            cgo: "1"
             name: mcpproxy-windows-amd64.exe
             archive_format: zip
-          - os: ubuntu-latest
+          - os: windows-latest
             goos: windows
             goarch: arm64
-            cgo: "0"
+            cgo: "1"
             name: mcpproxy-windows-arm64.exe
             archive_format: zip
           - os: macos-14
@@ -129,15 +129,26 @@ jobs:
         run: cd frontend && npm run build
 
       - name: Copy frontend dist for embedding
+        shell: bash
         run: |
           rm -rf web/frontend
           mkdir -p web/frontend
           cp -r frontend/dist web/frontend/
 
       - name: Run tests (skip binary E2E tests - not compatible with cross-compilation)
-        run: go test -tags nogui -v -skip "E2E|Binary|MCPProtocol" ./...
+        # Skip tests for Windows ARM64 (cross-compilation - can't run ARM64 binaries on AMD64 runner)
+        if: '!(matrix.goos == ''windows'' && matrix.goarch == ''arm64'')'
+        shell: bash
+        run: |
+          # On Windows, skip internal/server tests (E2E tests timeout after 11 minutes)
+          if [ "${{ matrix.goos }}" = "windows" ]; then
+            go test -tags nogui -v -skip "E2E|Binary|MCPProtocol" $(go list ./... | grep -v 'internal/server$')
+          else
+            go test -tags nogui -v -skip "E2E|Binary|MCPProtocol" ./...
+          fi
 
       - name: Build binary and create archives
+        shell: bash
         env:
           CGO_ENABLED: ${{ matrix.cgo }}
           GOOS: ${{ matrix.goos }}
@@ -161,10 +172,18 @@ jobs:
           # Create clean core binary for archive
           go build -ldflags "${LDFLAGS}" -o ${CLEAN_BINARY} ./cmd/mcpproxy
 
-          # Build tray binary for macOS
-          if [ "${{ matrix.goos }}" = "darwin" ]; then
-            echo "Building mcpproxy-tray for macOS..."
-            go build -ldflags "${LDFLAGS}" -o mcpproxy-tray ./cmd/mcpproxy-tray
+          # Build tray binary for platforms with GUI support (macOS and Windows)
+          if [ "${{ matrix.goos }}" = "darwin" ] || [ "${{ matrix.goos }}" = "windows" ]; then
+            echo "Building mcpproxy-tray for ${{ matrix.goos }}..."
+
+            # Determine tray binary name
+            if [ "${{ matrix.goos }}" = "windows" ]; then
+              TRAY_BINARY="mcpproxy-tray.exe"
+            else
+              TRAY_BINARY="mcpproxy-tray"
+            fi
+
+            go build -ldflags "${LDFLAGS}" -o ${TRAY_BINARY} ./cmd/mcpproxy-tray
           fi
 
           # Ad-hoc sign macOS binaries (development only)
@@ -182,12 +201,31 @@ jobs:
           # Create archive with version info
           ARCHIVE_BASE="mcpproxy-${VERSION#v}-${{ matrix.goos }}-${{ matrix.goarch }}"
 
+          # Determine files to include in archive
+          FILES_TO_ARCHIVE="${CLEAN_BINARY}"
+
+          # Add tray binary if it exists (Windows and macOS)
+          if [ "${{ matrix.goos }}" = "windows" ] && [ -f "mcpproxy-tray.exe" ]; then
+            FILES_TO_ARCHIVE="${FILES_TO_ARCHIVE} mcpproxy-tray.exe"
+            echo "Including mcpproxy-tray.exe in archive"
+          elif [ "${{ matrix.goos }}" = "darwin" ] && [ -f "mcpproxy-tray" ]; then
+            FILES_TO_ARCHIVE="${FILES_TO_ARCHIVE} mcpproxy-tray"
+            echo "Including mcpproxy-tray in archive"
+          fi
+
           if [ "${{ matrix.archive_format }}" = "zip" ]; then
-            # Create archive
-            zip "${ARCHIVE_BASE}.zip" ${CLEAN_BINARY}
+            # Create ZIP archive (Windows)
+            # Use PowerShell Compress-Archive on Windows since zip command isn't available
+            if [ "${{ matrix.goos }}" = "windows" ]; then
+              # Convert space-separated list to comma-separated for PowerShell
+              PS_FILES=$(echo ${FILES_TO_ARCHIVE} | sed 's/ /,/g')
+              powershell -Command "Compress-Archive -Path ${PS_FILES} -DestinationPath '${ARCHIVE_BASE}.zip'"
+            else
+              zip "${ARCHIVE_BASE}.zip" ${FILES_TO_ARCHIVE}
+            fi
           else
-            # Create archive
-            tar -czf "${ARCHIVE_BASE}.tar.gz" ${CLEAN_BINARY}
+            # Create tar.gz archive (Unix)
+            tar -czf "${ARCHIVE_BASE}.tar.gz" ${FILES_TO_ARCHIVE}
           fi
 
       - name: Create .icns icon (macOS)
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
@@ -31,16 +31,16 @@ jobs:
             cgo: "0"
             name: mcpproxy-linux-arm64
             archive_format: tar.gz
-          - os: ubuntu-latest
+          - os: windows-latest
             goos: windows
             goarch: amd64
-            cgo: "0"
+            cgo: "1"
             name: mcpproxy-windows-amd64.exe
             archive_format: zip
-          - os: ubuntu-latest
+          - os: windows-latest
             goos: windows
             goarch: arm64
-            cgo: "0"
+            cgo: "1"
             name: mcpproxy-windows-arm64.exe
             archive_format: zip
           - os: macos-14
@@ -92,6 +92,7 @@ jobs:
         run: cd frontend && npm run build
 
       - name: Copy frontend dist to embed location
+        shell: bash
         run: |
           rm -rf web/frontend
           mkdir -p web/frontend
@@ -176,6 +177,7 @@ jobs:
           echo "✅ Certificate import completed"
 
       - name: Build binary and create archives
+        shell: bash
         env:
           CGO_ENABLED: ${{ matrix.cgo }}
           GOOS: ${{ matrix.goos }}
@@ -199,10 +201,18 @@ jobs:
           # Create clean core binary for archive
           go build -ldflags "${LDFLAGS}" -o ${CLEAN_BINARY} ./cmd/mcpproxy
 
-          # Build tray binary for macOS
-          if [ "${{ matrix.goos }}" = "darwin" ]; then
-            echo "Building mcpproxy-tray for macOS..."
-            go build -ldflags "${LDFLAGS}" -o mcpproxy-tray ./cmd/mcpproxy-tray
+          # Build tray binary for platforms with GUI support (macOS and Windows)
+          if [ "${{ matrix.goos }}" = "darwin" ] || [ "${{ matrix.goos }}" = "windows" ]; then
+            echo "Building mcpproxy-tray for ${{ matrix.goos }}..."
+
+            # Determine tray binary name
+            if [ "${{ matrix.goos }}" = "windows" ]; then
+              TRAY_BINARY="mcpproxy-tray.exe"
+            else
+              TRAY_BINARY="mcpproxy-tray"
+            fi
+
+            go build -ldflags "${LDFLAGS}" -o ${TRAY_BINARY} ./cmd/mcpproxy-tray
           fi
 
           # Code sign macOS binaries
@@ -384,16 +394,37 @@ jobs:
           ARCHIVE_BASE="mcpproxy-${VERSION#v}-${{ matrix.goos }}-${{ matrix.goarch }}"
           LATEST_ARCHIVE_BASE="mcpproxy-latest-${{ matrix.goos }}-${{ matrix.goarch }}"
 
+          # Determine files to include in archive
+          FILES_TO_ARCHIVE="${CLEAN_BINARY}"
+
+          # Add tray binary if it exists (Windows and macOS)
+          if [ "${{ matrix.goos }}" = "windows" ] && [ -f "mcpproxy-tray.exe" ]; then
+            FILES_TO_ARCHIVE="${FILES_TO_ARCHIVE} mcpproxy-tray.exe"
+            echo "Including mcpproxy-tray.exe in archive"
+          elif [ "${{ matrix.goos }}" = "darwin" ] && [ -f "mcpproxy-tray" ]; then
+            FILES_TO_ARCHIVE="${FILES_TO_ARCHIVE} mcpproxy-tray"
+            echo "Including mcpproxy-tray in archive"
+          fi
+
           if [ "${{ matrix.archive_format }}" = "zip" ]; then
-            # Create versioned archive
-            zip "${ARCHIVE_BASE}.zip" ${CLEAN_BINARY}
-            # Create latest archive
-            zip "${LATEST_ARCHIVE_BASE}.zip" ${CLEAN_BINARY}
+            # Create ZIP archive (Windows)
+            # Use PowerShell Compress-Archive on Windows since zip command isn't available
+            if [ "${{ matrix.goos }}" = "windows" ]; then
+              # Convert space-separated list to comma-separated for PowerShell
+              PS_FILES=$(echo ${FILES_TO_ARCHIVE} | sed 's/ /,/g')
+              powershell -Command "Compress-Archive -Path ${PS_FILES} -DestinationPath '${ARCHIVE_BASE}.zip'"
+              powershell -Command "Compress-Archive -Path ${PS_FILES} -DestinationPath '${LATEST_ARCHIVE_BASE}.zip'"
+            else
+              # Create versioned archive
+              zip "${ARCHIVE_BASE}.zip" ${FILES_TO_ARCHIVE}
+              # Create latest archive
+              zip "${LATEST_ARCHIVE_BASE}.zip" ${FILES_TO_ARCHIVE}
+            fi
           else
             # Create versioned archive
-            tar -czf "${ARCHIVE_BASE}.tar.gz" ${CLEAN_BINARY}
-            # Create latest archive  
-            tar -czf "${LATEST_ARCHIVE_BASE}.tar.gz" ${CLEAN_BINARY}
+            tar -czf "${ARCHIVE_BASE}.tar.gz" ${FILES_TO_ARCHIVE}
+            # Create latest archive
+            tar -czf "${LATEST_ARCHIVE_BASE}.tar.gz" ${FILES_TO_ARCHIVE}
           fi
 
       - name: Create .icns icon (macOS)
diff --git a/STABILITY_UPSTREAM.md b/STABILITY_UPSTREAM.md
@@ -0,0 +1,63 @@
+# Upstream Stability Investigation Plan
+
+## Observed Symptoms
+- JetBrains MCP over SSE never surfaces tools, while stdio loads but drops connections; when this happens the dashboard freezes or the daemon hangs until forced termination (reported on Xubuntu 25.04 running as a user-scoped systemd service).
+- Intermittent upstream instability is suspected to stem from SSE transport behaviour and OAuth refresh handling.
+
+## Working Hypotheses (code references)
+1. **SSE timeout ejects long-lived streams** – `internal/transport/http.go:225-279` hard-codes `http.Client{Timeout: 180 * time.Second}` for SSE. Go’s client timeout covers the entire request, so an otherwise healthy SSE stream is forcibly closed every three minutes, likely leaving the proxy in a bad state when the upstream cannot recover quickly.
+2. **Endpoint bootstrap deadline too aggressive** – the SSE transport waits only 30s for the `endpoint` event (`github.com/mark3labs/mcp-go@v0.38.0/client/transport/sse.go:176-187`). If JetBrains (or other) servers delay emitting the endpoint while doing OAuth/device checks, we fail before tools load.
+3. **OAuth browser flow races with remote UX** – manual OAuth waits 30s for the callback (`internal/upstream/core/connection.go:1722-1759`). In a remote/systemd scenario the user may need more time (or use an out-of-band browser), causing repeated failures and triggering connection churn.
+4. **Connection-loss handling gaps** – we never register `Client.OnConnectionLost(...)` on SSE transports, so HTTP/2 idle resets or GOAWAY frames (which JetBrains emits) go unnoticed until the next RPC, amplifying freeze perceptions. This also limits our ability to surface diagnostics in logs/UI.
+
+## Phase 1 – Reproduce & Capture Baseline
+- Configure two JetBrains upstreams (SSE and stdio) with `log.level=debug` and, if possible, `transport` trace logging.
+- Exercising `scripts/run-web-smoke.sh` and manual UI navigation, collect:
+  - Upstream-specific logs under `~/.mcpproxy/logs/<server>.log`.
+  - HTTP traces for `/events` (SSE) and `/api/v1` from the proxy (e.g. `MITM_PROXY=1 go run ./cmd/mcpproxy` or curl with `--trace-time`).
+  - OAuth callback timing from `internal/oauth` logs to confirm 30s deadline trigger frequency.
+- Inspect BoltDB (`bbolt` CLI or `scripts/db-dump.go`) for stored OAuth tokens to see if refresh metadata is present/updated.
+
+**Verification checklist**
+- [ ] Baseline reproduction yields “timeout waiting for endpoint” or “context deadline exceeded” in logs when SSE fails.
+- [ ] Confirm whether OAuth callback timeout entries align with user interaction delays.
+- [ ] Identify whether SSE stream closes almost exactly at 180s uptime.
+
+## Phase 2 – SSE Transport Hardening
+- Audit the full SSE pipeline:
+  - Replace the global `http.Client.Timeout` with per-request contexts or keepalive idle deadlines; ensure this does not regress HTTP fallback.
+  - Capture GOAWAY/NO_ERROR disconnects by wiring `client.OnConnectionLost` inside `core.connectSSE` and propagate them to the managed client.
+  - Revisit the 30s endpoint wait; consider JetBrains-specific delay or signal logging (e.g. log the time between `Start` and first `endpoint` frame).
+- Develop instrumentation hooks:
+  - Record SSE connection uptime, retry counters, and last-error state in `StateManager`.
+  - Emit structured events (e.g., `EventTypeUpstreamTransport`) with transport diagnostics for `/events`.
+
+**Verification checklist**
+- [ ] Stress an SSE upstream for >10 minutes and confirm no forced disconnect occurs due to client timeout.
+- [ ] Simulate endpoint delay (e.g., proxy that waits 90s before emitting) and confirm new logic handles it or logs actionable warnings.
+- [ ] Ensure managed state transitions (`ready` → `error` → `reconnecting`) align with injected connection-lost scenarios.
+
+## Phase 3 – OAuth Token Lifecycle Review
+- Trace refresh flow end-to-end:
+  - Instrument `PersistentTokenStore.SaveToken/GetToken` to log token expiry deltas (guarded by debug level).
+  - Validate `MarkOAuthCompletedWithDB` propagation by queuing fake events in BoltDB and ensuring `Manager.processOAuthEvents` consumes them without double-processing.
+  - Explore extending the OAuth callback wait window and providing CLI guidance for headless setups (e.g., print verification URL without failing immediately).
+- Consider tooling to introspect OAuth state (`/api/v1/oauth/status` or tray dialog) so users can identify expired/invalid tokens.
+
+**Verification checklist**
+- [ ] Refreshing an OAuth token updates BoltDB and triggers a reconnect without manual intervention.
+- [ ] Extending callback timeout (experimentally) eliminates repeated “OAuth authorization timeout” messages for remote environments.
+- [ ] Cross-process completion events always drive a reconnect within the expected polling window (≤5s default).
+
+## Phase 4 – Introspection & User-Facing Diagnostics
+- Design lightweight diagnostics:
+  - CLI subcommand (e.g., `mcpproxy debug upstream <name>`) to dump current transport stats, token expiry, last error, and SSE uptime.
+  - Optional `/api/v1/diagnostics/upstream` endpoint returning same payload for UI integration.
+- Expand logging guidance in `MANUAL_TESTING.md` for capturing SSE issues (e.g., enabling trace on `transport` logger, how to tail upstream logs).
+- Evaluate adding Prometheus-style counters (connection retries, OAuth failures) to aid longer-term monitoring.
+
+**Verification checklist**
+- [ ] Diagnostics output surfaces enough context for a user to determine whether the issue is OAuth, SSE transport, or upstream crash.
+- [ ] UI/tray can surface a human-readable warning when SSE drops repeatedly (without freezing).
+- [ ] Documentation changes tested by a fresh install following the guide reproduce the troubleshooting steps successfully.
+
diff --git a/internal/server/info_shutdown_e2e_test.go b/internal/server/info_shutdown_e2e_test.go
@@ -10,6 +10,7 @@ import (
 	"os"
 	"os/exec"
 	"path/filepath"
+	"runtime"
 	"syscall"
 	"testing"
 	"time"
@@ -289,8 +290,12 @@ func TestSocketInfoEndpoint(t *testing.T) {
 func buildTestBinary(t *testing.T) (string, func()) {
 	t.Helper()
 
-	// Build binary
-	binaryPath := filepath.Join(t.TempDir(), "mcpproxy-test")
+	// Build binary with proper extension for Windows
+	binaryName := "mcpproxy-test"
+	if runtime.GOOS == "windows" {
+		binaryName += ".exe"
+	}
+	binaryPath := filepath.Join(t.TempDir(), binaryName)
 
 	buildCmd := exec.Command("go", "build",
 		"-o", binaryPath,