kvbm: sandbox scripts

ryanolson · ryanolson · commit 3ee364227f4d · 2025-12-05T20:07:13.000Z
Signed-off-by: Ryan Olson &lt;rolson@nvidia.com&gt;
diff --git a/.sandbox/launch_vllm_with_connector.sh b/.sandbox/launch_vllm_with_connector.sh
@@ -0,0 +1,126 @@
+#!/bin/bash
+# SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+
+# Script to launch vLLM with the DynamoConnector for testing
+
+set -e
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+REPO_ROOT="$(dirname "$SCRIPT_DIR")"
+
+# =============================================================================
+# Cleanup: Kill any previous vLLM processes
+# =============================================================================
+echo "🧹 Cleaning up previous processes..."
+pkill -9 -f "vllm.entrypoints" 2>/dev/null || true
+pkill -9 -f "EngineCore" 2>/dev/null || true
+sleep 2
+
+# Check if port 8000 is in use
+if lsof -i :8000 >/dev/null 2>&1; then
+    echo "⚠️  Port 8000 is still in use, killing processes..."
+    fuser -k 8000/tcp 2>/dev/null || true
+    sleep 1
+fi
+
+# =============================================================================
+# Environment Setup
+# =============================================================================
+
+# Find virtual environment
+if [ -d "$SCRIPT_DIR/venv" ]; then
+    VENV_PATH="$SCRIPT_DIR/venv"
+elif [ -d "$SCRIPT_DIR/.venv" ] && [ ! -L "$SCRIPT_DIR/.venv" ]; then
+    VENV_PATH="$SCRIPT_DIR/.venv"
+else
+    echo "❌ No virtual environment found!"
+    exit 1
+fi
+
+# Activate the virtual environment
+source "$VENV_PATH/bin/activate"
+
+# Ensure our kvbm package is in the path
+export PYTHONPATH="$REPO_ROOT/lib/bindings/kvbm/python:$PYTHONPATH"
+
+# =============================================================================
+# Rust Logging Configuration
+# =============================================================================
+# Set RUST_LOG if not already set - enables tracing from Rust components
+# export RUST_LOG="${RUST_LOG:-dynamo_kvbm=debug,dynamo_nova=info,warn}"
+export RUST_LOG="${RUST_LOG:-debug}"
+export DYN_LOG="${DYN_LOG:-debug}"
+
+# =============================================================================
+# vLLM Configuration
+# =============================================================================
+
+# Default model - use gpt2 for quick testing
+MODEL="${MODEL:-gpt2}"
+
+# Configure KV transfer for DynamoConnector
+# The connector is at: kvbm.v2.vllm.schedulers.connector.DynamoConnector
+kv_transfer_config='{
+  "kv_connector": "DynamoConnector",
+  "kv_role": "kv_both",
+  "kv_connector_module_path": "kvbm.v2.vllm.schedulers.connector",
+  "kv_connector_extra_config": {
+    "leader": { 
+      "cache": { "host": { "cache_size_gb": 1.0 } },
+      "tokio": { "worker_threads": 2 }
+    },
+    "worker": {
+      "nixl": { "backends": { "UCX": {}, "POSIX": {} } },
+      "tokio": { "worker_threads": 1 }
+    }
+  }
+}'
+
+# =============================================================================
+# Display Configuration
+# =============================================================================
+echo ""
+echo "🚀 Launching vLLM with DynamoConnector"
+echo "=============================================================================="
+echo ""
+echo "Environment:"
+echo "  SCRIPT_DIR:     $SCRIPT_DIR"
+echo "  REPO_ROOT:      $REPO_ROOT"
+echo "  VENV_PATH:      $VENV_PATH"
+echo "  Python:         $(which python)"
+echo "  vLLM version:   $(python -c 'import vllm; print(vllm.__version__)')"
+echo "  kvbm version:   $(python -c 'import kvbm; print(kvbm.__version__)' 2>/dev/null || echo 'N/A')"
+echo ""
+echo "PYTHONPATH:"
+echo "  $PYTHONPATH" | tr ':' '\n' | head -3
+echo ""
+echo "Rust Logging:"
+echo "  RUST_LOG:       $RUST_LOG"
+echo ""
+echo "vLLM Configuration:"
+echo "  Model:          $MODEL"
+echo "  Host:           127.0.0.1"
+echo "  Port:           8000"
+echo "  Enforce Eager:  true"
+echo ""
+echo "KV Transfer Config:"
+echo "$kv_transfer_config" | python -m json.tool 2>/dev/null || echo "$kv_transfer_config"
+echo ""
+echo "GPU Status:"
+nvidia-smi --query-gpu=index,name,memory.free,memory.total --format=csv,noheader 2>/dev/null || echo "  nvidia-smi not available"
+echo ""
+echo "=============================================================================="
+echo ""
+
+# =============================================================================
+# Launch vLLM
+# =============================================================================
+# Using --enforce-eager to avoid CUDA graph compilation overhead during testing
+exec python -m vllm.entrypoints.openai.api_server \
+  --model "$MODEL" \
+  --kv-transfer-config "$kv_transfer_config" \
+  --enforce-eager \
+  --host 127.0.0.1 \
+  --port 8000 \
+  "$@"
diff --git a/.sandbox/rebuild.sh b/.sandbox/rebuild.sh
@@ -0,0 +1,55 @@
+#!/bin/bash
+# SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+
+# Quick rebuild script for the kvbm Python bindings
+# Uses local venv if exists, otherwise tries default location
+
+set -e
+
+echo "🔧 Rebuilding KVBM Python bindings..."
+echo "=================================="
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+REPO_ROOT="$(dirname "$SCRIPT_DIR")"
+KVBM_BINDINGS_DIR="$REPO_ROOT/lib/bindings/kvbm"
+
+# Find virtual environment
+# Priority: local venv > local .venv > symlinked .venv
+if [ -d "$SCRIPT_DIR/venv" ]; then
+    VENV_PATH="$SCRIPT_DIR/venv"
+elif [ -d "$SCRIPT_DIR/.venv" ] && [ ! -L "$SCRIPT_DIR/.venv" ]; then
+    VENV_PATH="$SCRIPT_DIR/.venv"
+elif [ -L "$SCRIPT_DIR/.venv" ] && [ -d "$(readlink -f "$SCRIPT_DIR/.venv")" ]; then
+    VENV_PATH="$(readlink -f "$SCRIPT_DIR/.venv")"
+else
+    echo "❌ No virtual environment found!"
+    echo "   Expected locations:"
+    echo "     - $SCRIPT_DIR/venv"
+    echo "     - $SCRIPT_DIR/.venv"
+    echo ""
+    echo "   Create one with: python -m venv $SCRIPT_DIR/venv"
+    exit 1
+fi
+
+echo "📦 Using venv: $VENV_PATH"
+
+# Activate the virtual environment
+source "$VENV_PATH/bin/activate"
+
+# Navigate to the kvbm Python bindings directory
+cd "$KVBM_BINDINGS_DIR"
+
+echo "📦 Building with maturin..."
+echo "Build mode: dev (default)"
+echo ""
+
+# Build with maturin develop
+maturin develop
+
+echo ""
+echo "✅ Build complete!"
+echo "Package: kvbm"
+
+# Verify the build
+python -c "from kvbm._core import v2; print(f'kvbm._core.v2 loaded: {[a for a in dir(v2) if not a.startswith(\"_\")]}')"
diff --git a/.sandbox/test_cmpl_1.sh b/.sandbox/test_cmpl_1.sh
@@ -0,0 +1,13 @@
+#!/bin/bash
+
+# Script to send a completion request to vLLM
+# Endpoint: http://127.0.0.1:8000/v1/completions
+
+curl -X POST http://127.0.0.1:8000/v1/completions \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "gpt2",
+    "prompt": "what is a dynamo? and how did it signify the start of the industrial revolution?",
+    "max_tokens": 16,
+    "temperature": 0
+  }'
diff --git a/.sandbox/test_e2e.sh b/.sandbox/test_e2e.sh
@@ -0,0 +1,116 @@
+#!/bin/bash
+# SPDX-FileCopyrightText: Copyright (c) 2024-2025 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+# SPDX-License-Identifier: Apache-2.0
+
+# All-in-one test script that:
+# 1. Rebuilds Python bindings
+# 2. Launches vLLM with connector
+# 3. Waits for server to be ready
+# 4. Sends test completion request
+# 5. Captures all output
+
+set -e
+
+SCRIPT_DIR="$(cd "$(dirname "$0")" && pwd)"
+LOG_FILE="$SCRIPT_DIR/test_e2e_$(date +%Y%m%d_%H%M%S).log"
+
+echo "===================================================================="
+echo "End-to-End KVBM Connector Test"
+echo "===================================================================="
+echo ""
+echo "Log file: $LOG_FILE"
+echo ""
+
+# Function to cleanup on exit
+cleanup() {
+    echo ""
+    echo "Cleaning up..."
+    pkill -9 -f "vllm.entrypoints" 2>/dev/null || true
+    pkill -9 -f "EngineCore" 2>/dev/null || true
+}
+
+trap cleanup EXIT
+
+# Step 1: Rebuild bindings
+echo "Step 1: Rebuilding Python bindings..."
+echo "---------------------------------------------------------------------"
+if ! "$SCRIPT_DIR/rebuild.sh" 2>&1 | tee -a "$LOG_FILE"; then
+    echo "❌ Rebuild failed!"
+    exit 1
+fi
+
+echo "✅ Rebuild complete"
+echo ""
+
+# Step 2: Launch vLLM in background
+echo "Step 2: Launching vLLM with DynamoConnector..."
+echo "---------------------------------------------------------------------"
+
+# Launch vLLM in background using the existing script
+"$SCRIPT_DIR/launch_vllm_with_connector.sh" 2>&1 >> "$LOG_FILE" &
+VLLM_PID=$!
+
+echo "vLLM launched with PID: $VLLM_PID"
+echo ""
+
+# Step 3: Wait for server to be ready
+echo "Step 3: Waiting for vLLM server to be ready on port 8000..."
+echo "---------------------------------------------------------------------"
+
+MAX_WAIT=60
+WAIT_COUNT=0
+
+while ! curl -s http://127.0.0.1:8000/health &>/dev/null; do
+    if [ $WAIT_COUNT -ge $MAX_WAIT ]; then
+        echo "❌ Timeout waiting for vLLM server (waited ${MAX_WAIT}s)"
+        exit 1
+    fi
+
+    # Check if process is still running
+    if ! kill -0 $VLLM_PID 2>/dev/null; then
+        echo "❌ vLLM process died during startup"
+        exit 1
+    fi
+
+    echo -n "."
+    sleep 1
+    WAIT_COUNT=$((WAIT_COUNT + 1))
+done
+
+echo ""
+echo "✅ vLLM server is ready!"
+echo ""
+
+# Step 4: Send test request
+echo "Step 4: Sending test completion request..."
+echo "---------------------------------------------------------------------"
+
+RESPONSE=$("$SCRIPT_DIR/test_cmpl_1.sh" 2>&1 | tee -a "$LOG_FILE")
+
+echo "$RESPONSE"
+echo ""
+
+# Check if response contains error
+if echo "$RESPONSE" | grep -q '"error"'; then
+    echo "❌ Request failed with error"
+
+    echo ""
+    echo "Recent logs from vLLM:"
+    echo "---------------------------------------------------------------------"
+    tail -50 "$LOG_FILE" | grep -A 10 -i "error\|exception\|traceback" || tail -50 "$LOG_FILE"
+
+    exit 1
+else
+    echo "✅ Request completed successfully"
+fi
+
+echo ""
+echo "===================================================================="
+echo "Test Summary"
+echo "===================================================================="
+echo "✅ Bindings rebuilt"
+echo "✅ vLLM launched and initialized"
+echo "✅ Completion request processed"
+echo ""
+echo "Full logs saved to: $LOG_FILE"
+echo ""