feat: Integrate CI workflow for tck mandatory tests (#164)

guglielmo-san · web-flow · commit 4b8f783f43e1 · 2025-11-05T15:04:56.000+01:00
# Description This PR introduces a new CI pipeline that will run automatically on every push and pull request on the main branch. The created pipeline is responsible for running the tck mandatory tests against the the newly created sample agent in the tck forlder. Thank you for opening a Pull Request! Before submitting your PR, there are a few things you can do to make sure it goes smoothly: - [x] Follow the [`CONTRIBUTING` Guide](https://github.com/google-a2a/a2a-js/blob/main/CONTRIBUTING.md). - [x] Make your Pull Request title in the <https://www.conventionalcommits.org/> specification. - Important Prefixes for [release-please](https://github.com/googleapis/release-please): - `fix:` which represents bug fixes, and correlates to a [SemVer](https://semver.org/) patch. - `feat:` represents a new feature, and correlates to a SemVer minor. - `feat!:`, or `fix!:`, `refactor!:`, etc., which represent a breaking change (indicated by the `!`) and will result in a SemVer major. - [x] Ensure the tests and linter pass - [x] Appropriate docs were updated (if necessary) Fixes #159 🦕
diff --git a/.github/workflows/run-tck.yaml b/.github/workflows/run-tck.yaml
@@ -0,0 +1,104 @@
+name: Run TCK
+
+on:
+  push:
+    branches: [ "main" ]
+  pull_request:
+    branches: [ "main" ]
+
+
+env:
+  # TODO once we have the TCK for 0.4.0 we will need to look at the branch to decide which TCK version to run.
+  # Tag of the TCK
+  TCK_VERSION: 0.3.0.beta3
+  # Tells uv to not need a venv, and instead use system
+  UV_SYSTEM_PYTHON: 1
+  # SUT_JSONRPC_URL to use for the TCK and the server agent
+  SUT_JSONRPC_URL: http://localhost:41241
+  # Slow system on CI
+  TCK_STREAMING_TIMEOUT: 5.0
+
+# Only run the latest job
+concurrency:
+  group: '${{ github.workflow }} @ ${{ github.head_ref || github.ref }}'
+  cancel-in-progress: true
+
+jobs:
+  tck-test:
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout a2a-js
+        uses: actions/checkout@v4
+      - name: Set up Node
+        uses: actions/setup-node@v4
+        with:
+          node-version: 18
+          registry-url: 'https://registry.npmjs.org'
+      - run: |
+          npm ci
+          npm run build
+      - name: Checkout a2a-tck
+        uses: actions/checkout@v4
+        with:
+          repository: a2aproject/a2a-tck
+          path: tck/a2a-tck
+          ref: ${{ env.TCK_VERSION }}
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version-file: "tck/a2a-tck/pyproject.toml"
+      - name: Install uv and Python dependencies
+        run: |
+          pip install uv
+          uv pip install -e .
+        working-directory: tck/a2a-tck
+      - name: Start SUT
+        run: |
+          cd tck
+          npm run tck:sut-agent &
+      - name: Wait for SUT to start
+        run: |
+          URL="${{ env.SUT_JSONRPC_URL }}/.well-known/agent-card.json"
+          EXPECTED_STATUS=200
+          TIMEOUT=120
+          RETRY_INTERVAL=2
+          START_TIME=$(date +%s)
+
+          while true; do
+            # Calculate elapsed time
+            CURRENT_TIME=$(date +%s)
+            ELAPSED_TIME=$((CURRENT_TIME - START_TIME))
+
+            # Check for timeout
+            if [ "$ELAPSED_TIME" -ge "$TIMEOUT" ]; then
+                echo "❌ Timeout: Server did not respond with status $EXPECTED_STATUS within $TIMEOUT seconds."
+                exit 1
+            fi
+
+            # Get HTTP status code. || true is to reporting a failure to connect as an error
+            HTTP_STATUS=$(curl --output /dev/null --silent --write-out "%{http_code}" "$URL") || true
+            echo "STATUS: ${HTTP_STATUS}"
+
+            # Check if we got the correct status code
+            if [ "$HTTP_STATUS" -eq "$EXPECTED_STATUS" ]; then
+                echo "✅ Server is up! Received status $HTTP_STATUS after $ELAPSED_TIME seconds."
+                break;
+            fi
+
+            # Wait before retrying
+            echo "⏳ Server not ready (status: $HTTP_STATUS). Retrying in $RETRY_INTERVAL seconds..."
+            sleep "$RETRY_INTERVAL"
+          done
+          
+      - name: Run TCK
+        id: run-tck
+        timeout-minutes: 5
+        run: |
+          ./run_tck.py --sut-url ${{ env.SUT_JSONRPC_URL }} --category mandatory
+        working-directory: tck/a2a-tck
+      - name: Stop SUT
+        if: always()
+        run: |
+          # Find and kill the SUT process
+          pkill -f "npm run tck:sut-agent" || true
+          sleep 2
diff --git a/tck/agent/README.md b/tck/agent/README.md
@@ -0,0 +1,9 @@
+# SUT Agent
+
+This agent is a sample to emulate the task flow in a streaming scenario, and it will be the SUT tested against the tck tests in the CI. To run:
+
+```bash
+npm run tck:sut-agent
+```
+
+The agent will start on `http://localhost:41241`.
diff --git a/tck/agent/index.ts b/tck/agent/index.ts
@@ -0,0 +1,221 @@
+import express from "express";
+import { v4 as uuidv4 } from 'uuid'; // For generating unique IDs
+
+import {
+  AgentCard,
+  Task,
+  TaskStatusUpdateEvent,
+  Message
+} from "../../src/index.js";
+import {
+  InMemoryTaskStore,
+  TaskStore,
+  AgentExecutor,
+  RequestContext,
+  ExecutionEventBus,
+  DefaultRequestHandler
+} from "../../src/server/index.js";
+import { A2AExpressApp } from "../../src/server/express/index.js";
+
+/**
+ * SUTAgentExecutor implements the agent's core logic.
+ */
+class SUTAgentExecutor implements AgentExecutor {
+  private runningTask: Set<string> = new Set();
+  private lastContextId?: string;
+
+  public cancelTask = async (
+    taskId: string,
+    eventBus: ExecutionEventBus,
+  ): Promise<void> => {
+    this.runningTask.delete(taskId);
+    const cancelledUpdate: TaskStatusUpdateEvent = {
+      kind: 'status-update',
+      taskId: taskId,
+      contextId: this.lastContextId,
+      status: {
+        state: 'canceled',
+        timestamp: new Date().toISOString(),
+      },
+      final: true, // Cancellation is a final state
+    };
+    eventBus.publish(cancelledUpdate);
+  };
+
+  async execute(
+    requestContext: RequestContext,
+    eventBus: ExecutionEventBus
+  ): Promise<void> {
+    const userMessage = requestContext.userMessage;
+    const existingTask = requestContext.task;
+
+    // Determine IDs for the task and context
+    const taskId = requestContext.taskId;
+    const contextId = requestContext.contextId;
+
+    this.lastContextId = contextId;
+    this.runningTask.add(taskId);
+
+    console.log(
+      `[SUTAgentExecutor] Processing message ${userMessage.messageId} for task ${taskId} (context: ${contextId})`
+    );
+
+    // 1. Publish initial Task event if it's a new task
+    if (!existingTask) {
+      const initialTask: Task = {
+        kind: 'task',
+        id: taskId,
+        contextId: contextId,
+        status: {
+          state: 'submitted',
+          timestamp: new Date().toISOString(),
+        },
+        history: [userMessage], // Start history with the current user message
+        metadata: userMessage.metadata, // Carry over metadata from message if any
+      };
+      eventBus.publish(initialTask);
+    }
+
+    // 2. Publish "working" status update
+    const workingStatusUpdate: TaskStatusUpdateEvent = {
+      kind: 'status-update',
+      taskId: taskId,
+      contextId: contextId,
+      status: {
+        state: 'working',
+        message: {
+          kind: 'message',
+          role: 'agent',
+          messageId: uuidv4(),
+          parts: [{ kind: 'text', text: 'Processing your question' }],
+          taskId: taskId,
+          contextId: contextId,
+        },
+        timestamp: new Date().toISOString(),
+      },
+      final: false,
+    };
+    eventBus.publish(workingStatusUpdate);
+
+    // 3. Publish final task status update
+    const agentReplyText = this.parseInputMessage(userMessage);
+    await new Promise(resolve => setTimeout(resolve, 3000)); // Simulate processing delay
+    if (!this.runningTask.has(taskId)) {
+      console.log(
+        `[SUTAgentExecutor] Task ${taskId} was cancelled before processing could complete.`
+      );
+      return;
+    }
+    console.info(`[SUTAgentExecutor] Prompt response: ${agentReplyText}`);
+
+    const agentMessage: Message = {
+      kind: 'message',
+      role: 'agent',
+      messageId: uuidv4(),
+      parts: [{ kind: 'text', text: agentReplyText }],
+      taskId: taskId,
+      contextId: contextId,
+    };
+
+    const finalUpdate: TaskStatusUpdateEvent = {
+      kind: 'status-update',
+      taskId: taskId,
+      contextId: contextId,
+      status: {
+        state: 'input-required',
+        message: agentMessage,
+        timestamp: new Date().toISOString(),
+      },
+      final: true,
+    };
+    eventBus.publish(finalUpdate);
+  }
+
+  parseInputMessage(message: Message): string {
+    /** Process the user query and return a response. */
+    const textPart = message.parts.find(part => part.kind === 'text');
+    const query = textPart ? textPart.text.trim() : '';
+
+    if (!query) {
+      return "Hello! Please provide a message for me to respond to.";
+    }
+
+    // Simple responses based on input
+    const queryLower = query.toLowerCase();
+    if (queryLower.includes("hello") || queryLower.includes("hi")) {
+      return "Hello World! How are you?";
+    } else if (queryLower.includes("how are you")) {
+      return "I'm doing great! Thanks for asking. How can I help you today?";
+    } else {
+      return `Hello World! You said: '${query}'. Please, send me a new message.`;
+    }
+  }
+}
+
+// --- Server Setup ---
+
+const SUTAgentCard: AgentCard = {
+  name: 'SUT Agent',
+  description: 'A sample agent to be used as SUT against tck tests.',
+  // Adjust the base URL and port as needed. /a2a is the default base in A2AExpressApp
+  url: 'http://localhost:41241/',
+  provider: {
+    organization: 'A2A Samples',
+    url: 'https://example.com/a2a-samples' // Added provider URL
+  },
+  version: '1.0.0', // Incremented version
+  protocolVersion: '0.3.0',
+  capabilities: {
+    streaming: true, // The new framework supports streaming
+    pushNotifications: false, // Assuming not implemented for this agent yet
+    stateTransitionHistory: true, // Agent uses history
+  },
+  defaultInputModes: ['text'],
+  defaultOutputModes: ['text', 'task-status'], // task-status is a common output mode
+  skills: [
+    {
+      id: 'sut_agent',
+      name: 'SUT Agent',
+      description: 'Simulate the general flow of a streaming agent.',
+      tags: ['sut'],
+      examples: ["hi", "hello world", "how are you", "goodbye"],
+      inputModes: ['text'], // Explicitly defining for skill
+      outputModes: ['text', 'task-status'] // Explicitly defining for skill
+    },
+  ],
+  supportsAuthenticatedExtendedCard: false,
+  preferredTransport: 'JSONRPC',
+  additionalInterfaces: [{url: 'http://localhost:41241', transport: 'JSONRPC'}],
+};
+
+async function main() {
+  // 1. Create TaskStore
+  const taskStore: TaskStore = new InMemoryTaskStore();
+
+  // 2. Create AgentExecutor
+  const agentExecutor: AgentExecutor = new SUTAgentExecutor();
+
+  // 3. Create DefaultRequestHandler
+  const requestHandler = new DefaultRequestHandler(
+    SUTAgentCard,
+    taskStore,
+    agentExecutor
+  );
+
+  // 4. Create and setup A2AExpressApp
+  const appBuilder = new A2AExpressApp(requestHandler);
+  const expressApp = appBuilder.setupRoutes(express());
+
+  // 5. Start the server
+  const PORT = process.env.PORT || 41241;
+  expressApp.listen(PORT, (err) => {
+    if (err) {
+      throw err;
+    }
+    console.log(`[SUTAgent] Server using new framework started on http://localhost:${PORT}`);
+    console.log(`[SUTAgent] Agent Card: http://localhost:${PORT}/.well-known/agent-card.json`);
+    console.log('[SUTAgent] Press Ctrl+C to stop the server');
+  });
+}
+
+main().catch(console.error);
diff --git a/tck/package.json b/tck/package.json
@@ -0,0 +1,9 @@
+{
+  "name": "tck",
+  "version": "1.0.0",
+  "description": "SUT agent for tck tests CI",
+  "scripts": {
+    "tck:sut-agent": "tsx agent/index.ts"
+
+  }
+}