chore: refactor tests

dannykopping · dannykopping · commit c2f9c79c6a18 · 2026-03-11T09:57:41.000+02:00
Signed-off-by: Danny Kopping &lt;danny@coder.com&gt;
diff --git a/internal/integrationtest/bridge_test.go b/internal/integrationtest/bridge_test.go
@@ -126,72 +126,76 @@ func TestAnthropicMessages(t *testing.T) {
 func TestAnthropicMessagesModelThoughts(t *testing.T) {
 	t.Parallel()
 
-	t.Run("thinking captured with builtin tool", func(t *testing.T) {
-		t.Parallel()
-
-		cases := []struct {
-			name               string
-			streaming          bool
-			fixture            []byte
-			expectedToolCallID string
-			expectedThoughts   []string
-		}{
-			{
-				name:               "single thinking block/streaming",
-				streaming:          true,
-				fixture:            fixtures.AntSingleBuiltinTool,
-				expectedToolCallID: "toolu_01RX68weRSquLx6HUTj65iBo",
-				expectedThoughts:   []string{"The user wants me to read"},
-			},
-			{
-				name:               "single thinking block/blocking",
-				streaming:          false,
-				fixture:            fixtures.AntSingleBuiltinTool,
-				expectedToolCallID: "toolu_01AusGgY5aKFhzWrFBv9JfHq",
-				expectedThoughts:   []string{"The user wants me to read"},
-			},
-			{
-				name:               "multiple thinking blocks/streaming",
-				streaming:          true,
-				fixture:            fixtures.AntMultiThinkingBuiltinTool,
-				expectedToolCallID: "toolu_01RX68weRSquLx6HUTj65iBo",
-				expectedThoughts:   []string{"The user wants me to read", "I should use the Read tool"},
-			},
-			{
-				name:               "multiple thinking blocks/blocking",
-				streaming:          false,
-				fixture:            fixtures.AntMultiThinkingBuiltinTool,
-				expectedToolCallID: "toolu_01AusGgY5aKFhzWrFBv9JfHq",
-				expectedThoughts:   []string{"The user wants me to read", "I should use the Read tool"},
-			},
-		}
+	cases := []struct {
+		name               string
+		streaming          bool
+		fixture            []byte
+		expectedToolCallID string
+		expectedThoughts   []string // nil means no tool usages expected at all
+	}{
+		{
+			name:               "single thinking block/streaming",
+			streaming:          true,
+			fixture:            fixtures.AntSingleBuiltinTool,
+			expectedToolCallID: "toolu_01RX68weRSquLx6HUTj65iBo",
+			expectedThoughts:   []string{"The user wants me to read"},
+		},
+		{
+			name:               "single thinking block/blocking",
+			streaming:          false,
+			fixture:            fixtures.AntSingleBuiltinTool,
+			expectedToolCallID: "toolu_01AusGgY5aKFhzWrFBv9JfHq",
+			expectedThoughts:   []string{"The user wants me to read"},
+		},
+		{
+			name:               "multiple thinking blocks/streaming",
+			streaming:          true,
+			fixture:            fixtures.AntMultiThinkingBuiltinTool,
+			expectedToolCallID: "toolu_01RX68weRSquLx6HUTj65iBo",
+			expectedThoughts:   []string{"The user wants me to read", "I should use the Read tool"},
+		},
+		{
+			name:               "multiple thinking blocks/blocking",
+			streaming:          false,
+			fixture:            fixtures.AntMultiThinkingBuiltinTool,
+			expectedToolCallID: "toolu_01AusGgY5aKFhzWrFBv9JfHq",
+			expectedThoughts:   []string{"The user wants me to read", "I should use the Read tool"},
+		},
+		{
+			name:      "no thoughts without tool calls",
+			streaming: true,
+			fixture:   fixtures.AntSimple, // This fixture contains thoughts, but they're not associated with tool calls.
+		},
+	}
 
-		for _, tc := range cases {
-			t.Run(tc.name, func(t *testing.T) {
-				t.Parallel()
+	for _, tc := range cases {
+		t.Run(tc.name, func(t *testing.T) {
+			t.Parallel()
 
-				ctx, cancel := context.WithTimeout(t.Context(), time.Second*30)
-				t.Cleanup(cancel)
+			ctx, cancel := context.WithTimeout(t.Context(), time.Second*30)
+			t.Cleanup(cancel)
 
-				fix := fixtures.Parse(t, tc.fixture)
-				upstream := newMockUpstream(t, ctx, newFixtureResponse(fix))
+			fix := fixtures.Parse(t, tc.fixture)
+			upstream := newMockUpstream(t, ctx, newFixtureResponse(fix))
 
-				bridgeServer := newBridgeTestServer(t, ctx, upstream.URL)
+			bridgeServer := newBridgeTestServer(t, ctx, upstream.URL)
 
-				reqBody, err := sjson.SetBytes(fix.Request(), "stream", tc.streaming)
-				require.NoError(t, err)
-				resp := bridgeServer.makeRequest(t, http.MethodPost, pathAnthropicMessages, reqBody)
-				require.Equal(t, http.StatusOK, resp.StatusCode)
+			reqBody, err := sjson.SetBytes(fix.Request(), "stream", tc.streaming)
+			require.NoError(t, err)
+			resp := bridgeServer.makeRequest(t, http.MethodPost, pathAnthropicMessages, reqBody)
+			require.Equal(t, http.StatusOK, resp.StatusCode)
 
-				if tc.streaming {
-					sp := aibridge.NewSSEParser()
-					require.NoError(t, sp.Parse(resp.Body))
-					assert.Contains(t, sp.AllEvents(), "message_start")
-					assert.Contains(t, sp.AllEvents(), "message_stop")
-				}
+			if tc.streaming {
+				sp := aibridge.NewSSEParser()
+				require.NoError(t, sp.Parse(resp.Body))
+				assert.Contains(t, sp.AllEvents(), "message_start")
+				assert.Contains(t, sp.AllEvents(), "message_stop")
+			}
 
-				// Verify tool usage was recorded with associated model thoughts.
-				toolUsages := bridgeServer.Recorder.RecordedToolUsages()
+			toolUsages := bridgeServer.Recorder.RecordedToolUsages()
+			if tc.expectedThoughts == nil {
+				assert.Empty(t, toolUsages)
+			} else {
 				require.Len(t, toolUsages, 1)
 				assert.Equal(t, "Read", toolUsages[0].Tool)
 				assert.Equal(t, tc.expectedToolCallID, toolUsages[0].ToolCallID)
@@ -200,40 +204,11 @@ func TestAnthropicMessagesModelThoughts(t *testing.T) {
 				for i, expected := range tc.expectedThoughts {
 					assert.Contains(t, toolUsages[0].ModelThoughts[i].Content, expected)
 				}
+			}
 
-				bridgeServer.Recorder.VerifyAllInterceptionsEnded(t)
-			})
-		}
-	})
-
-	t.Run("no thoughts without tool calls", func(t *testing.T) {
-		t.Parallel()
-
-		ctx, cancel := context.WithTimeout(t.Context(), time.Second*30)
-		t.Cleanup(cancel)
-
-		// Use the simple fixture which has no tool calls — any thinking blocks
-		// should not be persisted since they can't be associated with a tool call.
-		fix := fixtures.Parse(t, fixtures.AntSimple)
-		upstream := newMockUpstream(t, ctx, newFixtureResponse(fix))
-
-		bridgeServer := newBridgeTestServer(t, ctx, upstream.URL)
-
-		reqBody, err := sjson.SetBytes(fix.Request(), "stream", true)
-		require.NoError(t, err)
-		resp := bridgeServer.makeRequest(t, http.MethodPost, pathAnthropicMessages, reqBody)
-		require.Equal(t, http.StatusOK, resp.StatusCode)
-
-		sp := aibridge.NewSSEParser()
-		require.NoError(t, sp.Parse(resp.Body))
-
-		// No tool usages (and therefore no thoughts) should be recorded
-		// when there are no tool calls.
-		toolUsages := bridgeServer.Recorder.RecordedToolUsages()
-		assert.Empty(t, toolUsages)
-
-		bridgeServer.Recorder.VerifyAllInterceptionsEnded(t)
-	})
+			bridgeServer.Recorder.VerifyAllInterceptionsEnded(t)
+		})
+	}
 }
 
 func TestAWSBedrockIntegration(t *testing.T) {
diff --git a/internal/integrationtest/responses_test.go b/internal/integrationtest/responses_test.go
@@ -919,61 +919,64 @@ func TestResponsesInjectedTool(t *testing.T) {
 func TestResponsesModelThoughts(t *testing.T) {
 	t.Parallel()
 
-	t.Run("reasoning captured with builtin tool", func(t *testing.T) {
-		t.Parallel()
-
-		cases := []struct {
-			name               string
-			fixture            []byte
-			expectedToolCallID string
-			expectedThoughts   []string
-		}{
-			{
-				name:               "single reasoning/blocking",
-				fixture:            fixtures.OaiResponsesBlockingSingleBuiltinTool,
-				expectedToolCallID: "call_CJSaa2u51JG996575oVljuNq",
-				expectedThoughts:   []string{"The user wants to add 3 and 5"},
-			},
-			{
-				name:               "single reasoning/streaming",
-				fixture:            fixtures.OaiResponsesStreamingBuiltinTool,
-				expectedToolCallID: "call_7VaiUXZYuuuwWwviCrckxq6t",
-				expectedThoughts:   []string{"The user wants to add 3 and 5"},
-			},
-			{
-				name:               "multiple reasoning items/blocking",
-				fixture:            fixtures.OaiResponsesBlockingMultiReasoningBuiltinTool,
-				expectedToolCallID: "call_CJSaa2u51JG996575oVljuNq",
-				expectedThoughts:   []string{"The user wants to add 3 and 5", "After adding, I will check if the result is prime"},
-			},
-			{
-				name:               "multiple reasoning items/streaming",
-				fixture:            fixtures.OaiResponsesStreamingMultiReasoningBuiltinTool,
-				expectedToolCallID: "call_7VaiUXZYuuuwWwviCrckxq6t",
-				expectedThoughts:   []string{"The user wants to add 3 and 5", "After adding, I will check if the result is prime"},
-			},
-		}
+	cases := []struct {
+		name               string
+		fixture            []byte
+		expectedToolCallID string
+		expectedThoughts   []string // nil means no tool usages expected at all
+	}{
+		{
+			name:               "single reasoning/blocking",
+			fixture:            fixtures.OaiResponsesBlockingSingleBuiltinTool,
+			expectedToolCallID: "call_CJSaa2u51JG996575oVljuNq",
+			expectedThoughts:   []string{"The user wants to add 3 and 5"},
+		},
+		{
+			name:               "single reasoning/streaming",
+			fixture:            fixtures.OaiResponsesStreamingBuiltinTool,
+			expectedToolCallID: "call_7VaiUXZYuuuwWwviCrckxq6t",
+			expectedThoughts:   []string{"The user wants to add 3 and 5"},
+		},
+		{
+			name:               "multiple reasoning items/blocking",
+			fixture:            fixtures.OaiResponsesBlockingMultiReasoningBuiltinTool,
+			expectedToolCallID: "call_CJSaa2u51JG996575oVljuNq",
+			expectedThoughts:   []string{"The user wants to add 3 and 5", "After adding, I will check if the result is prime"},
+		},
+		{
+			name:               "multiple reasoning items/streaming",
+			fixture:            fixtures.OaiResponsesStreamingMultiReasoningBuiltinTool,
+			expectedToolCallID: "call_7VaiUXZYuuuwWwviCrckxq6t",
+			expectedThoughts:   []string{"The user wants to add 3 and 5", "After adding, I will check if the result is prime"},
+		},
+		{
+			name:    "no thoughts without tool calls",
+			fixture: fixtures.OaiResponsesStreamingCodex, // This fixture contains reasoning, but it's not associated with tool calls.
+		},
+	}
 
-		for _, tc := range cases {
-			t.Run(tc.name, func(t *testing.T) {
-				t.Parallel()
+	for _, tc := range cases {
+		t.Run(tc.name, func(t *testing.T) {
+			t.Parallel()
 
-				ctx, cancel := context.WithTimeout(t.Context(), time.Second*30)
-				t.Cleanup(cancel)
+			ctx, cancel := context.WithTimeout(t.Context(), time.Second*30)
+			t.Cleanup(cancel)
 
-				fix := fixtures.Parse(t, tc.fixture)
-				upstream := newMockUpstream(t, ctx, newFixtureResponse(fix))
+			fix := fixtures.Parse(t, tc.fixture)
+			upstream := newMockUpstream(t, ctx, newFixtureResponse(fix))
 
-				bridgeServer := newBridgeTestServer(t, ctx, upstream.URL)
+			bridgeServer := newBridgeTestServer(t, ctx, upstream.URL)
 
-				resp := bridgeServer.makeRequest(t, http.MethodPost, pathOpenAIResponses, fix.Request())
-				require.Equal(t, http.StatusOK, resp.StatusCode)
+			resp := bridgeServer.makeRequest(t, http.MethodPost, pathOpenAIResponses, fix.Request())
+			require.Equal(t, http.StatusOK, resp.StatusCode)
 
-				_, err := io.ReadAll(resp.Body)
-				require.NoError(t, err)
+			_, err := io.ReadAll(resp.Body)
+			require.NoError(t, err)
 
-				// Verify tool usage was recorded with associated model thoughts.
-				toolUsages := bridgeServer.Recorder.RecordedToolUsages()
+			toolUsages := bridgeServer.Recorder.RecordedToolUsages()
+			if tc.expectedThoughts == nil {
+				require.Empty(t, toolUsages)
+			} else {
 				require.Len(t, toolUsages, 1)
 				require.Equal(t, "add", toolUsages[0].Tool)
 				require.Equal(t, tc.expectedToolCallID, toolUsages[0].ToolCallID)
@@ -982,34 +985,9 @@ func TestResponsesModelThoughts(t *testing.T) {
 				for i, expected := range tc.expectedThoughts {
 					require.Contains(t, toolUsages[0].ModelThoughts[i].Content, expected)
 				}
-			})
-		}
-	})
-
-	t.Run("no thoughts without tool calls", func(t *testing.T) {
-		t.Parallel()
-
-		ctx, cancel := context.WithTimeout(t.Context(), time.Second*30)
-		t.Cleanup(cancel)
-
-		// Use the simple fixture which has no tool calls — any reasoning
-		// should not be persisted since it can't be associated with a tool call.
-		fix := fixtures.Parse(t, fixtures.OaiResponsesStreamingCodex)
-		upstream := newMockUpstream(t, ctx, newFixtureResponse(fix))
-
-		bridgeServer := newBridgeTestServer(t, ctx, upstream.URL)
-
-		resp := bridgeServer.makeRequest(t, http.MethodPost, pathOpenAIResponses, fix.Request())
-		require.Equal(t, http.StatusOK, resp.StatusCode)
-
-		_, err := io.ReadAll(resp.Body)
-		require.NoError(t, err)
-
-		// No tool usages (and therefore no thoughts) should be recorded
-		// when there are no tool calls.
-		toolUsages := bridgeServer.Recorder.RecordedToolUsages()
-		require.Empty(t, toolUsages)
-	})
+			}
+		})
+	}
 }
 
 func requireResponsesError(t *testing.T, code int, message string, body []byte) {