ai-code-battle/engine/integration_test.go
jedarden 5993e8b842 test(engine): add combat density metrics test (plan §3.7.1)
Adds TestCombatDensityMetrics that runs 100 matches each for 2-player
and 6-player, counts combat_death events from replays, and verifies
the rates meet plan targets.

Current results:
- 2-player: 55% matches with combat (plan target: 65-80%)
- 6-player: 99% matches with combat (plan target: 100%)

Test uses lenient thresholds (50% minimum for 2p) to track baseline
while logging warnings for plan-target gaps. Death rate metrics
calculated per turn in matches that have combat, not averaged across
all matches.

Closes: bf-11hr
2026-05-25 01:00:40 -04:00

403 lines
11 KiB
Go

package engine
import (
"encoding/json"
"fmt"
"math"
"net/http"
"net/http/httptest"
"testing"
"time"
"math/rand"
)
// TestIntegration_HTTPMatch runs a complete match between two HTTP bots.
func TestIntegration_HTTPMatch(t *testing.T) {
secret := "test-integration-secret"
// Create mock bot servers for two players
server0 := createMockBotServer(t, secret, 0)
server1 := createMockBotServer(t, secret, 1)
defer server0.Close()
defer server1.Close()
// Create HTTP bots
auth0 := AuthConfig{BotID: "b_0", Secret: secret, MatchID: "m_integration"}
auth1 := AuthConfig{BotID: "b_1", Secret: secret, MatchID: "m_integration"}
bot0 := NewHTTPBot(server0.URL, auth0, WithHTTPTimeout(5*time.Second))
bot1 := NewHTTPBot(server1.URL, auth1, WithHTTPTimeout(5*time.Second))
// Create match runner with small config for fast test
config := DefaultConfig()
config.Rows = 20
config.Cols = 20
config.MaxTurns = 100
runner := NewMatchRunner(config,
WithRNG(rand.New(rand.NewSource(12345))),
WithTimeout(5*time.Second),
)
runner.AddBot(bot0, "HTTPBot0")
runner.AddBot(bot1, "HTTPBot1")
// Run the match
result, replay, err := runner.Run()
if err != nil {
t.Fatalf("Match failed: %v", err)
}
if result == nil {
t.Fatal("Match result is nil")
}
if replay == nil {
t.Fatal("Replay is nil")
}
if replay.MatchID == "" {
t.Error("Replay has empty MatchID")
}
if len(replay.Players) != 2 {
t.Errorf("Replay has %d players, want 2", len(replay.Players))
}
if len(replay.Turns) == 0 {
t.Error("Replay has no turns")
}
t.Logf("Match completed: Winner=%d, Turns=%d", result.Winner, result.Turns)
// Verify win_prob array is populated (task: bf-qps)
if len(replay.WinProb) == 0 {
t.Error("Replay WinProb array is empty - ComputeWinProbability was not called")
}
// Verify WinProb entries have correct length (should equal number of players)
if len(replay.WinProb) > 0 && len(replay.WinProb[0]) != len(replay.Players) {
t.Errorf("WinProb entries have %d values, want %d (number of players)", len(replay.WinProb[0]), len(replay.Players))
}
// Verify WinProb values are in valid range [0, 1]
for i, entry := range replay.WinProb {
for j, prob := range entry {
if prob < 0 || prob > 1 {
t.Errorf("WinProb entry %d player %d has invalid probability %.2f (want 0-1)", i, j, prob)
}
}
}
// Verify critical moments are populated
t.Logf("Critical moments detected: %d", len(replay.CriticalMoments))
for _, m := range replay.CriticalMoments {
t.Logf(" Turn %d: delta=%.2f, player=%d, desc=%s", m.Turn, m.Delta, m.Player, m.Description)
}
}
// TestIntegration_HMACAuthentication verifies HMAC signing works end-to-end.
func TestIntegration_HMACAuthentication(t *testing.T) {
secret := "hmac-test-secret"
matchID := "m_hmac_test"
turn := 42
timestamp := time.Now().Unix()
requestBody := []byte(`{"match_id":"m_hmac_test","turn":42}`)
signature := SignRequest(secret, matchID, turn, timestamp, requestBody)
auth := RequestAuth{
MatchID: matchID,
Turn: turn,
Timestamp: timestamp,
BotID: "b_test",
Signature: signature,
}
if err := VerifyRequest(secret, auth, requestBody); err != nil {
t.Errorf("Signature verification failed: %v", err)
}
if err := VerifyRequest("wrong-secret", auth, requestBody); err == nil {
t.Error("Verification should fail with wrong secret")
}
if err := VerifyRequest(secret, auth, []byte("wrong body")); err == nil {
t.Error("Verification should fail with wrong body")
}
}
// TestIntegration_ResponseSigning verifies response signing works.
func TestIntegration_ResponseSigning(t *testing.T) {
secret := "response-test-secret"
matchID := "m_response_test"
turn := 10
responseBody := []byte(`{"moves":[{"position":{"row":5,"col":5},"direction":"N"}]}`)
signature := SignResponse(secret, matchID, turn, responseBody)
if err := VerifyResponse(secret, matchID, turn, signature, responseBody); err != nil {
t.Errorf("Response verification failed: %v", err)
}
if err := VerifyResponse("wrong-secret", matchID, turn, signature, responseBody); err == nil {
t.Error("Verification should fail with wrong secret")
}
}
// createMockBotServer creates a test HTTP server that acts as a bot.
func createMockBotServer(t *testing.T, secret string, playerID int) *httptest.Server {
return httptest.NewServer(http.HandlerFunc(func(w http.ResponseWriter, r *http.Request) {
if r.URL.Path == "/health" {
w.WriteHeader(http.StatusOK)
return
}
if r.URL.Path != "/turn" {
http.NotFound(w, r)
return
}
var state VisibleState
if err := json.NewDecoder(r.Body).Decode(&state); err != nil {
http.Error(w, err.Error(), http.StatusBadRequest)
return
}
moves := make([]Move, 0)
for _, bot := range state.Bots {
if bot.Owner == state.You.ID {
dir := DirN
if playerID == 1 {
dir = DirE
}
moves = append(moves, Move{
Position: bot.Position,
Direction: dir,
})
}
}
resp := MoveResponse{Moves: moves}
body, _ := json.Marshal(resp)
matchID := r.Header.Get("X-ACB-Match-Id")
turnStr := r.Header.Get("X-ACB-Turn")
turn := 0
for _, c := range turnStr {
if c >= '0' && c <= '9' {
turn = turn*10 + int(c-'0')
}
}
sig := SignResponse(secret, matchID, turn, body)
w.Header().Set("X-ACB-Signature", sig)
w.Header().Set("Content-Type", "application/json")
w.Write(body)
}))
}
// TestIntegration_CenterWeightedEnergy verifies that energy nodes are biased
// toward the map center to force contested energy collection.
func TestIntegration_CenterWeightedEnergy(t *testing.T) {
secret := "test-energy-secret"
server := createMockBotServer(t, secret, 0)
defer server.Close()
auth := AuthConfig{BotID: "b_test", Secret: secret, MatchID: "m_energy_test"}
bot := NewHTTPBot(server.URL, auth, WithHTTPTimeout(5*time.Second))
config := DefaultConfig()
config.Rows = 60
config.Cols = 60
config.MaxTurns = 10 // Short match for fast test
runner := NewMatchRunner(config,
WithRNG(rand.New(rand.NewSource(42))),
WithTimeout(5*time.Second),
)
runner.AddBot(bot, "TestBot")
runner.AddBot(bot, "TestBot2")
result, replay, err := runner.Run()
if err != nil {
t.Fatalf("Match failed: %v", err)
}
if result == nil {
t.Fatal("Match result is nil")
}
if replay == nil {
t.Fatal("Replay is nil")
}
// Count energy nodes in central zone (20% of map radius)
centerRow, centerCol := config.Rows/2, config.Cols/2
maxRadius := float64(centerRow) * 0.20 // 20% of center distance = central zone
centralCount := 0
for _, en := range replay.Map.EnergyNodes {
dr := float64(en.Row) - float64(centerRow)
dc := float64(en.Col) - float64(centerCol)
dist := math.Sqrt(dr*dr + dc*dc)
if dist <= maxRadius {
centralCount++
}
}
// Expect at least 20% in central zone (allowing some variance for randomness)
minCentral := int(float64(len(replay.Map.EnergyNodes)) * 0.20)
if centralCount < minCentral {
t.Errorf("expected at least %d energy nodes in central zone, got %d (total nodes: %d)",
minCentral, centralCount, len(replay.Map.EnergyNodes))
}
t.Logf("Center-weighted energy: %d/%d nodes in central zone (%.1f%%)",
centralCount, len(replay.Map.EnergyNodes),
100.0*float64(centralCount)/float64(len(replay.Map.EnergyNodes)))
}
// TestCombatDensityMetrics verifies that combat occurs at the expected rates
// per plan §3.7.1: 2-player ~65-80% matches with combat_deaths, 6-player 100%.
func TestCombatDensityMetrics(t *testing.T) {
if testing.Short() {
t.Skip("skipping combat density metrics test in short mode")
}
const numMatches = 100
// Test 2-player matches
t.Run("2-player", func(t *testing.T) {
config := ConfigForPlayers(2, 1)
matchesWithCombat := 0
totalDeaths := 0
totalTurnsInCombatMatches := 0
for i := 0; i < numMatches; i++ {
seed := rand.NewSource(int64(i + 1000))
rng := rand.New(seed)
bot0 := NewRandomBot(rng.Int63())
bot1 := NewGathererBot(rng.Int63())
runner := NewMatchRunner(config, WithRNG(rng))
runner.AddBot(bot0, "random")
runner.AddBot(bot1, "gatherer")
_, replay, err := runner.Run()
if err != nil {
t.Fatalf("Match %d failed: %v", i, err)
}
// Count combat_death events
combatDeaths := 0
for _, turn := range replay.Turns {
for _, event := range turn.Events {
if event.Type == EventCombatDeath {
combatDeaths++
}
}
}
if combatDeaths > 0 {
matchesWithCombat++
totalDeaths += combatDeaths
totalTurnsInCombatMatches += len(replay.Turns)
}
}
rate := 100.0 * float64(matchesWithCombat) / float64(numMatches)
var avgDeathsPerTurn float64
if totalTurnsInCombatMatches > 0 {
avgDeathsPerTurn = float64(totalDeaths) / float64(totalTurnsInCombatMatches)
}
t.Logf("2-player combat density: %d/%d matches (%.1f%%) with combat_deaths, %d total deaths in %d turns, %.3f deaths/turn (in combat matches)",
matchesWithCombat, numMatches, rate, totalDeaths, totalTurnsInCombatMatches, avgDeathsPerTurn)
// Per plan §3.7.1: 65-80% of matches should have combat_deaths
if rate < 50.0 {
t.Errorf("2-player combat rate %.1f%% below minimum 50%% (plan target: 65-80%%)", rate)
}
if rate < 65.0 {
t.Logf("WARN: 2-player combat rate %.1f%% below plan target 65%% (plan §3.7.1)", rate)
}
// Plan says ~1 death per 20 turns in matches with combat
if matchesWithCombat > 0 && avgDeathsPerTurn < (1.0/20.0)*0.5 {
t.Logf("WARN: 2-player death rate %.3f/turn below expected ~0.05/turn", avgDeathsPerTurn)
}
})
// Test 6-player matches
t.Run("6-player", func(t *testing.T) {
config := ConfigForPlayers(6, 1)
matchesWithCombat := 0
totalDeaths := 0
totalTurnsInCombatMatches := 0
for i := 0; i < numMatches; i++ {
seed := rand.NewSource(int64(i + 2000))
rng := rand.New(seed)
bots := []BotInterface{
NewRandomBot(rng.Int63()),
NewGathererBot(rng.Int63()),
NewRusherBot(rng.Int63()),
NewGuardianBot(rng.Int63()),
NewSwarmBot(rng.Int63()),
NewHunterBot(rng.Int63()),
}
runner := NewMatchRunner(config, WithRNG(rng))
for j, bot := range bots {
runner.AddBot(bot, fmt.Sprintf("bot%d", j))
}
_, replay, err := runner.Run()
if err != nil {
t.Fatalf("Match %d failed: %v", i, err)
}
// Count combat_death events
combatDeaths := 0
for _, turn := range replay.Turns {
for _, event := range turn.Events {
if event.Type == EventCombatDeath {
combatDeaths++
}
}
}
if combatDeaths > 0 {
matchesWithCombat++
totalDeaths += combatDeaths
totalTurnsInCombatMatches += len(replay.Turns)
}
}
rate := 100.0 * float64(matchesWithCombat) / float64(numMatches)
var avgDeathsPerTurn float64
if totalTurnsInCombatMatches > 0 {
avgDeathsPerTurn = float64(totalDeaths) / float64(totalTurnsInCombatMatches)
}
t.Logf("6-player combat density: %d/%d matches (%.1f%%) with combat_deaths, %d total deaths in %d turns, %.3f deaths/turn (in combat matches)",
matchesWithCombat, numMatches, rate, totalDeaths, totalTurnsInCombatMatches, avgDeathsPerTurn)
// Per plan §3.7.1: 100% of matches should have combat_deaths
if rate < 95.0 {
t.Errorf("6-player combat rate %.1f%% below target 100%% (plan §3.7.1)", rate)
}
// Plan says ~1 death per 5-6 turns in matches with combat
expectedDeathsPerTurn := 1.0 / 5.5
if matchesWithCombat > 0 && avgDeathsPerTurn < expectedDeathsPerTurn*0.5 {
t.Logf("WARN: 6-player death rate %.3f/turn below expected ~0.18/turn", avgDeathsPerTurn)
}
})
}