fleet/server/datastore/mysql/campaigns_test.go
Martin Angers 6c0e56ea73
Address multiple redis-related issues observed with live queries (#16855)
#16331 

Doc updates in a separate PR:
https://github.com/fleetdm/fleet/pull/17214

# Checklist for submitter

- [x] Changes file added for user-visible changes in `changes/` or
`orbit/changes/`.
See [Changes
files](https://fleetdm.com/docs/contributing/committing-changes#changes-files)
for more information.
- [x] Input data is properly validated, `SELECT *` is avoided, SQL
injection is prevented (using placeholders for values in statements)
- [x] Added/updated tests
- [x] Manual QA for all new/changed functionality (smoke-tested locally
with osquery-perf simulating 100 hosts, ran a live query, a saved live
query, stopped naturally and stopped before the end, and again via
fleetctl)

---------

Co-authored-by: Victor Lyuboslavsky <victor@fleetdm.com>
Co-authored-by: Victor Lyuboslavsky <victor.lyuboslavsky@gmail.com>
2024-02-27 19:35:27 -06:00

256 lines
8.8 KiB
Go

package mysql
import (
"context"
"math/rand"
"sort"
"testing"
"time"
"github.com/WatchBeam/clock"
"github.com/fleetdm/fleet/v4/server/fleet"
"github.com/fleetdm/fleet/v4/server/test"
"github.com/stretchr/testify/assert"
"github.com/stretchr/testify/require"
)
func TestCampaigns(t *testing.T) {
ds := CreateMySQLDS(t)
cases := []struct {
name string
fn func(t *testing.T, ds *Datastore)
}{
{"DistributedQuery", testCampaignsDistributedQuery},
{"CleanupDistributedQuery", testCampaignsCleanupDistributedQuery},
{"SaveDistributedQuery", testCampaignsSaveDistributedQuery},
{"CompletedCampaigns", testCompletedCampaigns},
}
for _, c := range cases {
t.Run(c.name, func(t *testing.T) {
defer TruncateTables(t, ds)
c.fn(t, ds)
})
}
}
func testCampaignsDistributedQuery(t *testing.T, ds *Datastore) {
user := test.NewUser(t, ds, "Zach", "zwass@fleet.co", true)
mockClock := clock.NewMockClock()
query := test.NewQuery(t, ds, nil, "test", "select * from time", user.ID, false)
campaign := test.NewCampaign(t, ds, query.ID, fleet.QueryRunning, mockClock.Now())
{
retrieved, err := ds.DistributedQueryCampaign(context.Background(), campaign.ID)
require.Nil(t, err)
assert.Equal(t, campaign.QueryID, retrieved.QueryID)
assert.Equal(t, campaign.Status, retrieved.Status)
}
h1 := test.NewHost(t, ds, "foo.local", "192.168.1.10", "1", "1", mockClock.Now())
h2 := test.NewHost(t, ds, "bar.local", "192.168.1.11", "2", "2", mockClock.Now().Add(-1*time.Hour))
h3 := test.NewHost(t, ds, "baz.local", "192.168.1.12", "3", "3", mockClock.Now().Add(-13*time.Minute))
l1 := fleet.LabelSpec{
ID: 1,
Name: "label foo",
Query: "query foo",
}
l2 := fleet.LabelSpec{
ID: 2,
Name: "label bar",
Query: "query bar",
}
err := ds.ApplyLabelSpecs(context.Background(), []*fleet.LabelSpec{&l1, &l2})
require.Nil(t, err)
checkTargets(t, ds, campaign.ID, fleet.HostTargets{})
test.AddHostToCampaign(t, ds, campaign.ID, h1.ID)
checkTargets(t, ds, campaign.ID, fleet.HostTargets{HostIDs: []uint{h1.ID}})
test.AddLabelToCampaign(t, ds, campaign.ID, l1.ID)
checkTargets(t, ds, campaign.ID, fleet.HostTargets{HostIDs: []uint{h1.ID}, LabelIDs: []uint{l1.ID}})
test.AddLabelToCampaign(t, ds, campaign.ID, l2.ID)
checkTargets(t, ds, campaign.ID, fleet.HostTargets{HostIDs: []uint{h1.ID}, LabelIDs: []uint{l1.ID, l2.ID}})
test.AddHostToCampaign(t, ds, campaign.ID, h2.ID)
test.AddHostToCampaign(t, ds, campaign.ID, h3.ID)
checkTargets(t, ds, campaign.ID, fleet.HostTargets{HostIDs: []uint{h1.ID, h2.ID, h3.ID}, LabelIDs: []uint{l1.ID, l2.ID}})
}
func testCampaignsCleanupDistributedQuery(t *testing.T, ds *Datastore) {
ctx := context.Background()
user := test.NewUser(t, ds, "Zach", "zwass@fleet.co", true)
mockClock := clock.NewMockClock()
query := test.NewQuery(t, ds, nil, "test", "select * from time", user.ID, false)
c1 := test.NewCampaign(t, ds, query.ID, fleet.QueryWaiting, mockClock.Now())
c2 := test.NewCampaign(t, ds, query.ID, fleet.QueryRunning, mockClock.Now())
// Cleanup and verify that nothing changed (because time has not
// advanced)
expired, err := ds.CleanupDistributedQueryCampaigns(ctx, mockClock.Now())
require.Nil(t, err)
assert.Equal(t, uint(0), expired)
{
retrieved, err := ds.DistributedQueryCampaign(ctx, c1.ID)
require.Nil(t, err)
assert.Equal(t, c1.QueryID, retrieved.QueryID)
assert.Equal(t, c1.Status, retrieved.Status)
}
{
retrieved, err := ds.DistributedQueryCampaign(ctx, c2.ID)
require.Nil(t, err)
assert.Equal(t, c2.QueryID, retrieved.QueryID)
assert.Equal(t, c2.Status, retrieved.Status)
}
// Add some executions
mockClock.AddTime(1*time.Minute + 1*time.Second)
// Cleanup and verify that the campaign was expired and executions
// deleted appropriately
expired, err = ds.CleanupDistributedQueryCampaigns(ctx, mockClock.Now())
require.Nil(t, err)
assert.Equal(t, uint(1), expired)
{
// c1 should now be complete
retrieved, err := ds.DistributedQueryCampaign(ctx, c1.ID)
require.Nil(t, err)
assert.Equal(t, c1.QueryID, retrieved.QueryID)
assert.Equal(t, fleet.QueryComplete, retrieved.Status)
}
{
retrieved, err := ds.DistributedQueryCampaign(ctx, c2.ID)
require.Nil(t, err)
assert.Equal(t, c2.QueryID, retrieved.QueryID)
assert.Equal(t, c2.Status, retrieved.Status)
}
mockClock.AddTime(24*time.Hour + 1*time.Second)
// Cleanup and verify that the campaign was expired and executions
// deleted appropriately
expired, err = ds.CleanupDistributedQueryCampaigns(ctx, mockClock.Now())
require.Nil(t, err)
assert.Equal(t, uint(1), expired)
{
retrieved, err := ds.DistributedQueryCampaign(ctx, c1.ID)
require.Nil(t, err)
assert.Equal(t, c1.QueryID, retrieved.QueryID)
assert.Equal(t, fleet.QueryComplete, retrieved.Status)
}
{
// c2 should now be complete
retrieved, err := ds.DistributedQueryCampaign(ctx, c2.ID)
require.Nil(t, err)
assert.Equal(t, c2.QueryID, retrieved.QueryID)
assert.Equal(t, fleet.QueryComplete, retrieved.Status)
}
// simulate another old campaign created > 7 days ago
c3 := test.NewCampaign(t, ds, query.ID, fleet.QueryWaiting, mockClock.Now().AddDate(0, 0, -8))
{
retrieved, err := ds.DistributedQueryCampaign(ctx, c3.ID)
require.Nil(t, err)
assert.Equal(t, c3.QueryID, retrieved.QueryID)
assert.Equal(t, fleet.QueryWaiting, retrieved.Status)
}
// cleanup will mark c3 as completed because it was waiting for > 1 minute,
// but it won't return it as recently inactive because it's too old a query.
expired, err = ds.CleanupDistributedQueryCampaigns(ctx, mockClock.Now())
require.Nil(t, err)
assert.Equal(t, uint(1), expired)
// cleanup again does not expire any new campaign and still returns the same
// recently inactive campaigns
expired, err = ds.CleanupDistributedQueryCampaigns(ctx, mockClock.Now())
require.Nil(t, err)
assert.Equal(t, uint(0), expired)
// move time forward 7 days and cleanup again, this time it returns no recent
// inactive campaigns
mockClock.AddTime(7*24*time.Hour + 1*time.Second)
expired, err = ds.CleanupDistributedQueryCampaigns(ctx, mockClock.Now())
require.Nil(t, err)
assert.Equal(t, uint(0), expired)
}
func testCampaignsSaveDistributedQuery(t *testing.T, ds *Datastore) {
user := test.NewUser(t, ds, t.Name(), t.Name()+"zwass@fleet.co", true)
mockClock := clock.NewMockClock()
query := test.NewQuery(t, ds, nil, t.Name()+"test", "select * from time", user.ID, false)
c1 := test.NewCampaign(t, ds, query.ID, fleet.QueryWaiting, mockClock.Now())
gotC, err := ds.DistributedQueryCampaign(context.Background(), c1.ID)
require.NoError(t, err)
require.Equal(t, fleet.QueryWaiting, gotC.Status)
c1.Status = fleet.QueryComplete
require.NoError(t, ds.SaveDistributedQueryCampaign(context.Background(), c1))
gotC, err = ds.DistributedQueryCampaign(context.Background(), c1.ID)
require.NoError(t, err)
require.Equal(t, fleet.QueryComplete, gotC.Status)
}
func checkTargets(t *testing.T, ds fleet.Datastore, campaignID uint, expectedTargets fleet.HostTargets) {
targets, err := ds.DistributedQueryCampaignTargetIDs(context.Background(), campaignID)
require.Nil(t, err)
assert.ElementsMatch(t, expectedTargets.HostIDs, targets.HostIDs)
assert.ElementsMatch(t, expectedTargets.LabelIDs, targets.LabelIDs)
assert.ElementsMatch(t, expectedTargets.TeamIDs, targets.TeamIDs)
}
func testCompletedCampaigns(t *testing.T, ds *Datastore) {
// Test nil result
result, err := ds.GetCompletedCampaigns(context.Background(), nil)
assert.NoError(t, err)
assert.Len(t, result, 0)
result, err = ds.GetCompletedCampaigns(context.Background(), []uint{234, 1, 1, 34455455453})
assert.NoError(t, err)
assert.Len(t, result, 0)
// Now test reasonable results
user := test.NewUser(t, ds, t.Name(), t.Name()+"zwass@fleet.co", true)
mockClock := clock.NewMockClock()
query := test.NewQuery(t, ds, nil, t.Name()+"test", "select * from time", user.ID, false)
numCampaigns := 5
totalFilterSize := 100000
filter := make([]uint, 0, totalFilterSize)
complete := make([]uint, 0, numCampaigns)
for i := 0; i < numCampaigns; i++ {
c1 := test.NewCampaign(t, ds, query.ID, fleet.QueryWaiting, mockClock.Now())
gotC, err := ds.DistributedQueryCampaign(context.Background(), c1.ID)
require.NoError(t, err)
require.Equal(t, fleet.QueryWaiting, gotC.Status)
if rand.Intn(10) < 7 { //nolint:gosec
c1.Status = fleet.QueryComplete
require.NoError(t, ds.SaveDistributedQueryCampaign(context.Background(), c1))
complete = append(complete, c1.ID)
}
filter = append(filter, c1.ID)
}
for j := filter[len(filter)-1] / 2; j < uint(totalFilterSize); j++ { // some IDs are duplicated
filter = append(filter, j)
}
rand.Shuffle(len(filter), func(i, j int) { filter[i], filter[j] = filter[j], filter[i] })
result, err = ds.GetCompletedCampaigns(context.Background(), filter)
assert.NoError(t, err)
sort.Slice(result, func(i, j int) bool { return result[i] < result[j] })
assert.Equal(t, complete, result)
}