open-telemetry
diff --git a/‎cmd/otel-allocator/benchmark_test.go
+49-41 b/‎cmd/otel-allocator/benchmark_test.go
+49-41
diff --git a/‎cmd/otel-allocator/internal/allocation/allocator.go
+33-2 b/‎cmd/otel-allocator/internal/allocation/allocator.go
+33-2
diff --git a/‎cmd/otel-allocator/internal/allocation/allocator_test.go
+1-4 b/‎cmd/otel-allocator/internal/allocation/allocator_test.go
+1-4
diff --git a/‎cmd/otel-allocator/internal/allocation/least_weighted_test.go
+3-4 b/‎cmd/otel-allocator/internal/allocation/least_weighted_test.go
+3-4
diff --git a/‎cmd/otel-allocator/internal/allocation/per_node_test.go
+16-16 b/‎cmd/otel-allocator/internal/allocation/per_node_test.go
+16-16
diff --git a/‎cmd/otel-allocator/internal/allocation/strategy.go
+3-3 b/‎cmd/otel-allocator/internal/allocation/strategy.go
+3-3
diff --git a/‎cmd/otel-allocator/internal/allocation/testutils.go
+6-6 b/‎cmd/otel-allocator/internal/allocation/testutils.go
+6-6
diff --git a/‎cmd/otel-allocator/internal/prehook/prehook.go
+1-1 b/‎cmd/otel-allocator/internal/prehook/prehook.go
+1-1
@@ -28,65 +28,70 @@ import (
 	"github.com/open-telemetry/opentelemetry-operator/cmd/otel-allocator/internal/target"
 )
 
+var targetCounts = []int{1000, 10000, 100000, 800000}
+
 // BenchmarkProcessTargets benchmarks the whole target allocation pipeline. It starts with data the prometheus
 // discovery manager would normally output, and pushes it all the way into the allocator. It notably doe *not* check
 // the HTTP server afterward. Test data is chosen to be reasonably representative of what the Prometheus service discovery
 // outputs in the real world.
 func BenchmarkProcessTargets(b *testing.B) {
-	numTargets := 800000
 	targetsPerGroup := 5
 	groupsPerJob := 20
-	tsets := prepareBenchmarkData(numTargets, targetsPerGroup, groupsPerJob)
-	for _, strategy := range allocation.GetRegisteredAllocatorNames() {
-		b.Run(strategy, func(b *testing.B) {
-			targetDiscoverer := createTestDiscoverer(strategy, map[string][]*relabel.Config{})
-			targetDiscoverer.UpdateTsets(tsets)
-			b.ResetTimer()
-			for i := 0; i < b.N; i++ {
-				targetDiscoverer.Reload()
-			}
-		})
+	for _, numTargets := range targetCounts {
+		tsets := prepareBenchmarkData(numTargets, targetsPerGroup, groupsPerJob)
+		for _, strategy := range allocation.GetRegisteredAllocatorNames() {
+			b.Run(fmt.Sprintf("%s/%d", strategy, numTargets), func(b *testing.B) {
+				targetDiscoverer := createTestDiscoverer(strategy, map[string][]*relabel.Config{})
+				targetDiscoverer.UpdateTsets(tsets)
+				b.ResetTimer()
+				for i := 0; i < b.N; i++ {
+					targetDiscoverer.Reload()
+				}
+			})
+		}
 	}
 }
 
 // BenchmarkProcessTargetsWithRelabelConfig is BenchmarkProcessTargets with a relabel config set. The relabel config
 // does not actually modify any records, but does force the prehook to perform any necessary conversions along the way.
 func BenchmarkProcessTargetsWithRelabelConfig(b *testing.B) {
-	numTargets := 800000
 	targetsPerGroup := 5
 	groupsPerJob := 20
-	tsets := prepareBenchmarkData(numTargets, targetsPerGroup, groupsPerJob)
-	prehookConfig := make(map[string][]*relabel.Config, len(tsets))
-	for jobName := range tsets {
-		// keep all targets in half the jobs, drop the rest
-		jobNrStr := strings.Split(jobName, "-")[1]
-		jobNr, err := strconv.Atoi(jobNrStr)
-		require.NoError(b, err)
-		var action relabel.Action
-		if jobNr%2 == 0 {
-			action = "keep"
-		} else {
-			action = "drop"
+	for _, numTargets := range targetCounts {
+		tsets := prepareBenchmarkData(numTargets, targetsPerGroup, groupsPerJob)
+		prehookConfig := make(map[string][]*relabel.Config, len(tsets))
+		for jobName := range tsets {
+			// keep all targets in half the jobs, drop the rest
+			jobNrStr := strings.Split(jobName, "-")[1]
+			jobNr, err := strconv.Atoi(jobNrStr)
+			require.NoError(b, err)
+			var action relabel.Action
+			if jobNr%2 == 0 {
+				action = "keep"
+			} else {
+				action = "drop"
+			}
+			prehookConfig[jobName] = []*relabel.Config{
+				{
+					Action:       action,
+					Regex:        relabel.MustNewRegexp(".*"),
+					SourceLabels: model.LabelNames{"__address__"},
+				},
+			}
 		}
-		prehookConfig[jobName] = []*relabel.Config{
-			{
-				Action:       action,
-				Regex:        relabel.MustNewRegexp(".*"),
-				SourceLabels: model.LabelNames{"__address__"},
-			},
+
+		for _, strategy := range allocation.GetRegisteredAllocatorNames() {
+			b.Run(fmt.Sprintf("%s/%d", strategy, numTargets), func(b *testing.B) {
+				targetDiscoverer := createTestDiscoverer(strategy, prehookConfig)
+				targetDiscoverer.UpdateTsets(tsets)
+				b.ResetTimer()
+				for i := 0; i < b.N; i++ {
+					targetDiscoverer.Reload()
+				}
+			})
 		}
 	}
 
-	for _, strategy := range allocation.GetRegisteredAllocatorNames() {
-		b.Run(strategy, func(b *testing.B) {
-			targetDiscoverer := createTestDiscoverer(strategy, prehookConfig)
-			targetDiscoverer.UpdateTsets(tsets)
-			b.ResetTimer()
-			for i := 0; i < b.N; i++ {
-				targetDiscoverer.Reload()
-			}
-		})
-	}
 }
 
 func prepareBenchmarkData(numTargets, targetsPerGroup, groupsPerJob int) map[string][]*targetgroup.Group {
@@ -140,7 +145,10 @@ func prepareBenchmarkData(numTargets, targetsPerGroup, groupsPerJob int) map[str
 	}
 	targets := []model.LabelSet{}
 	for i := 0; i < numTargets; i++ {
-		targets = append(targets, exampleTarget.Clone())
+		newTarget := exampleTarget.Clone()
+		// ensure each target has a unique label to avoid deduplication
+		newTarget["target_id"] = model.LabelValue(strconv.Itoa(i))
+		targets = append(targets, newTarget)
 	}
 	groups := make([]*targetgroup.Group, numGroups)
 	for i := 0; i < numGroups; i++ {
 
@@ -5,6 +5,8 @@ package allocation
 
 import (
 	"errors"
+	"runtime"
+	"slices"
 	"sync"
 
 	"github.com/go-logr/logr"
@@ -73,20 +75,22 @@ func (a *allocator) SetFallbackStrategy(strategy Strategy) {
 // SetTargets accepts a list of targets that will be used to make
 // load balancing decisions. This method should be called when there are
 // new targets discovered or existing targets are shutdown.
-func (a *allocator) SetTargets(targets map[string]*target.Item) {
+func (a *allocator) SetTargets(targets []*target.Item) {
 	timer := prometheus.NewTimer(TimeToAssign.WithLabelValues("SetTargets", a.strategy.GetName()))
 	defer timer.ObserveDuration()
 
 	if a.filter != nil {
 		targets = a.filter.Apply(targets)
 	}
 	RecordTargetsKept(targets)
+	concurrency := runtime.NumCPU() * 2 // determined experimentally
+	targetMap := buildTargetMap(targets, concurrency)
 
 	a.m.Lock()
 	defer a.m.Unlock()
 
 	// Check for target changes
-	targetsDiff := diff.Maps(a.targetItems, targets)
+	targetsDiff := diff.Maps(a.targetItems, targetMap)
 	// If there are any additions or removals
 	if len(targetsDiff.Additions()) != 0 || len(targetsDiff.Removals()) != 0 {
 		a.handleTargets(targetsDiff)
@@ -302,3 +306,30 @@ func (a *allocator) handleCollectors(diff diff.Changes[*Collector]) {
 		TargetsUnassigned.Set(float64(unassignedTargets))
 	}
 }
+
+const minChunkSize = 100 // for small target counts, it's not worth it to spawn a lot of goroutines
+
+// buildTargetMap builds a map of targets, using their hashes as keys. It does this concurrently, and the concurrency
+// is configurable via the concurrency parameter. We do this in parallel because target hashing is surprisingly
+// expensive.
+func buildTargetMap(targets []*target.Item, concurrency int) map[string]*target.Item {
+	// technically there may be duplicates, so this may overallocate, but in the majority of cases it will be exact
+	result := make(map[string]*target.Item, len(targets))
+	chunkSize := len(targets) / concurrency
+	chunkSize = max(chunkSize, minChunkSize)
+	wg := sync.WaitGroup{}
+	for chunk := range slices.Chunk(targets, chunkSize) {
+		wg.Add(1)
+		go func(ch []*target.Item) {
+			defer wg.Done()
+			for _, item := range ch {
+				item.Hash()
+			}
+		}(chunk)
+	}
+	wg.Wait()
+	for _, item := range targets {
+		result[item.Hash()] = item
+	}
+	return result
+}
@@ -174,10 +174,7 @@ func TestAllocationCollision(t *testing.T) {
 		firstTarget := target.NewItem("sample-name", "0.0.0.0:8000", firstLabels, "")
 		secondTarget := target.NewItem("sample-name", "0.0.0.0:8000", secondLabels, "")
 
-		targetList := map[string]*target.Item{
-			firstTarget.Hash():  firstTarget,
-			secondTarget.Hash(): secondTarget,
-		}
+		targetList := []*target.Item{firstTarget, secondTarget}
 
 		// test that targets and collectors are added properly
 		allocator.SetTargets(targetList)
 
@@ -7,6 +7,7 @@ import (
 	"fmt"
 	"math"
 	"math/rand"
+	"slices"
 	"testing"
 
 	"github.com/stretchr/testify/assert"
@@ -128,7 +129,7 @@ func TestCollectorBalanceWhenAddingAndRemovingAtRandom(t *testing.T) {
 	for index := range targets {
 		shouldDelete := rand.Intn(toDelete) //nolint:gosec
 		if counter < shouldDelete {
-			delete(targets, index)
+			targets = slices.Delete(targets, index, index)
 		}
 		counter++
 	}
@@ -144,9 +145,7 @@ func TestCollectorBalanceWhenAddingAndRemovingAtRandom(t *testing.T) {
 		assert.InDelta(t, i.NumTargets, count, math.Round(percent))
 	}
 	// adding targets at 'random'
-	for _, item := range MakeNNewTargets(13, 3, 100) {
-		targets[item.Hash()] = item
-	}
+	targets = append(targets, MakeNNewTargets(13, 3, 100)...)
 	s.SetTargets(targets)
 
 	targetItemLen = len(s.TargetItems())
 
@@ -56,11 +56,11 @@ func TestAllocationPerNode(t *testing.T) {
 	thirdTarget := target.NewItem("sample-name", "0.0.0.0:8000", thirdLabels, "")
 	fourthTarget := target.NewItem("sample-name", "0.0.0.0:8000", fourthLabels, "")
 
-	targetList := map[string]*target.Item{
-		firstTarget.Hash():  firstTarget,
-		secondTarget.Hash(): secondTarget,
-		thirdTarget.Hash():  thirdTarget,
-		fourthTarget.Hash(): fourthTarget,
+	targetList := []*target.Item{
+		firstTarget,
+		secondTarget,
+		thirdTarget,
+		fourthTarget,
 	}
 
 	// test that targets and collectors are added properly
@@ -74,16 +74,16 @@ func TestAllocationPerNode(t *testing.T) {
 	assert.Len(t, actualItems, expectedTargetLen)
 
 	// verify allocation to nodes
-	for targetHash, item := range targetList {
-		actualItem, found := actualItems[targetHash]
+	for _, item := range targetList {
+		actualItem, found := actualItems[item.Hash()]
 		// if third target, should be skipped
 		assert.True(t, found, "target with hash %s not found", item.Hash())
 
 		// only the first two targets should be allocated
 		itemsForCollector := s.GetTargetsForCollectorAndJob(actualItem.CollectorName, actualItem.JobName)
 
 		// first two should be assigned one to each collector; if third target, should not be assigned
-		if targetHash == thirdTarget.Hash() {
+		if item.Hash() == thirdTarget.Hash() {
 			assert.Len(t, itemsForCollector, 0)
 			continue
 		}
@@ -123,11 +123,11 @@ func TestAllocationPerNodeUsingFallback(t *testing.T) {
 	thirdTarget := target.NewItem("sample-name", "0.0.0.0:8000", thirdLabels, "")
 	fourthTarget := target.NewItem("sample-name", "0.0.0.0:8000", fourthLabels, "")
 
-	targetList := map[string]*target.Item{
-		firstTarget.Hash():  firstTarget,
-		secondTarget.Hash(): secondTarget,
-		thirdTarget.Hash():  thirdTarget,
-		fourthTarget.Hash(): fourthTarget,
+	targetList := []*target.Item{
+		firstTarget,
+		secondTarget,
+		thirdTarget,
+		fourthTarget,
 	}
 
 	// test that targets and collectors are added properly
@@ -141,8 +141,8 @@ func TestAllocationPerNodeUsingFallback(t *testing.T) {
 	assert.Len(t, actualItems, expectedTargetLen)
 
 	// verify allocation to nodes
-	for targetHash, item := range targetList {
-		actualItem, found := actualItems[targetHash]
+	for _, item := range targetList {
+		actualItem, found := actualItems[item.Hash()]
 
 		assert.True(t, found, "target with hash %s not found", item.Hash())
 
@@ -151,7 +151,7 @@ func TestAllocationPerNodeUsingFallback(t *testing.T) {
 		// first two should be assigned one to each collector; if third target, it should be assigned
 		// according to the fallback strategy which may assign it to the otherwise empty collector or
 		// one of the others, depending on the strategy and collector loop order
-		if targetHash == thirdTarget.Hash() {
+		if item.Hash() == thirdTarget.Hash() {
 			assert.Empty(t, item.GetNodeName())
 			assert.NotZero(t, len(itemsForCollector))
 			continue
 
@@ -50,7 +50,7 @@ var (
 type Option func(Allocator)
 
 type Filter interface {
-	Apply(map[string]*target.Item) map[string]*target.Item
+	Apply([]*target.Item) []*target.Item
 }
 
 func WithFilter(filter Filter) Option {
@@ -69,7 +69,7 @@ func WithFallbackStrategy(fallbackStrategy string) Option {
 	}
 }
 
-func RecordTargetsKept(targets map[string]*target.Item) {
+func RecordTargetsKept(targets []*target.Item) {
 	TargetsRemaining.Set(float64(len(targets)))
 }
 
@@ -90,7 +90,7 @@ func GetRegisteredAllocatorNames() []string {
 
 type Allocator interface {
 	SetCollectors(collectors map[string]*Collector)
-	SetTargets(targets map[string]*target.Item)
+	SetTargets(targets []*target.Item)
 	TargetItems() map[string]*target.Item
 	Collectors() map[string]*Collector
 	GetTargetsForCollectorAndJob(collector string, job string) []*target.Item
 
@@ -24,16 +24,16 @@ func colIndex(index, numCols int) int {
 	return index % numCols
 }
 
-func MakeNNewTargets(n int, numCollectors int, startingIndex int) map[string]*target.Item {
-	toReturn := map[string]*target.Item{}
+func MakeNNewTargets(n int, numCollectors int, startingIndex int) []*target.Item {
+	toReturn := []*target.Item{}
 	for i := startingIndex; i < n+startingIndex; i++ {
 		collector := fmt.Sprintf("collector-%d", colIndex(i, numCollectors))
 		label := labels.Labels{
 			{Name: "i", Value: strconv.Itoa(i)},
 			{Name: "total", Value: strconv.Itoa(n + startingIndex)},
 		}
 		newTarget := target.NewItem(fmt.Sprintf("test-job-%d", i), fmt.Sprintf("test-url-%d", i), label, collector)
-		toReturn[newTarget.Hash()] = newTarget
+		toReturn = append(toReturn, newTarget)
 	}
 	return toReturn
 }
@@ -51,16 +51,16 @@ func MakeNCollectors(n int, startingIndex int) map[string]*Collector {
 	return toReturn
 }
 
-func MakeNNewTargetsWithEmptyCollectors(n int, startingIndex int) map[string]*target.Item {
-	toReturn := map[string]*target.Item{}
+func MakeNNewTargetsWithEmptyCollectors(n int, startingIndex int) []*target.Item {
+	toReturn := []*target.Item{}
 	for i := startingIndex; i < n+startingIndex; i++ {
 		label := labels.Labels{
 			{Name: "i", Value: strconv.Itoa(i)},
 			{Name: "total", Value: strconv.Itoa(n + startingIndex)},
 			{Name: "__meta_kubernetes_pod_node_name", Value: "node-0"},
 		}
 		newTarget := target.NewItem(fmt.Sprintf("test-job-%d", i), fmt.Sprintf("test-url-%d", i), label, "")
-		toReturn[newTarget.Hash()] = newTarget
+		toReturn = append(toReturn, newTarget)
 	}
 	return toReturn
 }
 
@@ -11,7 +11,7 @@ import (
 )
 
 type Hook interface {
-	Apply(map[string]*target.Item) map[string]*target.Item
+	Apply([]*target.Item) []*target.Item
 	SetConfig(map[string][]*relabel.Config)
 	GetConfig() map[string][]*relabel.Config
 }
Original file line number	Diff line number	Diff line change
`@@ -50,7 +50,7 @@ var (`
`50`	`50`	`type Option func(Allocator)`
`51`	`51`
`52`	`52`	`type Filter interface {`
`53`		`- Apply(map[string]target.Item) map[string]target.Item`
	`53`	`+ Apply([]target.Item) []target.Item`
`54`	`54`	`}`
`55`	`55`
`56`	`56`	`func WithFilter(filter Filter) Option {`
`@@ -69,7 +69,7 @@ func WithFallbackStrategy(fallbackStrategy string) Option {`
`69`	`69`	`}`
`70`	`70`	`}`
`71`	`71`
`72`		`-func RecordTargetsKept(targets map[string]*target.Item) {`
	`72`	`+func RecordTargetsKept(targets []*target.Item) {`
`73`	`73`	`TargetsRemaining.Set(float64(len(targets)))`
`74`	`74`	`}`
`75`	`75`
`@@ -90,7 +90,7 @@ func GetRegisteredAllocatorNames() []string {`
`90`	`90`
`91`	`91`	`type Allocator interface {`
`92`	`92`	`SetCollectors(collectors map[string]*Collector)`
`93`		`- SetTargets(targets map[string]*target.Item)`
	`93`	`+ SetTargets(targets []*target.Item)`
`94`	`94`	`TargetItems() map[string]*target.Item`
`95`	`95`	`Collectors() map[string]*Collector`
`96`	`96`	`GetTargetsForCollectorAndJob(collector string, job string) []*target.Item`
Original file line number	Diff line number	Diff line change
`@@ -24,16 +24,16 @@ func colIndex(index, numCols int) int {`
`24`	`24`	`return index % numCols`
`25`	`25`	`}`
`26`	`26`
`27`		`-func MakeNNewTargets(n int, numCollectors int, startingIndex int) map[string]*target.Item {`
`28`		`- toReturn := map[string]*target.Item{}`
	`27`	`+func MakeNNewTargets(n int, numCollectors int, startingIndex int) []*target.Item {`
	`28`	`+ toReturn := []*target.Item{}`
`29`	`29`	`for i := startingIndex; i < n+startingIndex; i++ {`
`30`	`30`	`collector := fmt.Sprintf("collector-%d", colIndex(i, numCollectors))`
`31`	`31`	`label := labels.Labels{`
`32`	`32`	`{Name: "i", Value: strconv.Itoa(i)},`
`33`	`33`	`{Name: "total", Value: strconv.Itoa(n + startingIndex)},`
`34`	`34`	`}`
`35`	`35`	`newTarget := target.NewItem(fmt.Sprintf("test-job-%d", i), fmt.Sprintf("test-url-%d", i), label, collector)`
`36`		`- toReturn[newTarget.Hash()] = newTarget`
	`36`	`+ toReturn = append(toReturn, newTarget)`
`37`	`37`	`}`
`38`	`38`	`return toReturn`
`39`	`39`	`}`
`@@ -51,16 +51,16 @@ func MakeNCollectors(n int, startingIndex int) map[string]*Collector {`
`51`	`51`	`return toReturn`
`52`	`52`	`}`
`53`	`53`
`54`		`-func MakeNNewTargetsWithEmptyCollectors(n int, startingIndex int) map[string]*target.Item {`
`55`		`- toReturn := map[string]*target.Item{}`
	`54`	`+func MakeNNewTargetsWithEmptyCollectors(n int, startingIndex int) []*target.Item {`
	`55`	`+ toReturn := []*target.Item{}`
`56`	`56`	`for i := startingIndex; i < n+startingIndex; i++ {`
`57`	`57`	`label := labels.Labels{`
`58`	`58`	`{Name: "i", Value: strconv.Itoa(i)},`
`59`	`59`	`{Name: "total", Value: strconv.Itoa(n + startingIndex)},`
`60`	`60`	`{Name: "__meta_kubernetes_pod_node_name", Value: "node-0"},`
`61`	`61`	`}`
`62`	`62`	`newTarget := target.NewItem(fmt.Sprintf("test-job-%d", i), fmt.Sprintf("test-url-%d", i), label, "")`
`63`		`- toReturn[newTarget.Hash()] = newTarget`
	`63`	`+ toReturn = append(toReturn, newTarget)`
`64`	`64`	`}`
`65`	`65`	`return toReturn`
`66`	`66`	`}`
Original file line number	Diff line number	Diff line change
`@@ -11,7 +11,7 @@ import (`
`11`	`11`	`)`
`12`	`12`
`13`	`13`	`type Hook interface {`
`14`		`- Apply(map[string]target.Item) map[string]target.Item`
	`14`	`+ Apply([]target.Item) []target.Item`
`15`	`15`	`SetConfig(map[string][]*relabel.Config)`
`16`	`16`	`GetConfig() map[string][]*relabel.Config`
`17`	`17`	`}`