summaryrefslogtreecommitdiffstats
path: root/container-search
diff options
context:
space:
mode:
authorHenning Baldersheim <balder@yahoo-inc.com>2022-08-22 16:32:23 +0200
committerHenning Baldersheim <balder@yahoo-inc.com>2022-08-22 16:35:15 +0200
commit591909a0ceaf0de0d89f2aeb0d60d36dbe2a0a62 (patch)
tree29de1b4fa4b22190587df46e51f8379ea03db8c0 /container-search
parentedf069589668ffd93736f071bf5c81d1247083fb (diff)
- Refactor to allow for different decay method.
- Implement decay over constant time in addition to over requests. - Default is decay over 500 requests, and 5.0s if you choose to decay over time.
Diffstat (limited to 'container-search')
-rw-r--r--container-search/src/main/java/com/yahoo/search/dispatch/CloseableInvoker.java10
-rw-r--r--container-search/src/main/java/com/yahoo/search/dispatch/Dispatcher.java2
-rw-r--r--container-search/src/main/java/com/yahoo/search/dispatch/LoadBalancer.java93
-rw-r--r--container-search/src/main/java/com/yahoo/search/dispatch/RequestDuration.java41
-rw-r--r--container-search/src/test/java/com/yahoo/search/dispatch/LoadBalancerTest.java84
5 files changed, 183 insertions, 47 deletions
diff --git a/container-search/src/main/java/com/yahoo/search/dispatch/CloseableInvoker.java b/container-search/src/main/java/com/yahoo/search/dispatch/CloseableInvoker.java
index 9da89c6bfd8..77496114df1 100644
--- a/container-search/src/main/java/com/yahoo/search/dispatch/CloseableInvoker.java
+++ b/container-search/src/main/java/com/yahoo/search/dispatch/CloseableInvoker.java
@@ -16,13 +16,13 @@ public abstract class CloseableInvoker implements Closeable {
protected abstract void release();
- private BiConsumer<Boolean, Duration> teardown = null;
+ private BiConsumer<Boolean, RequestDuration> teardown = null;
private boolean success = false;
- private long startTime = 0;
+ private RequestDuration duration;
- public void teardown(BiConsumer<Boolean, Duration> teardown) {
+ public void teardown(BiConsumer<Boolean, RequestDuration> teardown) {
this.teardown = teardown;
- this.startTime = System.nanoTime();
+ this.duration = new RequestDuration();
}
protected void setFinalStatus(boolean success) {
@@ -32,7 +32,7 @@ public abstract class CloseableInvoker implements Closeable {
@Override
public final void close() {
if (teardown != null) {
- teardown.accept(success, Duration.ofNanos(System.nanoTime() - startTime));
+ teardown.accept(success, duration.complete());
teardown = null;
}
release();
diff --git a/container-search/src/main/java/com/yahoo/search/dispatch/Dispatcher.java b/container-search/src/main/java/com/yahoo/search/dispatch/Dispatcher.java
index 9ae97dabccd..345c621ae24 100644
--- a/container-search/src/main/java/com/yahoo/search/dispatch/Dispatcher.java
+++ b/container-search/src/main/java/com/yahoo/search/dispatch/Dispatcher.java
@@ -227,7 +227,7 @@ public class Dispatcher extends AbstractComponent {
invoker.get().teardown((success, time) -> loadBalancer.releaseGroup(group, success, time));
return invoker.get();
} else {
- loadBalancer.releaseGroup(group, false, Duration.ZERO);
+ loadBalancer.releaseGroup(group, false, RequestDuration.of(Duration.ZERO));
if (rejected == null) {
rejected = new HashSet<>();
}
diff --git a/container-search/src/main/java/com/yahoo/search/dispatch/LoadBalancer.java b/container-search/src/main/java/com/yahoo/search/dispatch/LoadBalancer.java
index 6d8bb1dce3d..99960be5d65 100644
--- a/container-search/src/main/java/com/yahoo/search/dispatch/LoadBalancer.java
+++ b/container-search/src/main/java/com/yahoo/search/dispatch/LoadBalancer.java
@@ -26,8 +26,9 @@ public class LoadBalancer {
private static final long DEFAULT_LATENCY_DECAY_RATE = 1000;
private static final long MIN_LATENCY_DECAY_RATE = 42;
- private static final double INITIAL_QUERY_TIME = 0.001;
- private static final double MIN_QUERY_TIME = 0.001;
+ private static final double LATENCY_DECAY_TIME = Duration.ofSeconds(5).toMillis()/1000.0;
+ private static final Duration INITIAL_QUERY_TIME = Duration.ofMillis(1);
+ private static final double MIN_QUERY_TIME = Duration.ofMillis(1).toMillis()/1000.0;
private final List<GroupStatus> scoreboard;
private final GroupScheduler scheduler;
@@ -45,8 +46,8 @@ public class LoadBalancer {
this.scheduler = switch (policy) {
case ROUNDROBIN: yield new RoundRobinScheduler(scoreboard);
case BEST_OF_RANDOM_2: yield new BestOfRandom2(new Random(), scoreboard);
- case LATENCY_AMORTIZED_OVER_REQUESTS: yield new AdaptiveScheduler(new Random(), scoreboard);
- case LATENCY_AMORTIZED_OVER_TIME: yield new AdaptiveScheduler(new Random(), scoreboard); // TODO Intentionally the same for now
+ case LATENCY_AMORTIZED_OVER_REQUESTS: yield new AdaptiveScheduler(AdaptiveScheduler.Type.REQUESTS, new Random(), scoreboard);
+ case LATENCY_AMORTIZED_OVER_TIME: yield new AdaptiveScheduler(AdaptiveScheduler.Type.TIME, new Random(), scoreboard);
};
}
@@ -80,7 +81,7 @@ public class LoadBalancer {
* @param success was the query successful
* @param searchTime query execution time, used for adaptive load balancing
*/
- public void releaseGroup(Group group, boolean success, Duration searchTime) {
+ public void releaseGroup(Group group, boolean success, RequestDuration searchTime) {
synchronized (this) {
for (GroupStatus sched : scoreboard) {
if (sched.group.id() == group.id()) {
@@ -93,50 +94,55 @@ public class LoadBalancer {
static class GroupStatus {
+ interface Decayer {
+ void decay(RequestDuration duration);
+ double averageSearchTime();
+ }
+
+ static class NoDecay implements Decayer {
+ public void decay(RequestDuration duration) {}
+ public double averageSearchTime() { return MIN_QUERY_TIME; }
+ }
+
private final Group group;
private int allocations = 0;
- private long queries = 0;
- private double averageSearchTime = INITIAL_QUERY_TIME;
+ private Decayer decayer;
GroupStatus(Group group) {
this.group = group;
+ this.decayer = new NoDecay();
+ }
+ void setDecayer(Decayer decayer) {
+ this.decayer = decayer;
}
void allocate() {
allocations++;
}
- void release(boolean success, Duration searchTime) {
- double searchSeconds = searchTime.toMillis()/1000.0;
+ void release(boolean success, RequestDuration searchTime) {
allocations--;
if (allocations < 0) {
log.warning("Double free of query target group detected");
allocations = 0;
}
if (success) {
- searchSeconds = Math.max(searchSeconds, MIN_QUERY_TIME);
- double decayRate = Math.min(queries + MIN_LATENCY_DECAY_RATE, DEFAULT_LATENCY_DECAY_RATE);
- averageSearchTime = (searchSeconds + (decayRate - 1) * averageSearchTime) / decayRate;
- queries++;
+ decayer.decay(searchTime);
}
}
Duration averageSearchTime() {
- return Duration.ofNanos((long)(averageSearchTime*1000000000));
+ return Duration.ofNanos((long)(decayer.averageSearchTime()*1_000_000_000));
}
double averageSearchTimeInverse() {
- return 1.0 / averageSearchTime;
+ return 1.0 / decayer.averageSearchTime();
}
int groupId() {
return group.id();
}
- void setQueryStatistics(long queries, Duration averageSearchTime) {
- this.queries = queries;
- this.averageSearchTime = averageSearchTime.toMillis()/1000.0;
- }
}
private interface GroupScheduler {
@@ -201,13 +207,58 @@ public class LoadBalancer {
}
static class AdaptiveScheduler implements GroupScheduler {
-
+ enum Type {TIME, REQUESTS}
private final Random random;
private final List<GroupStatus> scoreboard;
- public AdaptiveScheduler(Random random, List<GroupStatus> scoreboard) {
+ private static double toDouble(Duration duration) {
+ return duration.toNanos()/1_000_000_000.0;
+ }
+ static class DecayByRequests implements GroupStatus.Decayer {
+ private long queries;
+ private double averageSearchTime;
+ DecayByRequests() {
+ this(0, INITIAL_QUERY_TIME);
+ }
+ DecayByRequests(long initialQueries, Duration initialSearchTime) {
+ queries = initialQueries;
+ averageSearchTime = toDouble(initialSearchTime);
+ }
+ public void decay(RequestDuration duration) {
+ double searchTime = Math.max(toDouble(duration.duration()), MIN_QUERY_TIME);
+ double decayRate = Math.min(queries + MIN_LATENCY_DECAY_RATE, DEFAULT_LATENCY_DECAY_RATE);
+ queries++;
+ averageSearchTime = (searchTime + (decayRate - 1) * averageSearchTime) / decayRate;
+ }
+ public double averageSearchTime() { return averageSearchTime; }
+ }
+
+ static class DecayByTime implements GroupStatus.Decayer {
+ private double averageSearchTime;
+ private RequestDuration prev;
+ DecayByTime() {
+ this(INITIAL_QUERY_TIME, RequestDuration.of(Duration.ZERO));
+ }
+ DecayByTime(Duration initialSearchTime, RequestDuration start) {
+ averageSearchTime = toDouble(initialSearchTime);
+ prev = start;
+ }
+ public void decay(RequestDuration duration) {
+ double searchTime = Math.max(duration.duration().toMillis()/1000.0, MIN_QUERY_TIME);
+ double decayRate = LATENCY_DECAY_TIME;
+ double sampleWeight = toDouble(duration.timeSince(prev));
+ averageSearchTime = (sampleWeight*searchTime + (decayRate - sampleWeight) * averageSearchTime) / decayRate;
+ prev = duration;
+ }
+ public double averageSearchTime() { return averageSearchTime; }
+ }
+
+ public AdaptiveScheduler(Type type, Random random, List<GroupStatus> scoreboard) {
this.random = random;
this.scoreboard = scoreboard;
+ for (GroupStatus gs : scoreboard) {
+ gs.setDecayer(type == Type.REQUESTS ? new DecayByRequests() : new DecayByTime());
+ }
}
private Optional<GroupStatus> selectGroup(double needle, boolean requireCoverage, Set<Integer> rejected) {
diff --git a/container-search/src/main/java/com/yahoo/search/dispatch/RequestDuration.java b/container-search/src/main/java/com/yahoo/search/dispatch/RequestDuration.java
new file mode 100644
index 00000000000..ad6b7f4a40c
--- /dev/null
+++ b/container-search/src/main/java/com/yahoo/search/dispatch/RequestDuration.java
@@ -0,0 +1,41 @@
+// Copyright Yahoo. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
+package com.yahoo.search.dispatch;
+
+import java.time.Duration;
+import java.time.Instant;
+
+/**
+ *
+ * @author baldersheim
+ */
+class RequestDuration {
+ private final long startTime;
+ private long endTime;
+ RequestDuration() {
+ this(System.nanoTime());
+ }
+ private RequestDuration(long startTime) {
+ this.startTime = startTime;
+ }
+
+ RequestDuration complete() {
+ endTime = System.nanoTime();
+ return this;
+ }
+ private RequestDuration complete(long duration) {
+ endTime = startTime + duration;
+ return this;
+ }
+ Duration duration() {
+ return Duration.ofNanos(endTime - startTime);
+ }
+ Duration timeSince(RequestDuration prev) {
+ return Duration.ofNanos(Math.abs(endTime - prev.endTime));
+ }
+ static RequestDuration of(Duration duration) {
+ return new RequestDuration().complete(duration.toNanos());
+ }
+ static RequestDuration of(Instant sinceEpoch, Duration duration) {
+ return new RequestDuration(sinceEpoch.toEpochMilli()*1_000_000).complete(duration.toNanos());
+ }
+}
diff --git a/container-search/src/test/java/com/yahoo/search/dispatch/LoadBalancerTest.java b/container-search/src/test/java/com/yahoo/search/dispatch/LoadBalancerTest.java
index c9981b3598b..1499a4bb324 100644
--- a/container-search/src/test/java/com/yahoo/search/dispatch/LoadBalancerTest.java
+++ b/container-search/src/test/java/com/yahoo/search/dispatch/LoadBalancerTest.java
@@ -11,6 +11,7 @@ import org.junit.jupiter.api.Test;
import org.opentest4j.AssertionFailedError;
import java.time.Duration;
+import java.time.Instant;
import java.util.ArrayList;
import java.util.Collections;
import java.util.List;
@@ -34,7 +35,7 @@ public class LoadBalancerTest {
LoadBalancer lb = new LoadBalancer(cluster, LoadBalancer.Policy.ROUNDROBIN);
Optional<Group> grp = lb.takeGroup(null);
- Group group = grp.orElseGet(() -> {
+ Group group = grp.orElseThrow(() -> {
throw new AssertionFailedError("Expected a SearchCluster.Group");
});
assertEquals(1, group.nodes().size());
@@ -48,7 +49,7 @@ public class LoadBalancerTest {
LoadBalancer lb = new LoadBalancer(cluster, LoadBalancer.Policy.ROUNDROBIN);
Optional<Group> grp = lb.takeGroup(null);
- Group group = grp.orElseGet(() -> {
+ Group group = grp.orElseThrow(() -> {
throw new AssertionFailedError("Expected a SearchCluster.Group");
});
assertEquals(1, group.nodes().size());
@@ -79,7 +80,7 @@ public class LoadBalancerTest {
Group group = grp.get();
int id1 = group.id();
// release allocation
- lb.releaseGroup(group, true, Duration.ofMillis(1));
+ lb.releaseGroup(group, true, RequestDuration.of(Duration.ofMillis(1)));
// get second group
grp = lb.takeGroup(null);
@@ -89,29 +90,27 @@ public class LoadBalancerTest {
@Test
void requireCorrectAverageSearchTimeDecay() {
- final double delta = 0.00001;
-
GroupStatus gs = newGroupStatus(1);
- gs.setQueryStatistics(0, Duration.ofSeconds(1));
- updateSearchTime(gs, Duration.ofSeconds(1));
+ gs.setDecayer(new AdaptiveScheduler.DecayByRequests(0, Duration.ofSeconds(1)));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofSeconds(1)));
assertEquals(Duration.ofSeconds(1), gs.averageSearchTime());
- updateSearchTime(gs, Duration.ofSeconds(2));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofSeconds(2)));
assertEquals(Duration.ofNanos(1023255813), gs.averageSearchTime());
- updateSearchTime(gs, Duration.ofSeconds(2));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofSeconds(2)));
assertEquals(Duration.ofNanos(1045454545), gs.averageSearchTime());
- updateSearchTime(gs, Duration.ofMillis(100));
- updateSearchTime(gs, Duration.ofMillis(100));
- updateSearchTime(gs, Duration.ofMillis(100));
- updateSearchTime(gs, Duration.ofMillis(100));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofMillis(100)));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofMillis(100)));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofMillis(100)));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofMillis(100)));
assertEquals(Duration.ofNanos(966666666), gs.averageSearchTime());
for (int i = 0; i < 10000; i++) {
- updateSearchTime(gs, Duration.ofSeconds(1));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofSeconds(1)));
}
assertEquals(Duration.ofNanos(999999812), gs.averageSearchTime());
- updateSearchTime(gs, Duration.ofMillis(100));
+ updateSearchTime(gs, RequestDuration.of(Duration.ofMillis(100)));
assertEquals(Duration.ofNanos(999099812), gs.averageSearchTime());
for (int i = 0; i < 10000; i++) {
- updateSearchTime(gs, Duration.ZERO);
+ updateSearchTime(gs, RequestDuration.of(Duration.ZERO));
}
assertEquals(Duration.ofNanos(1045087), gs.averageSearchTime());
}
@@ -123,7 +122,7 @@ public class LoadBalancerTest {
scoreboard.add(newGroupStatus(i));
}
Random seq = sequence(0.0, 0.1, 0.2, 0.39, 0.4, 0.6, 0.8, 0.99999);
- AdaptiveScheduler sched = new AdaptiveScheduler(seq, scoreboard);
+ AdaptiveScheduler sched = new AdaptiveScheduler(AdaptiveScheduler.Type.REQUESTS, seq, scoreboard);
assertEquals(0, sched.takeNextGroup(null).get().groupId());
assertEquals(0, sched.takeNextGroup(null).get().groupId());
@@ -140,11 +139,15 @@ public class LoadBalancerTest {
List<GroupStatus> scoreboard = new ArrayList<>();
for (int i = 0; i < 5; i++) {
GroupStatus gs = newGroupStatus(i);
- gs.setQueryStatistics(1, Duration.ofMillis((long)(0.1 * (i + 1)*1000.0)));
scoreboard.add(gs);
}
Random seq = sequence(0.0, 0.4379, 0.4380, 0.6569, 0.6570, 0.8029, 0.8030, 0.9124, 0.9125);
- AdaptiveScheduler sched = new AdaptiveScheduler(seq, scoreboard);
+ AdaptiveScheduler sched = new AdaptiveScheduler(AdaptiveScheduler.Type.REQUESTS, seq, scoreboard);
+ int i= 0;
+ for (GroupStatus gs : scoreboard) {
+ gs.setDecayer(new AdaptiveScheduler.DecayByRequests(1, Duration.ofMillis((long)(0.1 * (i + 1)*1000.0))));
+ i++;
+ }
assertEquals(0, sched.takeNextGroup(null).get().groupId());
assertEquals(0, sched.takeNextGroup(null).get().groupId());
@@ -190,7 +193,48 @@ public class LoadBalancerTest {
assertEquals(0, allocate(sched.takeNextGroup(null).get()).groupId());
}
- private static void updateSearchTime(GroupStatus gs, Duration time) {
+ private static Duration from_s(double seconds) {
+ return Duration.ofNanos((long)(seconds * 1_000_000_000));
+ }
+
+ private static int countRequestsToReach90p(Duration timeBetweenSample, Duration searchTime) {
+ double p90 = 0.9*searchTime.toMillis()/1000.0;
+ GroupStatus.Decayer decayer = new AdaptiveScheduler.DecayByTime(Duration.ofMillis(1), RequestDuration.of(Instant.EPOCH, Duration.ZERO));
+ int requests = 0;
+ Instant start = Instant.EPOCH;
+ for (; decayer.averageSearchTime() < p90;) {
+ decayer.decay(RequestDuration.of(start, searchTime));
+ start = start.plus(timeBetweenSample);
+ requests++;
+ }
+ return requests;
+ }
+
+ @Test
+ public void requireDecayByTimeToDependOnlyOnTime() {
+ double delta = 0.0000001;
+ GroupStatus.Decayer decayer = new AdaptiveScheduler.DecayByTime(Duration.ofMillis(2), RequestDuration.of(Instant.EPOCH, Duration.ZERO));
+ assertEquals(0.002, decayer.averageSearchTime(), delta);
+ decayer.decay(RequestDuration.of(Instant.ofEpochMilli(1000), Duration.ofMillis(10)));
+ assertEquals(0.003616, decayer.averageSearchTime(), delta);
+ decayer.decay(RequestDuration.of(Instant.ofEpochMilli(2000), Duration.ofMillis(10)));
+ assertEquals(0.0048928, decayer.averageSearchTime(), delta);
+ decayer.decay(RequestDuration.of(Instant.ofEpochMilli(3000), Duration.ofMillis(10)));
+ assertEquals(0.00591424, decayer.averageSearchTime(), delta);
+ decayer.decay(RequestDuration.of(Instant.ofEpochMilli(3100), Duration.ofMillis(10)));
+ assertEquals(0.0059959552, decayer.averageSearchTime(), delta);
+ decayer.decay(RequestDuration.of(Instant.ofEpochMilli(3100), Duration.ofMillis(10)));
+ assertEquals(0.0059959552, decayer.averageSearchTime(), delta);
+ decayer.decay(RequestDuration.of(Instant.ofEpochMilli(3000), Duration.ofMillis(10)));
+ assertEquals(0.006076036096, decayer.averageSearchTime(), delta);
+ decayer.decay(RequestDuration.of(Instant.ofEpochMilli(6000), Duration.ofMillis(10)));
+ assertEquals(0.0084304144384, decayer.averageSearchTime(), delta);
+ assertEquals(110, countRequestsToReach90p(Duration.ofMillis(100), Duration.ofMillis(10)));
+ assertEquals(55, countRequestsToReach90p(Duration.ofMillis(200), Duration.ofMillis(10)));
+ assertEquals(11, countRequestsToReach90p(Duration.ofMillis(1000), Duration.ofMillis(10)));
+ }
+
+ private static void updateSearchTime(GroupStatus gs, RequestDuration time) {
gs.allocate();
gs.release(true, time);
}