aboutsummaryrefslogtreecommitdiffstats
path: root/node-repository/src/main/java/com/yahoo/vespa/hosted/provision/maintenance/InfraApplicationRedeployer.java
diff options
context:
space:
mode:
Diffstat (limited to 'node-repository/src/main/java/com/yahoo/vespa/hosted/provision/maintenance/InfraApplicationRedeployer.java')
-rw-r--r--node-repository/src/main/java/com/yahoo/vespa/hosted/provision/maintenance/InfraApplicationRedeployer.java117
1 files changed, 117 insertions, 0 deletions
diff --git a/node-repository/src/main/java/com/yahoo/vespa/hosted/provision/maintenance/InfraApplicationRedeployer.java b/node-repository/src/main/java/com/yahoo/vespa/hosted/provision/maintenance/InfraApplicationRedeployer.java
new file mode 100644
index 00000000000..434e6161a4c
--- /dev/null
+++ b/node-repository/src/main/java/com/yahoo/vespa/hosted/provision/maintenance/InfraApplicationRedeployer.java
@@ -0,0 +1,117 @@
+package com.yahoo.vespa.hosted.provision.maintenance;
+
+import com.yahoo.component.annotation.Inject;
+import com.yahoo.concurrent.DaemonThreadFactory;
+import com.yahoo.concurrent.UncheckedTimeoutException;
+import com.yahoo.config.provision.ApplicationId;
+import com.yahoo.config.provision.Deployment;
+import com.yahoo.config.provision.InfraDeployer;
+import com.yahoo.config.provision.NodeType;
+import com.yahoo.transaction.Mutex;
+import com.yahoo.vespa.applicationmodel.InfrastructureApplication;
+import com.yahoo.vespa.hosted.provision.Node.State;
+import com.yahoo.vespa.hosted.provision.NodeList;
+import com.yahoo.vespa.hosted.provision.NodeRepository;
+
+import java.util.Optional;
+import java.util.Set;
+import java.util.concurrent.ConcurrentSkipListSet;
+import java.util.concurrent.ExecutorService;
+import java.util.concurrent.Executors;
+import java.util.concurrent.TimeUnit;
+import java.util.function.Function;
+import java.util.function.Supplier;
+import java.util.logging.Logger;
+
+import static java.util.logging.Level.FINE;
+import static java.util.logging.Level.INFO;
+import static java.util.logging.Level.WARNING;
+
+/**
+ * Performs on-demand redeployment of the {@link InfrastructureApplication}s, to minimise time between
+ * host provisioning for a deployment completing, and deployment of its application containers succeeding.
+ *
+ * @author jonmv
+ */
+public class InfraApplicationRedeployer implements AutoCloseable {
+
+ private static final Logger log = Logger.getLogger(InfraApplicationRedeployer.class.getName());
+
+ private final ExecutorService executor = Executors.newSingleThreadExecutor(new DaemonThreadFactory("infra-application-redeployer-"));
+ private final Set<InfrastructureApplication> readiedTypes = new ConcurrentSkipListSet<>();
+ private final InfraDeployer deployer;
+ private final Function<ApplicationId, Mutex> locks;
+ private final Supplier<NodeList> nodes;
+
+ @Inject
+ public InfraApplicationRedeployer(InfraDeployer deployer, NodeRepository nodes) {
+ this(deployer, nodes.applications()::lockMaintenance, nodes.nodes()::list);
+ }
+
+ InfraApplicationRedeployer(InfraDeployer deployer, Function<ApplicationId, Mutex> locks, Supplier<NodeList> nodes) {
+ this.deployer = deployer;
+ this.locks = locks;
+ this.nodes = nodes;
+ }
+
+ public void readied(NodeType type) {
+ applicationOf(type).ifPresent(this::readied);
+ }
+
+ private void readied(InfrastructureApplication application) {
+ if (application == null) return;
+ if (readiedTypes.add(application)) executor.execute(() -> checkAndRedeploy(application));
+ }
+
+ private void checkAndRedeploy(InfrastructureApplication application) {
+ if ( ! readiedTypes.remove(application)) return;
+ try (Mutex lock = locks.apply(application.id())) {
+ if (application.nodeType().isHost() && nodes.get().state(State.ready).nodeType(application.nodeType()).isEmpty()) return;
+ log.log(FINE, () -> "Redeploying " + application.id() + " after completing provisioning for " + application.name());
+ try {
+ deployer.getDeployment(application.id()).ifPresent(Deployment::activate);
+ childOf(application).ifPresent(this::readied);
+ }
+ catch (RuntimeException e) {
+ log.log(INFO, "Failed redeploying " + application.id() + ", will be retried by maintainer", e);
+ }
+ }
+ catch (UncheckedTimeoutException collision) {
+ readied(application);
+ }
+ }
+
+ private static Optional<InfrastructureApplication> applicationOf(NodeType type) {
+ return switch (type) {
+ case host -> Optional.of(InfrastructureApplication.TENANT_HOST);
+ case confighost -> Optional.of(InfrastructureApplication.CONFIG_SERVER_HOST);
+ case config -> Optional.of(InfrastructureApplication.CONFIG_SERVER);
+ case controllerhost -> Optional.of(InfrastructureApplication.CONTROLLER_HOST);
+ case controller -> Optional.of(InfrastructureApplication.CONTROLLER);
+ case proxyhost -> Optional.of(InfrastructureApplication.PROXY_HOST);
+ default -> Optional.empty();
+ };
+ }
+
+ private static Optional<InfrastructureApplication> childOf(InfrastructureApplication application) {
+ return switch (application) {
+ case CONFIG_SERVER_HOST -> Optional.of(InfrastructureApplication.CONFIG_SERVER);
+ case CONTROLLER_HOST -> Optional.of(InfrastructureApplication.CONTROLLER);
+ default -> Optional.empty();
+ };
+ }
+
+ @Override
+ public void close() {
+ executor.shutdown();
+ try {
+ if (executor.awaitTermination(10, TimeUnit.SECONDS)) return;
+ log.log(WARNING, "Redeployer did not shut down within 10 seconds");
+ }
+ catch (InterruptedException e) {
+ Thread.currentThread().interrupt();
+ }
+ executor.shutdownNow();
+ }
+
+}