aboutsummaryrefslogtreecommitdiffstats
path: root/node-repository/src/main/java/com/yahoo/vespa/hosted/provision/maintenance/InfraApplicationRedeployer.java
blob: 434e6161a4cd470d85970fc4d1499d56dc1ccac8 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
package com.yahoo.vespa.hosted.provision.maintenance;

import com.yahoo.component.annotation.Inject;
import com.yahoo.concurrent.DaemonThreadFactory;
import com.yahoo.concurrent.UncheckedTimeoutException;
import com.yahoo.config.provision.ApplicationId;
import com.yahoo.config.provision.Deployment;
import com.yahoo.config.provision.InfraDeployer;
import com.yahoo.config.provision.NodeType;
import com.yahoo.transaction.Mutex;
import com.yahoo.vespa.applicationmodel.InfrastructureApplication;
import com.yahoo.vespa.hosted.provision.Node.State;
import com.yahoo.vespa.hosted.provision.NodeList;
import com.yahoo.vespa.hosted.provision.NodeRepository;

import java.util.Optional;
import java.util.Set;
import java.util.concurrent.ConcurrentSkipListSet;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Executors;
import java.util.concurrent.TimeUnit;
import java.util.function.Function;
import java.util.function.Supplier;
import java.util.logging.Logger;

import static java.util.logging.Level.FINE;
import static java.util.logging.Level.INFO;
import static java.util.logging.Level.WARNING;

/**
 * Performs on-demand redeployment of the {@link InfrastructureApplication}s, to minimise time between
 * host provisioning for a deployment completing, and deployment of its application containers succeeding.
 *
 * @author jonmv
 */
public class InfraApplicationRedeployer implements AutoCloseable {

    private static final Logger log = Logger.getLogger(InfraApplicationRedeployer.class.getName());

    private final ExecutorService executor = Executors.newSingleThreadExecutor(new DaemonThreadFactory("infra-application-redeployer-"));
    private final Set<InfrastructureApplication> readiedTypes = new ConcurrentSkipListSet<>();
    private final InfraDeployer deployer;
    private final Function<ApplicationId, Mutex> locks;
    private final Supplier<NodeList> nodes;

    @Inject
    public InfraApplicationRedeployer(InfraDeployer deployer, NodeRepository nodes) {
        this(deployer, nodes.applications()::lockMaintenance, nodes.nodes()::list);
    }

    InfraApplicationRedeployer(InfraDeployer deployer, Function<ApplicationId, Mutex> locks, Supplier<NodeList> nodes) {
        this.deployer = deployer;
        this.locks = locks;
        this.nodes = nodes;
    }

    public void readied(NodeType type) {
        applicationOf(type).ifPresent(this::readied);
    }

    private void readied(InfrastructureApplication application) {
        if (application == null) return;
        if (readiedTypes.add(application)) executor.execute(() -> checkAndRedeploy(application));
    }

    private void checkAndRedeploy(InfrastructureApplication application) {
        if ( ! readiedTypes.remove(application)) return;
        try (Mutex lock = locks.apply(application.id())) {
            if (application.nodeType().isHost() && nodes.get().state(State.ready).nodeType(application.nodeType()).isEmpty()) return;
            log.log(FINE, () -> "Redeploying " + application.id() + " after completing provisioning for " + application.name());
            try {
                deployer.getDeployment(application.id()).ifPresent(Deployment::activate);
                childOf(application).ifPresent(this::readied);
            }
            catch (RuntimeException e) {
                log.log(INFO, "Failed redeploying " + application.id() + ", will be retried by maintainer", e);
            }
        }
        catch (UncheckedTimeoutException collision) {
            readied(application);
        }
    }

    private static Optional<InfrastructureApplication> applicationOf(NodeType type) {
        return switch (type) {
            case host -> Optional.of(InfrastructureApplication.TENANT_HOST);
            case confighost -> Optional.of(InfrastructureApplication.CONFIG_SERVER_HOST);
            case config -> Optional.of(InfrastructureApplication.CONFIG_SERVER);
            case controllerhost -> Optional.of(InfrastructureApplication.CONTROLLER_HOST);
            case controller -> Optional.of(InfrastructureApplication.CONTROLLER);
            case proxyhost -> Optional.of(InfrastructureApplication.PROXY_HOST);
            default -> Optional.empty();
        };
    }

    private static Optional<InfrastructureApplication> childOf(InfrastructureApplication application) {
        return switch (application) {
            case CONFIG_SERVER_HOST -> Optional.of(InfrastructureApplication.CONFIG_SERVER);
            case CONTROLLER_HOST -> Optional.of(InfrastructureApplication.CONTROLLER);
            default -> Optional.empty();
        };
    }

    @Override
    public void close() {
        executor.shutdown();
        try {
            if (executor.awaitTermination(10, TimeUnit.SECONDS)) return;
            log.log(WARNING, "Redeployer did not shut down within 10 seconds");
        }
        catch (InterruptedException e) {
            Thread.currentThread().interrupt();
        }
        executor.shutdownNow();
    }

}