summaryrefslogtreecommitdiffstats
path: root/node-repository/src/test/java/com/yahoo/vespa/hosted/provision/maintenance/FailedExpirerTest.java
blob: a1d9268ee33e0320a4c74a93ae07a3f18fabe678 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
// Copyright 2016 Yahoo Inc. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
package com.yahoo.vespa.hosted.provision.maintenance;

import com.yahoo.config.provision.ApplicationId;
import com.yahoo.config.provision.ApplicationName;
import com.yahoo.config.provision.Capacity;
import com.yahoo.config.provision.ClusterSpec;
import com.yahoo.config.provision.Environment;
import com.yahoo.config.provision.HostSpec;
import com.yahoo.config.provision.InstanceName;
import com.yahoo.config.provision.RegionName;
import com.yahoo.config.provision.TenantName;
import com.yahoo.config.provision.Zone;
import com.yahoo.test.ManualClock;
import com.yahoo.transaction.NestedTransaction;
import com.yahoo.vespa.curator.Curator;
import com.yahoo.vespa.curator.mock.MockCurator;
import com.yahoo.vespa.curator.transaction.CuratorTransaction;
import com.yahoo.vespa.hosted.provision.Node;
import com.yahoo.vespa.hosted.provision.NodeRepository;
import com.yahoo.vespa.hosted.provision.node.Configuration;
import com.yahoo.vespa.hosted.provision.node.NodeFlavors;
import com.yahoo.vespa.hosted.provision.provisioning.NodeRepositoryProvisioner;
import com.yahoo.vespa.hosted.provision.testutils.FlavorConfigBuilder;
import org.junit.Test;

import java.time.Duration;
import java.util.ArrayList;
import java.util.HashSet;
import java.util.List;
import java.util.Optional;
import java.util.Set;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertFalse;

/**
 * @author bratseth
 */
public class FailedExpirerTest {

    private Curator curator = new MockCurator();

    @Test
    public void ensure_failed_nodes_are_deallocated_in_prod() throws InterruptedException {
        NodeRepository nodeRepository = failureScenarioIn(Environment.prod);

        assertEquals(2, nodeRepository.getNodes(Node.Type.tenant, Node.State.failed).size());
        assertEquals(1, nodeRepository.getNodes(Node.Type.tenant, Node.State.dirty).size());
        assertEquals("node3", nodeRepository.getNodes(Node.Type.tenant, Node.State.dirty).get(0).hostname());
    }

    @Test
    public void ensure_failed_nodes_are_deallocated_in_dev() throws InterruptedException {
        NodeRepository nodeRepository = failureScenarioIn(Environment.dev);

        assertEquals(1, nodeRepository.getNodes(Node.Type.tenant, Node.State.failed).size());
        assertEquals(2, nodeRepository.getNodes(Node.Type.tenant, Node.State.dirty).size());
        assertEquals("node2", nodeRepository.getNodes(Node.Type.tenant, Node.State.failed).get(0).hostname());
    }

    private NodeRepository failureScenarioIn(Environment environment) {
        ManualClock clock = new ManualClock();
        NodeFlavors nodeFlavors = FlavorConfigBuilder.createDummies("default");
        NodeRepository nodeRepository = new NodeRepository(nodeFlavors, curator, clock);
        NodeRepositoryProvisioner provisioner = new NodeRepositoryProvisioner(nodeRepository, nodeFlavors, Zone.defaultZone(), clock);

        List<Node> nodes = new ArrayList<>(3);
        nodes.add(nodeRepository.createNode("node1", "node1", Optional.empty(), new Configuration(nodeFlavors.getFlavorOrThrow("default")), Node.Type.tenant));
        nodes.add(nodeRepository.createNode("node2", "node2", Optional.empty(), new Configuration(nodeFlavors.getFlavorOrThrow("default")), Node.Type.tenant));
        nodes.add(nodeRepository.createNode("node3", "node3", Optional.empty(), new Configuration(nodeFlavors.getFlavorOrThrow("default")), Node.Type.tenant));
        nodeRepository.addNodes(nodes);

        List<Node> hostNodes = new ArrayList<>(1);
        hostNodes.add(nodeRepository.createNode("parent1", "parent1", Optional.empty(), new Configuration(nodeFlavors.getFlavorOrThrow("default")), Node.Type.host));
        hostNodes.add(nodeRepository.createNode("parent2", "parent2", Optional.empty(), new Configuration(nodeFlavors.getFlavorOrThrow("default")), Node.Type.host));
        nodeRepository.addNodes(hostNodes);


        // Set node1 to have failed 4 times before
        Node node1 = nodeRepository.getNode("node1").get();
        node1 = node1.setStatus(node1.status().increaseFailCount());
        node1 = node1.setStatus(node1.status().increaseFailCount());
        node1 = node1.setStatus(node1.status().increaseFailCount());
        node1 = node1.setStatus(node1.status().increaseFailCount());
        nodeRepository.write(node1);

        // Set node2 to have a detected hardware failure
        Node node2 = nodeRepository.getNode("node2").get();
        node2 = node2.setStatus(node2.status().setHardwareFailure(true));
        nodeRepository.write(node2);

        // Allocate the nodes
        nodeRepository.setReady(nodeRepository.getNodes(Node.Type.tenant, Node.State.provisioned));
        ApplicationId applicationId = ApplicationId.from(TenantName.from("foo"), ApplicationName.from("bar"), InstanceName.from("fuz"));
        ClusterSpec cluster = ClusterSpec.from(ClusterSpec.Type.content, ClusterSpec.Id.from("test"), Optional.empty());
        provisioner.prepare(applicationId, cluster, Capacity.fromNodeCount(3), 1, null);
        NestedTransaction transaction = new NestedTransaction().add(new CuratorTransaction(curator));
        provisioner.activate(transaction, applicationId, asHosts(nodes));
        transaction.commit();
        assertEquals(3, nodeRepository.getNodes(Node.Type.tenant, Node.State.active).size());

        // Fail the nodes
        nodeRepository.fail("node1");
        nodeRepository.fail("node2");
        nodeRepository.fail("node3");
        assertEquals(3, nodeRepository.getNodes(Node.Type.tenant, Node.State.failed).size());

        // Failure times out
        clock.advance(Duration.ofDays(5));
        new FailedExpirer(nodeRepository, new Zone(environment, RegionName.from("us-west-1")), clock, Duration.ofDays(4)).run();

        return nodeRepository;
    }

    private Set<HostSpec> asHosts(List<Node> nodes) {
        Set<HostSpec> hosts = new HashSet<>(nodes.size());
        for (Node node : nodes)
            hosts.add(new HostSpec(node.hostname(),
                                   node.allocation().isPresent() ? Optional.of(node.allocation().get().membership()) :
                                                                   Optional.empty()));
        return hosts;
    }

}