1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
|
// Copyright 2020 Oath Inc. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
package com.yahoo.vespa.hosted.controller.maintenance;
import com.yahoo.config.provision.CloudName;
import com.yahoo.config.provision.zone.ZoneApi;
import com.yahoo.text.Text;
import com.yahoo.vespa.hosted.controller.Controller;
import com.yahoo.vespa.hosted.controller.api.integration.aws.AwsEventFetcher;
import com.yahoo.vespa.hosted.controller.api.integration.aws.CloudEvent;
import com.yahoo.vespa.hosted.controller.api.integration.configserver.Node;
import com.yahoo.vespa.hosted.controller.api.integration.configserver.NodeRepository;
import java.time.Duration;
import java.util.List;
import java.util.Map;
import java.util.logging.Logger;
import java.util.stream.Collectors;
/**
* Automatically fetches and handles scheduled events from AWS:
* 1. Deprovisions the affected hosts if applicable
* 2. Submits an issue detailing the event if some hosts are not processed by 1.
*
* @author mgimle
*/
public class CloudEventReporter extends ControllerMaintainer {
private static final Logger log = Logger.getLogger(CloudEventReporter.class.getName());
private final AwsEventFetcher eventFetcher;
private final Map<String, List<ZoneApi>> zonesByCloudNativeRegion;
private final NodeRepository nodeRepository;
CloudEventReporter(Controller controller, Duration interval) {
super(controller, interval);
this.eventFetcher = controller.serviceRegistry().eventFetcherService();
this.nodeRepository = controller.serviceRegistry().configServer().nodeRepository();
this.zonesByCloudNativeRegion = supportedZonesByRegion();
}
@Override
protected double maintain() {
for (var region : zonesByCloudNativeRegion.keySet()) {
List<CloudEvent> events = eventFetcher.getEvents(region);
for (var event : events) {
log.info(Text.format("Retrieved event %s, affecting the following instances: %s",
event.instanceEventId,
event.affectedInstances));
deprovisionAffectedHosts(region, event);
}
}
return 1.0;
}
/** Deprovision any host affected by given event */
private void deprovisionAffectedHosts(String region, CloudEvent event) {
for (var zone : zonesByCloudNativeRegion.get(region)) {
for (var node : nodeRepository.list(zone.getId(), false)) {
if (!affects(node, event)) continue;
log.info("Retiring and deprovisioning " + node.hostname().value() + " in " + zone.getId() +
": Affected by maintenance event " + event.instanceEventId);
nodeRepository.retire(zone.getId(), node.hostname().value(), true, true);
}
}
}
private static boolean affects(Node node, CloudEvent event) {
if (!node.type().isHost()) return false; // Non-hosts are never affected
return event.affectedInstances.stream()
.anyMatch(instance -> node.hostname().value().contains(instance));
}
/** Returns zones supported by this, grouped by their native region name */
private Map<String, List<ZoneApi>> supportedZonesByRegion() {
return controller().zoneRegistry().zones()
.ofCloud(CloudName.from("aws"))
.reachable()
.zones().stream()
.collect(Collectors.groupingBy(ZoneApi::getCloudNativeRegionName));
}
}
|