1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
|
// Copyright Verizon Media. Licensed under the terms of the Apache 2.0 license. See LICENSE in the project root.
#include "env.h"
#include "check-completion-handler.h"
#include "connectivity.h"
#include <vespa/defaults.h>
#include <vespa/log/log.h>
#include <vespa/config/common/exceptions.h>
#include <vespa/vespalib/util/exceptions.h>
#include <vespa/vespalib/util/signalhandler.h>
#include <vespa/vespalib/util/stringfmt.h>
#include <thread>
#include <chrono>
LOG_SETUP(".env");
using vespalib::make_string_short::fmt;
using namespace std::chrono_literals;
namespace config::sentinel {
namespace {
void maybeStopNow() {
if (vespalib::SignalHandler::INT.check() ||
vespalib::SignalHandler::TERM.check())
{
throw vespalib::FatalException("got signal during boot()");
}
}
constexpr std::chrono::milliseconds CONFIG_TIMEOUT_MS = 3min;
constexpr int maxConnectivityRetries = 100;
} // namespace <unnamed>
Env::Env()
: _cfgOwner(),
_rpcCommandQueue(),
_rpcServer(),
_stateApi(),
_startMetrics(),
_stateServer(),
_statePort(0)
{
_startMetrics.startedTime = vespalib::steady_clock::now();
_stateApi.myHealth.setFailed("initializing...");
}
Env::~Env() = default;
void Env::boot(const std::string &configId) {
LOG(debug, "Reading configuration for ID: %s", configId.c_str());
_cfgOwner.subscribe(configId, CONFIG_TIMEOUT_MS);
// subscribe() should throw if something is not OK
Connectivity checker;
for (int retry = 0; retry < maxConnectivityRetries; ++retry) {
bool changed = _cfgOwner.checkForConfigUpdate();
LOG_ASSERT(changed || retry > 0);
if (changed) {
LOG_ASSERT(_cfgOwner.hasConfig());
const auto & cfg = _cfgOwner.getConfig();
LOG(config, "Booting sentinel '%s' with [stateserver port %d] and [rpc port %d]",
configId.c_str(), cfg.port.telnet, cfg.port.rpc);
rpcPort(cfg.port.rpc);
statePort(cfg.port.telnet);
checker.configure(cfg.connectivity);
}
if (checker.checkConnectivity(*_rpcServer)) {
_stateApi.myHealth.setOk();
return;
} else {
_stateApi.myHealth.setFailed("FAILED connectivity check");
if ((retry % 10) == 0) {
LOG(warning, "Bad network connectivity (try %d)", 1+retry);
}
for (int i = 0; i < 5; ++i) {
respondAsEmpty();
maybeStopNow();
std::this_thread::sleep_for(600ms);
}
}
}
throw vespalib::FatalException("Giving up - too many connectivity check failures");
}
void Env::rpcPort(int port) {
if (port < 0 || port > 65535) {
throw vespalib::FatalException("Bad port " + std::to_string(port) + ", expected range [1, 65535]", VESPA_STRLOC);
}
if (port == 0) {
port = 19097; // default in config
}
if (_rpcServer && port == _rpcServer->getPort()) {
return; // ok already
}
_rpcServer = std::make_unique<RpcServer>(port, _rpcCommandQueue);
}
void Env::statePort(int port) {
if (port < 0 || port > 65535) {
throw vespalib::FatalException("Bad port " + std::to_string(port) + ", expected range [1, 65535]", VESPA_STRLOC);
}
if (port == 0) {
port = 19098; // default in config
}
if (_stateServer && port == _statePort) {
return; // ok already
}
LOG(debug, "Config-sentinel accepts state connections on port %d", port);
_stateServer = std::make_unique<vespalib::StateServer>(
port, _stateApi.myHealth, _startMetrics.producer, _stateApi.myComponents);
_statePort = port;
}
void Env::notifyConfigUpdated() {
vespalib::ComponentConfigProducer::Config current("sentinel", _cfgOwner.getGeneration(), "ok");
_stateApi.myComponents.addConfig(current);
}
void Env::respondAsEmpty() {
auto commands = _rpcCommandQueue.drain();
for (Cmd::UP &cmd : commands) {
cmd->retError("still booting, not ready for all RPC commands");
}
}
}
|