Grcov report - cluster_manager

1

#include "source/common/upstream/cluster_manager_impl.h"

2

3

#include <chrono>

4

#include <cstdint>

5

#include <functional>

6

#include <memory>

7

#include <string>

8

#include <vector>

9

10

#include "envoy/admin/v3/config_dump.pb.h"

11

#include "envoy/config/bootstrap/v3/bootstrap.pb.h"

12

#include "envoy/config/cluster/v3/cluster.pb.h"

13

#include "envoy/config/core/v3/config_source.pb.h"

14

#include "envoy/config/core/v3/protocol.pb.h"

15

#include "envoy/event/dispatcher.h"

16

#include "envoy/grpc/async_client.h"

17

#include "envoy/network/dns.h"

18

#include "envoy/runtime/runtime.h"

19

#include "envoy/stats/scope.h"

20

#include "envoy/tcp/async_tcp_client.h"

21

#include "envoy/upstream/load_balancer.h"

22

#include "envoy/upstream/upstream.h"

23

24

#include "source/common/common/assert.h"

25

#include "source/common/common/enum_to_int.h"

26

#include "source/common/common/fmt.h"

27

#include "source/common/common/utility.h"

28

#include "source/common/config/null_grpc_mux_impl.h"

29

#include "source/common/config/utility.h"

30

#include "source/common/config/xds_resource.h"

31

#include "source/common/grpc/async_client_manager_impl.h"

32

#include "source/common/http/async_client_impl.h"

33

#include "source/common/http/http1/conn_pool.h"

34

#include "source/common/http/http2/conn_pool.h"

35

#include "source/common/http/mixed_conn_pool.h"

36

#include "source/common/network/utility.h"

37

#include "source/common/protobuf/utility.h"

38

#include "source/common/router/shadow_writer_impl.h"

39

#include "source/common/runtime/runtime_features.h"

40

#include "source/common/tcp/conn_pool.h"

41

#include "source/common/upstream/cds_api_impl.h"

42

#include "source/common/upstream/cluster_factory_impl.h"

43

#include "source/common/upstream/load_balancer_context_base.h"

44

#include "source/common/upstream/load_stats_reporter_impl.h"

45

#include "source/common/upstream/priority_conn_pool_map_impl.h"

46

47

#include "absl/hash/hash.h"

48

#include "absl/status/status.h"

49

50

#ifdef ENVOY_ENABLE_QUIC

51

#include "source/common/http/conn_pool_grid.h"

52

#include "source/common/http/http3/conn_pool.h"

53

#include "source/common/quic/client_connection_factory_impl.h"

54

#endif

55

56

namespace Envoy {

57

namespace Upstream {

58

namespace {

59

60

void addOptionsIfNotNull(Network::Socket::OptionsSharedPtr& options,

61

96150

                         const Network::Socket::OptionsSharedPtr& to_add) {

62

96150

  if (to_add != nullptr) {

63

43831

    Network::Socket::appendOptions(options, to_add);

64

43831

65

96150

66

67

// Helper function to make sure each protocol in expected_protocols is present

68

// in protocols (only used for an ASSERT in debug builds)

69

bool contains(const std::vector<Http::Protocol>& protocols,

70

              const std::vector<Http::Protocol>& expected_protocols) {

71

  for (auto protocol : expected_protocols) {

72

    if (std::find(protocols.begin(), protocols.end(), protocol) == protocols.end()) {

73

      return false;

74

75

76

  return true;

77

78

79

absl::optional<Http::HttpServerPropertiesCache::Origin>

80

11755

getOrigin(const Network::TransportSocketOptionsConstSharedPtr& options, HostConstSharedPtr host) {

81

11755

  std::string sni = std::string(host->transportSocketFactory().defaultServerNameIndication());

82

11755

  if (options && options->serverNameOverride().has_value()) {

83

916

    sni = options->serverNameOverride().value();

84

916

85

11755

  if (sni.empty() || !host->address() || !host->address()->ip()) {

86

10614

    return absl::nullopt;

87

10614

88

1141

  return {{"https", sni, host->address()->ip()->port()}};

89

11755

90

91

bool isBlockingAdsCluster(const envoy::config::bootstrap::v3::Bootstrap& bootstrap,

92

15876

                          absl::string_view cluster_name) {

93

15876

  bool blocking_ads_cluster = false;

94

15876

  if (bootstrap.dynamic_resources().has_ads_config()) {

95

801

    const auto& ads_config_source = bootstrap.dynamic_resources().ads_config();

96

    // We only care about EnvoyGrpc, not GoogleGrpc, because we only need to delay ADS mux

97

    // initialization if it uses an Envoy cluster that needs to be initialized first. We don't

98

    // depend on the same cluster initialization when opening a gRPC stream for GoogleGrpc.

99

801

    blocking_ads_cluster =

100

801

        (ads_config_source.grpc_services_size() > 0 &&

101

801

         ads_config_source.grpc_services(0).has_envoy_grpc() &&

102

801

         ads_config_source.grpc_services(0).envoy_grpc().cluster_name() == cluster_name);

103

801

    if (Runtime::runtimeFeatureEnabled("envoy.restart_features.xds_failover_support")) {

104

      // Validate the failover server if there is one.

105

160

      blocking_ads_cluster |=

106

160

          (ads_config_source.grpc_services_size() == 2 &&

107

160

           ads_config_source.grpc_services(1).has_envoy_grpc() &&

108

160

           ads_config_source.grpc_services(1).envoy_grpc().cluster_name() == cluster_name);

109

160

110

801

111

15876

  return blocking_ads_cluster;

112

15876

113

114

} // namespace

115

116

16609

void ClusterManagerInitHelper::addCluster(ClusterManagerCluster& cm_cluster) {

117

  // See comments in ClusterManagerImpl::addOrUpdateCluster() for why this is only called during

118

  // server initialization.

119

16609

  ASSERT(state_ != State::AllClustersInitialized);

120

121

16609

  const auto initialize_cb = [&cm_cluster, this] {

122

16124

    RETURN_IF_NOT_OK(onClusterInit(cm_cluster));

123

16124

    cm_cluster.cluster().info()->configUpdateStats().warming_state_.set(0);

124

16124

    return absl::OkStatus();

125

16124

};

126

16609

  Cluster& cluster = cm_cluster.cluster();

127

128

16609

  cluster.info()->configUpdateStats().warming_state_.set(1);

129

16609

  if (cluster.initializePhase() == Cluster::InitializePhase::Primary) {

130

    // Remove the previous cluster before the cluster object is destroyed.

131

16247

    primary_init_clusters_.insert_or_assign(cm_cluster.cluster().info()->name(), &cm_cluster);

132

16247

    cluster.initialize(initialize_cb);

133

16253

  } else {

134

362

    ASSERT(cluster.initializePhase() == Cluster::InitializePhase::Secondary);

135

    // Remove the previous cluster before the cluster object is destroyed.

136

362

    secondary_init_clusters_.insert_or_assign(cm_cluster.cluster().info()->name(), &cm_cluster);

137

362

    if (started_secondary_initialize_) {

138

      // This can happen if we get a second CDS update that adds new clusters after we have

139

      // already started secondary init. In this case, just immediately initialize.

140

11

      cluster.initialize(initialize_cb);

141

11

142

362

143

144

16609

  ENVOY_LOG(debug, "cm init: adding: cluster={} primary={} secondary={}", cluster.info()->name(),

145

16609

            primary_init_clusters_.size(), secondary_init_clusters_.size());

146

16609

147

148

16432

absl::Status ClusterManagerInitHelper::onClusterInit(ClusterManagerCluster& cluster) {

149

16432

  ASSERT(state_ != State::AllClustersInitialized);

150

16432

  RETURN_IF_NOT_OK(per_cluster_init_callback_(cluster));

151

16432

  removeCluster(cluster);

152

16432

  return absl::OkStatus();

153

16432

154

155

17106

void ClusterManagerInitHelper::removeCluster(ClusterManagerCluster& cluster) {

156

17106

  if (state_ == State::AllClustersInitialized) {

157

667

    return;

158

667

159

160

  // There is a remote edge case where we can remove a cluster via CDS that has not yet been

161

  // initialized. When called via the remove cluster API this code catches that case.

162

16439

  absl::flat_hash_map<std::string, ClusterManagerCluster*>* cluster_map;

163

16439

  if (cluster.cluster().initializePhase() == Cluster::InitializePhase::Primary) {

164

16115

    cluster_map = &primary_init_clusters_;

165

16121

  } else {

166

324

    ASSERT(cluster.cluster().initializePhase() == Cluster::InitializePhase::Secondary);

167

324

    cluster_map = &secondary_init_clusters_;

168

324

169

170

  // It is possible that the cluster we are removing has already been initialized, and is not

171

  // present in the initializer map. If so, this is fine as a CDS update may happen for a

172

  // cluster with the same name. See the case "UpdateAlreadyInitialized" of the

173

  // target //test/common/upstream:cluster_manager_impl_test.

174

16439

  auto iter = cluster_map->find(cluster.cluster().info()->name());

175

16439

  if (iter != cluster_map->end() && iter->second == &cluster) {

176

16436

    cluster_map->erase(iter);

177

16436

178

16439

  ENVOY_LOG(debug, "cm init: init complete: cluster={} primary={} secondary={}",

179

16439

            cluster.cluster().info()->name(), primary_init_clusters_.size(),

180

16439

            secondary_init_clusters_.size());

181

16439

  maybeFinishInitialize();

182

16439

183

184

311

void ClusterManagerInitHelper::initializeSecondaryClusters() {

185

311

  started_secondary_initialize_ = true;

186

  // Cluster::initialize() method can modify the map of secondary_init_clusters_ to remove

187

  // the item currently being initialized, so we eschew range-based-for and do this complicated

188

  // dance to increment the iterator before calling initialize.

189

646

  for (auto iter = secondary_init_clusters_.begin(); iter != secondary_init_clusters_.end();) {

190

335

    ClusterManagerCluster* cluster = iter->second;

191

335

    ENVOY_LOG(debug, "initializing secondary cluster {}", iter->first);

192

335

    ++iter;

193

335

    cluster->cluster().initialize([cluster, this] { return onClusterInit(*cluster); });

194

335

195

311

196

197

38953

void ClusterManagerInitHelper::maybeFinishInitialize() {

198

  // Do not do anything if we are still doing the initial static load or if we are waiting for

199

  // CDS initialize.

200

38953

  ENVOY_LOG(debug, "maybe finish initialize state: {}", enumToInt(state_));

201

38953

  if (state_ == State::Loading || state_ == State::WaitingToStartCdsInitialization) {

202

15915

    return;

203

15915

204

205

23038

  ASSERT(state_ == State::WaitingToStartSecondaryInitialization ||

206

23038

         state_ == State::CdsInitialized ||

207

23038

         state_ == State::WaitingForPrimaryInitializationToComplete);

208

23038

  ENVOY_LOG(debug, "maybe finish initialize primary init clusters empty: {}",

209

23038

            primary_init_clusters_.empty());

210

  // If we are still waiting for primary clusters to initialize, do nothing.

211

23038

  if (!primary_init_clusters_.empty()) {

212

303

    return;

213

22784

  } else if (state_ == State::WaitingForPrimaryInitializationToComplete) {

214

10895

    state_ = State::WaitingToStartSecondaryInitialization;

215

10895

    if (primary_clusters_initialized_callback_) {

216

114

      primary_clusters_initialized_callback_();

217

114

218

10895

    return;

219

10895

220

221

  // If we are still waiting for secondary clusters to initialize, see if we need to first call

222

  // initialize on them. This is only done once.

223

11840

  ENVOY_LOG(debug, "maybe finish initialize secondary init clusters empty: {}",

224

11840

            secondary_init_clusters_.empty());

225

11840

  if (!secondary_init_clusters_.empty()) {

226

338

    if (!started_secondary_initialize_) {

227

311

      ENVOY_LOG(info, "cm init: initializing secondary clusters");

228

      // If the first CDS response doesn't have any primary cluster, ClusterLoadAssignment

229

      // should be already paused by CdsApiImpl::onConfigUpdate(). Need to check that to

230

      // avoid double pause ClusterLoadAssignment.

231

311

      const std::vector<std::string> paused_xds_types{

232

311

          Config::getTypeUrl<envoy::config::endpoint::v3::ClusterLoadAssignment>(),

233

311

          Config::getTypeUrl<envoy::config::endpoint::v3::LbEndpoint>(),

234

311

          Config::getTypeUrl<envoy::extensions::transport_sockets::tls::v3::Secret>()};

235

311

      Config::ScopedResume resume_eds_leds_sds = xds_manager_.pause(paused_xds_types);

236

311

      initializeSecondaryClusters();

237

311

238

338

    return;

239

338

240

241

  // At this point, if we are doing static init, and we have CDS, start CDS init. Otherwise, move

242

  // directly to initialized.

243

11502

  started_secondary_initialize_ = false;

244

11502

  ENVOY_LOG(debug, "maybe finish initialize cds api ready: {}", cds_ != nullptr);

245

11502

  if (state_ == State::WaitingToStartSecondaryInitialization && cds_) {

246

710

    ENVOY_LOG(info, "cm init: initializing cds");

247

710

    state_ = State::WaitingToStartCdsInitialization;

248

710

    cds_->initialize();

249

10816

  } else {

250

10792

    ENVOY_LOG(info, "cm init: all clusters initialized");

251

10792

    state_ = State::AllClustersInitialized;

252

10792

    if (initialized_callback_) {

253

663

      initialized_callback_();

254

663

255

10792

256

11502

257

258

11000

void ClusterManagerInitHelper::onStaticLoadComplete() {

259

11000

  ASSERT(state_ == State::Loading);

260

  // After initialization of primary clusters has completed, transition to

261

  // waiting for signal to initialize secondary clusters and then CDS.

262

11000

  state_ = State::WaitingForPrimaryInitializationToComplete;

263

11000

  maybeFinishInitialize();

264

11000

265

266

10822

void ClusterManagerInitHelper::startInitializingSecondaryClusters() {

267

10822

  ASSERT(state_ == State::WaitingToStartSecondaryInitialization);

268

10822

  ENVOY_LOG(debug, "continue initializing secondary clusters");

269

10822

  maybeFinishInitialize();

270

10822

271

272

10992

void ClusterManagerInitHelper::setCds(CdsApi* cds) {

273

10992

  ASSERT(state_ == State::Loading);

274

10992

  cds_ = cds;

275

10992

  if (cds_) {

276

714

    cds_->setInitializedCb([this]() -> void {

277

692

      ASSERT(state_ == State::WaitingToStartCdsInitialization);

278

692

      state_ = State::CdsInitialized;

279

692

      maybeFinishInitialize();

280

692

});

281

714

282

10992

283

284

void ClusterManagerInitHelper::setInitializedCb(

285

10681

    ClusterManager::InitializationCompleteCallback callback) {

286

10681

  if (state_ == State::AllClustersInitialized) {

287

9942

    callback();

288

10507

  } else {

289

739

    initialized_callback_ = callback;

290

739

291

10681

292

293

void ClusterManagerInitHelper::setPrimaryClustersInitializedCb(

294

10827

    ClusterManager::PrimaryClustersReadyCallback callback) {

295

  // The callback must be set before or at the `WaitingToStartSecondaryInitialization` state.

296

10827

  ASSERT(state_ == State::WaitingToStartSecondaryInitialization ||

297

10827

         state_ == State::WaitingForPrimaryInitializationToComplete || state_ == State::Loading);

298

10827

  if (state_ == State::WaitingToStartSecondaryInitialization) {

299

    // This is the case where all clusters are STATIC and without health checking.

300

10698

    callback();

301

10740

  } else {

302

129

    primary_clusters_initialized_callback_ = callback;

303

129

304

10827

305

306

ClusterManagerImpl::ClusterManagerImpl(const envoy::config::bootstrap::v3::Bootstrap& bootstrap,

307

                                       ClusterManagerFactory& factory,

308

                                       Server::Configuration::ServerFactoryContext& context,

309

                                       absl::Status& creation_status)

310

11012

    : context_(context), factory_(factory), runtime_(context.runtime()),

311

11012

      stats_(context.serverScope().store()), tls_(context.threadLocal()),

312

11012

      xds_manager_(context.xdsManager()), random_(context.api().randomGenerator()),

313

11012

      deferred_cluster_creation_(bootstrap.cluster_manager().enable_deferred_cluster_creation()),

314

11012

      bind_config_(bootstrap.cluster_manager().has_upstream_bind_config()

315

11012

                       ? absl::make_optional(bootstrap.cluster_manager().upstream_bind_config())

316

11012

                       : absl::nullopt),

317

11012

      local_info_(context.localInfo()), cm_stats_(generateStats(*stats_.rootScope())),

318

11012

      init_helper_(xds_manager_,

319

16620

                   [this](ClusterManagerCluster& cluster) { return onClusterInit(cluster); }),

320

11012

      time_source_(context.timeSource()), dispatcher_(context.mainThreadDispatcher()),

321

11012

      http_context_(context.httpContext()), router_context_(context.routerContext()),

322

11012

      cluster_stat_names_(stats_.symbolTable()),

323

11012

      cluster_config_update_stat_names_(stats_.symbolTable()),

324

11012

      cluster_lb_stat_names_(stats_.symbolTable()),

325

11012

      cluster_endpoint_stat_names_(stats_.symbolTable()),

326

11012

      cluster_load_report_stat_names_(stats_.symbolTable()),

327

11012

      cluster_circuit_breakers_stat_names_(stats_.symbolTable()),

328

11012

      cluster_request_response_size_stat_names_(stats_.symbolTable()),

329

11012

      cluster_timeout_budget_stat_names_(stats_.symbolTable()),

330

      common_lb_config_pool_(

331

11012

          std::make_shared<SharedPool::ObjectSharedPool<

332

11012

              const envoy::config::cluster::v3::Cluster::CommonLbConfig, MessageUtil, MessageUtil>>(

333

11012

              dispatcher_)),

334

11012

      shutdown_(false) {

335

11012

  if (auto admin = context.admin(); admin.has_value()) {

336

11012

    config_tracker_entry_ = admin->getConfigTracker().add(

337

11012

        "clusters", [this](const Matchers::StringMatcher& name_matcher) {

338

91

          return dumpClusterConfigs(name_matcher);

339

91

});

340

11012

341

11012

  async_client_manager_ = std::make_unique<Grpc::AsyncClientManagerImpl>(

342

11012

      bootstrap.grpc_async_client_manager_config(), context, context.grpcContext().statNames());

343

11012

  const auto& cm_config = bootstrap.cluster_manager();

344

11012

  if (cm_config.has_outlier_detection()) {

345

3

    const std::string event_log_file_path = cm_config.outlier_detection().event_log_path();

346

3

    if (!event_log_file_path.empty()) {

347

3

      auto outlier_or_error = Outlier::EventLoggerImpl::create(context.accessLogManager(),

348

3

                                                               event_log_file_path, time_source_);

349

3

      SET_AND_RETURN_IF_NOT_OK(outlier_or_error.status(), creation_status);

350

3

      outlier_event_logger_ = std::move(*outlier_or_error);

351

3

352

3

353

354

  // We need to know whether we're zone aware early on, so make sure we do this lookup

355

  // before we load any clusters.

356

11012

  if (!cm_config.local_cluster_name().empty()) {

357

13

    local_cluster_name_ = cm_config.local_cluster_name();

358

13

359

360

  // Now that the async-client manager is set, the xDS-Manager can be initialized.

361

11012

  SET_AND_RETURN_IF_NOT_OK(xds_manager_.initialize(bootstrap, this), creation_status);

362

11012

363

364

absl::Status

365

11011

ClusterManagerImpl::initialize(const envoy::config::bootstrap::v3::Bootstrap& bootstrap) {

366

11011

  ASSERT(!initialized_);

367

11011

  initialized_ = true;

368

369

  // Cluster loading happens in two phases: first all the primary clusters are loaded, and then all

370

  // the secondary clusters are loaded. As it currently stands all non-EDS clusters and EDS which

371

  // load endpoint definition from file are primary and

372

  // (REST,GRPC,DELTA_GRPC) EDS clusters are secondary. This two phase

373

  // loading is done because in v2 configuration each EDS cluster individually sets up a

374

  // subscription. When this subscription is an API source the cluster will depend on a non-EDS

375

  // cluster, so the non-EDS clusters must be loaded first.

376

32092

  auto is_primary_cluster = [](const envoy::config::cluster::v3::Cluster& cluster) -> bool {

377

31886

    return cluster.type() != envoy::config::cluster::v3::Cluster::EDS ||

378

31886

           (cluster.type() == envoy::config::cluster::v3::Cluster::EDS &&

379

204

            Config::SubscriptionFactory::isPathBasedConfigSource(

380

204

                cluster.eds_cluster_config().eds_config().config_source_specifier_case()));

381

31886

};

382

  // Build book-keeping for which clusters are primary. This is useful when we

383

  // invoke loadCluster() below and it needs the complete set of primaries.

384

16184

  for (const auto& cluster : bootstrap.static_resources().clusters()) {

385

15943

    if (is_primary_cluster(cluster)) {

386

15876

      primary_clusters_.insert(cluster.name());

387

15876

388

15943

389

390

11011

  bool has_ads_cluster = false;

391

  // Load all the primary clusters.

392

16184

  for (const auto& cluster : bootstrap.static_resources().clusters()) {

393

15943

    if (is_primary_cluster(cluster)) {

394

15876

      const bool required_for_ads = isBlockingAdsCluster(bootstrap, cluster.name());

395

15876

      has_ads_cluster |= required_for_ads;

396

      // TODO(abeyad): Consider passing a lambda for a "post-cluster-init" callback, which would

397

      // include a conditional ads_mux_->start() call, if other uses cases for "post-cluster-init"

398

      // functionality pops up.

399

15876

      auto status_or_cluster =

400

15876

          loadCluster(cluster, MessageUtil::hash(cluster), "", /*added_via_api=*/false,

401

15876

                      required_for_ads, active_clusters_);

402

15876

      RETURN_IF_NOT_OK_REF(status_or_cluster.status());

403

15872

404

15943

405

406

  // Now setup ADS if needed, this might rely on a primary cluster.

407

11007

  RETURN_IF_NOT_OK(xds_manager_.initializeAdsConnections(bootstrap));

408

409

  // After ADS is initialized, load EDS static clusters as EDS config may potentially need ADS.

410

16175

  for (const auto& cluster : bootstrap.static_resources().clusters()) {

411

    // Now load all the secondary clusters.

412

15924

    if (cluster.type() == envoy::config::cluster::v3::Cluster::EDS &&

413

15924

        !Config::SubscriptionFactory::isPathBasedConfigSource(

414

101

            cluster.eds_cluster_config().eds_config().config_source_specifier_case())) {

415

66

      ASSERT(!isBlockingAdsCluster(bootstrap, cluster.name()));

416

      // Passing "false" for required_for_ads because an ADS cluster cannot be

417

      // defined using EDS (or non-primary cluster).

418

66

      auto status_or_cluster =

419

66

          loadCluster(cluster, MessageUtil::hash(cluster), "", /*added_via_api=*/false,

420

66

                      /*required_for_ads=*/false, active_clusters_);

421

66

      if (!status_or_cluster.status().ok()) {

422

        return status_or_cluster.status();

423

424

66

425

15924

426

427

11006

  cm_stats_.cluster_added_.add(bootstrap.static_resources().clusters().size());

428

11006

  updateClusterCounts();

429

430

11006

  absl::optional<ThreadLocalClusterManagerImpl::LocalClusterParams> local_cluster_params;

431

11006

  if (local_cluster_name_) {

432

11

    auto local_cluster = active_clusters_.find(local_cluster_name_.value());

433

11

    if (local_cluster == active_clusters_.end()) {

434

1

      return absl::InvalidArgumentError(

435

1

          fmt::format("local cluster '{}' must be defined", local_cluster_name_.value()));

436

1

437

10

    local_cluster_params.emplace();

438

10

    local_cluster_params->info_ = local_cluster->second->cluster().info();

439

10

    local_cluster_params->load_balancer_factory_ = local_cluster->second->loadBalancerFactory();

440

10

    local_cluster->second->setAddedOrUpdated();

441

10

442

443

  // Once the initial set of static bootstrap clusters are created (including the local cluster),

444

  // we can instantiate the thread local cluster manager.

445

21625

  tls_.set([this, local_cluster_params](Event::Dispatcher& dispatcher) {

446

21612

    return std::make_shared<ThreadLocalClusterManagerImpl>(*this, dispatcher, local_cluster_params);

447

21612

});

448

449

11005

  const auto& dyn_resources = bootstrap.dynamic_resources();

450

  // We can now potentially create the CDS API once the backing cluster exists.

451

11005

  if (dyn_resources.has_cds_config() || !dyn_resources.cds_resources_locator().empty()) {

452

719

    std::unique_ptr<xds::core::v3::ResourceLocator> cds_resources_locator;

453

719

    if (!dyn_resources.cds_resources_locator().empty()) {

454

14

      auto url_or_error =

455

14

          Config::XdsResourceIdentifier::decodeUrl(dyn_resources.cds_resources_locator());

456

14

      RETURN_IF_NOT_OK_REF(url_or_error.status());

457

14

      cds_resources_locator =

458

14

          std::make_unique<xds::core::v3::ResourceLocator>(std::move(url_or_error.value()));

459

14

460

    // In case cds_config is configured and the new xDS-TP configs are used,

461

    // then the CdsApi will need to track the resources, as the xDS-TP configs

462

    // may be used for OD-CDS. If this is not set, the SotW update may override

463

    // the OD-CDS resources.

464

719

    const bool support_multi_ads_sources =

465

719

        bootstrap.has_default_config_source() || !bootstrap.config_sources().empty();

466

719

    auto cds_or_error = factory_.createCds(dyn_resources.cds_config(), cds_resources_locator.get(),

467

719

                                           *this, support_multi_ads_sources);

468

719

    RETURN_IF_NOT_OK_REF(cds_or_error.status())

469

719

    cds_api_ = std::move(*cds_or_error);

470

719

    init_helper_.setCds(cds_api_.get());

471

10884

  } else {

472

10286

    init_helper_.setCds(nullptr);

473

10286

474

475

  // Proceed to add all static bootstrap clusters to the init manager. This will immediately

476

  // initialize any primary clusters. Post-init processing further initializes any thread

477

  // aware load balancer and sets up the per-worker host set updates.

478

16174

  for (auto& cluster : active_clusters_) {

479

15920

    init_helper_.addCluster(*cluster.second);

480

15920

481

482

  // Potentially move to secondary initialization on the static bootstrap clusters if all primary

483

  // clusters have already initialized. (E.g., if all static).

484

11005

  init_helper_.onStaticLoadComplete();

485

486

  // Initialize the ADS and xDS-TP config based connections.

487

11005

  if (!has_ads_cluster) {

488

    // There is no ADS cluster, so we won't be starting the ADS mux after a cluster has finished

489

    // initializing, so we must start ADS here.

490

10785

    xds_manager_.adsMux()->start();

491

10785

492

  // TODO(adisuissa): to ensure parity with the non-xdstp-config-based ADS

493

  // we need to change this to only be invoked for Envoy-based clusters when

494

  // they are ready (this is needed to avoid early connection attempts in the

495

  // DNS based clusters).

496

11005

  xds_manager_.startXdstpAdsMuxes();

497

11005

  return absl::OkStatus();

498

11005

499

500

absl::Status ClusterManagerImpl::initializeSecondaryClusters(

501

10815

    const envoy::config::bootstrap::v3::Bootstrap& bootstrap) {

502

10815

  init_helper_.startInitializingSecondaryClusters();

503

504

10815

  const auto& cm_config = bootstrap.cluster_manager();

505

10815

  if (cm_config.has_load_stats_config()) {

506

31

    const auto& load_stats_config = cm_config.load_stats_config();

507

508

31

    absl::Status status = Config::Utility::checkTransportVersion(load_stats_config);

509

31

    RETURN_IF_NOT_OK(status);

510

31

    absl::StatusOr<Grpc::RawAsyncClientSharedPtr> client_or_error;

511

31

    if (Runtime::runtimeFeatureEnabled("envoy.restart_features.use_cached_grpc_client_for_xds")) {

512

2

      absl::StatusOr<Envoy::OptRef<const envoy::config::core::v3::GrpcService>> maybe_grpc_service =

513

2

          Envoy::Config::Utility::getGrpcConfigFromApiConfigSource(load_stats_config,

514

2

                                                                   /*grpc_service_idx*/ 0,

515

2

                                                                   /*xdstp_config_source*/ false);

516

2

      RETURN_IF_NOT_OK_REF(maybe_grpc_service.status());

517

2

      if (maybe_grpc_service.value().has_value()) {

518

2

        client_or_error = async_client_manager_->getOrCreateRawAsyncClientWithHashKey(

519

2

            Grpc::GrpcServiceConfigWithHashKey(*maybe_grpc_service.value()), *stats_.rootScope(),

520

2

            /*skip_cluster_check*/ false);

521

2

      } else {

522

        return absl::InvalidArgumentError("Invalid grpc service.");

523

524

29

    } else {

525

29

      auto factory_or_error = Config::Utility::factoryForGrpcApiConfigSource(

526

29

          *async_client_manager_, load_stats_config, *stats_.rootScope(), false, 0, false);

527

29

      RETURN_IF_NOT_OK_REF(factory_or_error.status());

528

28

      client_or_error = factory_or_error.value()->createUncachedRawAsyncClient();

529

28

530

30

    RETURN_IF_NOT_OK_REF(client_or_error.status());

531

30

    load_stats_reporter_ = std::make_unique<LoadStatsReporterImpl>(

532

30

        local_info_, *this, *stats_.rootScope(), std::move(client_or_error.value()), dispatcher_);

533

30

534

10814

  return absl::OkStatus();

535

10815

536

537

11012

ClusterManagerStats ClusterManagerImpl::generateStats(Stats::Scope& scope) {

538

11012

  const std::string final_prefix = "cluster_manager.";

539

11012

  return {ALL_CLUSTER_MANAGER_STATS(POOL_COUNTER_PREFIX(scope, final_prefix),

540

11012

                                    POOL_GAUGE_PREFIX(scope, final_prefix))};

541

11012

542

543

ThreadLocalClusterManagerStats

544

ClusterManagerImpl::ThreadLocalClusterManagerImpl::generateStats(Stats::Scope& scope,

545

21612

                                                                 const std::string& thread_name) {

546

21612

  const std::string final_prefix = absl::StrCat("thread_local_cluster_manager.", thread_name);

547

21612

  return {ALL_THREAD_LOCAL_CLUSTER_MANAGER_STATS(POOL_GAUGE_PREFIX(scope, final_prefix))};

548

21612

549

550

17323

absl::Status ClusterManagerImpl::onClusterInit(ClusterManagerCluster& cm_cluster) {

551

  // This routine is called when a cluster has finished initializing. The cluster has not yet

552

  // been setup for cross-thread updates to avoid needless updates during initialization. The order

553

  // of operations here is important. We start by initializing the thread aware load balancer if

554

  // needed. This must happen first so cluster updates are heard first by the load balancer.

555

  // Also, it assures that all of clusters which this function is called should be always active.

556

17323

  auto& cluster = cm_cluster.cluster();

557

17323

  auto cluster_data = warming_clusters_.find(cluster.info()->name());

558

  // We have a situation that clusters will be immediately active, such as static and primary

559

  // cluster. So we must have this prevention logic here.

560

17323

  if (cluster_data != warming_clusters_.end()) {

561

1550

    clusterWarmingToActive(cluster.info()->name());

562

1550

    updateClusterCounts();

563

1550

564

17323

  cluster_data = active_clusters_.find(cluster.info()->name());

565

566

17323

  if (cluster_data->second->thread_aware_lb_ != nullptr) {

567

17323

    RETURN_IF_NOT_OK(cluster_data->second->thread_aware_lb_->initialize());

568

17323

569

570

  // Now setup for cross-thread updates.

571

  // This is used by cluster types such as EDS clusters to drain the connection pools of removed

572

  // hosts.

573

17323

  cluster_data->second->member_update_cb_ = cluster.prioritySet().addMemberUpdateCb(

574

17447

      [&cluster, this](const HostVector&, const HostVector& hosts_removed) {

575

900

        if (cluster.info()->lbConfig().close_connections_on_host_set_change()) {

576

6

          for (const auto& host_set : cluster.prioritySet().hostSetsPerPriority()) {

577

            // This will drain all tcp and http connection pools.

578

6

            postThreadLocalRemoveHosts(cluster, host_set->hosts());

579

6

580

894

        } else {

581

          // TODO(snowp): Should this be subject to merge windows?

582

583

          // Whenever hosts are removed from the cluster, we make each TLS cluster drain it's

584

          // connection pools for the removed hosts. If `close_connections_on_host_set_change` is

585

          // enabled, this case will be covered by first `if` statement, where all

586

          // connection pools are drained.

587

894

          if (!hosts_removed.empty()) {

588

74

            postThreadLocalRemoveHosts(cluster, hosts_removed);

589

74

590

894

591

900

});

592

593

  // This is used by cluster types such as EDS clusters to update the cluster

594

  // without draining the cluster.

595

17323

  cluster_data->second->priority_update_cb_ = cluster.prioritySet().addPriorityUpdateCb(

596

17323

      [&cm_cluster, this](uint32_t priority, const HostVector& hosts_added,

597

17444

                          const HostVector& hosts_removed) {

598

        // This fires when a cluster is about to have an updated member set. We need to send this

599

        // out to all of the thread local configurations.

600

601

        // Should we save this update and merge it with other updates?

602

//

603

        // Note that we can only _safely_ merge updates that have no added/removed hosts. That is,

604

        // only those updates that signal a change in host healthcheck state, weight or metadata.

605

//

606

        // We've discussed merging updates related to hosts being added/removed, but it's really

607

        // tricky to merge those given that downstream consumers of these updates expect to see the

608

        // full list of updates, not a condensed one. This is because they use the broadcasted

609

        // HostSharedPtrs within internal maps to track hosts. If we fail to broadcast the entire

610

        // list of removals, these maps will leak those HostSharedPtrs.

611

//

612

        // See https://github.com/envoyproxy/envoy/pull/3941 for more context.

613

503

        bool scheduled = false;

614

503

        const auto merge_timeout = PROTOBUF_GET_MS_OR_DEFAULT(

615

503

            cm_cluster.cluster().info()->lbConfig(), update_merge_window, 1000);

616

        // Remember: we only merge updates with no adds/removes — just hc/weight/metadata changes.

617

503

        const bool is_mergeable = hosts_added.empty() && hosts_removed.empty();

618

619

503

        if (merge_timeout > 0) {

620

          // If this is not mergeable, we should cancel any scheduled updates since

621

          // we'll deliver it immediately.

622

457

          scheduled = scheduleUpdate(cm_cluster, priority, is_mergeable, merge_timeout);

623

457

624

625

        // If an update was not scheduled for later, deliver it immediately.

626

503

        if (!scheduled) {

627

437

          cm_stats_.cluster_updated_.inc();

628

437

          postThreadLocalClusterUpdate(

629

437

              cm_cluster, ThreadLocalClusterUpdateParams(priority, hosts_added, hosts_removed));

630

437

631

503

});

632

633

  // Finally, post updates cross-thread so the per-thread load balancers are ready. First we

634

  // populate any update information that may be available after cluster init.

635

17323

  ThreadLocalClusterUpdateParams params;

636

17396

  for (auto& host_set : cluster.prioritySet().hostSetsPerPriority()) {

637

17394

    if (host_set->hosts().empty()) {

638

484

      continue;

639

484

640

16910

    params.per_priority_update_params_.emplace_back(host_set->priority(), host_set->hosts(),

641

16910

                                                    HostVector{});

642

16910

643

  // NOTE: In all cases *other* than the local cluster, this is when a cluster is added/updated

644

  // The local cluster must currently be statically defined and must exist prior to other

645

  // clusters being added/updated. We could gate the below update on hosts being available on

646

  // the cluster or the cluster not already existing, but the special logic is not worth it.

647

17323

  postThreadLocalClusterUpdate(cm_cluster, std::move(params));

648

17323

  return absl::OkStatus();

649

17323

650

651

bool ClusterManagerImpl::scheduleUpdate(ClusterManagerCluster& cluster, uint32_t priority,

652

457

                                        bool mergeable, const uint64_t timeout) {

653

  // Find pending updates for this cluster.

654

457

  auto& updates_by_prio = updates_map_[cluster.cluster().info()->name()];

655

457

  if (!updates_by_prio) {

656

246

    updates_by_prio = std::make_unique<PendingUpdatesByPriorityMap>();

657

246

658

659

  // Find pending updates for this priority.

660

457

  auto& updates = (*updates_by_prio)[priority];

661

457

  if (!updates) {

662

286

    updates = std::make_unique<PendingUpdates>();

663

286

664

665

  // Has an update_merge_window gone by since the last update? If so, don't schedule

666

  // the update so it can be applied immediately. Ditto if this is not a mergeable update.

667

457

  const auto delta = time_source_.monotonicTime() - updates->last_updated_;

668

457

  const uint64_t delta_ms = std::chrono::duration_cast<std::chrono::milliseconds>(delta).count();

669

457

  const bool out_of_merge_window = delta_ms > timeout;

670

457

  if (out_of_merge_window || !mergeable) {

671

    // If there was a pending update, we cancel the pending merged update.

672

//

673

    // Note: it's possible that even though we are outside of a merge window (delta_ms > timeout),

674

    // a timer is enabled. This race condition is fine, since we'll disable the timer here and

675

    // deliver the update immediately.

676

677

    // Why wasn't the update scheduled for later delivery? We keep some stats that are helpful

678

    // to understand why merging did not happen. There's 2 things we are tracking here:

679

680

    // 1) Was this update out of a merge window?

681

391

    if (mergeable && out_of_merge_window) {

682

74

      cm_stats_.update_out_of_merge_window_.inc();

683

74

684

685

    // 2) Were there previous updates that we are cancelling (and delivering immediately)?

686

391

    if (updates->disableTimer()) {

687

12

      cm_stats_.update_merge_cancelled_.inc();

688

12

689

690

391

    updates->last_updated_ = time_source_.monotonicTime();

691

391

    return false;

692

391

693

694

  // If there's no timer, create one.

695

66

  if (updates->timer_ == nullptr) {

696

36

    updates->timer_ = dispatcher_.createTimer([this, &cluster, priority, &updates]() -> void {

697

4

      applyUpdates(cluster, priority, *updates);

698

4

});

699

36

700

701

  // Ensure there's a timer set to deliver these updates.

702

66

  if (!updates->timer_->enabled()) {

703

44

    updates->enableTimer(timeout);

704

44

705

706

66

  return true;

707

457

708

709

void ClusterManagerImpl::applyUpdates(ClusterManagerCluster& cluster, uint32_t priority,

710

4

                                      PendingUpdates& updates) {

711

  // Deliver pending updates.

712

713

  // Remember that these merged updates are _only_ for updates related to

714

  // HC/weight/metadata changes. That's why added/removed are empty. All

715

  // adds/removals were already immediately broadcasted.

716

4

  static const HostVector hosts_added;

717

4

  static const HostVector hosts_removed;

718

719

4

  postThreadLocalClusterUpdate(

720

4

      cluster, ThreadLocalClusterUpdateParams(priority, hosts_added, hosts_removed));

721

722

4

  cm_stats_.cluster_updated_via_merge_.inc();

723

4

  updates.last_updated_ = time_source_.monotonicTime();

724

4

725

726

absl::StatusOr<bool>

727

ClusterManagerImpl::addOrUpdateCluster(const envoy::config::cluster::v3::Cluster& cluster,

728

                                       const std::string& version_info,

729

1759

                                       const bool avoid_cds_removal) {

730

  // First we need to see if this new config is new or an update to an existing dynamic cluster.

731

  // We don't allow updates to statically configured clusters in the main configuration. We check

732

  // both the warming clusters and the active clusters to see if we need an update or the update

733

  // should be blocked.

734

1759

  const std::string& cluster_name = cluster.name();

735

1759

  const auto existing_active_cluster = active_clusters_.find(cluster_name);

736

1759

  const auto existing_warming_cluster = warming_clusters_.find(cluster_name);

737

1759

  const uint64_t new_hash = MessageUtil::hash(cluster);

738

1759

  if (existing_warming_cluster != warming_clusters_.end()) {

739

    // If the cluster is the same as the warming cluster of the same name, block the update.

740

30

    if (existing_warming_cluster->second->blockUpdate(new_hash)) {

741

12

      return false;

742

12

743

    // NB: https://github.com/envoyproxy/envoy/issues/14598

744

    // Always proceed if the cluster is different from the existing warming cluster.

745

1729

  } else if (existing_active_cluster != active_clusters_.end() &&

746

1729

             existing_active_cluster->second->blockUpdate(new_hash)) {

747

    // If there's no warming cluster of the same name, and if the cluster is the same as the active

748

    // cluster of the same name, block the update.

749

133

    return false;

750

133

751

752

1614

  if (existing_active_cluster != active_clusters_.end() ||

753

1614

      existing_warming_cluster != warming_clusters_.end()) {

754

88

    if (existing_active_cluster != active_clusters_.end()) {

755

      // The following init manager remove call is a NOP in the case we are already initialized.

756

      // It's just kept here to avoid additional logic.

757

72

      init_helper_.removeCluster(*existing_active_cluster->second);

758

72

759

88

    cm_stats_.cluster_modified_.inc();

760

1526

  } else {

761

1526

    cm_stats_.cluster_added_.inc();

762

1526

763

764

  // There are two discrete paths here depending on when we are adding/updating a cluster.

765

  // 1) During initial server load we use the init manager which handles complex logic related to

766

  //    primary/secondary init, static/CDS init, warming all clusters, etc.

767

  // 2) After initial server load, we handle warming independently for each cluster in the warming

768

  //    map.

769

  // Note: It's likely possible that all warming logic could be centralized in the init manager, but

770

  //       a decision was made to split the logic given how complex the init manager already is. In

771

  //       the future we may decide to undergo a refactor to unify the logic but the effort/risk to

772

  //       do that right now does not seem worth it given that the logic is generally pretty clean

773

  //       and easy to understand.

774

1614

  const bool all_clusters_initialized =

775

1614

      init_helper_.state() == ClusterManagerInitHelper::State::AllClustersInitialized;

776

  // Preserve the previous cluster data to avoid early destroy. The same cluster should be added

777

  // before destroy to avoid early initialization complete.

778

1614

  auto status_or_cluster =

779

1614

      loadCluster(cluster, new_hash, version_info, /*added_via_api=*/true,

780

1614

                  /*required_for_ads=*/false, warming_clusters_, avoid_cds_removal);

781

1614

  RETURN_IF_NOT_OK_REF(status_or_cluster.status());

782

1614

  const ClusterDataPtr previous_cluster = std::move(status_or_cluster.value());

783

1614

  auto& cluster_entry = warming_clusters_.at(cluster_name);

784

1614

  cluster_entry->cluster_->info()->configUpdateStats().warming_state_.set(1);

785

1614

  if (!all_clusters_initialized) {

786

676

    ENVOY_LOG(debug, "add/update cluster {} during init", cluster_name);

787

676

    init_helper_.addCluster(*cluster_entry);

788

1369

  } else {

789

938

    ENVOY_LOG(debug, "add/update cluster {} starting warming", cluster_name);

790

938

    cluster_entry->cluster_->initialize([this, cluster_name] {

791

902

      ENVOY_LOG(debug, "warming cluster {} complete", cluster_name);

792

902

      auto state_changed_cluster_entry = warming_clusters_.find(cluster_name);

793

902

      state_changed_cluster_entry->second->cluster_->info()->configUpdateStats().warming_state_.set(

794

902

0);

795

902

      return onClusterInit(*state_changed_cluster_entry->second);

796

902

});

797

938

798

799

1614

  return true;

800

1614

801

802

1550

void ClusterManagerImpl::clusterWarmingToActive(const std::string& cluster_name) {

803

1550

  auto warming_it = warming_clusters_.find(cluster_name);

804

1550

  ASSERT(warming_it != warming_clusters_.end());

805

806

  // If the cluster is being updated, we need to cancel any pending merged updates.

807

  // Otherwise, applyUpdates() will fire with a dangling cluster reference.

808

1550

  updates_map_.erase(cluster_name);

809

810

1550

  active_clusters_[cluster_name] = std::move(warming_it->second);

811

1550

  warming_clusters_.erase(warming_it);

812

1550

813

814

1774

bool ClusterManagerImpl::removeCluster(const std::string& cluster_name, const bool remove_ignored) {

815

1774

  bool removed = false;

816

1774

  auto existing_active_cluster = active_clusters_.find(cluster_name);

817

1774

  if (existing_active_cluster != active_clusters_.end() &&

818

1774

      existing_active_cluster->second->added_via_api_ &&

819

1774

      (!existing_active_cluster->second->avoid_cds_removal_ || remove_ignored)) {

820

587

    removed = true;

821

587

    init_helper_.removeCluster(*existing_active_cluster->second);

822

587

    active_clusters_.erase(existing_active_cluster);

823

824

587

    ENVOY_LOG(debug, "removing cluster {}", cluster_name);

825

1158

    tls_.runOnAllThreads([cluster_name](OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

826

1158

      ASSERT(cluster_manager->thread_local_clusters_.contains(cluster_name) ||

827

1158

             cluster_manager->thread_local_deferred_clusters_.contains(cluster_name));

828

1158

      ENVOY_LOG(debug, "removing TLS cluster {}", cluster_name);

829

1158

      for (auto cb_it = cluster_manager->update_callbacks_.begin();

830

2349

           cb_it != cluster_manager->update_callbacks_.end();) {

831

        // The current callback may remove itself from the list, so a handle for

832

        // the next item is fetched before calling the callback.

833

1191

        auto curr_cb_it = cb_it;

834

1191

        ++cb_it;

835

1191

        (*curr_cb_it)->onClusterRemoval(cluster_name);

836

1191

837

1158

      cluster_manager->thread_local_clusters_.erase(cluster_name);

838

1158

      cluster_manager->thread_local_deferred_clusters_.erase(cluster_name);

839

1158

      cluster_manager->local_stats_.clusters_inflated_.set(

840

1158

          cluster_manager->thread_local_clusters_.size());

841

1158

});

842

587

    cluster_initialization_map_.erase(cluster_name);

843

587

844

845

1774

  auto existing_warming_cluster = warming_clusters_.find(cluster_name);

846

1774

  if (existing_warming_cluster != warming_clusters_.end() &&

847

1774

      existing_warming_cluster->second->added_via_api_ &&

848

1774

      (!existing_warming_cluster->second->avoid_cds_removal_ || remove_ignored)) {

849

12

    removed = true;

850

12

    init_helper_.removeCluster(*existing_warming_cluster->second);

851

12

    warming_clusters_.erase(existing_warming_cluster);

852

12

    ENVOY_LOG(info, "removing warming cluster {}", cluster_name);

853

12

854

855

1774

  if (removed) {

856

599

    cm_stats_.cluster_removed_.inc();

857

599

    updateClusterCounts();

858

    // Cancel any pending merged updates.

859

599

    updates_map_.erase(cluster_name);

860

599

861

862

1774

  return removed;

863

1774

864

865

absl::StatusOr<ClusterManagerImpl::ClusterDataPtr>

866

ClusterManagerImpl::loadCluster(const envoy::config::cluster::v3::Cluster& cluster,

867

                                const uint64_t cluster_hash, const std::string& version_info,

868

                                bool added_via_api, const bool required_for_ads,

869

17556

                                ClusterMap& cluster_map, const bool avoid_cds_removal) {

870

17556

  absl::StatusOr<std::pair<ClusterSharedPtr, ThreadAwareLoadBalancerPtr>>

871

17556

      new_cluster_pair_or_error =

872

17556

          factory_.clusterFromProto(cluster, outlier_event_logger_, added_via_api);

873

874

17556

  if (!new_cluster_pair_or_error.ok()) {

875

    return absl::InvalidArgumentError(std::string(new_cluster_pair_or_error.status().message()));

876

877

17556

  auto& new_cluster = new_cluster_pair_or_error->first;

878

17556

  auto& lb = new_cluster_pair_or_error->second;

879

17556

  Cluster& cluster_reference = *new_cluster;

880

881

17556

  const auto cluster_info = cluster_reference.info();

882

883

17556

  if (!added_via_api) {

884

15929

    if (cluster_map.find(cluster_info->name()) != cluster_map.end()) {

885

2

      return absl::InvalidArgumentError(

886

2

          fmt::format("cluster manager: duplicate cluster '{}'", cluster_info->name()));

887

2

888

15929

889

890

  // Check if the cluster provided load balancing policy is used. We need handle it as special

891

  // case.

892

17554

  TypedLoadBalancerFactory& typed_lb_factory = cluster_info->loadBalancerFactory();

893

17554

  const bool cluster_provided_lb =

894

17554

      typed_lb_factory.name() == "envoy.load_balancing_policies.cluster_provided";

895

896

17554

  if (cluster_provided_lb && lb == nullptr) {

897

1

    return absl::InvalidArgumentError(

898

1

        fmt::format("cluster manager: cluster provided LB specified but cluster "

899

1

                    "'{}' did not provide one. Check cluster documentation.",

900

1

                    cluster_info->name()));

901

1

902

17553

  if (!cluster_provided_lb && lb != nullptr) {

903

1

    return absl::InvalidArgumentError(

904

1

        fmt::format("cluster manager: cluster provided LB not specified but cluster "

905

1

                    "'{}' provided one. Check cluster documentation.",

906

1

                    cluster_info->name()));

907

1

908

909

17552

  if (new_cluster->healthChecker() != nullptr) {

910

105

    new_cluster->healthChecker()->addHostCheckCompleteCb(

911

173

        [this](HostSharedPtr host, HealthTransition changed_state, HealthState) {

912

152

          if (changed_state == HealthTransition::Changed &&

913

152

              host->healthFlagGet(Host::HealthFlag::FAILED_ACTIVE_HC)) {

914

39

            postThreadLocalHealthFailure(host);

915

39

916

152

});

917

105

918

919

17552

  if (new_cluster->outlierDetector() != nullptr) {

920

76

    new_cluster->outlierDetector()->addChangedStateCb([this](HostSharedPtr host) {

921

44

      if (host->healthFlagGet(Host::HealthFlag::FAILED_OUTLIER_CHECK)) {

922

28

        ENVOY_LOG_EVENT(debug, "outlier_detection_ejection",

923

28

                        "host {} in cluster {} was ejected by the outlier detector",

924

28

                        host->address()->asStringView(), host->cluster().name());

925

28

        postThreadLocalHealthFailure(host);

926

28

927

44

});

928

62

929

17552

  ClusterDataPtr result;

930

17552

  auto cluster_entry_it = cluster_map.find(cluster_info->name());

931

17552

  if (cluster_entry_it != cluster_map.end()) {

932

18

    result = std::exchange(cluster_entry_it->second,

933

18

                           std::make_unique<ClusterData>(

934

18

                               cluster, cluster_hash, version_info, added_via_api, required_for_ads,

935

18

                               std::move(new_cluster), time_source_, avoid_cds_removal));

936

17534

  } else {

937

17534

    bool inserted = false;

938

17534

    std::tie(cluster_entry_it, inserted) = cluster_map.emplace(

939

17534

        cluster_info->name(),

940

17534

        std::make_unique<ClusterData>(cluster, cluster_hash, version_info, added_via_api,

941

17534

                                      required_for_ads, std::move(new_cluster), time_source_,

942

17534

                                      avoid_cds_removal));

943

17534

    ASSERT(inserted);

944

17534

945

946

17552

  if (cluster_provided_lb) {

947

171

    cluster_entry_it->second->thread_aware_lb_ = std::move(lb);

948

17469

  } else {

949

17381

    cluster_entry_it->second->thread_aware_lb_ =

950

17381

        typed_lb_factory.create(cluster_info->loadBalancerConfig(), *cluster_info,

951

17381

                                cluster_reference.prioritySet(), runtime_, random_, time_source_);

952

17381

953

954

17552

  updateClusterCounts();

955

17552

  return result;

956

17553

957

958

41376

void ClusterManagerImpl::updateClusterCounts() {

959

  // This if/else block implements a control flow mechanism that can be used by an ADS

960

  // implementation to properly sequence CDS and RDS updates. It is not enforcing on ADS. ADS can

961

  // use it to detect when a previously sent cluster becomes warm before sending routes that depend

962

  // on it. This can improve incidence of HTTP 503 responses from Envoy when a route is used before

963

  // it's supporting cluster is ready.

964

//

965

  // We achieve that by leaving CDS in the paused state as long as there is at least

966

  // one cluster in the warming state. This prevents CDS ACK from being sent to ADS.

967

  // Once cluster is warmed up, CDS is resumed, and ACK is sent to ADS, providing a

968

  // signal to ADS to proceed with RDS updates.

969

  // If we're in the middle of shutting down (ads_mux_ already gone) then this is irrelevant.

970

41376

  const bool all_clusters_initialized =

971

41376

      init_helper_.state() == ClusterManagerInitHelper::State::AllClustersInitialized;

972

41376

  if (all_clusters_initialized && xds_manager_.adsMux()) {

973

2431

    const auto type_url = Config::getTypeUrl<envoy::config::cluster::v3::Cluster>();

974

2431

    if (resume_cds_ == nullptr && !warming_clusters_.empty()) {

975

904

      resume_cds_ = xds_manager_.pause(type_url);

976

1535

    } else if (warming_clusters_.empty()) {

977

1429

      resume_cds_.reset();

978

1429

979

2431

980

41376

  cm_stats_.active_clusters_.set(active_clusters_.size());

981

41376

  cm_stats_.warming_clusters_.set(warming_clusters_.size());

982

41376

983

984

161380

ThreadLocalCluster* ClusterManagerImpl::getThreadLocalCluster(absl::string_view cluster) {

985

161380

  ThreadLocalClusterManagerImpl& cluster_manager = *tls_;

986

987

161380

  auto entry = cluster_manager.thread_local_clusters_.find(cluster);

988

161380

  if (entry != cluster_manager.thread_local_clusters_.end()) {

989

160332

    return entry->second.get();

990

160364

  } else {

991

1048

    return cluster_manager.initializeClusterInlineIfExists(cluster);

992

1048

993

161380

994

995

void ClusterManagerImpl::maybePreconnect(

996

    ThreadLocalClusterManagerImpl::ClusterEntry& cluster_entry,

997

    const ClusterConnectivityState& state,

998

49533

    std::function<ConnectionPool::Instance*()> pick_preconnect_pool) {

999

49533

  auto peekahead_ratio = cluster_entry.info()->peekaheadRatio();

1000

49533

  if (peekahead_ratio <= 1.0) {

1001

49450

    return;

1002

49450

1003

1004

  // 3 here is arbitrary. Just as in ConnPoolImplBase::tryCreateNewConnections

1005

  // we want to limit the work which can be done on any given preconnect attempt.

1006

186

  for (int i = 0; i < 3; ++i) {

1007

    // See if adding this one new connection

1008

    // would put the cluster over desired capacity. If so, stop preconnecting.

1009

//

1010

    // We anticipate the incoming stream here, because maybePreconnect is called

1011

    // before a new stream is established.

1012

183

    if (!ConnectionPool::ConnPoolImplBase::shouldConnect(

1013

183

            state.pending_streams_, state.active_streams_,

1014

183

            state.connecting_and_connected_stream_capacity_, peekahead_ratio, true)) {

1015

53

      return;

1016

53

1017

130

    ConnectionPool::Instance* preconnect_pool = pick_preconnect_pool();

1018

130

    if (!preconnect_pool || !preconnect_pool->maybePreconnect(peekahead_ratio)) {

1019

      // Given that the next preconnect pick may be entirely different, we could

1020

      // opt to try again even if the first preconnect fails. Err on the side of

1021

      // caution and wait for the next attempt.

1022

27

      return;

1023

27

1024

130

1025

83

1026

1027

absl::optional<HttpPoolData>

1028

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::httpConnPool(

1029

    HostConstSharedPtr host, ResourcePriority priority, absl::optional<Http::Protocol> protocol,

1030

47410

    LoadBalancerContext* context) {

1031

  // Select a host and create a connection pool for it if it does not already exist.

1032

47410

  auto pool = httpConnPoolImpl(host, priority, protocol, context);

1033

47410

  if (pool == nullptr) {

1034

4

    return absl::nullopt;

1035

4

1036

1037

47406

  HttpPoolData data(

1038

47406

      [this, priority, protocol, context]() -> void {

1039

        // Now that a new stream is being established, attempt to preconnect.

1040

47333

        maybePreconnect(

1041

47338

            *this, parent_.cluster_manager_state_, [this, &priority, &protocol, &context]() {

1042

93

              HostConstSharedPtr peek_host = peekAnotherHost(context);

1043

93

              return peek_host ? httpConnPoolImpl(peek_host, priority, protocol, context) : nullptr;

1044

93

});

1045

47333

},

1046

47406

      pool);

1047

47406

  return data;

1048

47410

1049

1050

absl::optional<TcpPoolData>

1051

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::tcpConnPool(

1052

2277

    HostConstSharedPtr host, ResourcePriority priority, LoadBalancerContext* context) {

1053

2277

  if (!host) {

1054

1

    return absl::nullopt;

1055

1

1056

  // Select a host and create a connection pool for it if it does not already exist.

1057

2276

  auto pool = tcpConnPoolImpl(host, priority, context);

1058

2276

  if (pool == nullptr) {

1059

    return absl::nullopt;

1060

1061

1062

2276

  TcpPoolData data(

1063

2276

      [this, priority, context]() -> void {

1064

2201

        maybePreconnect(*this, parent_.cluster_manager_state_, [this, &priority, &context]() {

1065

37

          HostConstSharedPtr peek_host = peekAnotherHost(context);

1066

37

          return peek_host ? tcpConnPoolImpl(peek_host, priority, context) : nullptr;

1067

37

});

1068

2200

},

1069

2276

      pool);

1070

2276

  return data;

1071

2276

1072

1073

absl::optional<TcpPoolData>

1074

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::tcpConnPool(

1075

386

    ResourcePriority priority, LoadBalancerContext* context) {

1076

386

  HostConstSharedPtr host = LoadBalancer::onlyAllowSynchronousHostSelection(chooseHost(context));

1077

386

  if (!host) {

1078

3

    return absl::nullopt;

1079

3

1080

383

  return tcpConnPool(host, priority, context);

1081

386

1082

1083

void ClusterManagerImpl::drainConnections(const std::string& cluster,

1084

35

                                          DrainConnectionsHostPredicate predicate) {

1085

35

  ENVOY_LOG_EVENT(debug, "drain_connections_call", "drainConnections called for cluster {}",

1086

35

                  cluster);

1087

68

  tls_.runOnAllThreads([cluster, predicate](OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

1088

68

    auto cluster_entry = cluster_manager->thread_local_clusters_.find(cluster);

1089

68

    if (cluster_entry != cluster_manager->thread_local_clusters_.end()) {

1090

68

      cluster_entry->second->drainConnPools(

1091

68

          predicate, ConnectionPool::DrainBehavior::DrainExistingConnections);

1092

68

1093

68

});

1094

35

1095

1096

void ClusterManagerImpl::drainConnections(DrainConnectionsHostPredicate predicate,

1097

11

                                          ConnectionPool::DrainBehavior drain_behavior) {

1098

11

  ENVOY_LOG_EVENT(debug, "drain_connections_call_for_all_clusters",

1099

11

                  "drainConnections called for all clusters");

1100

11

  tls_.runOnAllThreads(

1101

22

      [predicate, drain_behavior](OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

1102

44

        for (const auto& cluster_entry : cluster_manager->thread_local_clusters_) {

1103

44

          cluster_entry.second->drainConnPools(predicate, drain_behavior);

1104

44

1105

22

});

1106

11

1107

1108

380

absl::Status ClusterManagerImpl::checkActiveStaticCluster(const std::string& cluster) {

1109

380

  const auto& it = active_clusters_.find(cluster);

1110

380

  if (it == active_clusters_.end()) {

1111

2

    return absl::InvalidArgumentError(fmt::format("Unknown gRPC client cluster '{}'", cluster));

1112

2

1113

378

  if (it->second->added_via_api_) {

1114

1

    return absl::InvalidArgumentError(

1115

1

        fmt::format("gRPC client cluster '{}' is not static", cluster));

1116

1

1117

377

  return absl::OkStatus();

1118

378

1119

1120

void ClusterManagerImpl::postThreadLocalRemoveHosts(const Cluster& cluster,

1121

74

                                                    const HostVector& hosts_removed) {

1122

  // Drain the connection pools for the given hosts. For deferred clusters have

1123

  // been created.

1124

74

  tls_.runOnAllThreads([name = cluster.info()->name(),

1125

128

                        hosts_removed](OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

1126

128

    cluster_manager->removeHosts(name, hosts_removed);

1127

128

});

1128

74

1129

1130

bool ClusterManagerImpl::deferralIsSupportedForCluster(

1131

17736

    const ClusterInfoConstSharedPtr& info) const {

1132

17736

  if (!deferred_cluster_creation_) {

1133

17203

    return false;

1134

17203

1135

1136

  // Certain cluster types are unsupported for deferred initialization.

1137

  // We need to check both the `clusterType()` (preferred) falling back to

1138

  // the `type()` due to how custom clusters were added leveraging an any

1139

  // config.

1140

533

  if (auto custom_cluster_type = info->clusterType(); custom_cluster_type.has_value()) {

1141

    // TODO(kbaichoo): make it configurable what custom types are supported?

1142

18

    static const std::array<std::string, 4> supported_well_known_cluster_types = {

1143

18

        "envoy.clusters.aggregate", "envoy.cluster.eds", "envoy.clusters.redis",

1144

18

        "envoy.cluster.static"};

1145

18

    if (std::find(supported_well_known_cluster_types.begin(),

1146

18

                  supported_well_known_cluster_types.end(),

1147

18

                  custom_cluster_type->name()) == supported_well_known_cluster_types.end()) {

1148

      return false;

1149

1150

1151

515

  } else {

1152

    // Check DiscoveryType instead.

1153

515

    static constexpr std::array<envoy::config::cluster::v3::Cluster::DiscoveryType, 2>

1154

515

        supported_cluster_types = {envoy::config::cluster::v3::Cluster::EDS,

1155

515

                                   envoy::config::cluster::v3::Cluster::STATIC};

1156

515

    if (std::find(supported_cluster_types.begin(), supported_cluster_types.end(), info->type()) ==

1157

515

        supported_cluster_types.end()) {

1158

13

      return false;

1159

13

1160

515

1161

1162

520

  return true;

1163

533

1164

1165

void ClusterManagerImpl::postThreadLocalClusterUpdate(ClusterManagerCluster& cm_cluster,

1166

17736

                                                      ThreadLocalClusterUpdateParams&& params) {

1167

17736

  bool add_or_update_cluster = false;

1168

17736

  if (!cm_cluster.addedOrUpdated()) {

1169

17300

    add_or_update_cluster = true;

1170

17300

    cm_cluster.setAddedOrUpdated();

1171

17300

1172

1173

17736

  LoadBalancerFactorySharedPtr load_balancer_factory;

1174

17736

  if (add_or_update_cluster) {

1175

17300

    load_balancer_factory = cm_cluster.loadBalancerFactory();

1176

17300

1177

1178

17767

  for (auto& per_priority : params.per_priority_update_params_) {

1179

17325

    const auto& host_set =

1180

17325

        cm_cluster.cluster().prioritySet().hostSetsPerPriority()[per_priority.priority_];

1181

17325

    per_priority.update_hosts_params_ = HostSetImpl::updateHostsParams(*host_set);

1182

17325

    per_priority.locality_weights_ = host_set->localityWeights();

1183

17325

    per_priority.weighted_priority_health_ = host_set->weightedPriorityHealth();

1184

17325

    per_priority.overprovisioning_factor_ = host_set->overprovisioningFactor();

1185

17325

1186

1187

17736

  HostMapConstSharedPtr host_map = cm_cluster.cluster().prioritySet().crossPriorityHostMap();

1188

1189

17736

  pending_cluster_creations_.erase(cm_cluster.cluster().info()->name());

1190

1191

17736

  const UnitFloat drop_overload = cm_cluster.cluster().dropOverload();

1192

17736

  const std::string drop_category = cm_cluster.cluster().dropCategory();

1193

  // Populate the cluster initialization object based on this update.

1194

17736

  ClusterInitializationObjectConstSharedPtr cluster_initialization_object =

1195

17736

      addOrUpdateClusterInitializationObjectIfSupported(params, cm_cluster.cluster().info(),

1196

17736

                                                        load_balancer_factory, host_map,

1197

17736

                                                        drop_overload, drop_category);

1198

1199

17736

  tls_.runOnAllThreads([info = cm_cluster.cluster().info(), params = std::move(params),

1200

17736

                        add_or_update_cluster, load_balancer_factory, map = std::move(host_map),

1201

17736

                        cluster_initialization_object = std::move(cluster_initialization_object),

1202

17736

                        drop_overload, drop_category = std::move(drop_category)](

1203

34916

                           OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

1204

34916

    ASSERT(cluster_manager.has_value(),

1205

34916

           "Expected the ThreadLocalClusterManager to be set during ClusterManagerImpl creation.");

1206

1207

    // Cluster Manager here provided by the particular thread, it will provide

1208

    // this allowing to make the relevant change.

1209

34916

    if (const bool defer_unused_clusters =

1210

34916

            cluster_initialization_object != nullptr &&

1211

34916

            !cluster_manager->thread_local_clusters_.contains(info->name()) &&

1212

34916

            !Envoy::Thread::MainThread::isMainThread();

1213

34916

        defer_unused_clusters) {

1214

      // Save the cluster initialization object.

1215

490

      ENVOY_LOG(debug, "Deferring add or update for TLS cluster {}", info->name());

1216

490

      cluster_manager->thread_local_deferred_clusters_[info->name()] =

1217

490

          cluster_initialization_object;

1218

1219

      // Invoke similar logic of onClusterAddOrUpdate.

1220

490

      ThreadLocalClusterCommand command = [&cluster_manager,

1221

490

                                           cluster_name = info->name()]() -> ThreadLocalCluster& {

1222

        // If we have multiple callbacks only the first one needs to use the

1223

        // command to initialize the cluster.

1224

8

        auto existing_cluster_entry = cluster_manager->thread_local_clusters_.find(cluster_name);

1225

8

        if (existing_cluster_entry != cluster_manager->thread_local_clusters_.end()) {

1226

          return *existing_cluster_entry->second;

1227

1228

1229

8

        auto* cluster_entry = cluster_manager->initializeClusterInlineIfExists(cluster_name);

1230

8

        ASSERT(cluster_entry != nullptr, "Deferred clusters initiailization should not fail.");

1231

8

        return *cluster_entry;

1232

8

};

1233

490

      for (auto cb_it = cluster_manager->update_callbacks_.begin();

1234

997

           cb_it != cluster_manager->update_callbacks_.end();) {

1235

        // The current callback may remove itself from the list, so a handle for

1236

        // the next item is fetched before calling the callback.

1237

507

        auto curr_cb_it = cb_it;

1238

507

        ++cb_it;

1239

507

        (*curr_cb_it)->onClusterAddOrUpdate(info->name(), command);

1240

507

1241

1242

34465

    } else {

1243

      // Broadcast

1244

34426

      ThreadLocalClusterManagerImpl::ClusterEntry* new_cluster = nullptr;

1245

34426

      if (add_or_update_cluster) {

1246

33670

        if (cluster_manager->thread_local_clusters_.contains(info->name())) {

1247

114

          ENVOY_LOG(debug, "updating TLS cluster {}", info->name());

1248

33558

        } else {

1249

33556

          ENVOY_LOG(debug, "adding TLS cluster {}", info->name());

1250

33556

1251

1252

33670

        new_cluster = new ThreadLocalClusterManagerImpl::ClusterEntry(*cluster_manager, info,

1253

33670

                                                                      load_balancer_factory);

1254

33670

        cluster_manager->thread_local_clusters_[info->name()].reset(new_cluster);

1255

33670

        cluster_manager->local_stats_.clusters_inflated_.set(

1256

33670

            cluster_manager->thread_local_clusters_.size());

1257

33670

1258

1259

34426

      if (cluster_manager->thread_local_clusters_[info->name()]) {

1260

34424

        cluster_manager->thread_local_clusters_[info->name()]->setDropOverload(drop_overload);

1261

34424

        cluster_manager->thread_local_clusters_[info->name()]->setDropCategory(drop_category);

1262

34424

1263

34480

      for (const auto& per_priority : params.per_priority_update_params_) {

1264

33731

        cluster_manager->updateClusterMembership(

1265

33731

            info->name(), per_priority.priority_, per_priority.update_hosts_params_,

1266

33731

            per_priority.locality_weights_, per_priority.hosts_added_, per_priority.hosts_removed_,

1267

33731

            per_priority.weighted_priority_health_, per_priority.overprovisioning_factor_, map);

1268

33731

1269

1270

34426

      if (new_cluster != nullptr) {

1271

33669

        ThreadLocalClusterCommand command = [&new_cluster]() -> ThreadLocalCluster& {

1272

50

          return *new_cluster;

1273

50

};

1274

33669

        for (auto cb_it = cluster_manager->update_callbacks_.begin();

1275

67512

             cb_it != cluster_manager->update_callbacks_.end();) {

1276

          // The current callback may remove itself from the list, so a handle for

1277

          // the next item is fetched before calling the callback.

1278

33843

          auto curr_cb_it = cb_it;

1279

33843

          ++cb_it;

1280

33843

          (*curr_cb_it)->onClusterAddOrUpdate(info->name(), command);

1281

33843

1282

33669

1283

34426

1284

34916

});

1285

1286

  // By this time, the main thread has received the cluster initialization update, so we can start

1287

  // the ADS mux if the ADS mux is dependent on this cluster's initialization.

1288

17736

  if (cm_cluster.requiredForAds() && !ads_mux_initialized_) {

1289

204

    xds_manager_.adsMux()->start();

1290

204

    ads_mux_initialized_ = true;

1291

204

1292

17736

1293

1294

ClusterManagerImpl::ClusterInitializationObjectConstSharedPtr

1295

ClusterManagerImpl::addOrUpdateClusterInitializationObjectIfSupported(

1296

    const ThreadLocalClusterUpdateParams& params, ClusterInfoConstSharedPtr cluster_info,

1297

    LoadBalancerFactorySharedPtr load_balancer_factory, HostMapConstSharedPtr map,

1298

17736

    UnitFloat drop_overload, absl::string_view drop_category) {

1299

17736

  if (!deferralIsSupportedForCluster(cluster_info)) {

1300

17216

    return nullptr;

1301

17216

1302

1303

520

  const std::string& cluster_name = cluster_info->name();

1304

520

  auto entry = cluster_initialization_map_.find(cluster_name);

1305

  // TODO(kbaichoo): if EDS can be configured via cluster_type() then modify the

1306

  // merging logic below.

1307

//

1308

  // This method may be called multiple times to create multiple ClusterInitializationObject

1309

  // instances for the same cluster. And before the thread local clusters are actually initialized,

1310

  // the new instances will override the old instances in the work threads. But part of data is be

1311

  // created only once, such as load balancer factory. So we should always to merge the new instance

1312

  // with the old one to keep the latest instance have all necessary data.

1313

//

1314

  // More specifically, this will happen in the following scenarios for now:

1315

  // 1. EDS clusters: the ClusterLoadAssignment of EDS cluster may be updated multiples before

1316

  //   the thread local cluster is initialized.

1317

  // 2. Clusters in the unit tests: the cluster in the unit test may be updated multiples before

1318

  //   the thread local cluster is initialized by calling 'updateHosts' manually.

1319

520

  const bool should_merge_with_prior_cluster =

1320

520

      entry != cluster_initialization_map_.end() && entry->second->cluster_info_ == cluster_info;

1321

1322

520

  if (should_merge_with_prior_cluster) {

1323

    // We need to copy from an existing Cluster Initialization Object. In

1324

    // particular, only update the params with changed priority.

1325

63

    auto new_initialization_object = std::make_shared<ClusterInitializationObject>(

1326

63

        entry->second->per_priority_state_, params, std::move(cluster_info),

1327

63

        load_balancer_factory == nullptr ? entry->second->load_balancer_factory_

1328

63

                                         : load_balancer_factory,

1329

63

        map, drop_overload, drop_category);

1330

63

    cluster_initialization_map_[cluster_name] = new_initialization_object;

1331

63

    return new_initialization_object;

1332

469

  } else {

1333

    // We need to create a fresh Cluster Initialization Object.

1334

457

    auto new_initialization_object = std::make_shared<ClusterInitializationObject>(

1335

457

        params, std::move(cluster_info), load_balancer_factory, map, drop_overload, drop_category);

1336

457

    cluster_initialization_map_[cluster_name] = new_initialization_object;

1337

457

    return new_initialization_object;

1338

457

1339

520

1340

1341

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry*

1342

ClusterManagerImpl::ThreadLocalClusterManagerImpl::initializeClusterInlineIfExists(

1343

1056

    absl::string_view cluster) {

1344

1056

  auto entry = thread_local_deferred_clusters_.find(cluster);

1345

1056

  if (entry == thread_local_deferred_clusters_.end()) {

1346

    // Unknown cluster.

1347

926

    return nullptr;

1348

926

1349

1350

  // Create the cluster inline.

1351

130

  const ClusterInitializationObjectConstSharedPtr& initialization_object = entry->second;

1352

130

  ENVOY_LOG(debug, "initializing TLS cluster {} inline", cluster);

1353

130

  auto cluster_entry = std::make_unique<ClusterEntry>(

1354

130

      *this, initialization_object->cluster_info_, initialization_object->load_balancer_factory_);

1355

130

  ClusterEntry* cluster_entry_ptr = cluster_entry.get();

1356

1357

130

  thread_local_clusters_[cluster] = std::move(cluster_entry);

1358

130

  local_stats_.clusters_inflated_.set(thread_local_clusters_.size());

1359

1360

134

  for (const auto& [_, per_priority] : initialization_object->per_priority_state_) {

1361

120

    updateClusterMembership(initialization_object->cluster_info_->name(), per_priority.priority_,

1362

120

                            per_priority.update_hosts_params_, per_priority.locality_weights_,

1363

120

                            per_priority.hosts_added_, per_priority.hosts_removed_,

1364

120

                            per_priority.weighted_priority_health_,

1365

120

                            per_priority.overprovisioning_factor_,

1366

120

                            initialization_object->cross_priority_host_map_);

1367

120

1368

130

  thread_local_clusters_[cluster]->setDropOverload(initialization_object->drop_overload_);

1369

130

  thread_local_clusters_[cluster]->setDropCategory(initialization_object->drop_category_);

1370

1371

  // Remove the CIO as we've initialized the cluster.

1372

130

  thread_local_deferred_clusters_.erase(entry);

1373

1374

130

  return cluster_entry_ptr;

1375

1056

1376

1377

ClusterManagerImpl::ClusterInitializationObject::ClusterInitializationObject(

1378

    const ThreadLocalClusterUpdateParams& params, ClusterInfoConstSharedPtr cluster_info,

1379

    LoadBalancerFactorySharedPtr load_balancer_factory, HostMapConstSharedPtr map,

1380

    UnitFloat drop_overload, absl::string_view drop_category)

1381

457

    : cluster_info_(std::move(cluster_info)), load_balancer_factory_(load_balancer_factory),

1382

457

      cross_priority_host_map_(map), drop_overload_(drop_overload), drop_category_(drop_category) {

1383

  // Copy the update since the map is empty.

1384

462

  for (const auto& update : params.per_priority_update_params_) {

1385

415

    per_priority_state_.emplace(update.priority_, update);

1386

415

1387

457

1388

1389

ClusterManagerImpl::ClusterInitializationObject::ClusterInitializationObject(

1390

    const absl::flat_hash_map<int, ThreadLocalClusterUpdateParams::PerPriority>& per_priority_state,

1391

    const ThreadLocalClusterUpdateParams& update_params, ClusterInfoConstSharedPtr cluster_info,

1392

    LoadBalancerFactorySharedPtr load_balancer_factory, HostMapConstSharedPtr map,

1393

    UnitFloat drop_overload, absl::string_view drop_category)

1394

63

    : per_priority_state_(per_priority_state), cluster_info_(std::move(cluster_info)),

1395

63

      load_balancer_factory_(load_balancer_factory), cross_priority_host_map_(map),

1396

63

      drop_overload_(drop_overload), drop_category_(drop_category) {

1397

1398

  // Because EDS Clusters receive the entire ClusterLoadAssignment but only

1399

  // provides the delta we must process the hosts_added and hosts_removed and

1400

  // not simply overwrite with hosts added.

1401

63

  for (const auto& update : update_params.per_priority_update_params_) {

1402

63

    auto it = per_priority_state_.find(update.priority_);

1403

63

    if (it != per_priority_state_.end()) {

1404

35

      auto& priority_state = it->second;

1405

      // Merge the two per_priorities.

1406

35

      priority_state.update_hosts_params_ = update.update_hosts_params_;

1407

35

      priority_state.locality_weights_ = update.locality_weights_;

1408

35

      priority_state.weighted_priority_health_ = update.weighted_priority_health_;

1409

35

      priority_state.overprovisioning_factor_ = update.overprovisioning_factor_;

1410

1411

      // Merge the hosts vectors to just have hosts added.

1412

      // Assumes that the old host_added_ is exclusive to new hosts_added_ and

1413

      // new hosts_removed_ only refers to the old hosts_added_.

1414

35

      ASSERT(priority_state.hosts_removed_.empty(),

1415

35

             "Cluster Initialization Object should apply hosts "

1416

35

             "removed updates to hosts_added vector!");

1417

1418

      // TODO(kbaichoo): replace with a more efficient algorithm. For example

1419

      // if the EDS cluster exposed the LoadAssignment we could just merge by

1420

      // overwriting hosts_added.

1421

35

      if (!update.hosts_removed_.empty()) {

1422

        // Remove all hosts to be removed from the old host_added.

1423

15

        auto& host_added = priority_state.hosts_added_;

1424

15

        auto removed_section = std::remove_if(

1425

15

            host_added.begin(), host_added.end(),

1426

33

            [hosts_removed = std::cref(update.hosts_removed_)](const HostSharedPtr& ptr) {

1427

33

              return std::find(hosts_removed.get().begin(), hosts_removed.get().end(), ptr) !=

1428

33

                     hosts_removed.get().end();

1429

33

});

1430

15

        priority_state.hosts_added_.erase(removed_section, priority_state.hosts_added_.end());

1431

15

1432

1433

      // Add updated host_added.

1434

35

      priority_state.hosts_added_.reserve(priority_state.hosts_added_.size() +

1435

35

                                          update.hosts_added_.size());

1436

35

      std::copy(update.hosts_added_.begin(), update.hosts_added_.end(),

1437

35

                std::back_inserter(priority_state.hosts_added_));

1438

1439

43

    } else {

1440

      // Just copy the new priority.

1441

28

      per_priority_state_.emplace(update.priority_, update);

1442

28

1443

63

1444

63

1445

1446

67

void ClusterManagerImpl::postThreadLocalHealthFailure(const HostSharedPtr& host) {

1447

118

  tls_.runOnAllThreads([host](OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

1448

118

    cluster_manager->onHostHealthFailure(host);

1449

118

});

1450

67

1451

1452

Host::CreateConnectionData ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::tcpConn(

1453

62

    LoadBalancerContext* context) {

1454

62

  HostConstSharedPtr logical_host =

1455

62

      LoadBalancer::onlyAllowSynchronousHostSelection(chooseHost(context));

1456

1457

62

  if (logical_host) {

1458

59

    auto conn_info = logical_host->createConnection(

1459

59

        parent_.thread_local_dispatcher_, nullptr,

1460

59

        context == nullptr ? nullptr : context->upstreamTransportSocketOptions());

1461

59

    if ((cluster_info_->features() &

1462

59

         ClusterInfo::Features::CLOSE_CONNECTIONS_ON_HOST_HEALTH_FAILURE) &&

1463

59

        conn_info.connection_ != nullptr) {

1464

8

      auto conn_map_iter = parent_.host_tcp_conn_map_.find(logical_host);

1465

8

      if (conn_map_iter == parent_.host_tcp_conn_map_.end()) {

1466

6

        conn_map_iter =

1467

6

            parent_.host_tcp_conn_map_.try_emplace(logical_host, logical_host->acquireHandle())

1468

6

                .first;

1469

6

1470

8

      auto& conn_map = conn_map_iter->second;

1471

8

      conn_map.connections_.emplace(

1472

8

          conn_info.connection_.get(),

1473

8

          std::make_unique<ThreadLocalClusterManagerImpl::TcpConnContainer>(

1474

8

              parent_, logical_host, *conn_info.connection_));

1475

8

1476

59

    return conn_info;

1477

59

1478

3

  return {nullptr, nullptr};

1479

62

1480

1481

Http::AsyncClient&

1482

3101

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::httpAsyncClient() {

1483

3101

  if (lazy_http_async_client_ == nullptr) {

1484

2042

    lazy_http_async_client_ = std::make_unique<Http::AsyncClientImpl>(

1485

2042

        cluster_info_, parent_.parent_.stats_, parent_.thread_local_dispatcher_, parent_.parent_,

1486

2042

        parent_.parent_.context_,

1487

2042

        Router::ShadowWriterPtr{new Router::ShadowWriterImpl(parent_.parent_)},

1488

2042

        parent_.parent_.http_context_, parent_.parent_.router_context_);

1489

2042

1490

3101

  return *lazy_http_async_client_;

1491

3101

1492

1493

Tcp::AsyncTcpClientPtr

1494

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::tcpAsyncClient(

1495

22

    LoadBalancerContext* context, Tcp::AsyncTcpClientOptionsConstSharedPtr options) {

1496

22

  return std::make_unique<Tcp::AsyncTcpClientImpl>(parent_.thread_local_dispatcher_, *this, context,

1497

22

                                                   options->enable_half_close);

1498

22

1499

1500

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::updateHosts(

1501

    const std::string& name, uint32_t priority,

1502

    PrioritySet::UpdateHostsParams&& update_hosts_params,

1503

    LocalityWeightsConstSharedPtr locality_weights, const HostVector& hosts_added,

1504

    const HostVector& hosts_removed, absl::optional<bool> weighted_priority_health,

1505

    absl::optional<uint32_t> overprovisioning_factor,

1506

33849

    HostMapConstSharedPtr cross_priority_host_map) {

1507

33849

  ENVOY_LOG(debug, "membership update for TLS cluster {} added {} removed {}", name,

1508

33849

            hosts_added.size(), hosts_removed.size());

1509

33849

  priority_set_.updateHosts(priority, std::move(update_hosts_params), std::move(locality_weights),

1510

33849

                            hosts_added, hosts_removed, weighted_priority_health,

1511

33849

                            overprovisioning_factor, std::move(cross_priority_host_map));

1512

  // If an LB is thread aware, create a new worker local LB on membership changes.

1513

33854

  if (lb_factory_ != nullptr && lb_factory_->recreateOnHostChange()) {

1514

936

    ENVOY_LOG(debug, "re-creating local LB for TLS cluster {}", name);

1515

936

    lb_ = lb_factory_->create({priority_set_, parent_.local_priority_set_});

1516

936

1517

33849

1518

1519

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::drainConnPools(

1520

34141

    const HostVector& hosts_removed) {

1521

34979

  for (const auto& host : hosts_removed) {

1522

34607

    parent_.drainOrCloseConnPools(host, ConnectionPool::DrainBehavior::DrainAndDelete);

1523

34607

1524

34141

1525

1526

33816

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::drainConnPools() {

1527

34020

  for (auto& host_set : priority_set_.hostSetsPerPriority()) {

1528

34020

    drainConnPools(host_set->hosts());

1529

34020

1530

33816

1531

1532

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::drainConnPools(

1533

112

    DrainConnectionsHostPredicate predicate, ConnectionPool::DrainBehavior behavior) {

1534

112

  for (auto& host_set : priority_set_.hostSetsPerPriority()) {

1535

114

    for (const auto& host : host_set->hosts()) {

1536

114

      if (predicate != nullptr && !predicate(*host)) {

1537

24

        continue;

1538

24

1539

1540

90

      parent_.drainOrCloseConnPools(host, behavior);

1541

90

1542

112

1543

112

1544

1545

ClusterUpdateCallbacksHandlePtr

1546

407

ClusterManagerImpl::addThreadLocalClusterUpdateCallbacks(ClusterUpdateCallbacks& cb) {

1547

407

  ThreadLocalClusterManagerImpl& cluster_manager = *tls_;

1548

407

  return cluster_manager.addClusterUpdateCallbacks(cb);

1549

407

1550

1551

absl::StatusOr<OdCdsApiHandlePtr>

1552

ClusterManagerImpl::allocateOdCdsApi(OdCdsCreationFunction creation_function,

1553

                                     const envoy::config::core::v3::ConfigSource& odcds_config,

1554

                                     OptRef<xds::core::v3::ResourceLocator> odcds_resources_locator,

1555

174

                                     ProtobufMessage::ValidationVisitor& validation_visitor) {

1556

  // Generate a unique key based on config and locator. This enables reuse of subscriptions

1557

  // with the same configuration. Note that timeout is intentionally not part of the hash,

1558

  // so different timeout values will share the same subscription.

1559

  // Subscriptions persist for the lifetime of ClusterManagerImpl and are cleaned up when

1560

  // it is destroyed.

1561

174

  uint64_t config_hash = MessageUtil::hash(odcds_config);

1562

174

  if (odcds_resources_locator.has_value()) {

1563

1

    config_hash = absl::HashOf(config_hash, MessageUtil::hash(*odcds_resources_locator));

1564

1

1565

1566

174

  auto it = odcds_subscriptions_.find(config_hash);

1567

174

  if (it != odcds_subscriptions_.end()) {

1568

10

    return OdCdsApiHandleImpl::create(*this, config_hash);

1569

10

1570

1571

164

  auto odcds_or_error =

1572

164

      creation_function(odcds_config, odcds_resources_locator, xds_manager_, *this, *this,

1573

164

                        *stats_.rootScope(), validation_visitor, context_);

1574

164

  RETURN_IF_NOT_OK_REF(odcds_or_error.status());

1575

164

  odcds_subscriptions_.emplace(config_hash, std::move(*odcds_or_error));

1576

164

  return OdCdsApiHandleImpl::create(*this, config_hash);

1577

164

1578

1579

ClusterDiscoveryCallbackHandlePtr

1580

ClusterManagerImpl::requestOnDemandClusterDiscovery(uint64_t config_source_key, std::string name,

1581

                                                    ClusterDiscoveryCallbackPtr callback,

1582

268

                                                    std::chrono::milliseconds timeout) {

1583

268

  ThreadLocalClusterManagerImpl& cluster_manager = *tls_;

1584

1585

268

  auto [handle, discovery_in_progress, invoker] =

1586

268

      cluster_manager.cdm_.addCallback(name, std::move(callback));

1587

  // This check will catch requests for discoveries from this thread only. If other thread

1588

  // requested the same discovery, we will detect it in the main thread later.

1589

268

  if (discovery_in_progress) {

1590

34

    ENVOY_LOG(debug,

1591

34

              "cm odcds: on-demand discovery for cluster {} is already in progress, something else "

1592

34

              "in thread {} has already requested it",

1593

34

              name, cluster_manager.thread_local_dispatcher_.name());

1594

    // This worker thread has already requested a discovery of a cluster with this name, so

1595

    // nothing more left to do here.

1596

//

1597

    // We can't "just" return handle here, because handle is a part of the structured binding done

1598

    // above. So it's not really a ClusterDiscoveryCallbackHandlePtr, but more like

1599

    // ClusterDiscoveryCallbackHandlePtr&, so named return value optimization does not apply here

1600

    // - it needs to be moved.

1601

34

    return std::move(handle);

1602

34

1603

234

  ENVOY_LOG(

1604

234

      debug,

1605

234

      "cm odcds: forwarding the on-demand discovery request for cluster {} to the main thread",

1606

234

      name);

1607

  // This seems to be the first request for discovery of this cluster in this worker thread. Rest

1608

  // of the process may only happen in the main thread.

1609

234

  Event::Dispatcher& worker_dispatcher = cluster_manager.thread_local_dispatcher_;

1610

234

  dispatcher_.post([this, config_source_key, timeout, name = std::move(name),

1611

234

                    invoker = std::move(invoker), &worker_dispatcher] {

1612

234

    OdCdsApiSharedPtr odcds = odcds_subscriptions_.at(config_source_key);

1613

1614

    // Check for the cluster here too. It might have been added between the time when this closure

1615

    // was posted and when it is being executed.

1616

234

    if (getThreadLocalCluster(name) != nullptr) {

1617

1

      ENVOY_LOG(

1618

1

          debug,

1619

1

          "cm odcds: the requested cluster {} is already known, posting the callback back to {}",

1620

1

          name, worker_dispatcher.name());

1621

1

      worker_dispatcher.post([invoker = std::move(invoker)] {

1622

1

        invoker.invokeCallback(ClusterDiscoveryStatus::Available);

1623

1

});

1624

1

      return;

1625

1

1626

1627

233

    if (pending_cluster_creations_.contains(name)) {

1628

1

      ENVOY_LOG(debug, "cm odcds: on-demand discovery for cluster {} is already in progress", name);

1629

      // We already began the discovery process for this cluster, nothing to do. If we got here,

1630

      // it means that it was other worker thread that requested the discovery.

1631

1

      return;

1632

1

1633

    // Start the discovery. If the cluster gets discovered, cluster manager will warm it up and

1634

    // invoke the cluster lifecycle callbacks, that will in turn invoke our callback.

1635

232

    odcds->updateOnDemand(name);

1636

    // Setup the discovery timeout timer to avoid keeping callbacks indefinitely.

1637

232

    auto timer = dispatcher_.createTimer([this, name] { notifyExpiredDiscovery(name); });

1638

232

    timer->enableTimer(timeout);

1639

    // Keep odcds handle alive for the duration of the discovery process.

1640

232

    pending_cluster_creations_.insert(

1641

232

        {std::move(name), ClusterCreation{std::move(odcds), std::move(timer)}});

1642

232

});

1643

1644

  // We can't "just" return handle here, because handle is a part of the structured binding done

1645

  // above. So it's not really a ClusterDiscoveryCallbackHandlePtr, but more like

1646

  // ClusterDiscoveryCallbackHandlePtr&, so named return value optimization does not apply here -

1647

  // it needs to be moved.

1648

234

  return std::move(handle);

1649

268

1650

1651

18

void ClusterManagerImpl::notifyMissingCluster(absl::string_view name) {

1652

18

  ENVOY_LOG(info, "cm odcds: cluster {} not found during on-demand discovery", name);

1653

18

  notifyClusterDiscoveryStatus(name, ClusterDiscoveryStatus::Missing);

1654

18

1655

1656

19

void ClusterManagerImpl::notifyExpiredDiscovery(absl::string_view name) {

1657

19

  ENVOY_LOG(info, "cm odcds: on-demand discovery for cluster {} timed out", name);

1658

19

  notifyClusterDiscoveryStatus(name, ClusterDiscoveryStatus::Timeout);

1659

19

1660

1661

void ClusterManagerImpl::notifyClusterDiscoveryStatus(absl::string_view name,

1662

37

                                                      ClusterDiscoveryStatus status) {

1663

37

  auto map_node_handle = pending_cluster_creations_.extract(name);

1664

37

  if (map_node_handle.empty()) {

1665

    // Not a cluster we are interested in. This may happen when ODCDS

1666

    // receives some cluster name in removed resources field and

1667

    // notifies the cluster manager about it.

1668

1

    return;

1669

1

1670

  // Let all the worker threads know that the discovery timed out.

1671

36

  tls_.runOnAllThreads(

1672

70

      [name = std::string(name), status](OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

1673

70

        ENVOY_LOG(

1674

70

            trace,

1675

70

            "cm cdm: starting processing cluster name {} (status {}) from the expired timer in {}",

1676

70

            name, enumToInt(status), cluster_manager->thread_local_dispatcher_.name());

1677

70

        cluster_manager->cdm_.processClusterName(name, status);

1678

70

});

1679

36

1680

1681

527

Config::EdsResourcesCacheOptRef ClusterManagerImpl::edsResourcesCache() {

1682

  // EDS caching is only supported for ADS.

1683

527

  if (xds_manager_.adsMux()) {

1684

492

    return xds_manager_.adsMux()->edsResourcesCache();

1685

492

1686

35

  return {};

1687

527

1688

1689

void ClusterManagerImpl::createNetworkObserverRegistries(

1690

1

    Quic::EnvoyQuicNetworkObserverRegistryFactory& factory) {

1691

1

#ifdef ENVOY_ENABLE_QUIC

1692

1

  tls_.runOnAllThreads([&factory](OptRef<ThreadLocalClusterManagerImpl> cluster_manager) {

1693

1

    ENVOY_LOG(trace, "cm: create network observer registry in {}",

1694

1

              cluster_manager->thread_local_dispatcher_.name());

1695

1

    cluster_manager->createThreadLocalNetworkObserverRegistry(factory);

1696

1

});

1697

#else

1698

  (void)factory;

1699

#endif

1700

1

1701

1702

ClusterDiscoveryManager

1703

1

ClusterManagerImpl::createAndSwapClusterDiscoveryManager(std::string thread_name) {

1704

1

  ThreadLocalClusterManagerImpl& cluster_manager = *tls_;

1705

1

  ClusterDiscoveryManager cdm(std::move(thread_name), cluster_manager);

1706

1707

1

  cluster_manager.cdm_.swap(cdm);

1708

1709

1

  return cdm;

1710

1

1711

1712

ProtobufTypes::MessagePtr

1713

91

ClusterManagerImpl::dumpClusterConfigs(const Matchers::StringMatcher& name_matcher) {

1714

91

  auto config_dump = std::make_unique<envoy::admin::v3::ClustersConfigDump>();

1715

91

  config_dump->set_version_info(cds_api_ != nullptr ? cds_api_->versionInfo() : "");

1716

249

  for (const auto& active_cluster_pair : active_clusters_) {

1717

247

    const auto& cluster = *active_cluster_pair.second;

1718

247

    if (!name_matcher.match(cluster.cluster_config_.name())) {

1719

34

      continue;

1720

34

1721

213

    if (!cluster.added_via_api_) {

1722

168

      auto& static_cluster = *config_dump->mutable_static_clusters()->Add();

1723

168

      static_cluster.mutable_cluster()->PackFrom(cluster.cluster_config_);

1724

168

      TimestampUtil::systemClockToTimestamp(cluster.last_updated_,

1725

168

                                            *(static_cluster.mutable_last_updated()));

1726

168

    } else {

1727

45

      auto& dynamic_cluster = *config_dump->mutable_dynamic_active_clusters()->Add();

1728

45

      dynamic_cluster.set_version_info(cluster.version_info_);

1729

45

      dynamic_cluster.mutable_cluster()->PackFrom(cluster.cluster_config_);

1730

45

      TimestampUtil::systemClockToTimestamp(cluster.last_updated_,

1731

45

                                            *(dynamic_cluster.mutable_last_updated()));

1732

45

1733

213

1734

1735

93

  for (const auto& warming_cluster_pair : warming_clusters_) {

1736

12

    const auto& cluster = *warming_cluster_pair.second;

1737

12

    if (!name_matcher.match(cluster.cluster_config_.name())) {

1738

      continue;

1739

1740

12

    auto& dynamic_cluster = *config_dump->mutable_dynamic_warming_clusters()->Add();

1741

12

    dynamic_cluster.set_version_info(cluster.version_info_);

1742

12

    dynamic_cluster.mutable_cluster()->PackFrom(cluster.cluster_config_);

1743

12

    TimestampUtil::systemClockToTimestamp(cluster.last_updated_,

1744

12

                                          *(dynamic_cluster.mutable_last_updated()));

1745

12

1746

1747

91

  return config_dump;

1748

91

1749

1750

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ThreadLocalClusterManagerImpl(

1751

    ClusterManagerImpl& parent, Event::Dispatcher& dispatcher,

1752

    const absl::optional<LocalClusterParams>& local_cluster_params)

1753

21612

    : parent_(parent), thread_local_dispatcher_(dispatcher), cdm_(dispatcher.name(), *this),

1754

21612

      local_stats_(generateStats(*parent.stats_.rootScope(), dispatcher.name())) {

1755

  // If local cluster is defined then we need to initialize it first.

1756

21612

  if (local_cluster_params.has_value()) {

1757

16

    const auto& local_cluster_name = local_cluster_params->info_->name();

1758

16

    ENVOY_LOG(debug, "adding TLS local cluster {}", local_cluster_name);

1759

16

    thread_local_clusters_[local_cluster_name] = std::make_unique<ClusterEntry>(

1760

16

        *this, local_cluster_params->info_, local_cluster_params->load_balancer_factory_);

1761

16

    local_priority_set_ = &thread_local_clusters_[local_cluster_name]->prioritySet();

1762

16

    local_stats_.clusters_inflated_.set(thread_local_clusters_.size());

1763

16

1764

21612

1765

1766

21612

ClusterManagerImpl::ThreadLocalClusterManagerImpl::~ThreadLocalClusterManagerImpl() {

1767

  // Clear out connection pools as well as the thread local cluster map so that we release all

1768

  // cluster pointers. Currently we have to free all non-local clusters before we free

1769

  // the local cluster. This is because non-local clusters with a zone aware load balancer have a

1770

  // member update callback registered with the local cluster.

1771

21612

  ENVOY_LOG(debug, "shutting down thread local cluster manager");

1772

21612

  destroying_ = true;

1773

21612

  host_http_conn_pool_map_.clear();

1774

21612

  host_tcp_conn_pool_map_.clear();

1775

21612

  ASSERT(host_tcp_conn_map_.empty());

1776

32966

  for (auto& cluster : thread_local_clusters_) {

1777

32754

    if (&cluster.second->prioritySet() != local_priority_set_) {

1778

32738

      cluster.second.reset();

1779

32738

1780

32754

1781

21612

  thread_local_clusters_.clear();

1782

1783

  // Ensure that all pools are completely destructed.

1784

21612

  thread_local_dispatcher_.clearDeferredDeleteList();

1785

21612

1786

1787

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::removeTcpConn(

1788

8

    const HostConstSharedPtr& host, Network::ClientConnection& connection) {

1789

8

  auto host_tcp_conn_map_it = host_tcp_conn_map_.find(host);

1790

8

  ASSERT(host_tcp_conn_map_it != host_tcp_conn_map_.end());

1791

8

  auto& connections_map = host_tcp_conn_map_it->second.connections_;

1792

8

  auto it = connections_map.find(&connection);

1793

8

  ASSERT(it != connections_map.end());

1794

8

  connection.dispatcher().deferredDelete(std::move(it->second));

1795

8

  connections_map.erase(it);

1796

8

  if (connections_map.empty()) {

1797

6

    host_tcp_conn_map_.erase(host_tcp_conn_map_it);

1798

6

1799

8

1800

1801

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::removeHosts(

1802

128

    const std::string& name, const HostVector& hosts_removed) {

1803

128

  auto entry = thread_local_clusters_.find(name);

1804

  // The if should only be possible if deferred cluster creation is enabled.

1805

128

  if (entry == thread_local_clusters_.end()) {

1806

7

    ASSERT(

1807

7

        parent_.deferred_cluster_creation_,

1808

7

        fmt::format("Cannot find ThreadLocalCluster {}, but deferred cluster creation is disabled.",

1809

7

                    name));

1810

7

    ASSERT(thread_local_deferred_clusters_.find(name) != thread_local_deferred_clusters_.end(),

1811

7

           "Cluster with removed host is neither deferred or inflated!");

1812

7

    return;

1813

7

1814

121

  const auto& cluster_entry = entry->second;

1815

121

  ENVOY_LOG(debug, "removing hosts for TLS cluster {} removed {}", name, hosts_removed.size());

1816

1817

  // We need to go through and purge any connection pools for hosts that got deleted.

1818

  // Even if two hosts actually point to the same address this will be safe, since if a

1819

  // host is readded it will be a different physical HostSharedPtr.

1820

121

  cluster_entry->drainConnPools(hosts_removed);

1821

121

1822

1823

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::updateClusterMembership(

1824

    const std::string& name, uint32_t priority, PrioritySet::UpdateHostsParams update_hosts_params,

1825

    LocalityWeightsConstSharedPtr locality_weights, const HostVector& hosts_added,

1826

    const HostVector& hosts_removed, bool weighted_priority_health,

1827

33852

    uint64_t overprovisioning_factor, HostMapConstSharedPtr cross_priority_host_map) {

1828

33852

  ASSERT(thread_local_clusters_.find(name) != thread_local_clusters_.end());

1829

33852

  const auto& cluster_entry = thread_local_clusters_[name];

1830

33852

  cluster_entry->updateHosts(name, priority, std::move(update_hosts_params),

1831

33852

                             std::move(locality_weights), hosts_added, hosts_removed,

1832

33852

                             weighted_priority_health, overprovisioning_factor,

1833

33852

                             std::move(cross_priority_host_map));

1834

33852

1835

1836

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::onHostHealthFailure(

1837

118

    const HostSharedPtr& host) {

1838

118

  if (host->cluster().features() &

1839

118

      ClusterInfo::Features::CLOSE_CONNECTIONS_ON_HOST_HEALTH_FAILURE) {

1840

9

    drainOrCloseConnPools(host, absl::nullopt);

1841

1842

    // Close non connection pool TCP connections obtained from tcpConn()

1843

//

1844

    // TODO(jono): The only remaining user of the non-pooled connections seems to be the statsd

1845

    // TCP client. Perhaps it could be rewritten to use a connection pool, and this code deleted.

1846

//

1847

    // Each connection will remove itself from the TcpConnectionsMap when it closes, via its

1848

    // Network::ConnectionCallbacks. The last removed tcp conn will remove the TcpConnectionsMap

1849

    // from host_tcp_conn_map_, so do not cache it between iterations.

1850

//

1851

    // TODO(ggreenway) PERF: If there are a large number of connections, this could take a long

1852

    // time and halt other useful work. Consider breaking up this work. Note that this behavior is

1853

    // noted in the configuration documentation in cluster setting

1854

    // "close_connections_on_host_health_failure". Update the docs if this if this changes.

1855

15

    while (true) {

1856

15

      const auto& it = host_tcp_conn_map_.find(host);

1857

15

      if (it == host_tcp_conn_map_.end()) {

1858

9

        break;

1859

9

1860

6

      TcpConnectionsMap& container = it->second;

1861

6

      container.connections_.begin()->first->close(

1862

6

          Network::ConnectionCloseType::NoFlush,

1863

6

          StreamInfo::LocalCloseReasons::get().NonPooledTcpConnectionHostHealthFailure);

1864

6

1865

109

  } else {

1866

109

    drainOrCloseConnPools(host, ConnectionPool::DrainBehavior::DrainExistingConnections);

1867

109

1868

118

1869

1870

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ConnPoolsContainer*

1871

ClusterManagerImpl::ThreadLocalClusterManagerImpl::getHttpConnPoolsContainer(

1872

93848

    const HostConstSharedPtr& host, bool allocate) {

1873

93848

  auto container_iter = host_http_conn_pool_map_.find(host);

1874

93848

  if (container_iter == host_http_conn_pool_map_.end()) {

1875

46429

    if (!allocate) {

1876

34627

      return nullptr;

1877

34627

1878

11802

    container_iter =

1879

11802

        host_http_conn_pool_map_.try_emplace(host, thread_local_dispatcher_, host).first;

1880

11802

1881

1882

59221

  return &container_iter->second;

1883

93848

1884

1885

ClusterUpdateCallbacksHandlePtr

1886

ClusterManagerImpl::ThreadLocalClusterManagerImpl::addClusterUpdateCallbacks(

1887

22020

    ClusterUpdateCallbacks& cb) {

1888

22020

  return std::make_unique<ClusterUpdateCallbacksHandleImpl>(cb, update_callbacks_);

1889

22020

1890

1891

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::ClusterEntry(

1892

    ThreadLocalClusterManagerImpl& parent, ClusterInfoConstSharedPtr cluster,

1893

    const LoadBalancerFactorySharedPtr& lb_factory)

1894

33816

    : parent_(parent), cluster_info_(cluster), lb_factory_(lb_factory),

1895

33816

      override_host_statuses_(HostUtility::createOverrideHostStatus(cluster_info_->lbConfig())) {

1896

33816

  priority_set_.getOrCreateHostSet(0);

1897

1898

  // TODO(mattklein123): Consider converting other LBs over to thread local. All of them could

1899

  // benefit given the healthy panic, locality, and priority calculations that take place.

1900

33816

  ASSERT(lb_factory_ != nullptr);

1901

33816

  lb_ = lb_factory_->create({priority_set_, parent_.local_priority_set_});

1902

33816

1903

1904

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::drainOrCloseConnPools(

1905

34815

    const HostSharedPtr& host, absl::optional<ConnectionPool::DrainBehavior> drain_behavior) {

1906

  // Drain or close any HTTP connection pool for the host.

1907

34815

1908

34815

    const auto container = getHttpConnPoolsContainer(host);

1909

34815

    if (container != nullptr) {

1910

190

      container->do_not_delete_ = true;

1911

190

      if (drain_behavior.has_value()) {

1912

188

        container->pools_->drainConnections(drain_behavior.value());

1913

188

      } else {

1914

        // TODO(wbpcode): 'CLOSE_CONNECTIONS_ON_HOST_HEALTH_FAILURE' and 'closeConnections'

1915

        // is only supported for TCP connection pools for now. Use 'DrainExistingConnections'

1916

        // drain here as alternative.

1917

2

        container->pools_->drainConnections(

1918

2

            ConnectionPool::DrainBehavior::DrainExistingConnections);

1919

2

1920

190

      container->do_not_delete_ = false;

1921

1922

190

      if (container->pools_->empty()) {

1923

160

        host_http_conn_pool_map_.erase(host);

1924

160

1925

190

1926

34815

1927

  // Drain or close any TCP connection pool for the host.

1928

34815

1929

34815

    const auto container = host_tcp_conn_pool_map_.find(host);

1930

34815

    if (container != host_tcp_conn_pool_map_.end()) {

1931

      // Draining pools or closing connections can cause pool deletion if it becomes

1932

      // idle. Copy `pools_` so that we aren't iterating through a container that

1933

      // gets mutated by callbacks deleting from it.

1934

24

      std::vector<Tcp::ConnectionPool::Instance*> pools;

1935

34

      for (const auto& pair : container->second.pools_) {

1936

34

        pools.push_back(pair.second.get());

1937

34

1938

1939

34

      for (auto* pool : pools) {

1940

34

        if (drain_behavior.has_value()) {

1941

31

          pool->drainConnections(drain_behavior.value());

1942

31

        } else {

1943

3

          pool->closeConnections();

1944

3

1945

34

1946

24

1947

34815

1948

34815

1949

1950

33816

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::~ClusterEntry() {

1951

  // We need to drain all connection pools for the cluster being removed. Then we can remove the

1952

  // cluster.

1953

//

1954

  // TODO(mattklein123): Optimally, we would just fire member changed callbacks and remove all of

1955

  // the hosts inside of the HostImpl destructor. That is a change with wide implications, so we

1956

  // are going with a more targeted approach for now.

1957

33816

  drainConnPools();

1958

33816

1959

1960

Http::ConnectionPool::Instance*

1961

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::httpConnPoolImpl(

1962

    HostConstSharedPtr host, ResourcePriority priority,

1963

47481

    absl::optional<Http::Protocol> downstream_protocol, LoadBalancerContext* context) {

1964

47481

  if (!host) {

1965

3

    return nullptr;

1966

3

1967

  // Right now, HTTP, HTTP/2 and ALPN pools are considered separate.

1968

  // We could do better here, and always use the ALPN pool and simply make sure

1969

  // we end up on a connection of the correct protocol, but for simplicity we're

1970

  // starting with something simpler.

1971

47478

  auto upstream_protocols = host->cluster().upstreamHttpProtocol(downstream_protocol);

1972

47478

  std::vector<uint8_t> hash_key;

1973

47478

  hash_key.reserve(upstream_protocols.size());

1974

47626

  for (auto protocol : upstream_protocols) {

1975

47626

    hash_key.push_back(uint8_t(protocol));

1976

47626

1977

1978

47478

  absl::optional<envoy::config::core::v3::AlternateProtocolsCacheOptions>

1979

47478

      alternate_protocol_options =

1980

47478

          host->cluster().httpProtocolOptions().alternateProtocolsCacheOptions();

1981

47478

  Network::Socket::OptionsSharedPtr upstream_options(std::make_shared<Network::Socket::Options>());

1982

47478

  if (context) {

1983

    // Inherit socket options from downstream connection, if set.

1984

47406

    if (context->downstreamConnection()) {

1985

44272

      addOptionsIfNotNull(upstream_options, context->downstreamConnection()->socketOptions());

1986

44272

1987

47406

    addOptionsIfNotNull(upstream_options, context->upstreamSocketOptions());

1988

47406

1989

1990

  // Use the socket options for computing connection pool hash key, if any.

1991

  // This allows socket options to control connection pooling so that connections with

1992

  // different options are not pooled together.

1993

47478

  for (const auto& option : *upstream_options) {

1994

10

    option->hashKey(hash_key);

1995

10

1996

1997

47478

  bool have_transport_socket_options = false;

1998

47478

  if (context && context->upstreamTransportSocketOptions()) {

1999

44268

    host->transportSocketFactory().hashKey(hash_key, context->upstreamTransportSocketOptions());

2000

44268

    have_transport_socket_options = true;

2001

44268

2002

2003

  // If configured, use the downstream connection id in pool hash key

2004

47478

  if (cluster_info_->connectionPoolPerDownstreamConnection() && context &&

2005

47478

      context->downstreamConnection()) {

2006

15

    context->downstreamConnection()->hashKey(hash_key);

2007

15

2008

2009

47478

  ConnPoolsContainer& container = *parent_.getHttpConnPoolsContainer(host, true);

2010

2011

  // Note: to simplify this, we assume that the factory is only called in the scope of this

2012

  // function. Otherwise, we'd need to capture a few of these variables by value.

2013

47478

  ConnPoolsContainer::ConnPools::PoolOptRef pool =

2014

47478

      container.pools_->getPool(priority, hash_key, [&]() {

2015

11824

        auto pool = parent_.parent_.factory_.allocateConnPool(

2016

11824

            parent_.thread_local_dispatcher_, host, priority, upstream_protocols,

2017

11824

            alternate_protocol_options, !upstream_options->empty() ? upstream_options : nullptr,

2018

11824

            have_transport_socket_options ? context->upstreamTransportSocketOptions() : nullptr,

2019

11824

            parent_.parent_.time_source_, parent_.cluster_manager_state_, quic_info_,

2020

11824

            parent_.getNetworkObserverRegistry());

2021

2022

11824

        pool->addIdleCallback([&parent = parent_, host, priority, hash_key]() {

2023

11774

          parent.httpConnPoolIsIdle(host, priority, hash_key);

2024

11774

});

2025

2026

11824

        return pool;

2027

11824

});

2028

2029

47478

  if (pool.has_value()) {

2030

47477

    return &(pool.value().get());

2031

47477

  } else {

2032

1

    return nullptr;

2033

1

2034

47478

2035

2036

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::httpConnPoolIsIdle(

2037

11774

    HostConstSharedPtr host, ResourcePriority priority, const std::vector<uint8_t>& hash_key) {

2038

11774

  if (destroying_) {

2039

    // If the Cluster is being destroyed, this pool will be cleaned up by that

2040

    // process.

2041

221

    return;

2042

221

2043

2044

11553

  ConnPoolsContainer* container = getHttpConnPoolsContainer(host);

2045

11553

  if (container == nullptr) {

2046

    // This could happen if we have cleaned out the host before iterating through every

2047

    // connection pool. Handle it by just continuing.

2048

    return;

2049

2050

2051

11553

  ENVOY_LOG(trace, "Erasing idle pool for host {}", *host);

2052

11553

  container->pools_->erasePool(priority, hash_key);

2053

2054

  // Guard deletion of the container with `do_not_delete_` to avoid deletion while

2055

  // iterating through the container in `container->pools_->startDrain()`. See

2056

  // comment in `ClusterManagerImpl::ThreadLocalClusterManagerImpl::drainConnPools`.

2057

11553

  if (!container->do_not_delete_ && container->pools_->empty()) {

2058

11382

    ENVOY_LOG(trace, "Pool container empty for host {}, erasing host entry", *host);

2059

11382

    host_http_conn_pool_map_.erase(

2060

11382

        host); // NOTE: `container` is erased after this point in the lambda.

2061

11382

2062

11553

2063

2064

HostSelectionResponse ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::chooseHost(

2065

50255

    LoadBalancerContext* context) {

2066

50255

  auto cross_priority_host_map = priority_set_.crossPriorityHostMap();

2067

50255

  auto host_and_strict_mode = HostUtility::selectOverrideHost(cross_priority_host_map.get(),

2068

50255

                                                              override_host_statuses_, context);

2069

50255

  if (host_and_strict_mode.first != nullptr) {

2070

30

    return {std::move(host_and_strict_mode.first)};

2071

30

2072

2073

50225

  if (!host_and_strict_mode.second) {

2074

50221

    Upstream::HostSelectionResponse host_selection = lb_->chooseHost(context);

2075

50221

    if (host_selection.host || host_selection.cancelable) {

2076

50178

      return host_selection;

2077

50178

2078

43

    cluster_info_->trafficStats()->upstream_cx_none_healthy_.inc();

2079

43

    ENVOY_LOG(debug, "no healthy host");

2080

43

    return host_selection;

2081

50221

2082

2083

4

  cluster_info_->trafficStats()->upstream_cx_none_healthy_.inc();

2084

4

  ENVOY_LOG(debug, "no healthy host");

2085

4

  return {nullptr};

2086

50225

2087

2088

HostConstSharedPtr ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::peekAnotherHost(

2089

130

    LoadBalancerContext* context) {

2090

130

  auto cross_priority_host_map = priority_set_.crossPriorityHostMap();

2091

130

  auto host_and_strict_mode = HostUtility::selectOverrideHost(cross_priority_host_map.get(),

2092

130

                                                              override_host_statuses_, context);

2093

130

  if (host_and_strict_mode.first != nullptr) {

2094

1

    return std::move(host_and_strict_mode.first);

2095

1

2096

  // TODO(wbpcode): should we do strict mode check of override host here?

2097

129

  return lb_->peekAnotherHost(context);

2098

130

2099

2100

Tcp::ConnectionPool::Instance*

2101

ClusterManagerImpl::ThreadLocalClusterManagerImpl::ClusterEntry::tcpConnPoolImpl(

2102

2312

    HostConstSharedPtr host, ResourcePriority priority, LoadBalancerContext* context) {

2103

  // Inherit socket options from downstream connection, if set.

2104

2312

  std::vector<uint8_t> hash_key = {uint8_t(priority)};

2105

2106

  // Use downstream connection socket options for computing connection pool hash key, if any.

2107

  // This allows socket options to control connection pooling so that connections with

2108

  // different options are not pooled together.

2109

2312

  Network::Socket::OptionsSharedPtr upstream_options(std::make_shared<Network::Socket::Options>());

2110

2312

  if (context) {

2111

2248

    if (context->downstreamConnection()) {

2112

2224

      addOptionsIfNotNull(upstream_options, context->downstreamConnection()->socketOptions());

2113

2224

2114

2248

    addOptionsIfNotNull(upstream_options, context->upstreamSocketOptions());

2115

2248

2116

2117

2312

  for (const auto& option : *upstream_options) {

2118

2

    option->hashKey(hash_key);

2119

2

2120

2121

  // If configured, use the downstream connection id in pool hash key

2122

2312

  if (cluster_info_->connectionPoolPerDownstreamConnection() && context &&

2123

2312

      context->downstreamConnection()) {

2124

4

    ENVOY_LOG(trace, "honoring connection_pool_per_downstream_connection");

2125

4

    context->downstreamConnection()->hashKey(hash_key);

2126

4

2127

2128

2312

  bool have_transport_socket_options = false;

2129

2312

  if (context != nullptr && context->upstreamTransportSocketOptions() != nullptr) {

2130

1940

    have_transport_socket_options = true;

2131

1940

    host->transportSocketFactory().hashKey(hash_key, context->upstreamTransportSocketOptions());

2132

1940

2133

2134

2312

  auto container_iter = parent_.host_tcp_conn_pool_map_.find(host);

2135

2312

  if (container_iter == parent_.host_tcp_conn_pool_map_.end()) {

2136

810

    container_iter = parent_.host_tcp_conn_pool_map_.try_emplace(host, host->acquireHandle()).first;

2137

810

2138

2312

  TcpConnPoolsContainer& container = container_iter->second;

2139

2312

  auto pool_iter = container.pools_.find(hash_key);

2140

2312

  if (pool_iter == container.pools_.end()) {

2141

835

    bool inserted;

2142

835

    std::tie(pool_iter, inserted) = container.pools_.emplace(

2143

835

        hash_key,

2144

835

        parent_.parent_.factory_.allocateTcpConnPool(

2145

835

            parent_.thread_local_dispatcher_, host, priority,

2146

835

            !upstream_options->empty() ? upstream_options : nullptr,

2147

835

            have_transport_socket_options ? context->upstreamTransportSocketOptions() : nullptr,

2148

835

            parent_.cluster_manager_state_, cluster_info_->tcpPoolIdleTimeout()));

2149

835

    ASSERT(inserted);

2150

835

    pool_iter->second->addIdleCallback(

2151

835

        [&parent = parent_, host, hash_key]() { parent.tcpConnPoolIsIdle(host, hash_key); });

2152

835

2153

2154

2312

  return pool_iter->second.get();

2155

2312

2156

2157

void ClusterManagerImpl::ThreadLocalClusterManagerImpl::tcpConnPoolIsIdle(

2158

794

    HostConstSharedPtr host, const std::vector<uint8_t>& hash_key) {

2159

794

  if (destroying_) {

2160

    // If the Cluster is being destroyed, this pool will be cleaned up by that process.

2161

7

    return;

2162

7

2163

2164

787

  auto it = host_tcp_conn_pool_map_.find(host);

2165

787

  if (it != host_tcp_conn_pool_map_.end()) {

2166

787

    TcpConnPoolsContainer& container = it->second;

2167

2168

787

    auto erase_iter = container.pools_.find(hash_key);

2169

787

    if (erase_iter != container.pools_.end()) {

2170

787

      ENVOY_LOG(trace, "Idle pool, erasing pool for host {}", *host);

2171

787

      thread_local_dispatcher_.deferredDelete(std::move(erase_iter->second));

2172

787

      container.pools_.erase(erase_iter);

2173

787

2174

2175

787

    if (container.pools_.empty()) {

2176

778

      host_tcp_conn_pool_map_.erase(

2177

778

          host); // NOTE: `container` is erased after this point in the lambda.

2178

778

2179

787

2180

787

2181

2182

absl::StatusOr<ClusterManagerPtr> ProdClusterManagerFactory::clusterManagerFromProto(

2183

10669

    const envoy::config::bootstrap::v3::Bootstrap& bootstrap) {

2184

10669

  absl::Status creation_status = absl::OkStatus();

2185

10669

  auto cluster_manager_impl = std::unique_ptr<ClusterManagerImpl>{

2186

10669

      new ClusterManagerImpl(bootstrap, *this, context_, creation_status)};

2187

10669

  RETURN_IF_NOT_OK(creation_status);

2188

10669

  return cluster_manager_impl;

2189

10669

2190

2191

Http::ConnectionPool::InstancePtr ProdClusterManagerFactory::allocateConnPool(

2192

    Event::Dispatcher& dispatcher, HostConstSharedPtr host, ResourcePriority priority,

2193

    std::vector<Http::Protocol>& protocols,

2194

    const absl::optional<envoy::config::core::v3::AlternateProtocolsCacheOptions>&

2195

        alternate_protocol_options,

2196

    const Network::ConnectionSocket::OptionsSharedPtr& options,

2197

    const Network::TransportSocketOptionsConstSharedPtr& transport_socket_options,

2198

    TimeSource& source, ClusterConnectivityState& state, Http::PersistentQuicInfoPtr& quic_info,

2199

11755

    OptRef<Quic::EnvoyQuicNetworkObserverRegistry> network_observer_registry) {

2200

2201

11755

  Http::HttpServerPropertiesCacheSharedPtr alternate_protocols_cache;

2202

11755

  if (alternate_protocol_options.has_value()) {

2203

    // If there is configuration for an alternate protocols cache, always create one.

2204

44

    alternate_protocols_cache =

2205

44

        alternate_protocols_cache_manager_.getCache(alternate_protocol_options.value(), dispatcher);

2206

11751

  } else if (!alternate_protocol_options.has_value() &&

2207

11711

             (protocols.size() == 2 ||

2208

11711

              (protocols.size() == 1 && protocols[0] == Http::Protocol::Http2))) {

2209

    // If there is no configuration for an alternate protocols cache, still

2210

    // create one if there's an HTTP/2 upstream (either explicitly, or for mixed

2211

    // HTTP/1.1 and HTTP/2 pools) to track the max concurrent streams across

2212

    // connections.

2213

5999

    envoy::config::core::v3::AlternateProtocolsCacheOptions default_options;

2214

5999

    default_options.set_name(host->cluster().name());

2215

5999

    alternate_protocols_cache =

2216

5999

        alternate_protocols_cache_manager_.getCache(default_options, dispatcher);

2217

5999

2218

2219

11755

  absl::optional<Http::HttpServerPropertiesCache::Origin> origin =

2220

11755

      getOrigin(transport_socket_options, host);

2221

11755

  if (protocols.size() == 3 &&

2222

11755

      context_.runtime().snapshot().featureEnabled("upstream.use_http3", 100) &&

2223

11755

      !transport_socket_options->http11ProxyInfo()) {

2224

41

    ASSERT(contains(protocols,

2225

41

                    {Http::Protocol::Http11, Http::Protocol::Http2, Http::Protocol::Http3}));

2226

41

    ASSERT(alternate_protocol_options.has_value());

2227

41

    ASSERT(alternate_protocols_cache);

2228

41

#ifdef ENVOY_ENABLE_QUIC

2229

41

    Envoy::Http::ConnectivityGrid::ConnectivityOptions coptions{protocols};

2230

41

    if (quic_info == nullptr) {

2231

29

      quic_info = Quic::createPersistentQuicInfoForCluster(dispatcher, host->cluster(), context_);

2232

29

2233

41

    return std::make_unique<Http::ConnectivityGrid>(

2234

41

        dispatcher, context_.api().randomGenerator(), host, priority, options,

2235

41

        transport_socket_options, state, source, alternate_protocols_cache, coptions,

2236

41

        quic_stat_names_, *stats_.rootScope(), *quic_info, network_observer_registry,

2237

41

        context_.overloadManager());

2238

#else

2239

    (void)quic_info;

2240

    (void)network_observer_registry;

2241

    // Should be blocked by configuration checking at an earlier point.

2242

    PANIC("unexpected");

2243

#endif

2244

41

2245

11714

  if (protocols.size() >= 2) {

2246

35

    if (origin.has_value()) {

2247

34

      envoy::config::core::v3::AlternateProtocolsCacheOptions default_options;

2248

34

      default_options.set_name(host->cluster().name());

2249

34

      alternate_protocols_cache =

2250

34

          alternate_protocols_cache_manager_.getCache(default_options, dispatcher);

2251

34

2252

2253

35

    ASSERT(contains(protocols, {Http::Protocol::Http11, Http::Protocol::Http2}));

2254

35

    return std::make_unique<Http::HttpConnPoolImplMixed>(

2255

35

        dispatcher, context_.api().randomGenerator(), host, priority, options,

2256

35

        transport_socket_options, state, origin, alternate_protocols_cache,

2257

35

        context_.overloadManager());

2258

35

2259

11679

  if (protocols.size() == 1 && protocols[0] == Http::Protocol::Http2 &&

2260

11679

      context_.runtime().snapshot().featureEnabled("upstream.use_http2", 100)) {

2261

5967

    return Http::Http2::allocateConnPool(dispatcher, context_.api().randomGenerator(), host,

2262

5967

                                         priority, options, transport_socket_options, state,

2263

5967

                                         context_.overloadManager(), origin,

2264

5967

                                         alternate_protocols_cache);

2265

5967

2266

5712

  if (protocols.size() == 1 && protocols[0] == Http::Protocol::Http3 &&

2267

5712

      context_.runtime().snapshot().featureEnabled("upstream.use_http3", 100)) {

2268

895

#ifdef ENVOY_ENABLE_QUIC

2269

895

    if (quic_info == nullptr) {

2270

859

      quic_info = Quic::createPersistentQuicInfoForCluster(dispatcher, host->cluster(), context_);

2271

859

2272

895

    return Http::Http3::allocateConnPool(

2273

895

        dispatcher, context_.api().randomGenerator(), host, priority, options,

2274

895

        transport_socket_options, state, quic_stat_names_, {}, *stats_.rootScope(), {}, *quic_info,

2275

895

        network_observer_registry, context_.overloadManager(), false);

2276

#else

2277

    UNREFERENCED_PARAMETER(source);

2278

    // Should be blocked by configuration checking at an earlier point.

2279

    PANIC("unexpected");

2280

#endif

2281

895

2282

4817

  ASSERT(protocols.size() == 1 && protocols[0] == Http::Protocol::Http11);

2283

4817

  return Http::Http1::allocateConnPool(dispatcher, context_.api().randomGenerator(), host, priority,

2284

4817

                                       options, transport_socket_options, state,

2285

4817

                                       context_.overloadManager());

2286

5712

2287

2288

Tcp::ConnectionPool::InstancePtr ProdClusterManagerFactory::allocateTcpConnPool(

2289

    Event::Dispatcher& dispatcher, HostConstSharedPtr host, ResourcePriority priority,

2290

    const Network::ConnectionSocket::OptionsSharedPtr& options,

2291

    Network::TransportSocketOptionsConstSharedPtr transport_socket_options,

2292

    ClusterConnectivityState& state,

2293

768

    absl::optional<std::chrono::milliseconds> tcp_pool_idle_timeout) {

2294

768

  ENVOY_LOG_MISC(debug, "Allocating TCP conn pool");

2295

768

  return std::make_unique<Tcp::ConnPoolImpl>(dispatcher, host, priority, options,

2296

768

                                             transport_socket_options, state, tcp_pool_idle_timeout,

2297

768

                                             context_.overloadManager());

2298

768

2299

2300

absl::StatusOr<std::pair<ClusterSharedPtr, ThreadAwareLoadBalancerPtr>>

2301

ProdClusterManagerFactory::clusterFromProto(const envoy::config::cluster::v3::Cluster& cluster,

2302

                                            Outlier::EventLoggerSharedPtr outlier_event_logger,

2303

17287

                                            bool added_via_api) {

2304

17287

  return ClusterFactoryImplBase::create(cluster, context_, dns_resolver_fn_, outlier_event_logger,

2305

17287

                                        added_via_api);

2306

17287

2307

2308

absl::StatusOr<CdsApiPtr>

2309

ProdClusterManagerFactory::createCds(const envoy::config::core::v3::ConfigSource& cds_config,

2310

                                     const xds::core::v3::ResourceLocator* cds_resources_locator,

2311

715

                                     ClusterManager& cm, bool support_multi_ads_sources) {

2312

  // TODO(htuch): Differentiate static vs. dynamic validation visitors.

2313

715

  return CdsApiImpl::create(cds_config, cds_resources_locator, cm, *stats_.rootScope(),

2314

715

                            context_.messageValidationContext().dynamicValidationVisitor(),

2315

715

                            context_, support_multi_ads_sources);

2316

715

2317

2318

} // namespace Upstream

2319

} // namespace Envoy