- Define a new data type, the proto file is copied for now. - Merge client and communicator into `FederatedColl`. - Define CUDA variant. - Migrate tests for CPU, add tests for CUDA.
65 lines
2.0 KiB
C++
65 lines
2.0 KiB
C++
/**
|
|
* Copyright 2023, XGBoost contributors
|
|
*/
|
|
#pragma once
|
|
|
|
#include <federated.grpc.pb.h>
|
|
#include <federated.pb.h>
|
|
|
|
#include <cstdint> // for int32_t
|
|
#include <memory> // for unique_ptr
|
|
#include <string> // for string
|
|
|
|
#include "../../src/collective/comm.h" // for Comm
|
|
#include "../../src/common/json_utils.h" // for OptionalArg
|
|
#include "xgboost/json.h"
|
|
|
|
namespace xgboost::collective {
|
|
class FederatedComm : public Comm {
|
|
std::shared_ptr<federated::Federated::Stub> stub_;
|
|
|
|
void Init(std::string const& host, std::int32_t port, std::int32_t world, std::int32_t rank,
|
|
std::string const& server_cert, std::string const& client_key,
|
|
std::string const& client_cert);
|
|
|
|
protected:
|
|
explicit FederatedComm(std::shared_ptr<FederatedComm const> that) : stub_{that->stub_} {
|
|
this->rank_ = that->Rank();
|
|
this->world_ = that->World();
|
|
|
|
this->tracker_ = that->TrackerInfo();
|
|
}
|
|
|
|
public:
|
|
/**
|
|
* @param config
|
|
*
|
|
* - federated_server_address: Tracker address
|
|
* - federated_world_size: The number of workers
|
|
* - federated_rank: Rank of federated worker
|
|
* - federated_server_cert_path
|
|
* - federated_client_key_path
|
|
* - federated_client_cert_path
|
|
*/
|
|
explicit FederatedComm(Json const& config);
|
|
explicit FederatedComm(std::string const& host, std::int32_t port, std::int32_t world,
|
|
std::int32_t rank) {
|
|
this->Init(host, port, world, rank, {}, {}, {});
|
|
}
|
|
~FederatedComm() override { stub_.reset(); }
|
|
|
|
[[nodiscard]] std::shared_ptr<Channel> Chan(std::int32_t) const override {
|
|
LOG(FATAL) << "peer to peer communication is not allowed for federated learning.";
|
|
return nullptr;
|
|
}
|
|
[[nodiscard]] Result LogTracker(std::string msg) const override {
|
|
LOG(CONSOLE) << msg;
|
|
return Success();
|
|
}
|
|
[[nodiscard]] bool IsFederated() const override { return true; }
|
|
[[nodiscard]] federated::Federated::Stub* Handle() const { return stub_.get(); }
|
|
|
|
Comm* MakeCUDAVar(Context const* ctx, std::shared_ptr<Coll> pimpl) const override;
|
|
};
|
|
} // namespace xgboost::collective
|