Initial support for federated learning (#7831)
Federated learning plugin for xgboost: * A gRPC server to aggregate MPI-style requests (allgather, allreduce, broadcast) from federated workers. * A Rabit engine for the federated environment. * Integration test to simulate federated learning. Additional followups are needed to address GPU support, better security, and privacy, etc.
This commit is contained in:
104
plugin/federated/federated_client.h
Normal file
104
plugin/federated/federated_client.h
Normal file
@@ -0,0 +1,104 @@
|
||||
/*!
|
||||
* Copyright 2022 XGBoost contributors
|
||||
*/
|
||||
#pragma once
|
||||
#include <federated.grpc.pb.h>
|
||||
#include <federated.pb.h>
|
||||
#include <grpcpp/grpcpp.h>
|
||||
|
||||
#include <cstdio>
|
||||
#include <cstdlib>
|
||||
#include <string>
|
||||
|
||||
namespace xgboost {
|
||||
namespace federated {
|
||||
|
||||
/**
|
||||
* @brief A wrapper around the gRPC client.
|
||||
*/
|
||||
class FederatedClient {
|
||||
public:
|
||||
FederatedClient(std::string const &server_address, int rank, std::string const &server_cert,
|
||||
std::string const &client_key, std::string const &client_cert)
|
||||
: stub_{[&] {
|
||||
grpc::SslCredentialsOptions options;
|
||||
options.pem_root_certs = server_cert;
|
||||
options.pem_private_key = client_key;
|
||||
options.pem_cert_chain = client_cert;
|
||||
return Federated::NewStub(
|
||||
grpc::CreateChannel(server_address, grpc::SslCredentials(options)));
|
||||
}()},
|
||||
rank_{rank} {}
|
||||
|
||||
/** @brief Insecure client for testing only. */
|
||||
FederatedClient(std::string const &server_address, int rank)
|
||||
: stub_{Federated::NewStub(
|
||||
grpc::CreateChannel(server_address, grpc::InsecureChannelCredentials()))},
|
||||
rank_{rank} {}
|
||||
|
||||
std::string Allgather(std::string const &send_buffer) {
|
||||
AllgatherRequest request;
|
||||
request.set_sequence_number(sequence_number_++);
|
||||
request.set_rank(rank_);
|
||||
request.set_send_buffer(send_buffer);
|
||||
|
||||
AllgatherReply reply;
|
||||
grpc::ClientContext context;
|
||||
grpc::Status status = stub_->Allgather(&context, request, &reply);
|
||||
|
||||
if (status.ok()) {
|
||||
return reply.receive_buffer();
|
||||
} else {
|
||||
std::cout << status.error_code() << ": " << status.error_message() << '\n';
|
||||
throw std::runtime_error("Allgather RPC failed");
|
||||
}
|
||||
}
|
||||
|
||||
std::string Allreduce(std::string const &send_buffer, DataType data_type,
|
||||
ReduceOperation reduce_operation) {
|
||||
AllreduceRequest request;
|
||||
request.set_sequence_number(sequence_number_++);
|
||||
request.set_rank(rank_);
|
||||
request.set_send_buffer(send_buffer);
|
||||
request.set_data_type(data_type);
|
||||
request.set_reduce_operation(reduce_operation);
|
||||
|
||||
AllreduceReply reply;
|
||||
grpc::ClientContext context;
|
||||
grpc::Status status = stub_->Allreduce(&context, request, &reply);
|
||||
|
||||
if (status.ok()) {
|
||||
return reply.receive_buffer();
|
||||
} else {
|
||||
std::cout << status.error_code() << ": " << status.error_message() << '\n';
|
||||
throw std::runtime_error("Allreduce RPC failed");
|
||||
}
|
||||
}
|
||||
|
||||
std::string Broadcast(std::string const &send_buffer, int root) {
|
||||
BroadcastRequest request;
|
||||
request.set_sequence_number(sequence_number_++);
|
||||
request.set_rank(rank_);
|
||||
request.set_send_buffer(send_buffer);
|
||||
request.set_root(root);
|
||||
|
||||
BroadcastReply reply;
|
||||
grpc::ClientContext context;
|
||||
grpc::Status status = stub_->Broadcast(&context, request, &reply);
|
||||
|
||||
if (status.ok()) {
|
||||
return reply.receive_buffer();
|
||||
} else {
|
||||
std::cout << status.error_code() << ": " << status.error_message() << '\n';
|
||||
throw std::runtime_error("Broadcast RPC failed");
|
||||
}
|
||||
}
|
||||
|
||||
private:
|
||||
std::unique_ptr<Federated::Stub> const stub_;
|
||||
int const rank_;
|
||||
uint64_t sequence_number_{};
|
||||
};
|
||||
|
||||
} // namespace federated
|
||||
} // namespace xgboost
|
||||
Reference in New Issue
Block a user