2017-04-25 17:15:31 +02:00
/* -------------------------------------------------------------------------- */
2021-02-09 16:07:56 +01:00
/* Copyright 2002-2021, OpenNebula Project, OpenNebula Systems */
2017-04-25 17:15:31 +02:00
/* */
/* Licensed under the Apache License, Version 2.0 (the "License"); you may */
/* not use this file except in compliance with the License. You may obtain */
/* a copy of the License at */
/* */
/* http://www.apache.org/licenses/LICENSE-2.0 */
/* */
/* Unless required by applicable law or agreed to in writing, software */
/* distributed under the License is distributed on an "AS IS" BASIS, */
/* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. */
/* See the License for the specific language governing permissions and */
/* limitations under the License. */
/* -------------------------------------------------------------------------- */
# ifndef RAFT_MANAGER_H_
# define RAFT_MANAGER_H_
2020-07-24 16:00:59 +02:00
# include "Listener.h"
2017-04-27 01:03:44 +02:00
# include "ReplicaManager.h"
# include "ReplicaRequest.h"
2017-05-14 23:48:46 +02:00
# include "Template.h"
2019-09-09 14:43:51 +02:00
# include "ExecuteHook.h"
2017-04-25 17:15:31 +02:00
2019-12-10 11:45:15 +01:00
class LogDBRecord ;
2017-04-25 17:15:31 +02:00
/* -------------------------------------------------------------------------- */
/* -------------------------------------------------------------------------- */
2020-07-24 16:00:59 +02:00
class RaftManager
2017-04-25 17:15:31 +02:00
{
public :
2017-04-27 01:03:44 +02:00
/**
* State of this server
*/
enum State {
SOLO = 0 ,
CANDIDATE = 1 ,
FOLLOWER = 2 ,
LEADER = 3
} ;
2017-05-02 17:57:55 +02:00
/**
* Raft manager constructor
* @ param server_id of this server
2017-05-18 16:36:26 +02:00
* @ param leader_hook_mad to be executed when follower - > leader
* @ param follower_hook_mad to be executed when leader - > follower
2017-05-02 17:57:55 +02:00
* @ param log_purge period to purge logDB records
* @ param bcast heartbeat broadcast timeout
* @ param election timeout
* @ param xmlrpc timeout for RAFT related xmlrpc API calls
* */
2017-05-18 16:36:26 +02:00
RaftManager ( int server_id , const VectorAttribute * leader_hook_mad ,
const VectorAttribute * follower_hook_mad , time_t log_purge ,
long long bcast , long long election , time_t xmlrpc ,
2020-07-02 22:42:10 +02:00
const std : : string & remotes_location ) ;
2017-04-25 17:15:31 +02:00
2020-09-15 11:16:00 +02:00
~ RaftManager ( ) = default ;
2017-04-25 17:15:31 +02:00
2017-04-27 01:03:44 +02:00
// -------------------------------------------------------------------------
2017-04-28 22:23:32 +02:00
// Raft associated actions (synchronous)
2017-04-27 01:03:44 +02:00
// -------------------------------------------------------------------------
2017-04-25 17:15:31 +02:00
/**
2017-04-28 22:23:32 +02:00
* Follower successfully replicated a log entry :
* - Increment next entry to send to follower
* - Update match entry on follower
* - Evaluate majority to apply changes to DB
2017-04-25 17:15:31 +02:00
*/
2017-05-16 17:08:24 +02:00
void replicate_success ( int follower_id ) ;
2017-04-25 17:15:31 +02:00
2017-04-27 01:03:44 +02:00
/**
2017-04-28 22:23:32 +02:00
* Follower failed to replicate a log entry because an inconsistency was
* detected ( same index , different term ) :
* - Decrease follower next_index
* - Retry ( do not wait for replica events )
2017-04-27 01:03:44 +02:00
*/
2017-05-16 17:08:24 +02:00
void replicate_failure ( int follower_id ) ;
2017-04-27 01:03:44 +02:00
/**
* Triggers a REPLICATE event , it will notify the replica threads to
* send the log to the followers
*/
2017-04-28 22:23:32 +02:00
void replicate_log ( ReplicaRequest * rr ) ;
2017-04-27 01:03:44 +02:00
2018-09-06 17:22:52 +02:00
/**
* Allocate a replica request fot the given index .
* @ param rindex of the record for the request
*/
2020-07-24 16:00:59 +02:00
void replicate_allocate ( uint64_t rindex )
2017-04-25 17:15:31 +02:00
{
2020-07-24 16:00:59 +02:00
requests . allocate ( rindex ) ;
2017-04-25 17:15:31 +02:00
}
2017-04-27 01:03:44 +02:00
/**
2020-07-24 16:00:59 +02:00
* Termination function
2017-04-27 01:03:44 +02:00
*/
2020-07-24 16:00:59 +02:00
void finalize ( ) ;
2017-04-25 17:15:31 +02:00
2017-04-27 01:03:44 +02:00
// -------------------------------------------------------------------------
// Raft state query functions
// -------------------------------------------------------------------------
2017-05-03 20:04:42 +02:00
/**
2017-05-06 00:17:27 +02:00
* Return the Raft status in XML format
* @ return xml document with the raft state
*/
std : : string & to_xml ( std : : string & state_xml ) ;
/**
2017-05-03 20:04:42 +02:00
* Makes this server follower . Stop associated replication facilities
*/
void follower ( unsigned int term ) ;
2020-05-15 16:15:52 +02:00
static std : : string state_to_str ( State _state )
{
2020-07-02 22:42:10 +02:00
std : : string st ;
2020-05-15 16:15:52 +02:00
switch ( _state )
{
case SOLO :
st = " SOLO " ;
break ;
case CANDIDATE :
st = " CANDIDATE " ;
break ;
case FOLLOWER :
st = " FOLLOWER " ;
break ;
case LEADER :
st = " LEADER " ;
break ;
}
return st ;
}
State get_state ( )
{
2020-07-24 16:00:59 +02:00
std : : lock_guard < std : : mutex > lock ( raft_mutex ) ;
2020-05-15 16:15:52 +02:00
2020-07-24 16:00:59 +02:00
return state ;
2020-05-15 16:15:52 +02:00
}
2017-04-27 01:03:44 +02:00
unsigned int get_term ( )
{
2020-07-24 16:00:59 +02:00
std : : lock_guard < std : : mutex > lock ( raft_mutex ) ;
2017-04-27 01:03:44 +02:00
2020-07-24 16:00:59 +02:00
return term ;
2017-04-27 01:03:44 +02:00
}
2019-04-08 17:43:12 +02:00
uint64_t get_commit ( )
2017-04-27 01:03:44 +02:00
{
2020-07-24 16:00:59 +02:00
std : : lock_guard < std : : mutex > lock ( raft_mutex ) ;
2017-04-27 01:03:44 +02:00
2020-07-24 16:00:59 +02:00
return commit ;
2017-04-27 01:03:44 +02:00
}
2020-07-24 16:00:59 +02:00
/**
2017-05-06 23:36:08 +02:00
* Update the commit index = min ( leader_commit , log index ) .
2020-07-24 16:00:59 +02:00
* @ param leader_commit index sent by leader in a replicate xml - rpc call
* @ param index of the last record inserted in the database
* @ return the updated commit index
*/
uint64_t update_commit ( uint64_t leader_commit , uint64_t index ) ;
2017-04-27 01:03:44 +02:00
2017-05-02 23:43:18 +02:00
/**
* Evaluates a vote request . It is granted if no vote has been granted in
* this term or it is requested by the same candidate .
* @ param _votedfor the candidate id
* @ return - 1 if vote is not granted
*/
int update_votedfor ( int _votedfor ) ;
2020-07-24 16:00:59 +02:00
/**
* Update the last_heartbeat time recieved from server . It stores the id
2017-05-08 10:12:49 +02:00
* of the leader .
* @ param leader_id id of server , - 1 if there is no leader set ( e . g .
* during a election because a vote request was received )
2020-07-24 16:00:59 +02:00
*/
void update_last_heartbeat ( int leader_id ) ;
2017-04-30 19:56:47 +02:00
2017-04-27 01:03:44 +02:00
/**
2017-04-27 12:42:09 +02:00
* @ return true if the server is the leader of the zone , runs in solo mode
2020-07-24 16:00:59 +02:00
* or is a follower
2017-04-27 01:03:44 +02:00
*/
2017-04-27 12:42:09 +02:00
bool is_leader ( )
2017-04-27 01:03:44 +02:00
{
2020-07-24 16:00:59 +02:00
return test_state ( LEADER ) ;
2017-04-27 12:42:09 +02:00
}
2017-04-27 01:03:44 +02:00
2017-04-27 12:42:09 +02:00
bool is_follower ( )
{
2020-07-24 16:00:59 +02:00
return test_state ( FOLLOWER ) ;
2017-04-27 01:03:44 +02:00
}
2017-05-05 15:46:57 +02:00
bool is_candidate ( )
{
return test_state ( CANDIDATE ) ;
}
2017-04-28 22:46:37 +02:00
bool is_solo ( )
{
return test_state ( SOLO ) ;
}
2018-01-08 00:32:52 +01:00
bool is_reconciling ( )
{
bool _reconciling ;
2020-07-24 16:00:59 +02:00
std : : lock_guard < std : : mutex > lock ( raft_mutex ) ;
2018-01-08 00:32:52 +01:00
_reconciling = reconciling ;
return _reconciling ;
}
2017-04-27 01:03:44 +02:00
/**
* Get next index to send to the follower
* @ param follower server id
2019-04-15 16:26:44 +02:00
* @ return UINT64_MAX on failure , the next index if success
2017-04-27 01:03:44 +02:00
*/
2019-04-08 17:43:12 +02:00
uint64_t get_next_index ( int follower_id )
2017-04-27 01:03:44 +02:00
{
2019-04-15 16:26:44 +02:00
uint64_t _index = UINT64_MAX ;
2017-04-27 01:03:44 +02:00
2020-07-24 16:00:59 +02:00
std : : lock_guard < std : : mutex > lock ( raft_mutex ) ;
2017-04-27 01:03:44 +02:00
2020-09-17 11:10:55 +02:00
auto it = next . find ( follower_id ) ;
2017-04-27 01:03:44 +02:00
if ( it ! = next . end ( ) )
{
_index = it - > second ;
}
return _index ;
}
2017-05-08 19:48:41 +02:00
/**
* Gets the endpoint for xml - rpc calls of the current leader
* @ param endpoint
* @ return 0 on success , - 1 if no leader found
*/
int get_leader_endpoint ( std : : string & endpoint ) ;
2017-04-30 19:56:47 +02:00
// -------------------------------------------------------------------------
// XML-RPC Raft API calls
// -------------------------------------------------------------------------
/**
* Calls the follower xml - rpc method
2020-07-24 16:00:59 +02:00
* @ param follower_id to make the call
2017-04-30 19:56:47 +02:00
* @ param lr the record to replicate
* @ param success of the xml - rpc method
* @ param ft term in the follower as returned by the replicate call
2020-07-24 16:00:59 +02:00
* @ param error describing error if any
2017-04-30 19:56:47 +02:00
* @ return - 1 if a XMl - RPC ( network ) error occurs , 0 otherwise
*/
2020-07-24 16:00:59 +02:00
int xmlrpc_replicate_log ( int follower_id , LogDBRecord * lr , bool & success ,
unsigned int & ft , std : : string & error ) ;
2017-04-30 19:56:47 +02:00
2017-05-03 20:04:42 +02:00
/**
* Calls the request vote xml - rpc method
2020-07-24 16:00:59 +02:00
* @ param follower_id to make the call
2017-05-03 20:04:42 +02:00
* @ param lindex highest last log index
* @ param lterm highest last log term
* @ param success of the xml - rpc method
* @ param ft term in the follower as returned by the replicate call
2020-07-24 16:00:59 +02:00
* @ param error describing error if any
2017-05-03 20:04:42 +02:00
* @ return - 1 if a XMl - RPC ( network ) error occurs , 0 otherwise
*/
2019-04-08 17:43:12 +02:00
int xmlrpc_request_vote ( int follower_id , uint64_t lindex ,
2017-05-03 20:04:42 +02:00
unsigned int lterm , bool & success , unsigned int & fterm ,
std : : string & error ) ;
2017-04-30 19:56:47 +02:00
// -------------------------------------------------------------------------
// Server related interface
// -------------------------------------------------------------------------
2017-05-02 17:57:55 +02:00
/**
* Adds a new server to the follower list and starts associated replica
* thread .
* @ param follower_id id of new server
2017-05-23 13:31:18 +02:00
* @ param xmlep xmlrpc endpoint for new server
2017-05-02 17:57:55 +02:00
*/
2020-07-24 16:00:59 +02:00
void add_server ( int follower_id , const std : : string & xmlep ) ;
2017-05-02 01:38:30 +02:00
2017-05-02 17:57:55 +02:00
/**
* Deletes a new server to the follower list and stops associated replica
* thread .
* @ param follower_id id of server
*/
2020-07-24 16:00:59 +02:00
void delete_server ( int follower_id ) ;
2017-04-30 19:56:47 +02:00
2018-06-20 17:58:19 +02:00
/**
* Reset index for a follower .
* @ param follower_id id of server
*/
2020-07-24 16:00:59 +02:00
void reset_index ( int follower_id ) ;
2018-06-20 17:58:19 +02:00
2017-04-25 17:15:31 +02:00
private :
2020-07-24 16:00:59 +02:00
std : : mutex raft_mutex ;
2017-04-25 17:15:31 +02:00
2017-04-27 01:03:44 +02:00
/**
* Clients waiting for a log replication
*/
2018-07-30 13:14:14 +02:00
ReplicaRequestMap requests ;
2017-08-03 12:28:48 +02:00
2017-04-27 01:03:44 +02:00
// -------------------------------------------------------------------------
// Raft state
// -------------------------------------------------------------------------
/**
* Server state
*/
State state ;
2020-07-24 16:00:59 +02:00
/**
* Server id
*/
int server_id ;
2017-04-30 19:56:47 +02:00
2017-04-27 01:03:44 +02:00
/**
* Current term
*/
unsigned int term ;
2017-04-28 19:35:57 +02:00
/**
* Number of servers in zone
*/
unsigned int num_servers ;
2020-07-24 16:00:59 +02:00
/**
* Time when the last heartbeat was sent ( LEADER ) or received ( FOLLOWER )
*/
struct timespec last_heartbeat ;
2017-04-29 23:25:53 +02:00
2017-05-02 23:43:18 +02:00
/**
* ID of the last candidate we voted for ( - 1 if none )
*/
int votedfor ;
2017-05-08 10:12:49 +02:00
/**
* ID of leader for the current term
*/
int leader_id ;
2017-05-02 23:43:18 +02:00
/**
* This is the raft persistent state : votedfor and current term . It is
* stored along the log in a special record ( 0 , - 1 , TEMPLATE , 0 )
*/
Template raft_state ;
2019-04-08 17:43:12 +02:00
/**
* Value for name column in system_attributes table for raft state .
*/
2020-07-02 22:42:10 +02:00
static const std : : string raft_state_name ;
2019-04-08 17:43:12 +02:00
2018-01-08 00:32:52 +01:00
/**
* After becoming a leader it is replicating and applying any pending
* log entry .
*/
bool reconciling ;
2017-05-02 01:38:30 +02:00
//--------------------------------------------------------------------------
// Timers
// - timer_period_ms. Base timer to wake up the manager (10ms)
// - purge_period_ms. How often the LogDB is purged (600s)
// - xmlrpc_timeout. To timeout xml-rpc api calls to replicate log
2020-07-24 16:00:59 +02:00
// - election_timeout. Timeout leader heartbeats (followers)
// - broadcast_timeout. To send heartbeat to followers (leader)
2017-05-02 01:38:30 +02:00
//--------------------------------------------------------------------------
2017-04-30 19:56:47 +02:00
static const time_t timer_period_ms ;
2017-05-02 01:38:30 +02:00
2017-05-02 17:57:55 +02:00
time_t purge_period_ms ;
2017-04-30 19:56:47 +02:00
2017-05-02 17:57:55 +02:00
time_t xmlrpc_timeout_ms ;
2017-04-30 19:56:47 +02:00
2020-07-24 16:00:59 +02:00
struct timespec election_timeout ;
2017-04-30 19:56:47 +02:00
2020-07-24 16:00:59 +02:00
struct timespec broadcast_timeout ;
/**
* Timer action async execution
*/
Timer timer_thread ;
2017-04-29 23:25:53 +02:00
2020-09-10 09:08:29 +02:00
Timer purge_thread ;
2017-04-27 01:03:44 +02:00
//--------------------------------------------------------------------------
// Volatile log index variables
// - commit, highest log known to be committed
2017-04-27 11:12:30 +02:00
// - applied, highest log applied to DB (in LogDB)
2017-04-27 01:03:44 +02:00
//
//---------------------------- LEADER VARIABLES ----------------------------
//
// - next, next log to send to each follower <follower, next>
// - match, highest log replicated in this server <follower, match>
2020-07-24 16:00:59 +02:00
// - servers, list of servers in zone and xml-rpc edp <follower, edp>
2017-04-27 01:03:44 +02:00
// -------------------------------------------------------------------------
2017-05-14 23:48:46 +02:00
RaftReplicaManager replica_manager ;
2017-04-27 01:03:44 +02:00
2017-06-03 19:24:19 +02:00
HeartBeatManager heartbeat_manager ;
2019-04-08 17:43:12 +02:00
uint64_t commit ;
2017-04-27 01:03:44 +02:00
2019-04-08 17:43:12 +02:00
std : : map < int , uint64_t > next ;
2017-04-27 01:03:44 +02:00
2019-04-08 17:43:12 +02:00
std : : map < int , uint64_t > match ;
2017-04-27 01:03:44 +02:00
2017-05-16 17:08:24 +02:00
std : : map < int , std : : string > servers ;
2017-04-30 19:56:47 +02:00
2017-05-18 16:36:26 +02:00
// -------------------------------------------------------------------------
// Hooks
// -------------------------------------------------------------------------
2020-09-15 11:16:00 +02:00
std : : unique_ptr < ExecuteHook > leader_hook ;
std : : unique_ptr < ExecuteHook > follower_hook ;
2017-05-18 16:36:26 +02:00
2017-04-25 17:15:31 +02:00
// -------------------------------------------------------------------------
2020-07-24 16:00:59 +02:00
// Internal Raft functions
2017-04-25 17:15:31 +02:00
// -------------------------------------------------------------------------
/**
2020-09-10 09:08:29 +02:00
* This function is executed periodically to vote leader
2017-04-25 17:15:31 +02:00
*/
2020-07-24 16:00:59 +02:00
void timer_action ( ) ;
2017-04-25 17:15:31 +02:00
2020-09-10 09:08:29 +02:00
/**
* This function is executed periodically to purge the state log
*/
void purge_action ( ) ;
2017-04-29 23:25:53 +02:00
/**
2020-07-24 16:00:59 +02:00
* @ param s the state to check
* @ return true if the server states matches the provided one
2017-04-29 23:25:53 +02:00
*/
2020-07-24 16:00:59 +02:00
bool test_state ( State s )
{
2017-04-27 12:42:09 +02:00
bool _is_state ;
2020-07-24 16:00:59 +02:00
std : : lock_guard < std : : mutex > lock ( raft_mutex ) ;
2017-04-27 12:42:09 +02:00
_is_state = state = = s ;
return _is_state ;
2020-07-24 16:00:59 +02:00
}
2017-04-30 19:56:47 +02:00
2020-07-24 16:00:59 +02:00
/**
* Request votes of followers
*/
2017-05-03 20:04:42 +02:00
void request_vote ( ) ;
/**
* Makes this server leader , and start replica threads
*/
void leader ( ) ;
2019-04-08 17:43:12 +02:00
/**
* Init the raft state status row .
*/
int init_raft_state ( const std : : string & raft_xml ) ;
2017-04-25 17:15:31 +02:00
} ;
# endif /*RAFT_MANAGER_H_*/