#pragma once #include "Common/ZooKeeper/ZooKeeperCommon.h" #include "config.h" #if USE_NURAFT #include #include #include #include #include #include #include #include #include #include #include namespace DB { using ZooKeeperResponseCallback = std::function; /// Highlevel wrapper for ClickHouse Keeper. /// Process user requests via consensus and return responses. class KeeperDispatcher { private: using RequestsQueue = ConcurrentBoundedQueue; using SessionToResponseCallback = std::unordered_map; using ClusterUpdateQueue = ConcurrentBoundedQueue; /// Size depends on coordination settings std::unique_ptr requests_queue; ResponsesQueue responses_queue; SnapshotsQueue snapshots_queue{1}; /// More than 1k updates is definitely misconfiguration. ClusterUpdateQueue cluster_update_queue{1000}; mutable std::mutex session_to_response_callback_mutex; /// These two maps looks similar, but serves different purposes. /// The first map is subscription map for normal responses like /// (get, set, list, etc.). Dispatcher determines callback for each response /// using session id from this map. SessionToResponseCallback session_to_response_callback; /// But when client connects to the server for the first time it doesn't /// have session_id. It request it from server. We give temporary /// internal id for such requests just to much client with its response. SessionToResponseCallback new_session_id_response_callback; /// Reading and batching new requests from client handlers ThreadFromGlobalPool request_thread; /// Pushing responses to clients client handlers /// using session_id. ThreadFromGlobalPool responses_thread; /// Cleaning old dead sessions ThreadFromGlobalPool session_cleaner_thread; /// Dumping new snapshots to disk ThreadFromGlobalPool snapshot_thread; /// Apply or wait for configuration changes ThreadFromGlobalPool update_configuration_thread; /// RAFT wrapper. std::unique_ptr server; KeeperConnectionStats keeper_stats; KeeperConfigurationAndSettingsPtr configuration_and_settings; LoggerPtr log; /// Counter for new session_id requests. std::atomic internal_session_id_counter{0}; KeeperSnapshotManagerS3 snapshot_s3; KeeperContextPtr keeper_context; /// Thread put requests to raft void requestThread(); /// Thread put responses for subscribed sessions void responseThread(); /// Thread clean disconnected sessions from memory void sessionCleanerTask(); /// Thread create snapshots in the background void snapshotThread(); // TODO (myrrc) this should be removed once "reconfig" is stabilized void clusterUpdateWithReconfigDisabledThread(); void clusterUpdateThread(); void setResponse(int64_t session_id, const Coordination::ZooKeeperResponsePtr & response, Coordination::ZooKeeperRequestPtr request = nullptr); /// Add error responses for requests to responses queue. /// Clears requests. void addErrorResponses(const KeeperStorageBase::RequestsForSessions & requests_for_sessions, Coordination::Error error); /// Forcefully wait for result and sets errors if something when wrong. /// Clears both arguments nuraft::ptr forceWaitAndProcessResult( RaftAppendResult & result, KeeperStorageBase::RequestsForSessions & requests_for_sessions, bool clear_requests_on_success); public: std::mutex read_request_queue_mutex; /// queue of read requests that can be processed after a request with specific session ID and XID is committed std::unordered_map> read_request_queue; /// Just allocate some objects, real initialization is done by `intialize method` KeeperDispatcher(); /// Call shutdown ~KeeperDispatcher(); /// Initialization from config. /// standalone_keeper -- we are standalone keeper application (not inside clickhouse server) /// 'macros' are used to substitute macros in endpoint of disks void initialize(const Poco::Util::AbstractConfiguration & config, bool standalone_keeper, bool start_async, const MultiVersion::Version & macros); void startServer(); bool checkInit() const { return server && server->checkInit(); } /// Is server accepting requests, i.e. connected to the cluster /// and achieved quorum bool isServerActive() const; void updateConfiguration(const Poco::Util::AbstractConfiguration & config, const MultiVersion::Version & macros); void pushClusterUpdates(ClusterUpdateActions && actions); bool reconfigEnabled() const; /// Shutdown internal keeper parts (server, state machine, log storage, etc) void shutdown(); void forceRecovery(); /// Put request to ClickHouse Keeper bool putRequest(const Coordination::ZooKeeperRequestPtr & request, int64_t session_id, bool use_xid_64); /// Get new session ID int64_t getSessionID(int64_t session_timeout_ms); /// Register session and subscribe for responses with callback void registerSession(int64_t session_id, ZooKeeperResponseCallback callback); /// Call if we don't need any responses for this session no more (session was expired) void finishSession(int64_t session_id); /// Invoked when a request completes. void updateKeeperStatLatency(uint64_t process_time_ms); /// Are we leader bool isLeader() const { return server->isLeader(); } bool isFollower() const { return server->isFollower(); } bool hasLeader() const { return server->isLeaderAlive(); } bool isObserver() const { return server->isObserver(); } bool isExceedingMemorySoftLimit() const { return server->isExceedingMemorySoftLimit(); } uint64_t getLogDirSize() const; uint64_t getSnapDirSize() const; /// Request statistics such as qps, latency etc. KeeperConnectionStats & getKeeperConnectionStats() { return keeper_stats; } Keeper4LWInfo getKeeper4LWInfo() const; const IKeeperStateMachine & getStateMachine() const { return *server->getKeeperStateMachine(); } const KeeperConfigurationAndSettingsPtr & getKeeperConfigurationAndSettings() const { return configuration_and_settings; } const KeeperContextPtr & getKeeperContext() const { return keeper_context; } void incrementPacketsSent() { keeper_stats.incrementPacketsSent(); } void incrementPacketsReceived() { keeper_stats.incrementPacketsReceived(); } void resetConnectionStats() { keeper_stats.reset(); } /// Create snapshot manually, return the last committed log index in the snapshot uint64_t createSnapshot() { return server->createSnapshot(); } /// Get Raft information KeeperLogInfo getKeeperLogInfo() { return server->getKeeperLogInfo(); } /// Request to be leader. bool requestLeader() { return server->requestLeader(); } /// Yield leadership and become follower. void yieldLeadership() { server->yieldLeadership(); } void recalculateStorageStats() { server->recalculateStorageStats(); } static void cleanResources(); }; } #endif