#pragma once #include #include #include #include #include #include namespace CurrentMetrics { extern const Metric QueryPreempted; } namespace DB { /** Implements query priorities in very primitive way. * Allows to freeze query execution if at least one query of higher priority is executed. * * Priority value is integer, smaller means higher priority. * * Priority 0 is special - queries with that priority is always executed, * not depends on other queries and not affect other queries. * Thus 0 means - don't use priorities. * * NOTE Possibilities for improvement: * - implement limit on maximum number of running queries with same priority. */ class QueryPriorities { public: using Priority = size_t; private: friend struct Handle; using Count = int; /// Number of currently running queries for each priority. using Container = std::map; std::mutex mutex; std::condition_variable condvar; Container container; /** If there are higher priority queries - sleep until they are finish or timeout happens. */ template void waitIfNeed(Priority priority, Duration timeout) { if (0 == priority) return; std::unique_lock lock(mutex); /// Is there at least one more priority query? bool found = false; for (const auto & value : container) { if (value.first >= priority) break; if (value.second > 0) { found = true; break; } } if (!found) return; CurrentMetrics::Increment metric_increment{CurrentMetrics::QueryPreempted}; /// Spurious wakeups are Ok. We allow to wait less than requested. condvar.wait_for(lock, timeout); } public: struct HandleImpl { private: QueryPriorities & parent; QueryPriorities::Container::value_type & value; public: HandleImpl(QueryPriorities & parent_, QueryPriorities::Container::value_type & value_) : parent(parent_), value(value_) {} ~HandleImpl() { { std::lock_guard lock(parent.mutex); --value.second; } parent.condvar.notify_all(); } template void waitIfNeed(Duration timeout) { parent.waitIfNeed(value.first, timeout); } }; using Handle = std::shared_ptr; /** Register query with specified priority. * Returns an object that remove record in destructor. */ Handle insert(Priority priority) { if (0 == priority) return {}; std::lock_guard lock(mutex); auto it = container.emplace(priority, 0).first; ++it->second; return std::make_shared(*this, *it); } }; }