#pragma once #include #include #include #include #include #include #include #include #include #include #include "DictionaryStructure.h" #include "IDictionary.h" #include "IDictionarySource.h" #include "DictionaryHelpers.h" namespace DB { class Arena; class IPAddressDictionary final : public IDictionary { public: struct Configuration { DictionaryLifetime dict_lifetime; bool require_nonempty; bool use_async_executor = false; }; IPAddressDictionary( const StorageID & dict_id_, const DictionaryStructure & dict_struct_, DictionarySourcePtr source_ptr_, Configuration configuration_); std::string getKeyDescription() const { return key_description; } std::string getTypeName() const override { return "Trie"; } size_t getBytesAllocated() const override { return bytes_allocated; } size_t getQueryCount() const override { return query_count.load(); } double getFoundRate() const override { size_t queries = query_count.load(); if (!queries) return 0; return std::min(1.0, static_cast(found_count.load()) / queries); } double getHitRate() const override { return 1.0; } size_t getElementCount() const override { return element_count; } double getLoadFactor() const override { return static_cast(element_count) / bucket_count; } std::shared_ptr clone() const override { return std::make_shared(getDictionaryID(), dict_struct, source_ptr->clone(), configuration); } DictionarySourcePtr getSource() const override { return source_ptr; } const DictionaryLifetime & getLifetime() const override { return configuration.dict_lifetime; } const DictionaryStructure & getStructure() const override { return dict_struct; } bool isInjective(const std::string & attribute_name) const override { return dict_struct.getAttribute(attribute_name).injective; } DictionaryKeyType getKeyType() const override { return DictionaryKeyType::Complex; } void convertKeyColumns(Columns & key_columns, DataTypes & key_types) const override; ColumnPtr getColumn( const std::string & attribute_name, const DataTypePtr & attribute_type, const Columns & key_columns, const DataTypes & key_types, DefaultOrFilter default_or_filter) const override; ColumnUInt8::Ptr hasKeys(const Columns & key_columns, const DataTypes & key_types) const override; Pipe read(const Names & column_names, size_t max_block_size, size_t num_streams) const override; private: template using ContainerType = std::vector; using IPAddress = Poco::Net::IPAddress; using IPv4Container = PODArray; using IPv6Container = PaddedPODArray; using IPMaskContainer = PODArray; using RowIdxConstIter = ContainerType::const_iterator; struct Attribute final { AttributeUnderlyingType type; std::variant< UInt8, UInt16, UInt32, UInt64, UInt128, UInt256, Int8, Int16, Int32, Int64, Int128, Int256, Decimal32, Decimal64, Decimal128, Decimal256, DateTime64, Float32, Float64, UUID, IPv4, IPv6, String, Array> null_values; std::variant< ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType, ContainerType> maps; std::unique_ptr string_arena; }; void createAttributes(); void loadData(); template void addAttributeSize(const Attribute & attribute); void calculateBytesAllocated(); template static void createAttributeImpl(Attribute & attribute, const Field & null_value); static Attribute createAttributeWithType(const AttributeUnderlyingType type, const Field & null_value); /// NOLINT template void getItemsByTwoKeyColumnsImpl( const Attribute & attribute, const Columns & key_columns, ValueSetter && set_value, DefaultValueExtractor & default_value_extractor) const; template size_t getItemsByTwoKeyColumnsShortCircuitImpl( const Attribute & attribute, const Columns & key_columns, ValueSetter && set_value, IColumn::Filter & default_mask) const; template void getItemsImpl( const Attribute & attribute, const Columns & key_columns, ValueSetter && set_value, DefaultValueExtractor & default_value_extractor) const; template void getItemsShortCircuitImpl( const Attribute & attribute, const Columns & key_columns, ValueSetter && set_value, IColumn::Filter & default_mask) const; template void setAttributeValueImpl(Attribute & attribute, const T value); /// NOLINT void setAttributeValue(Attribute & attribute, const Field & value); const Attribute & getAttribute(const std::string & attribute_name) const; Columns getKeyColumns() const; RowIdxConstIter ipNotFound() const; RowIdxConstIter tryLookupIPv4(UInt32 addr, uint8_t * buf) const; RowIdxConstIter tryLookupIPv6(const uint8_t * addr) const; template RowIdxConstIter lookupIP(IPValueType target) const; static const uint8_t * getIPv6FromOffset(const IPv6Container & ipv6_col, size_t i); DictionaryStructure dict_struct; const DictionarySourcePtr source_ptr; const Configuration configuration; const bool access_to_key_from_attributes; const std::string key_description{dict_struct.getKeyDescription()}; /// Contains sorted IP subnetworks. If some addresses equals, subnet with lower mask is placed first. std::variant ip_column; /// Prefix lengths corresponding to ip_column. IPMaskContainer mask_column; /** Contains links to parent subnetworks in ip_column. * Array holds such ip_column's (and mask_column's) indices that * - if parent_subnet[i] < i, then ip_column[i] is subnetwork of ip_column[parent_subnet[i]], * - if parent_subnet[i] == i, then ip_column[i] doesn't belong to any other subnet. */ ContainerType parent_subnet; /// Contains corresponding indices in attributes array. ContainerType row_idx; std::map attribute_index_by_name; std::vector attributes; size_t bytes_allocated = 0; size_t element_count = 0; size_t bucket_count = 0; mutable std::atomic query_count{0}; mutable std::atomic found_count{0}; LoggerPtr logger; }; }