#pragma once #include #include #include #include #include #include #include #include #include #include namespace DB { /** Container for set of columns for bunch of rows in memory. * This is unit of data processing. * Also contains metadata - data types of columns and their names * (either original names from a table, or generated names during temporary calculations). * Allows to insert, remove columns in arbitrary position, to change order of columns. */ class Block { private: using Container = ColumnsWithTypeAndName; using IndexByName = std::unordered_map; Container data; IndexByName index_by_name; public: BlockInfo info; Block() = default; Block(std::initializer_list il); Block(const ColumnsWithTypeAndName & data_); /// NOLINT Block(ColumnsWithTypeAndName && data_); /// NOLINT /// insert the column at the specified position void insert(size_t position, ColumnWithTypeAndName elem); /// insert the column to the end void insert(ColumnWithTypeAndName elem); /// insert the column to the end, if there is no column with that name yet void insertUnique(ColumnWithTypeAndName elem); /// remove the column at the specified position void erase(size_t position); /// remove the columns at the specified positions void erase(const std::set & positions); /// remove the column with the specified name void erase(const String & name); /// References are invalidated after calling functions above. ColumnWithTypeAndName & getByPosition(size_t position) { return data[position]; } const ColumnWithTypeAndName & getByPosition(size_t position) const { return data[position]; } ColumnWithTypeAndName & safeGetByPosition(size_t position); const ColumnWithTypeAndName & safeGetByPosition(size_t position) const; ColumnWithTypeAndName* findByName(const std::string & name, bool case_insensitive = false) { return const_cast( const_cast(this)->findByName(name, case_insensitive)); } const ColumnWithTypeAndName * findByName(const std::string & name, bool case_insensitive = false) const; ColumnWithTypeAndName & getByName(const std::string & name, bool case_insensitive = false) { return const_cast( const_cast(this)->getByName(name, case_insensitive)); } const ColumnWithTypeAndName & getByName(const std::string & name, bool case_insensitive = false) const; Container::iterator begin() { return data.begin(); } Container::iterator end() { return data.end(); } Container::const_iterator begin() const { return data.begin(); } Container::const_iterator end() const { return data.end(); } Container::const_iterator cbegin() const { return data.cbegin(); } Container::const_iterator cend() const { return data.cend(); } bool has(const std::string & name, bool case_insensitive = false) const; size_t getPositionByName(const std::string & name) const; const ColumnsWithTypeAndName & getColumnsWithTypeAndName() const; NamesAndTypesList getNamesAndTypesList() const; NamesAndTypes getNamesAndTypes() const; Names getNames() const; DataTypes getDataTypes() const; Names getDataTypeNames() const; /// Hash table match `column name -> position in the block`. using NameMap = ::google::dense_hash_map; NameMap getNamesToIndexesMap() const; Serializations getSerializations() const; Serializations getSerializations(const SerializationInfoByName & hints) const; /// Returns number of rows from first column in block, not equal to nullptr. If no columns, returns 0. size_t rows() const; size_t columns() const { return data.size(); } /// Checks that every column in block is not nullptr and has same number of elements. void checkNumberOfRows(bool allow_null_columns = false) const; /// Approximate number of bytes in memory - for profiling and limits. size_t bytes() const; /// Approximate number of allocated bytes in memory - for profiling and limits. size_t allocatedBytes() const; explicit operator bool() const { return !!columns(); } bool operator!() const { return !this->operator bool(); } /// NOLINT /** Get a list of column names separated by commas. */ std::string dumpNames() const; /** List of names, types and lengths of columns. Designed for debugging. */ std::string dumpStructure() const; /** List of column names and positions from index */ std::string dumpIndex() const; /** Get the same block, but empty. */ Block cloneEmpty() const; Columns getColumns() const; void setColumns(const Columns & columns); void setColumn(size_t position, ColumnWithTypeAndName column); Block cloneWithColumns(const Columns & columns) const; Block cloneWithoutColumns() const; Block cloneWithCutColumns(size_t start, size_t length) const; /** Get empty columns with the same types as in block. */ MutableColumns cloneEmptyColumns() const; /** Get columns from block for mutation. Columns in block will be nullptr. */ MutableColumns mutateColumns(); /** Replace columns in a block */ void setColumns(MutableColumns && columns); Block cloneWithColumns(MutableColumns && columns) const; /** Get a block with columns that have been rearranged in the order of their names. */ Block sortColumns() const; /** See IColumn::shrinkToFit() */ Block shrinkToFit() const; Block compress() const; Block decompress() const; void clear(); void swap(Block & other) noexcept; /** Updates SipHash of the Block, using update method of columns. * Returns hash for block, that could be used to differentiate blocks * with same structure, but different data. */ void updateHash(SipHash & hash) const; private: void eraseImpl(size_t position); void initializeIndexByName(); void reserve(size_t count); /// This is needed to allow function execution over data. /// It is safe because functions does not change column names, so index is unaffected. /// It is temporary. friend class ExpressionActions; friend class ActionsDAG; }; using BlockPtr = std::shared_ptr; using Blocks = std::vector; using BlocksList = std::list; using BlocksPtr = std::shared_ptr; /// Extends block with extra data in derived classes struct ExtraBlock { Block block; bool empty() const { return !block; } }; using ExtraBlockPtr = std::shared_ptr; /// Compare number of columns, data types, column types, column names, and values of constant columns. bool blocksHaveEqualStructure(const Block & lhs, const Block & rhs); /// Throw exception when blocks are different. void assertBlocksHaveEqualStructure(const Block & lhs, const Block & rhs, std::string_view context_description); /// Actual header is compatible to desired if block have equal structure except constants. /// It is allowed when column from actual header is constant, but in desired is not. /// If both columns are constant, it is checked that they have the same value. bool isCompatibleHeader(const Block & actual, const Block & desired); void assertCompatibleHeader(const Block & actual, const Block & desired, std::string_view context_description); /// Calculate difference in structure of blocks and write description into output strings. NOTE It doesn't compare values of constant columns. void getBlocksDifference(const Block & lhs, const Block & rhs, std::string & out_lhs_diff, std::string & out_rhs_diff); void convertToFullIfSparse(Block & block); /// Converts columns-constants to full columns ("materializes" them). Block materializeBlock(const Block & block); void materializeBlockInplace(Block & block); Block concatenateBlocks(const std::vector & blocks); }