#pragma once #include #include #include #include #include #include #include namespace DB { namespace ErrorCodes { extern const int TOO_LARGE_STRING_SIZE; } namespace ColumnStringHelpers { /** Simplifies writing data to the ColumnString or ColumnFixedString via WriteBuffer. * * Take care of little subtle details, like padding or proper offsets. */ template class WriteHelper { ColumnType & col; WriteBufferFromVector buffer; size_t prev_row_buffer_size = 0; static ColumnType & resizeColumn(ColumnType & column, size_t rows) { if constexpr (std::is_same_v) column.resize(rows); else { column.getOffsets().reserve_exact(rows); /// Using coefficient 2 for initial size is arbitrary. column.getChars().reserve_exact(rows * 2); } return column; } public: WriteHelper(ColumnType & col_, size_t expected_rows) : col(resizeColumn(col_, expected_rows)) , buffer(col.getChars()) {} ~WriteHelper() = default; void finalize() { buffer.finalize(); } auto & getWriteBuffer() { return buffer; } void rowWritten() { if constexpr (std::is_same_v) { if (buffer.count() > prev_row_buffer_size + col.getN()) throw Exception( ErrorCodes::TOO_LARGE_STRING_SIZE, "Too large string for FixedString column"); // Pad with zeroes on the right to maintain FixedString invariant. const auto excess_bytes = buffer.count() % col.getN(); const auto fill_bytes = col.getN() - excess_bytes; writeChar(0, fill_bytes, buffer); } else { writeChar(0, buffer); col.getOffsets().push_back(buffer.count()); } prev_row_buffer_size = buffer.count(); } }; } }