#pragma once #include #include #include #include #include #include #include #include #include #include namespace DB { namespace ErrorCodes { extern const int ILLEGAL_COLUMN; extern const int BAD_ARGUMENTS; } struct Base58Encode { static constexpr auto name = "base58Encode"; static void processString(const ColumnString & src_column, ColumnString::MutablePtr & dst_column, size_t input_rows_count) { auto & dst_data = dst_column->getChars(); auto & dst_offsets = dst_column->getOffsets(); /// Base58 has efficiency of 73% (8/11) [https://monerodocs.org/cryptography/base58/], /// and we take double scale to avoid any reallocation. size_t max_result_size = static_cast(ceil(2 * src_column.getChars().size() + 1)); dst_data.resize(max_result_size); dst_offsets.resize(input_rows_count); const ColumnString::Offsets & src_offsets = src_column.getOffsets(); const auto * src = src_column.getChars().data(); auto * dst = dst_data.data(); size_t prev_src_offset = 0; size_t current_dst_offset = 0; for (size_t row = 0; row < input_rows_count; ++row) { size_t current_src_offset = src_offsets[row]; size_t src_length = current_src_offset - prev_src_offset - 1; size_t encoded_size = encodeBase58(&src[prev_src_offset], src_length, &dst[current_dst_offset]); prev_src_offset = current_src_offset; current_dst_offset += encoded_size; dst[current_dst_offset] = 0; ++current_dst_offset; dst_offsets[row] = current_dst_offset; } dst_data.resize(current_dst_offset); } static void processFixedString(const ColumnFixedString & src_column, ColumnString::MutablePtr & dst_column, size_t input_rows_count) { auto & dst_data = dst_column->getChars(); auto & dst_offsets = dst_column->getOffsets(); /// Base58 has efficiency of 73% (8/11) [https://monerodocs.org/cryptography/base58/], /// and we take double scale to avoid any reallocation. size_t max_result_size = static_cast(ceil(2 * src_column.getChars().size() + 1)); dst_data.resize(max_result_size); dst_offsets.resize(input_rows_count); const auto * src = src_column.getChars().data(); auto * dst = dst_data.data(); size_t N = src_column.getN(); size_t current_dst_offset = 0; for (size_t row = 0; row < input_rows_count; ++row) { size_t encoded_size = encodeBase58(&src[row * N], N, &dst[current_dst_offset]); current_dst_offset += encoded_size; dst[current_dst_offset] = 0; ++current_dst_offset; dst_offsets[row] = current_dst_offset; } dst_data.resize(current_dst_offset); } }; enum class Base58DecodeErrorHandling : uint8_t { ThrowException, ReturnEmptyString }; template struct Base58Decode { static constexpr auto name = Name::name; static void processString(const ColumnString & src_column, ColumnString::MutablePtr & dst_column, size_t input_rows_count) { auto & dst_data = dst_column->getChars(); auto & dst_offsets = dst_column->getOffsets(); /// Base58 has efficiency of 73% (8/11) [https://monerodocs.org/cryptography/base58/], /// and decoded value will be no longer than source. size_t max_result_size = src_column.getChars().size() + 1; dst_data.resize(max_result_size); dst_offsets.resize(input_rows_count); const ColumnString::Offsets & src_offsets = src_column.getOffsets(); const auto * src = src_column.getChars().data(); auto * dst = dst_data.data(); size_t prev_src_offset = 0; size_t current_dst_offset = 0; for (size_t row = 0; row < input_rows_count; ++row) { size_t current_src_offset = src_offsets[row]; size_t src_length = current_src_offset - prev_src_offset - 1; std::optional decoded_size = decodeBase58(&src[prev_src_offset], src_length, &dst[current_dst_offset]); if (!decoded_size) { if constexpr (ErrorHandling == Base58DecodeErrorHandling::ThrowException) throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid Base58 value, cannot be decoded"); else decoded_size = 0; } prev_src_offset = current_src_offset; current_dst_offset += *decoded_size; dst[current_dst_offset] = 0; ++current_dst_offset; dst_offsets[row] = current_dst_offset; } dst_data.resize(current_dst_offset); } static void processFixedString(const ColumnFixedString & src_column, ColumnString::MutablePtr & dst_column, size_t input_rows_count) { auto & dst_data = dst_column->getChars(); auto & dst_offsets = dst_column->getOffsets(); /// Base58 has efficiency of 73% (8/11) [https://monerodocs.org/cryptography/base58/], /// and decoded value will be no longer than source. size_t max_result_size = src_column.getChars().size() + 1; dst_data.resize(max_result_size); dst_offsets.resize(input_rows_count); const auto * src = src_column.getChars().data(); auto * dst = dst_data.data(); size_t N = src_column.getN(); size_t current_dst_offset = 0; for (size_t row = 0; row < input_rows_count; ++row) { std::optional decoded_size = decodeBase58(&src[row * N], N, &dst[current_dst_offset]); if (!decoded_size) { if constexpr (ErrorHandling == Base58DecodeErrorHandling::ThrowException) throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid Base58 value, cannot be decoded"); else decoded_size = 0; } current_dst_offset += *decoded_size; dst[current_dst_offset] = 0; ++current_dst_offset; dst_offsets[row] = current_dst_offset; } dst_data.resize(current_dst_offset); } }; template class FunctionBase58Conversion : public IFunction { public: static constexpr auto name = Func::name; static FunctionPtr create(ContextPtr) { return std::make_shared(); } String getName() const override { return Func::name; } size_t getNumberOfArguments() const override { return 1; } bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; } bool useDefaultImplementationForConstants() const override { return true; } ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1}; } DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override { FunctionArgumentDescriptors args{ {"arg", static_cast(&isStringOrFixedString), nullptr, "String or FixedString"} }; validateFunctionArguments(*this, arguments, args); return std::make_shared(); } DataTypePtr getReturnTypeForDefaultImplementationForDynamic() const override { return std::make_shared(); } ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override { const ColumnPtr col = arguments[0].column; if (const ColumnString * col_string = checkAndGetColumn(col.get())) { auto col_res = ColumnString::create(); Func::processString(*col_string, col_res, input_rows_count); return col_res; } else if (const ColumnFixedString * col_fixed_string = checkAndGetColumn(col.get())) { auto col_res = ColumnString::create(); Func::processFixedString(*col_fixed_string, col_res, input_rows_count); return col_res; } throw Exception( ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}, must be String or FixedString", arguments[0].column->getName(), getName()); } }; }