Differential D7758 Diff 26296 native/cpp/CommonCpp/Tools/Base64.cpp

Changeset View

Standalone View

native/cpp/CommonCpp/Tools/Base64.cpp

#include "Base64.h"		#include "Base64.h"

#include <math.h>		#include <math.h>
#include <array>		#include <array>

namespace comm {		// anonymous namespace to encapsulate internal utilities
		namespace {
static constexpr std::array<char, 64> encode_table{		constexpr std::array<char, 64> encode_table{
'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M',		'A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M',
'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z',		'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U', 'V', 'W', 'X', 'Y', 'Z',
'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm',		'a', 'b', 'c', 'd', 'e', 'f', 'g', 'h', 'i', 'j', 'k', 'l', 'm',
'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z',		'n', 'o', 'p', 'q', 'r', 's', 't', 'u', 'v', 'w', 'x', 'y', 'z',
'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '+', '/'};		'0', '1', '2', '3', '4', '5', '6', '7', '8', '9', '+', '/'};

static std::array<char, 4> encode_triplet(uint8_t a, uint8_t b, uint8_t c) {		constexpr std::array<uint8_t, 256> decode_table{
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x3E, 0x64, 0x64, 0x64, 0x3F,
		0x34, 0x35, 0x36, 0x37, 0x38, 0x39, 0x3A, 0x3B, 0x3C, 0x3D, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06,
		0x07, 0x08, 0x09, 0x0A, 0x0B, 0x0C, 0x0D, 0x0E, 0x0F, 0x10, 0x11, 0x12,
		0x13, 0x14, 0x15, 0x16, 0x17, 0x18, 0x19, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x1A, 0x1B, 0x1C, 0x1D, 0x1E, 0x1F, 0x20, 0x21, 0x22, 0x23, 0x24,
		0x25, 0x26, 0x27, 0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x2D, 0x2E, 0x2F, 0x30,
		0x31, 0x32, 0x33, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64, 0x64,
		0x64, 0x64, 0x64, 0x64};

		std::array<char, 4> encode_triplet(uint8_t a, uint8_t b, uint8_t c) {
constexpr uint32_t SIX_BIT_MASK = 0b111111;		constexpr uint32_t SIX_BIT_MASK = 0b111111;
const uint32_t concat_bits = (a << 16) \| (b << 8) \| c;		const uint32_t concat_bits = (a << 16) \| (b << 8) \| c;
const auto x = encode_table[(concat_bits >> 18) & SIX_BIT_MASK];		const auto x = encode_table[(concat_bits >> 18) & SIX_BIT_MASK];
const auto y = encode_table[(concat_bits >> 12) & SIX_BIT_MASK];		const auto y = encode_table[(concat_bits >> 12) & SIX_BIT_MASK];
const auto z = encode_table[(concat_bits >> 6) & SIX_BIT_MASK];		const auto z = encode_table[(concat_bits >> 6) & SIX_BIT_MASK];
const auto w = encode_table[concat_bits & SIX_BIT_MASK];		const auto w = encode_table[concat_bits & SIX_BIT_MASK];
return {x, y, z, w};		return {x, y, z, w};
}		}

		std::array<uint8_t, 3> decode_quad(char a, char b, char c, char d) {
		constexpr uint32_t BYTE_MASK = 0xff;
		uint32_t const concat_bytes = (decode_table[a] << 18) \|
		(decode_table[b] << 12) \| (decode_table[c] << 6) \| decode_table[d];
		const uint8_t byte1 = (concat_bytes >> 16) & BYTE_MASK;
		const uint8_t byte2 = (concat_bytes >> 8) & BYTE_MASK;
		const uint8_t byte3 = concat_bytes & BYTE_MASK;
		return {byte1, byte2, byte3};
		}

		inline bool is_valid_base64_char(char c) {
		const auto decode_byte = decode_table[c];
		return decode_byte != 0x64;
		}

		inline bool is_valid_base64_str(const std::string_view encoded_str) {
		if ((encoded_str.size() % 4) == 1) {
		return false;
		}

		if (!std::all_of(begin(encoded_str), end(encoded_str) - 2, [](char c) {
		kamilUnsubmitted Not Done Inline Actions I think to use this you should add `#include <algorithm>` and `#include <iterator>` kamil: I think to use this you should add `#include <algorithm>` and `#include <iterator>`
		return is_valid_base64_char(c);
		})) {
		return false;
		}

		const auto last = rbegin(encoded_str);
		kamilUnsubmitted Not Done Inline Actions in line 69 you used `end(encoded_str) - 2`, so to make it consistent and more readable I will prefer something like: `const auto last = end(encoded_str) - 1;` and base logic in next lines on this kamil: in line 69 you used `end(encoded_str) - 2`, so to make it consistent and more readable I will…
		if (!is_valid_base64_char(*next(last))) {
		return (next(last) == '=') && (last == '=');
		}

		return is_valid_base64_char(last) \|\| (last == '=');
		}

		} // anonymous namespace

		namespace comm {

std::string Base64::encode(const std::vector<uint8_t> &data) {		std::string Base64::encode(const std::vector<uint8_t> &data) {
const auto size = data.size();		const auto size = data.size();
const auto remainder = size % 3;		const auto remainder = size % 3;
const auto baseLength = size - remainder;		const auto baseLength = size - remainder;

// three bytes are encoded by 4 base64 chars		// three bytes are encoded by 4 base64 chars
std::string encoded;		std::string encoded;
encoded.reserve(4 * ceil(size / 3));		encoded.reserve(4 * ceil(size / 3));
Show All 12 Lines	if (remainder == 1) {
auto it = data.end() - 2;		auto it = data.end() - 2;
const auto b64_chars = encode_triplet(it, (it + 1), 0x00);		const auto b64_chars = encode_triplet(it, (it + 1), 0x00);
std::copy_n(begin(b64_chars), 3, back_inserter(encoded));		std::copy_n(begin(b64_chars), 3, back_inserter(encoded));
encoded.push_back('=');		encoded.push_back('=');
}		}
return encoded;		return encoded;
}		}

		std::vector<uint8_t> Base64::decode(const std::string_view base64String) {
		if (base64String.size() == 0) {
		return std::vector<uint8_t>{};
		}
		if (!is_valid_base64_str(base64String)) {
		throw std::runtime_error("Invalid base64 string");
		kamilUnsubmitted Not Done Inline Actions I think there was some discussion that initialization with curly brackets`{}` is better, but I can not find it right now kamil: I think there was some discussion that initialization with curly brackets`{}` is better, but I…
		atulUnsubmitted Not Done Inline Actions Here's the snippet I read that encouraged braced initialization as a "best practice": In practice we use all sorts of initialization in our C++ code, but we did say in our C++ coding standards that we "prefer braced initialization": https://www.notion.so/commapp/C-coding-standards-8c9f22b4b16a41c3a868eb5f537db1de?pvs=4#7de58b7ac3c0402bbae2a4e3b6b6738c atul: Here's the snippet I read that encouraged braced initialization as a "best practice": {F539399}…
		}

		const auto unpadded = base64String.substr(0, base64String.find_first_of('='));
		const auto full_quadruples = unpadded.size() / 4;

		// 4 base64 characters encode 3 bytes
		std::vector<uint8_t> decoded_bytes;
		decoded_bytes.reserve((full_quadruples + 1) * 3);

		for (size_t i = 0; i < full_quadruples; i++) {
		const auto quad = unpadded.substr(i * 4, 4);
		const auto bytes = decode_quad(quad[0], quad[1], quad[2], quad[3]);
		std::copy(begin(bytes), end(bytes), back_inserter(decoded_bytes));
		}

		const auto last_quad = unpadded.substr(full_quadruples * 4);
		if (last_quad.size() == 0) {
		return decoded_bytes;
		}

		// handle padding
		if ((last_quad.size() == 2) \|\| (last_quad[2] == '=')) {
		const auto bytes = decode_quad(last_quad[0], last_quad[1], 'A', 'A');
		decoded_bytes.push_back(bytes[0]);
		} else {
		const auto bytes =
		decode_quad(last_quad[0], last_quad[1], last_quad[2], 'A');
		std::copy_n(begin(bytes), 2, back_inserter(decoded_bytes));
		}

		return decoded_bytes;
		}

} // namespace comm		} // namespace comm