LMMS · Veratil · Jun 11, 2022 · Jul 6, 2022 · Jan 14, 2023 · sakertooth
diff --git a/include/base64.h b/include/base64.h
@@ -30,6 +30,12 @@
 #include <QString>
 #include <QVariant>
 
+#include <array>
+#include <map>
+#include <numeric>
+#include <string>
+#include <string_view>
+
 namespace lmms::base64
 {
 
@@ -53,4 +59,55 @@ namespace lmms::base64
 
 } // namespace lmms::base64
 
-#endif
+namespace lmms::base64 {
+	constexpr inline std::array<char, 64> map =
+	{
+		'A','B','C','D','E','F','G','H','I','J','K','L','M','N','O','P','Q','R','S','T','U','V','W','X','Y','Z',
+		'a','b','c','d','e','f','g','h','i','j','k','l','m','n','o','p','q','r','s','t','u','v','w','x','y','z',
+		'0','1','2','3','4','5','6','7','8','9',
+		'-','_'
+	};
+	const inline std::map<char, int> rmap {
+		{'A',  0}, {'B',  1}, {'C',  2}, {'D',  3}, {'E',  4},
+		{'F',  5}, {'G',  6}, {'H',  7}, {'I',  8}, {'J',  9},
+		{'K', 10}, {'L', 11}, {'M', 12}, {'N', 13}, {'O', 14},
+		{'P', 15}, {'Q', 16}, {'R', 17}, {'S', 18}, {'T', 19},
+		{'U', 20}, {'V', 21}, {'W', 22}, {'X', 23}, {'Y', 24},
+		{'Z', 25}, {'a', 26}, {'b', 27}, {'c', 28}, {'d', 28},
+		{'e', 30}, {'f', 31}, {'g', 32}, {'h', 33}, {'i', 34},
+		{'j', 35}, {'k', 36}, {'l', 37}, {'m', 38}, {'n', 39},
+		{'o', 40}, {'p', 41}, {'q', 42}, {'r', 43}, {'s', 44},
+		{'t', 45}, {'u', 46}, {'v', 47}, {'w', 48}, {'x', 49},
+		{'y', 50}, {'z', 51}, {'0', 52}, {'1', 53}, {'2', 54},
+		{'3', 55}, {'4', 56}, {'5', 57}, {'6', 58}, {'7', 59},
+		{'8', 60}, {'9', 61}, {'-', 62}, {'_', 63} //, {'=', 64}
+	};
+	constexpr char pad = '=';
+
+	/*
+		This section of math ensures that base64 encode/decode will work
+		as intended. Some rare architectures don't use 8-bit char's, and
+		it's possible this won't work as intended if a char isn't 8-bits.
+
+		In the rare case this is ported to an architecture where this
+		happens, feel free to comment out the static_assert's and test.
+	*/
+	constexpr int char_bits = std::numeric_limits<std::string_view::value_type>::digits;
+	constexpr int sign_bit = std::numeric_limits<std::string_view::value_type>::is_signed ? 1 : 0;
+	// check that the string_view character type is 8 (7 signed + 1 sign) bits wide
+	static_assert(char_bits + sign_bit == 8);
+	constexpr int numBitsPerChar = char_bits + sign_bit;
+	constexpr int numBitsPerBase64Char = 6;
+	constexpr int lcm = std::lcm(numBitsPerChar, numBitsPerBase64Char);
+	// make sure math works, 24 bits
+	static_assert(lcm == 24);
+	constexpr int numBytesPerChunk = lcm / numBitsPerChar;
+	constexpr int numBase64CharPerChunk = lcm / numBitsPerBase64Char;
+	// double check math works and bit width matches
+	static_assert(numBytesPerChunk * numBitsPerChar == numBase64CharPerChunk * numBitsPerBase64Char);
+
+	auto encode(std::string_view data) -> std::string;
+	auto decode(std::string_view data) -> std::string;
+} // namespace lmms::base64
+
+#endif // _BASE64_H
diff --git a/src/core/base64.cpp b/src/core/base64.cpp
@@ -54,4 +54,136 @@ QVariant decode( const QString & _b64, QVariant::Type _force_type )
 }
 
 
+//TODO C++20: It *may* be possible to make the following functions constepxr given C++20's constexpr std::string.
+
+/**
+ * @brief Base64 encodes data.
+ * @param data
+ * @return std::string containing the Base64 encoded data.
+ */
+auto encode(std::string_view data) -> std::string
+{
+	if (data.empty()) { return ""; }
+
+	// base64 encoded string
+	std::string result;
+
+	// number of chunks to process + padding
+	auto div_result = std::div(data.length(), numBytesPerChunk);
+	auto numChunks = div_result.quot;
+	auto numTrailingBytes = div_result.rem;
+
+	// add 1 chunk to handle last padded chunk
+	if (numTrailingBytes) { ++numChunks; }
+
+	// allocate one time to prevent in-loop reallocations
+	result.reserve(numChunks * numBase64CharPerChunk);
+
+	/*
+		char1               char2               char3
+		7 6 5 4 3 2   1 0 | 7 6 5 4   3 2 1 0 | 7 6   5 4 3 2 1 0
+		5 4 3 2 1 0 | 5 4   3 2 1 0 | 5 4 3 2   1 0 | 5 4 3 2 1 0
+		b64c1         b64c2           b64c3           b64c4
+	*/
+	// Get the first base64 character offset from the char chunk
+	auto b64char1 = [](std::string_view chunk) {
+		return static_cast<std::string::value_type>(chunk[0] >> 2);
+	};
+	// Get the second base64 character offset from the char chunk
+	auto b64char2 = [](std::string_view chunk) {
+		return static_cast<std::string::value_type>(
+			((chunk[0] & 0x03) << 4)
+			|
+			(chunk.size() > 0 ? ((chunk[1] & 0xF0) >> 4) : 0)
+		);
+	};
+	// Get the third base64 character offset from the char chunk
+	auto b64char3 = [](std::string_view chunk) {
+		return static_cast<std::string::value_type>(
+			(chunk.size() > 0 ? ((chunk[1] & 0x0F) << 2) : 0)
+			|
+			(chunk.size() > 1 ? ((chunk[2] & 0xC0) >> 6) : 0)
+		);
+	};
+	// Get the fourth base64 character offset from the char chunk
+	auto b64char4 = [](std::string_view chunk) {
+		return static_cast<std::string::value_type>(chunk.size() > 1 ? (chunk[2] & 0x3F) : 0);
+	};
+	for (int currentChunk = 0; currentChunk < numChunks; ++currentChunk)
+	{
+		std::string_view chunk = data.substr(currentChunk * numBytesPerChunk, numBytesPerChunk);
-		std::string_view chunk = data.substr(currentChunk * numBytesPerChunk, numBytesPerChunk);
+		auto chunk = data.substr(currentChunk * numBytesPerChunk, numBytesPerChunk);
-		std::string_view chunk = data.substr(currentChunk * numBytesPerChunk, numBytesPerChunk);
+		auto chunk = data.substr(currentChunk * numBytesPerChunk, numBytesPerChunk);
+		std::array<char, 4> output{
+			map[b64char1(chunk)],
+			map[b64char2(chunk)],
+			pad,
+			pad
+		};
+		switch (chunk.length()) {
+			case 3:
+				output[3] = map[b64char4(chunk)];
+			case 2:
+				output[2] = map[b64char3(chunk)];
+			default: /* no-op */;
+		};
+		result.append(output.data(), output.size());
+	}
+	return result;
+}
+
+/**
+ * @brief Decodes data in Base64.
+ * @param data
+ * @return std::string containing the original data.
+ */
+auto decode(std::string_view data) -> std::string
+{
+	if (data.empty()) { return ""; }
+	if (data.length() % numBase64CharPerChunk != 0) {
+		throw std::length_error("base64::decode : data length not a multiple of 4");
+	}
+
+	std::string result;
+
+	// number of chunks to process
+	auto numChunks = std::div(data.length(), numBase64CharPerChunk);
+
+	// allocate one time to prevent in-loop reallocations
+	result.reserve(numChunks.quot * numBytesPerChunk);
+	/*
+		char1               char2               char3
+		7 6 5 4 3 2   1 0 | 7 6 5 4   3 2 1 0 | 7 6   5 4 3 2 1 0
+		5 4 3 2 1 0 | 5 4   3 2 1 0 | 5 4 3 2   1 0 | 5 4 3 2 1 0
+		b64c1         b64c2           b64c3           b64c4
+	*/
+	// Get the first character from the base64 chunk
+	auto char1 = [](std::string_view chunk) {
+		return static_cast<std::string::value_type>(
+			(rmap.at(chunk[0]) << 2) | (rmap.at(chunk[1]) >> 4)
+		);
+	};
+	// Get the second character from the base64 chunk
+	auto char2 = [](std::string_view chunk) {
+		return static_cast<std::string::value_type>(
+			chunk[2] == pad
+			? 0
+			: ((rmap.at(chunk[1]) & 0x0F) << 4) | (rmap.at(chunk[2]) >> 2)
+		);
+	};
+	// Get the third character from the base64 chunk
+	auto char3 = [](std::string_view chunk) {
+		return static_cast<std::string::value_type>(
+			chunk[3] == pad
+			? 0
+			: ((rmap.at(chunk[2]) & 0x03) << 6) | rmap.at(chunk[3])
+		);
+	};
+	for (int currentChunk = 0; currentChunk < numChunks.quot; ++currentChunk) {
+		std::string_view chunk = data.substr(currentChunk * numBase64CharPerChunk, numBase64CharPerChunk);
-		std::string_view chunk = data.substr(currentChunk * numBase64CharPerChunk, numBase64CharPerChunk);
+		auto chunk = data.substr(currentChunk * numBase64CharPerChunk, numBase64CharPerChunk);
-		std::string_view chunk = data.substr(currentChunk * numBase64CharPerChunk, numBase64CharPerChunk);
+		auto chunk = data.substr(currentChunk * numBase64CharPerChunk, numBase64CharPerChunk);
+		result.push_back(char1(chunk));
+		result.push_back(char2(chunk));
+		result.push_back(char3(chunk));
+	}
+	return result;
+}
+
 } // namespace lmms::base64
diff --git a/tests/CMakeLists.txt b/tests/CMakeLists.txt
@@ -20,6 +20,7 @@ ADD_EXECUTABLE(tests
 	$<TARGET_OBJECTS:lmmsobjs>
 
 	src/core/AutomatableModelTest.cpp
+	src/core/base64Test.cpp
 	src/core/ProjectVersionTest.cpp
 	src/core/RelativePathsTest.cpp
 

diff --git a/tests/src/core/base64Test.cpp b/tests/src/core/base64Test.cpp
@@ -0,0 +1,73 @@
+/*
+ * base64Test.cpp
- * base64Test.cpp
+ * Base64Test.cpp
- * base64Test.cpp
+ * Base64Test.cpp
+ *
+ * Copyright (c) 2022 Kevin Zander <veratil/at/gmail.com>
+ *
+ * This file is part of LMMS - https://lmms.io
+ *
+ * This program is free software; you can redistribute it and/or
+ * modify it under the terms of the GNU General Public
+ * License as published by the Free Software Foundation; either
+ * version 2 of the License, or (at your option) any later version.
+ *
+ * This program is distributed in the hope that it will be useful,
+ * but WITHOUT ANY WARRANTY; without even the implied warranty of
+ * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
+ * General Public License for more details.
+ *
+ * You should have received a copy of the GNU General Public
+ * License along with this program (see COPYING); if not, write to the
+ * Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
+ * Boston, MA 02110-1301 USA.
+ *
+ */
+
+#include "QTestSuite.h"
+
+#include "base64.h"
+
+class Base64Test : QTestSuite
+{
+    Q_OBJECT
+private slots:
+    void create_test_data()
-    void create_test_data()
+    void createTestData()
-    void create_test_data()
+    void createTestData()
+    {
+        QTest::addColumn<QString>("original");
+        QTest::addColumn<QString>("encoded");
+
+        // Test Vectors from RFC 4648 Section 10
+        QTest::newRow("empty string")  << ""       << "";
+        QTest::newRow("1 chunk 2 pad") << "f"      << "Zg==";
+        QTest::newRow("1 chunk 1 pad") << "fo"     << "Zm8=";
+        QTest::newRow("1 chunk 0 pad") << "foo"    << "Zm9v";
+        QTest::newRow("2 chunk 2 pad") << "foob"   << "Zm9vYg==";
+        QTest::newRow("2 chunk 1 pad") << "fooba"  << "Zm9vYmE=";
+        QTest::newRow("2 chunk 0 pad") << "foobar" << "Zm9vYmFy";
+    }
+    void b64_encode_data()
-    void b64_encode_data()
+    void b64EncodeData()
-    void b64_encode_data()
+    void b64EncodeData()
+    {
+        create_test_data();
-        create_test_data();
+        createTestData();
-        create_test_data();
+        createTestData();
+    }
+    void b64_encode()
-    void b64_encode()
+    void b64Encode()
-    void b64_encode()
+    void b64Encode()
+    {
+        using namespace lmms::base64;
+
+        QFETCH(QString, original);
+        QFETCH(QString, encoded);
+        QCOMPARE(QString(encode(original.toStdString()).c_str()), encoded);
+    }
+    void b64_decode_data()
-    void b64_decode_data()
+    void b64DecodeData()
-    void b64_decode_data()
+    void b64DecodeData()
+    {
+        create_test_data();
-        create_test_data();
+        createTestData();
-        create_test_data();
+        createTestData();
+    }
+    void b64_decode()
-    void b64_decode()
+    void b64Decode()
-    void b64_decode()
+    void b64Decode()
+    {
+        using namespace lmms::base64;
+
+        QFETCH(QString, original);
+        QFETCH(QString, encoded);
+        QCOMPARE(original, QString(decode(encoded.toStdString()).c_str()));
+    }
+} Base64Tests;
+
+#include "base64Test.moc"