From 7a329ef07d30f91a35dfb4fb50694bfad6c68721 Mon Sep 17 00:00:00 2001 From: LinZhihao-723 Date: Fri, 28 Jun 2024 16:36:38 -0400 Subject: [PATCH] Add json serialization --- components/core/CMakeLists.txt | 1 + components/core/src/clp/ffi/utils.cpp | 131 +++++++++++++++++++++++ components/core/src/clp/ffi/utils.hpp | 26 +++++ components/core/tests/test-ffi_utils.cpp | 110 +++++++++++++++++++ 4 files changed, 268 insertions(+) create mode 100644 components/core/tests/test-ffi_utils.cpp diff --git a/components/core/CMakeLists.txt b/components/core/CMakeLists.txt index 7cba49acb..2450a279e 100644 --- a/components/core/CMakeLists.txt +++ b/components/core/CMakeLists.txt @@ -460,6 +460,7 @@ set(SOURCE_FILES_unitTest tests/test-EncodedVariableInterpreter.cpp tests/test-encoding_methods.cpp tests/test-ffi_SchemaTree.cpp + tests/test-ffi_utils.cpp tests/test-Grep.cpp tests/test-ir_encoding_methods.cpp tests/test-ir_parsing.cpp diff --git a/components/core/src/clp/ffi/utils.cpp b/components/core/src/clp/ffi/utils.cpp index c85c47701..7b5eb2720 100644 --- a/components/core/src/clp/ffi/utils.cpp +++ b/components/core/src/clp/ffi/utils.cpp @@ -5,16 +5,93 @@ #include #include #include +#include #include #include #include +#include + #include "../utf8_utils.hpp" using std::string; using std::string_view; namespace clp::ffi { +namespace { +/** + * Serializes and appends a msgpack object to the given JSON string. + * NOTE: Event if the serialization failed, `json_str` may be modified. + * @param obj + * @param json_str Outputs the appended JSON string. + * @return true on success. + * @return false if the type of the object is not supported, or the serialization failed. + */ +[[nodiscard]] auto serialize_and_append_msgpack_object_to_json_str( + msgpack::object const& obj, + string& json_str +) -> bool; + +/** + * Wrapper of `validate_and_append_escaped_utf8_string`, with both leading and end double quote + * marks added to match JSON string spec. + * NOTE: Event if the serialization failed, `json_str` may be modified. + * @param src + * @param json_str Outputs the appended JSON string. + * @return Same as `validate_and_append_escaped_utf8_string`. + */ +[[nodiscard]] auto +append_escaped_utf8_string_to_json_str(string_view src, string& json_str) -> bool; + +// NOLINTNEXTLINE(misc-no-recursion) +auto serialize_and_append_msgpack_object_to_json_str( + msgpack::object const& obj, + std::string& json_str +) -> bool { + bool ret_val{true}; + switch (obj.type) { + case msgpack::type::MAP: + ret_val = serialize_and_append_msgpack_map_to_json_str(obj, json_str); + break; + case msgpack::type::ARRAY: + ret_val = serialize_and_append_msgpack_array_to_json_str(obj, json_str); + break; + case msgpack::type::NIL: + json_str += "null"; + break; + case msgpack::type::BOOLEAN: + json_str += obj.as() ? "true" : "false"; + break; + case msgpack::type::STR: + ret_val = append_escaped_utf8_string_to_json_str(obj.as(), json_str); + break; + case msgpack::type::FLOAT32: + case msgpack::type::FLOAT: + json_str += std::to_string(obj.as()); + break; + case msgpack::type::POSITIVE_INTEGER: + json_str += std::to_string(obj.as()); + break; + case msgpack::type::NEGATIVE_INTEGER: + json_str += std::to_string(obj.as()); + break; + default: + ret_val = false; + break; + } + return ret_val; +} + +auto append_escaped_utf8_string_to_json_str(string_view src, string& json_str) -> bool { + json_str.push_back('"'); + if (false == validate_and_append_escaped_utf8_string(src, json_str)) { + return false; + } + json_str.push_back('"'); + return true; +} +} // namespace + auto validate_and_escape_utf8_string(string_view raw) -> std::optional { std::optional ret_val; auto& escaped{ret_val.emplace()}; @@ -86,4 +163,58 @@ auto validate_and_append_escaped_utf8_string(std::string_view src, std::string& return true; } + +// NOLINTNEXTLINE(misc-no-recursion) +auto serialize_and_append_msgpack_array_to_json_str( + msgpack::object const& array, + std::string& json_str +) -> bool { + if (msgpack::type::ARRAY != array.type) { + return false; + } + // NOLINTNEXTLINE(cppcoreguidelines-pro-type-union-access) + auto const array_data{array.via.array}; + bool is_first_element{true}; + json_str.push_back('['); + for (auto const& element : std::span{array_data.ptr, static_cast(array_data.size)}) { + if (is_first_element) { + is_first_element = false; + } else { + json_str.push_back(','); + } + if (false == serialize_and_append_msgpack_object_to_json_str(element, json_str)) { + return false; + } + } + json_str.push_back(']'); + return true; +} + +// NOLINTNEXTLINE(misc-no-recursion) +auto serialize_and_append_msgpack_map_to_json_str(msgpack::object const& map, std::string& json_str) + -> bool { + if (msgpack::type::MAP != map.type) { + return false; + } + // NOLINTNEXTLINE(cppcoreguidelines-pro-type-union-access) + auto const& map_data{map.via.map}; + bool is_first_element{true}; + json_str.push_back('{'); + for (auto const& [key, val] : std::span{map_data.ptr, static_cast(map_data.size)}) { + if (is_first_element) { + is_first_element = false; + } else { + json_str.push_back(','); + } + if (false == append_escaped_utf8_string_to_json_str(key.as(), json_str)) { + return false; + } + json_str.push_back(':'); + if (false == serialize_and_append_msgpack_object_to_json_str(val, json_str)) { + return false; + } + } + json_str.push_back('}'); + return true; +} } // namespace clp::ffi diff --git a/components/core/src/clp/ffi/utils.hpp b/components/core/src/clp/ffi/utils.hpp index 26823da9c..a12e34a0e 100644 --- a/components/core/src/clp/ffi/utils.hpp +++ b/components/core/src/clp/ffi/utils.hpp @@ -5,6 +5,8 @@ #include #include +#include + namespace clp::ffi { /** * Validates whether the given string is UTF-8 encoded, and escapes any characters to make the @@ -26,6 +28,30 @@ namespace clp::ffi { */ [[nodiscard]] auto validate_and_append_escaped_utf8_string(std::string_view src, std::string& dst) -> bool; + +/** + * Serializes and appends a msgpack array to the given JSON string. + * @param array + * @param json_str Outputs the appended JSON string. + * @return Whether the serialized succeeded. NOTE: Event if the serialization failed, `json_str` may + * be modified. + */ +[[nodiscard]] auto serialize_and_append_msgpack_array_to_json_str( + msgpack::object const& array, + std::string& json_str +) -> bool; + +/** + * Serializes and appends a msgpack map to the given JSON string. + * @param map + * @param json_str Outputs the appended JSON string. + * @return Whether the serialized succeeded. NOTE: Event if the serialization failed, `json_str` may + * be modified. + */ +[[nodiscard]] auto serialize_and_append_msgpack_map_to_json_str( + msgpack::object const& map, + std::string& json_str +) -> bool; } // namespace clp::ffi #endif // CLP_FFI_UTILS_HPP diff --git a/components/core/tests/test-ffi_utils.cpp b/components/core/tests/test-ffi_utils.cpp new file mode 100644 index 000000000..8d39adffb --- /dev/null +++ b/components/core/tests/test-ffi_utils.cpp @@ -0,0 +1,110 @@ +#include +#include +#include +#include +#include + +#include +#include +#include + +#include "../src/clp/ffi/utils.hpp" +#include "../src/clp/type_utils.hpp" + +using nlohmann::json; +using std::optional; +using std::string; +using std::string_view; +using std::vector; + +using clp::ffi::serialize_and_append_msgpack_array_to_json_str; +using clp::ffi::serialize_and_append_msgpack_map_to_json_str; + +namespace { +/** + * Serializes the given msgpack byte sequence into a JSON string. + * @param msgpack_bytes + * @return Serialized JSON string on success. + * @return std::nullopt on failure. + */ +[[nodiscard]] auto serialize_msgpack_bytes_to_json_str(vector const& msgpack_bytes +) -> optional; + +auto serialize_msgpack_bytes_to_json_str(vector const& msgpack_bytes +) -> optional { + msgpack::object_handle msgpack_oh; + msgpack::unpack( + msgpack_oh, + clp::size_checked_pointer_cast(msgpack_bytes.data()), + msgpack_bytes.size() + ); + optional ret_val; + auto const& msgpack_obj{msgpack_oh.get()}; + if (msgpack::type::ARRAY == msgpack_obj.type) { + if (false == serialize_and_append_msgpack_array_to_json_str(msgpack_obj, ret_val.emplace())) + { + return std::nullopt; + } + } else if (msgpack::type::MAP == msgpack_obj.type) { + if (false == serialize_and_append_msgpack_map_to_json_str(msgpack_obj, ret_val.emplace())) { + return std::nullopt; + } + } else { + return std::nullopt; + } + return ret_val; +} +} // namespace + +TEST_CASE("test_msgpack_to_json", "[ffi][utils]") { + optional result; + + // Test array with primitive values only + json const array_with_primitive_values_only + = {1, -1, 1.01, -1.01, true, false, "short_string", "This is a long string", nullptr}; + result = serialize_msgpack_bytes_to_json_str(json::to_msgpack(array_with_primitive_values_only) + ); + REQUIRE((result.has_value() && array_with_primitive_values_only == json::parse(result.value())) + ); + + // Test map with primitive values only + json const map_with_primitive_values_only + = {{"int_key", 1}, + {"int_key_negative", -1}, + {"float_key", 0.01}, + {"float_key_negative", -0.01}, + {"bool_key_true", false}, + {"bool_key_false", true}, + {"str_key", "Test string"}, + {"null_key", nullptr}}; + result = serialize_msgpack_bytes_to_json_str(json::to_msgpack(map_with_primitive_values_only)); + REQUIRE((result.has_value() && map_with_primitive_values_only == json::parse(result.value()))); + + // Test array with inner map + json array_with_map = array_with_primitive_values_only; + array_with_map.emplace_back(map_with_primitive_values_only); + result = serialize_msgpack_bytes_to_json_str(json::to_msgpack(array_with_map)); + REQUIRE((result.has_value() && array_with_map == json::parse(result.value()))); + + // Test map with inner array + json map_with_array = map_with_primitive_values_only; + map_with_array.emplace("array_key", array_with_primitive_values_only); + result = serialize_msgpack_bytes_to_json_str(json::to_msgpack(map_with_array)); + REQUIRE((result.has_value() && map_with_array == json::parse(result.value()))); + + // Recursively create inner maps and arrays + // Note: the execution time and memory consumption will grow exponentially as we increase the + // recursive depth. + constexpr size_t cRecursiveDepth{6}; + for (size_t i{0}; i < cRecursiveDepth; ++i) { + array_with_map.emplace_back(map_with_array); + array_with_map.emplace_back(array_with_map); + result = serialize_msgpack_bytes_to_json_str(json::to_msgpack(array_with_map)); + REQUIRE((result.has_value() && array_with_map == json::parse(result.value()))); + + map_with_array.emplace("array_key_" + std::to_string(i), array_with_map); + map_with_array.emplace("map_key_" + std::to_string(i), map_with_array); + result = serialize_msgpack_bytes_to_json_str(json::to_msgpack(map_with_array)); + REQUIRE((result.has_value() && map_with_array == json::parse(result.value()))); + } +}