1
0
mirror of https://github.com/SquidDev-CC/CC-Tweaked synced 2024-11-05 01:26:20 +00:00

Add ability to serialize Unicode strings to JSON (#1489)

This commit is contained in:
JackMacWindows 2023-06-18 17:42:28 -04:00 committed by GitHub
parent 953372b1b7
commit c8523bf479
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
3 changed files with 91 additions and 33 deletions

View File

@ -57,7 +57,7 @@ fabric-loom = "1.1.10"
forgeGradle = "5.1.+" forgeGradle = "5.1.+"
githubRelease = "2.2.12" githubRelease = "2.2.12"
ideaExt = "1.1.6" ideaExt = "1.1.6"
illuaminate = "0.1.0-24-gdb28902" illuaminate = "0.1.0-28-ga7efd71"
librarian = "1.+" librarian = "1.+"
minotaur = "2.+" minotaur = "2.+"
mixinGradle = "0.7.+" mixinGradle = "0.7.+"

View File

@ -424,12 +424,31 @@ do
if map[c] == nil then map[c] = hexify(c) end if map[c] == nil then map[c] = hexify(c) end
end end
serializeJSONString = function(s) serializeJSONString = function(s, options)
return ('"%s"'):format(s:gsub("[\0-\x1f\"\\]", map):gsub("[\x7f-\xff]", hexify)) if options and options.unicode_strings and s:find("[\x80-\xff]") then
local retval = '"'
for _, code in utf8.codes(s) do
if code > 0xFFFF then
-- Encode the codepoint as a UTF-16 surrogate pair
code = code - 0x10000
local high, low = bit32.extract(code, 10, 10) + 0xD800, bit32.extract(code, 0, 10) + 0xDC00
retval = retval .. ("\\u%04X\\u%04X"):format(high, low)
elseif code <= 0x5C and map[string.char(code)] then -- 0x5C = `\`, don't run `string.char` if we don't need to
retval = retval .. map[string.char(code)]
elseif code < 0x20 or code >= 0x7F then
retval = retval .. ("\\u%04X"):format(code)
else
retval = retval .. string.char(code)
end
end
return retval .. '"'
else
return ('"%s"'):format(s:gsub("[\0-\x1f\"\\]", map):gsub("[\x7f-\xff]", hexify))
end
end end
end end
local function serializeJSONImpl(t, tTracking, bNBTStyle) local function serializeJSONImpl(t, tTracking, options)
local sType = type(t) local sType = type(t)
if t == empty_json_array then return "[]" if t == empty_json_array then return "[]"
elseif t == json_null then return "null" elseif t == json_null then return "null"
@ -450,13 +469,14 @@ local function serializeJSONImpl(t, tTracking, bNBTStyle)
local nObjectSize = 0 local nObjectSize = 0
local nArraySize = 0 local nArraySize = 0
local largestArrayIndex = 0 local largestArrayIndex = 0
local bNBTStyle = options and options.nbt_style
for k, v in pairs(t) do for k, v in pairs(t) do
if type(k) == "string" then if type(k) == "string" then
local sEntry local sEntry
if bNBTStyle then if bNBTStyle then
sEntry = tostring(k) .. ":" .. serializeJSONImpl(v, tTracking, bNBTStyle) sEntry = tostring(k) .. ":" .. serializeJSONImpl(v, tTracking, options)
else else
sEntry = serializeJSONString(k) .. ":" .. serializeJSONImpl(v, tTracking, bNBTStyle) sEntry = serializeJSONString(k, options) .. ":" .. serializeJSONImpl(v, tTracking, options)
end end
if nObjectSize == 0 then if nObjectSize == 0 then
sObjectResult = sObjectResult .. sEntry sObjectResult = sObjectResult .. sEntry
@ -473,7 +493,7 @@ local function serializeJSONImpl(t, tTracking, bNBTStyle)
if t[k] == nil then --if the array is nil at index k the value is "null" as to keep the unused indexes in between used ones. if t[k] == nil then --if the array is nil at index k the value is "null" as to keep the unused indexes in between used ones.
sEntry = "null" sEntry = "null"
else -- if the array index does not point to a nil we serialise it's content. else -- if the array index does not point to a nil we serialise it's content.
sEntry = serializeJSONImpl(t[k], tTracking, bNBTStyle) sEntry = serializeJSONImpl(t[k], tTracking, options)
end end
if nArraySize == 0 then if nArraySize == 0 then
sArrayResult = sArrayResult .. sEntry sArrayResult = sArrayResult .. sEntry
@ -492,7 +512,7 @@ local function serializeJSONImpl(t, tTracking, bNBTStyle)
end end
elseif sType == "string" then elseif sType == "string" then
return serializeJSONString(t) return serializeJSONString(t, options)
elseif sType == "number" or sType == "boolean" then elseif sType == "number" or sType == "boolean" then
return tostring(t) return tostring(t)
@ -813,32 +833,57 @@ end
unserialise = unserialize -- GB version unserialise = unserialize -- GB version
--- Returns a JSON representation of the given data. --[[- Returns a JSON representation of the given data.
--
-- This function attempts to guess whether a table is a JSON array or This function attempts to guess whether a table is a JSON array or
-- object. However, empty tables are assumed to be empty objects - use object. However, empty tables are assumed to be empty objects - use
-- @{textutils.empty_json_array} to mark an empty array. @{textutils.empty_json_array} to mark an empty array.
--
-- This is largely intended for interacting with various functions from the This is largely intended for interacting with various functions from the
-- @{commands} API, though may also be used in making @{http} requests. @{commands} API, though may also be used in making @{http} requests.
--
-- @param t The value to serialise. Like @{textutils.serialise}, this should not @param[1] t The value to serialise. Like @{textutils.serialise}, this should not
-- contain recursive tables or functions. contain recursive tables or functions.
-- @tparam[opt] boolean bNBTStyle Whether to produce NBT-style JSON (non-quoted keys) @tparam[1,opt] { nbt_style? = boolean, unicode_strings? = boolean } options Options for serialisation.
-- instead of standard JSON. - `nbt_style`: Whether to produce NBT-style JSON (non-quoted keys) instead of standard JSON.
-- @treturn string The JSON representation of the input. - `unicode_strings`: Whether to treat strings as containing UTF-8 characters instead of
-- @throws If the object contains a value which cannot be using the default 8-bit character set.
-- serialised. This includes functions and tables which appear multiple
-- times. @param[2] t The value to serialise. Like @{textutils.serialise}, this should not
-- @usage textutils.serialiseJSON({ values = { 1, "2", true } }) contain recursive tables or functions.
-- @since 1.7 @tparam[2] boolean bNBTStyle Whether to produce NBT-style JSON (non-quoted keys)
-- @see textutils.json_null Use to serialise a JSON `null` value. instead of standard JSON.
-- @see textutils.empty_json_array Use to serialise a JSON empty array.
function serializeJSON(t, bNBTStyle) @treturn string The JSON representation of the input.
@throws If the object contains a value which cannot be serialised. This includes
functions and tables which appear multiple times.
@usage Serialise a simple object
textutils.serialiseJSON({ values = { 1, "2", true } })
@usage Serialise an object to a NBT-style string
textutils.serialiseJSON({ values = { 1, "2", true } }, { nbt_style = true })
@since 1.7
@changed 1.106.0 Added `options` overload and `unicode_strings` option.
@see textutils.json_null Use to serialise a JSON `null` value.
@see textutils.empty_json_array Use to serialise a JSON empty array.
]]
function serializeJSON(t, options)
expect(1, t, "table", "string", "number", "boolean") expect(1, t, "table", "string", "number", "boolean")
expect(2, bNBTStyle, "boolean", "nil") expect(2, options, "table", "boolean", "nil")
if type(options) == "boolean" then
options = { nbt_style = options }
elseif type(options) == "table" then
field(options, "nbt_style", "boolean", "nil")
field(options, "unicode_strings", "boolean", "nil")
end
local tTracking = {} local tTracking = {}
return serializeJSONImpl(t, tTracking, bNBTStyle or false) return serializeJSONImpl(t, tTracking, options)
end end
serialiseJSON = serializeJSON -- GB version serialiseJSON = serializeJSON -- GB version

View File

@ -143,8 +143,10 @@ describe("The textutils library", function()
textutils.serialiseJSON({}) textutils.serialiseJSON({})
textutils.serialiseJSON(false) textutils.serialiseJSON(false)
textutils.serialiseJSON("", true) textutils.serialiseJSON("", true)
textutils.serializeJSON("", {})
textutils.serializeJSON(0, { nbt_style = true, unicode_strings = true })
expect.error(textutils.serialiseJSON, nil):eq("bad argument #1 (table, string, number or boolean expected, got nil)") expect.error(textutils.serialiseJSON, nil):eq("bad argument #1 (table, string, number or boolean expected, got nil)")
expect.error(textutils.serialiseJSON, "", 1):eq("bad argument #2 (boolean expected, got number)") expect.error(textutils.serialiseJSON, "", 1):eq("bad argument #2 (table or boolean expected, got number)")
end) end)
it("serializes empty arrays", function() it("serializes empty arrays", function()
@ -174,6 +176,17 @@ describe("The textutils library", function()
expect(textutils.serializeJSON({ 5, "test", nil, nil, textutils.json_null })):eq('[5,"test",null,null,null]') expect(textutils.serializeJSON({ 5, "test", nil, nil, textutils.json_null })):eq('[5,"test",null,null,null]')
expect(textutils.serializeJSON({ nil, nil, nil, nil, "text" })):eq('[null,null,null,null,"text"]') expect(textutils.serializeJSON({ nil, nil, nil, nil, "text" })):eq('[null,null,null,null,"text"]')
end) end)
it("serializes NBT style", function()
expect(textutils.serializeJSON({ test = 2 }, { nbt_style = true })):eq('{test:2}')
expect(textutils.serializeJSON({ test = 2 }, true)):eq('{test:2}') -- old style
end)
it("serializes Unicode strings", function()
expect(textutils.serializeJSON("\u{3053}\u{3093}\u{306B}\u{3061}\u{306F}", { unicode_strings = true })):eq([["\u3053\u3093\u306B\u3061\u306F"]])
expect(textutils.serializeJSON("\u{1f62f}", { unicode_strings = true })):eq([["\uD83D\uDE2F"]])
expect(textutils.serializeJSON("\\\"\u{00ff}\n\"", { unicode_strings = true })):eq('"\\\\\\"\\u00FF\\n\\""')
end)
end) end)
describe("textutils.unserializeJSON", function() describe("textutils.unserializeJSON", function()