This repository has been archived on 2024-09-19. You can view files and clone it, but cannot push or open issues or pull requests.
dkjson/jsontest.lua
2013-10-13 21:11:53 +02:00

513 lines
15 KiB
Lua

local encode, decode, dkencode, dkdecode
local test_module, opt = ... -- command line argument
--local test_module = 'cmj-json'
--local test_module = 'dkjson'
--local test_module = 'dkjson-nopeg'
--local test_module = 'fleece'
--local test_module = 'jf-json'
--locel test_module = 'lua-yajl'
--local test_module = 'mp-cjson'
--local test_module = 'nm-json'
--local test_module = 'sb-json'
--local test_module = 'th-json'
--local opt = "esc" -- Test which characters in the BMP get escaped and whether this is correct
--local opt = "esc_full" -- Full range from 0 to 0x10ffff
--local opt = "esc_asc" -- Just 0 to 127
--local opt = "refcycle" -- What happens when a reference cycle gets encoded?
local testlocale = "de_DE.UTF8"
local function inlocale(fn)
local oldloc = os.setlocale(nil, 'numeric')
if not os.setlocale(testlocale, 'numeric') then
print("test could not switch to locale "..testlocale)
else
fn()
end
os.setlocale(oldloc, 'numeric')
end
if test_module == 'dkjson-nopeg' then
test_module = 'dkjson'
package.preload["lpeg"] = function () error "lpeg disabled" end
package.loaded["lpeg"] = nil
lpeg = nil
end
if test_module == 'dkjson-lulpeg' then
test_module = 'dkjson'
package.loaded["lpeg"] = require "lulpeg"
end
do
-- http://chiselapp.com/user/dhkolf/repository/dkjson/
local dkjson = require "dkjson"
dkencode = dkjson.encode
dkdecode = dkjson.decode
end
if test_module == 'cmj-json' then
-- https://github.com/craigmj/json4lua/
-- http://json.luaforge.net/
local json = require "cmjjson" -- renamed, the original file was just 'json'
encode = json.encode
decode = json.decode
elseif test_module == 'dkjson' then
-- http://chiselapp.com/user/dhkolf/repository/dkjson/
encode = dkencode
decode = dkdecode
elseif test_module == 'fleece' then
-- http://www.eonblast.com/fleece/
local fleece = require "fleece"
encode = function(x) return fleece.json(x, "E4") end
elseif test_module == 'jf-json' then
-- http://regex.info/blog/lua/json
local json = require "jfjson" -- renamed, the original file was just 'JSON'
encode = function(x) return json:encode(x) end
decode = function(x) return json:decode(x) end
elseif test_module == 'lua-yajl' then
-- http://github.com/brimworks/lua-yajl
local yajl = require ("yajl")
encode = yajl.to_string
decode = yajl.to_value
elseif test_module == 'mp-cjson' then
-- http://www.kyne.com.au/~mark/software/lua-cjson.php
local json = require "cjson"
encode = json.encode
decode = json.decode
elseif test_module == 'nm-json' then
-- http://luaforge.net/projects/luajsonlib/
local json = require "LuaJSON"
encode = json.encode or json.stringify
decode = json.decode or json.parse
elseif test_module == 'sb-json' then
-- http://www.chipmunkav.com/downloads/Json.lua
local json = require "sbjson" -- renamed, the original file was just 'Json'
encode = json.Encode
decode = json.Decode
elseif test_module == 'th-json' then
-- https://github.com/harningt/luajson
-- http://luaforge.net/projects/luajson/
local json = require "json"
encode = json.encode
decode = json.decode
else
print "No module specified"
return
end
if not encode then
print ("No encode method")
else
local x, r
local escapecodes = {
["\""] = "\\\"", ["\\"] = "\\\\", ["\b"] = "\\b", ["\f"] = "\\f",
["\n"] = "\\n", ["\r"] = "\\r", ["\t"] = "\\t", ["/"] = "\\/"
}
local function test (x, n, expect)
local enc = encode{ x }:match("^%s*%[%s*%\"(.-)%\"%s*%]%s*$")
if not enc or (escapecodes[x] ~= enc
and ("\\u%04x"):format(n) ~= enc:gsub("[A-F]", string.lower)
and not (expect and enc:match("^"..expect.."$"))) then
print(("U+%04X isn't encoded correctly: %q"):format(n, enc))
end
end
-- necessary escapes for JSON:
for i = 0,31 do
test(string.char(i), i)
end
test("\"", ("\""):byte())
test("\\", ("\\"):byte())
-- necessary escapes for JavaScript:
test("\226\128\168", 0x2028)
test("\226\128\169", 0x2029)
-- invalid escapes that were seen in the wild:
test("'", ("'"):byte(), "%'")
r,x = pcall (encode, { [1000] = "x" })
if not r then
print ("encoding a sparse array (#=0) raises an error:", x)
else
if #x > 30 then
print ("sparse array (#=0) encoded as:", x:sub(1,15).." <...> "..x:sub(-15,-1), "#"..#x)
else
print ("sparse array (#=0) encoded as:", x)
end
end
r,x = pcall (encode, { [1] = "a", [1000] = "x" })
if not r then
print ("encoding a sparse array (#=1) raises an error:", x)
else
if #x > 30 then
print ("sparse array (#=1) encoded as:", x:sub(1,15).." <...> "..x:sub(-15,-1), "#str="..#x)
else
print ("sparse array (#=1) encoded as:", x)
end
end
r,x = pcall (encode, { [1] = "a", [5] = "c", ["x"] = "x" })
if not r then
print ("encoding a mixed table raises an error:", x)
else
print ("mixed table encoded as:", x)
end
r, x = pcall(encode, { math.huge*0 }) -- NaN
if not r then
print ("encoding NaN raises an error:", x)
else
r = dkdecode(x)
if not r then
print ("NaN isn't converted into valid JSON:", x)
elseif type(r[1]) == "number" and r[1] == r[1] then -- a number, but not NaN
print ("NaN is converted into a valid number:", x)
else
print ("NaN is converted to:", x)
end
end
if test_module == 'fleece' then
print ("Fleece (0.3.1) is known to freeze on +/-Inf")
else
r, x = pcall(encode, { math.huge }) -- +Inf
if not r then
print ("encoding +Inf raises an error:", x)
else
r = dkdecode(x)
if not r then
print ("+Inf isn't converted into valid JSON:", x)
else
print ("+Inf is converted to:", x)
end
end
r, x = pcall(encode, { -math.huge }) -- -Inf
if not r then
print ("encoding -Inf raises an error:", x)
else
r = dkdecode(x)
if not r then
print ("-Inf isn't converted into valid JSON:", x)
else
print ("-Inf is converted to:", x)
end
end
end
inlocale(function ()
local r, x = pcall(encode, { 0.5 })
if not r then
print("encoding 0.5 in locale raises an error:", x)
elseif not x:find(".", 1, true) then
print("In locale 0.5 isn't converted into valid JSON:", x)
end
end)
end
if not decode then
print ("No decode method")
else
local x, r
x = decode[=[ ["\u0000"] ]=]
if x[1] ~= "\000" then
print ("\\u0000 isn't decoded correctly")
end
x = decode[=[ ["\u20AC"] ]=]
if x[1] ~= "\226\130\172" then
print ("\\u20AC isn't decoded correctly")
end
x = decode[=[ ["\uD834\uDD1E"] ]=]
if x[1] ~= "\240\157\132\158" then
print ("\\uD834\\uDD1E isn't decoded correctly")
end
r, x = pcall(decode, [=[
{"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x":
{"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x":
{"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x":
{"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x": {"x":{"x":{"x":{"x":{"x":
"deep down"
} } } } } } } } } } } } } } }
} } } } } } } } } } } } } } }
} } } } } } } } } } } } } } }
} } } } } } } } } } } } } } }
]=])
if not r then
print ("decoding a deep nested table raises an error:", x)
else
local i = 0
while type(x) == 'table' do
i = i + 1
x = x.x
end
if i ~= 60 or x ~= "deep down" then
print ("deep nested table isn't decoded correctly")
end
end
if false and test_module == 'cmj-json' then
-- unfortunatly the version can't be read
print ("decoding a big array takes ages (or forever?) on cmj-json prior to version 0.9.5")
else
r, x = pcall(decode, "["..("0,"):rep(100000).."0]")
if not r then
print ("decoding a big array raises an error:", x)
else
if type(x) ~= 'table' or #x ~= 100001 then
print ("big array isn't decoded correctly")
end
end
end
r, x = pcall(decode, "{}")
if not r then
print ("decoding an empty object raises an error:", x)
end
r, x = pcall(decode, "[]")
if not r then
print ("decoding an empty array raises an error:", x)
end
r, x = pcall(decode, "[1e+2]")
if not r then
print ("decoding a number with exponential notation raises an error:", x)
elseif x[1] ~= 1e+2 then
print ("1e+2 decoded incorrectly:", r[1])
end
inlocale(function ()
local r, x = pcall(decode, "[0.5]")
if not r then
print("decoding 0.5 in locale raises an error:", x)
elseif not x then
print("cannot decode 0.5 in locale")
elseif x[1] ~= 0.5 then
print("decoded 0.5 incorrectly in locale:", x[1])
end
end)
-- special tests for dkjson:
if test_module == 'dkjson' then
x = dkdecode[=[ [{"x":0}] ]=]
local m = getmetatable(x)
if not m or m.__jsontype ~= 'array' then
print ("<metatable>.__jsontype ~= array")
end
local m = getmetatable(x[1])
if not m or m.__jsontype ~= 'object' then
print ("<metatable>.__jsontype ~= object")
end
local x,p,m = dkdecode" invalid "
if p ~= 2 or type(m) ~= 'string' or not m:find("at line 1, column 2$") then
print (("Invalid location: position=%d, message=%q"):format(p,m))
end
local x,p,m = dkdecode" \n invalid "
if p ~= 4 or type(m) ~= 'string' or not m:find("at line 2, column 2$") then
print (("Invalid location: position=%d, message=%q"):format(p,m))
end
end
end
if encode and opt == "refcycle" then
local a = {}
a.a = a
print ("Trying a reference cycle...")
encode(a)
end
if encode and (opt or ""):sub(1,3) == "esc" then
local strchar, strbyte, strformat = string.char, string.byte, string.format
local floor = math.floor
local function unichar (value)
if value < 0 then
return nil
elseif value <= 0x007f then
return strchar (value)
elseif value <= 0x07ff then
return strchar (0xc0 + floor(value/0x40),
0x80 + (floor(value) % 0x40))
elseif value <= 0xffff then
return strchar (0xe0 + floor(value/0x1000),
0x80 + (floor(value/0x40) % 0x40),
0x80 + (floor(value) % 0x40))
elseif value <= 0x10ffff then
return strchar (0xf0 + floor(value/0x40000),
0x80 + (floor(value/0x1000) % 0x40),
0x80 + (floor(value/0x40) % 0x40),
0x80 + (floor(value) % 0x40))
else
return nil
end
end
local escapecodes = {
["\""] = "\\\"", ["\\"] = "\\\\", ["\b"] = "\\b", ["\f"] = "\\f",
["\n"] = "\\n", ["\r"] = "\\r", ["\t"] = "\\t", ["/"] = "\\/"
}
local function escapeutf8 (uchar)
local a, b, c, d = strbyte (uchar, 1, 4)
a, b, c, d = a or 0, b or 0, c or 0, d or 0
if a <= 0x7f then
value = a
elseif 0xc0 <= a and a <= 0xdf and b >= 0x80 then
value = (a - 0xc0) * 0x40 + b - 0x80
elseif 0xe0 <= a and a <= 0xef and b >= 0x80 and c >= 0x80 then
value = ((a - 0xe0) * 0x40 + b - 0x80) * 0x40 + c - 0x80
elseif 0xf0 <= a and a <= 0xf7 and b >= 0x80 and c >= 0x80 and d >= 0x80 then
value = (((a - 0xf0) * 0x40 + b - 0x80) * 0x40 + c - 0x80) * 0x40 + d - 0x80
else
return ""
end
if value <= 0xffff then
return strformat ("\\u%.4x", value)
elseif value <= 0x10ffff then
-- encode as UTF-16 surrogate pair
value = value - 0x10000
local highsur, lowsur = 0xD800 + floor (value/0x400), 0xDC00 + (value % 0x400)
return strformat ("\\u%.4x\\u%.4x", highsur, lowsur)
else
return ""
end
end
local isspecial = {}
local unifile = io.open("UnicodeData.txt")
if unifile then
-- <http://www.unicode.org/Public/UNIDATA/UnicodeData.txt>
-- each line consists of 15 parts for each defined codepoints
local pat = {}
for i = 1,14 do
pat[i] = "[^;]*;"
end
pat[1] = "([^;]*);" -- Codepoint
pat[3] = "([^;]*);" -- Category
pat[15] = "[^;]*"
pat = table.concat(pat)
for line in unifile:lines() do
local cp, cat = line:match(pat)
if cat:match("^C[^so]") or cat:match("^Z[lp]") then
isspecial[tonumber(cp, 16)] = cat
end
end
unifile:close()
end
local x,xe
local t = {}
local esc = {}
local escerr = {}
local range
if opt == "esc_full" then range = 0x10ffff
elseif opt == "esc_asc" then range = 0x7f
else range = 0xffff end
for i = 0,range do
t[1] = unichar(i)
xe = encode(t)
x = string.match(xe, "^%s*%[%s*%\"(.*)%\"%s*%]%s*$")
if type(x) ~= 'string' then
escerr[i] = xe
elseif string.lower(x) == escapeutf8(t[1]) then
esc[i] = 'u'
elseif x == escapecodes[t[1]] then
esc[i] = 'c'
elseif x:sub(1,1) == "\\" then
escerr[i] = xe
end
end
do
local i = 0
while i <= range do
local first
while i <= range and not (esc[i] or isspecial[i]) do i = i + 1 end
if i > range then break end
first = i
local special = isspecial[i]
if esc[i] and special then
while esc[i] and isspecial[i] == special do i = i + 1 end
if i-1 > first then
print (("Escaped %s characters from U+%04X to U+%04X"):format(special,first,i-1))
else
print (("Escaped %s character U+%04X"):format(special,first))
end
elseif esc[i] then
while esc[i] and not isspecial[i] do i = i + 1 end
if i-1 > first then
print (("Escaped from U+%04X to U+%04X"):format(first,i-1))
else
if first >= 32 and first <= 127 then
print (("Escaped U+%04X (%c)"):format(first,first))
else
print (("Escaped U+%04X"):format(first))
end
end
elseif special then
while not esc[i] and isspecial[i] == special do i = i + 1 end
if i-1 > first then
print (("Unescaped %s characters from U+%04X to U+%04X"):format(special,first,i-1))
else
print (("Unescaped %s character U+%04X"):format(special,first))
end
end
end
end
do
local i = 0
while i <= range do
local first
while i <= range and not escerr[i] do i = i + 1 end
if not escerr[i] then break end
first = i
while escerr[i] do i = i + 1 end
if i-1 > first then
print (("Errors while escaping from U+%04X to U+%04X"):format(first, i-1))
else
print (("Errors while escaping U+%04X"):format(first))
end
end
end
end
-- Copyright (C) 2011 David Heiko Kolf
--
-- Permission is hereby granted, free of charge, to any person obtaining
-- a copy of this software and associated documentation files (the
-- "Software"), to deal in the Software without restriction, including
-- without limitation the rights to use, copy, modify, merge, publish,
-- distribute, sublicense, and/or sell copies of the Software, and to
-- permit persons to whom the Software is furnished to do so, subject to
-- the following conditions:
--
-- The above copyright notice and this permission notice shall be
-- included in all copies or substantial portions of the Software.
--
-- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
-- EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
-- MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
-- NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
-- BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
-- ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
-- CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
-- SOFTWARE.