json.lua 9.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401
  1. --
  2. -- json.lua
  3. --
  4. -- Copyright (c) 2019 rxi
  5. --
  6. -- Permission is hereby granted, free of charge, to any person obtaining a copy of
  7. -- this software and associated documentation files (the "Software"), to deal in
  8. -- the Software without restriction, including without limitation the rights to
  9. -- use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
  10. -- of the Software, and to permit persons to whom the Software is furnished to do
  11. -- so, subject to the following conditions:
  12. --
  13. -- The above copyright notice and this permission notice shall be included in all
  14. -- copies or substantial portions of the Software.
  15. --
  16. -- THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  17. -- IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  18. -- FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  19. -- AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  20. -- LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  21. -- OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  22. -- SOFTWARE.
  23. --
  24. json = { _version = "0.1.2" }
  25. -------------------------------------------------------------------------------
  26. -- Encode
  27. -------------------------------------------------------------------------------
  28. local encode
  29. local escape_char_map = {
  30. [ "\\" ] = "\\\\",
  31. [ "\"" ] = "\\\"",
  32. [ "\b" ] = "\\b",
  33. [ "\f" ] = "\\f",
  34. [ "\n" ] = "\\n",
  35. [ "\r" ] = "\\r",
  36. [ "\t" ] = "\\t",
  37. }
  38. local escape_char_map_inv = { [ "\\/" ] = "/" }
  39. for k, v in pairs(escape_char_map) do
  40. escape_char_map_inv[v] = k
  41. end
  42. local function escape_char(c)
  43. return escape_char_map[c] or string.format("\\u%04x", c:byte())
  44. end
  45. local function encode_nil(val)
  46. return "null"
  47. end
  48. local function encode_table(val, stack)
  49. local res = {}
  50. stack = stack or {}
  51. -- Circular reference?
  52. if stack[val] then error("circular reference") end
  53. stack[val] = true
  54. if rawget(val, 1) ~= nil or next(val) == nil then
  55. -- Treat as array -- check keys are valid and it is not sparse
  56. local n = 0
  57. for k in pairs(val) do
  58. if type(k) ~= "number" then
  59. error("invalid table: mixed or invalid key types")
  60. end
  61. n = n + 1
  62. end
  63. if n ~= #val then
  64. error("invalid table: sparse array")
  65. end
  66. -- Encode
  67. for i, v in ipairs(val) do
  68. table.insert(res, encode(v, stack))
  69. end
  70. stack[val] = nil
  71. return "[" .. table.concat(res, ",") .. "]"
  72. else
  73. -- Treat as an object
  74. for k, v in pairs(val) do
  75. if type(k) ~= "string" then
  76. error("invalid table: mixed or invalid key types")
  77. end
  78. table.insert(res, encode(k, stack) .. ":" .. encode(v, stack))
  79. end
  80. stack[val] = nil
  81. return "{" .. table.concat(res, ",") .. "}"
  82. end
  83. end
  84. local function encode_string(val)
  85. return '"' .. val:gsub('[%z\1-\31\\"]', escape_char) .. '"'
  86. end
  87. local function encode_number(val)
  88. -- Check for NaN, -inf and inf
  89. if val ~= val or val <= -math.huge or val >= math.huge then
  90. error("unexpected number value '" .. tostring(val) .. "'")
  91. end
  92. return string.format("%.14g", val)
  93. end
  94. local type_func_map = {
  95. [ "nil" ] = encode_nil,
  96. [ "table" ] = encode_table,
  97. [ "string" ] = encode_string,
  98. [ "number" ] = encode_number,
  99. [ "boolean" ] = tostring,
  100. }
  101. encode = function(val, stack)
  102. local t = type(val)
  103. local f = type_func_map[t]
  104. if f then
  105. return f(val, stack)
  106. end
  107. error("unexpected type '" .. t .. "'")
  108. end
  109. function json.encode(val)
  110. return ( encode(val) )
  111. end
  112. -------------------------------------------------------------------------------
  113. -- Decode
  114. -------------------------------------------------------------------------------
  115. local parse
  116. local function create_set(...)
  117. local res = {}
  118. for i = 1, select("#", ...) do
  119. res[ select(i, ...) ] = true
  120. end
  121. return res
  122. end
  123. local space_chars = create_set(" ", "\t", "\r", "\n")
  124. local delim_chars = create_set(" ", "\t", "\r", "\n", "]", "}", ",")
  125. local escape_chars = create_set("\\", "/", '"', "b", "f", "n", "r", "t", "u")
  126. local literals = create_set("true", "false", "null")
  127. local literal_map = {
  128. [ "true" ] = true,
  129. [ "false" ] = false,
  130. [ "null" ] = nil,
  131. }
  132. local function next_char(str, idx, set, negate)
  133. for i = idx, #str do
  134. if set[str:sub(i, i)] ~= negate then
  135. return i
  136. end
  137. end
  138. return #str + 1
  139. end
  140. local function decode_error(str, idx, msg)
  141. local line_count = 1
  142. local col_count = 1
  143. for i = 1, idx - 1 do
  144. col_count = col_count + 1
  145. if str:sub(i, i) == "\n" then
  146. line_count = line_count + 1
  147. col_count = 1
  148. end
  149. end
  150. error( string.format("%s at line %d col %d", msg, line_count, col_count) )
  151. end
  152. local function codepoint_to_utf8(n)
  153. -- http://scripts.sil.org/cms/scripts/page.php?site_id=nrsi&id=iws-appendixa
  154. local f = math.floor
  155. if n <= 0x7f then
  156. return string.char(n)
  157. elseif n <= 0x7ff then
  158. return string.char(f(n / 64) + 192, n % 64 + 128)
  159. elseif n <= 0xffff then
  160. return string.char(f(n / 4096) + 224, f(n % 4096 / 64) + 128, n % 64 + 128)
  161. elseif n <= 0x10ffff then
  162. return string.char(f(n / 262144) + 240, f(n % 262144 / 4096) + 128,
  163. f(n % 4096 / 64) + 128, n % 64 + 128)
  164. end
  165. error( string.format("invalid unicode codepoint '%x'", n) )
  166. end
  167. local function parse_unicode_escape(s)
  168. local n1 = tonumber( s:sub(3, 6), 16 )
  169. local n2 = tonumber( s:sub(9, 12), 16 )
  170. -- Surrogate pair?
  171. if n2 then
  172. return codepoint_to_utf8((n1 - 0xd800) * 0x400 + (n2 - 0xdc00) + 0x10000)
  173. else
  174. return codepoint_to_utf8(n1)
  175. end
  176. end
  177. local function parse_string(str, i)
  178. local has_unicode_escape = false
  179. local has_surrogate_escape = false
  180. local has_escape = false
  181. local last
  182. for j = i + 1, #str do
  183. local x = str:byte(j)
  184. if x < 32 then
  185. decode_error(str, j, "control character in string")
  186. end
  187. if last == 92 then -- "\\" (escape char)
  188. if x == 117 then -- "u" (unicode escape sequence)
  189. local hex = str:sub(j + 1, j + 5)
  190. if not hex:find("%x%x%x%x") then
  191. decode_error(str, j, "invalid unicode escape in string")
  192. end
  193. if hex:find("^[dD][89aAbB]") then
  194. has_surrogate_escape = true
  195. else
  196. has_unicode_escape = true
  197. end
  198. else
  199. local c = string.char(x)
  200. if not escape_chars[c] then
  201. decode_error(str, j, "invalid escape char '" .. c .. "' in string")
  202. end
  203. has_escape = true
  204. end
  205. last = nil
  206. elseif x == 34 then -- '"' (end of string)
  207. local s = str:sub(i + 1, j - 1)
  208. if has_surrogate_escape then
  209. s = s:gsub("\\u[dD][89aAbB]..\\u....", parse_unicode_escape)
  210. end
  211. if has_unicode_escape then
  212. s = s:gsub("\\u....", parse_unicode_escape)
  213. end
  214. if has_escape then
  215. s = s:gsub("\\.", escape_char_map_inv)
  216. end
  217. return s, j + 1
  218. else
  219. last = x
  220. end
  221. end
  222. decode_error(str, i, "expected closing quote for string")
  223. end
  224. local function parse_number(str, i)
  225. local x = next_char(str, i, delim_chars)
  226. local s = str:sub(i, x - 1)
  227. local n = tonumber(s)
  228. if not n then
  229. decode_error(str, i, "invalid number '" .. s .. "'")
  230. end
  231. return n, x
  232. end
  233. local function parse_literal(str, i)
  234. local x = next_char(str, i, delim_chars)
  235. local word = str:sub(i, x - 1)
  236. if not literals[word] then
  237. decode_error(str, i, "invalid literal '" .. word .. "'")
  238. end
  239. return literal_map[word], x
  240. end
  241. local function parse_array(str, i)
  242. local res = {}
  243. local n = 1
  244. i = i + 1
  245. while 1 do
  246. local x
  247. i = next_char(str, i, space_chars, true)
  248. -- Empty / end of array?
  249. if str:sub(i, i) == "]" then
  250. i = i + 1
  251. break
  252. end
  253. -- Read token
  254. x, i = parse(str, i)
  255. res[n] = x
  256. n = n + 1
  257. -- Next token
  258. i = next_char(str, i, space_chars, true)
  259. local chr = str:sub(i, i)
  260. i = i + 1
  261. if chr == "]" then break end
  262. if chr ~= "," then decode_error(str, i, "expected ']' or ','") end
  263. end
  264. return res, i
  265. end
  266. local function parse_object(str, i)
  267. local res = {}
  268. i = i + 1
  269. while 1 do
  270. local key, val
  271. i = next_char(str, i, space_chars, true)
  272. -- Empty / end of object?
  273. if str:sub(i, i) == "}" then
  274. i = i + 1
  275. break
  276. end
  277. -- Read key
  278. if str:sub(i, i) ~= '"' then
  279. decode_error(str, i, "expected string for key")
  280. end
  281. key, i = parse(str, i)
  282. -- Read ':' delimiter
  283. i = next_char(str, i, space_chars, true)
  284. if str:sub(i, i) ~= ":" then
  285. decode_error(str, i, "expected ':' after key")
  286. end
  287. i = next_char(str, i + 1, space_chars, true)
  288. -- Read value
  289. val, i = parse(str, i)
  290. -- Set
  291. res[key] = val
  292. -- Next token
  293. i = next_char(str, i, space_chars, true)
  294. local chr = str:sub(i, i)
  295. i = i + 1
  296. if chr == "}" then break end
  297. if chr ~= "," then decode_error(str, i, "expected '}' or ','") end
  298. end
  299. return res, i
  300. end
  301. local char_func_map = {
  302. [ '"' ] = parse_string,
  303. [ "0" ] = parse_number,
  304. [ "1" ] = parse_number,
  305. [ "2" ] = parse_number,
  306. [ "3" ] = parse_number,
  307. [ "4" ] = parse_number,
  308. [ "5" ] = parse_number,
  309. [ "6" ] = parse_number,
  310. [ "7" ] = parse_number,
  311. [ "8" ] = parse_number,
  312. [ "9" ] = parse_number,
  313. [ "-" ] = parse_number,
  314. [ "t" ] = parse_literal,
  315. [ "f" ] = parse_literal,
  316. [ "n" ] = parse_literal,
  317. [ "[" ] = parse_array,
  318. [ "{" ] = parse_object,
  319. }
  320. parse = function(str, idx)
  321. local chr = str:sub(idx, idx)
  322. local f = char_func_map[chr]
  323. if f then
  324. return f(str, idx)
  325. end
  326. decode_error(str, idx, "unexpected character '" .. chr .. "'")
  327. end
  328. function json.decode(str)
  329. if type(str) ~= "string" then
  330. error("expected argument of type string, got " .. type(str))
  331. end
  332. local res, idx = parse(str, next_char(str, 1, space_chars, true))
  333. idx = next_char(str, idx, space_chars, true)
  334. if idx <= #str then
  335. decode_error(str, idx, "trailing garbage")
  336. end
  337. return res
  338. end
  339. return json