基於lua 5.2.3 封裝實現一個可供其餘lua腳本使用的功能模塊,具體要求爲: 一、實現一個標準的lua功能模塊 二、封裝json格式的數據與lua value間的互相轉換功能 三、遵循json格式定義確保相同的數據源彼此轉換後數據仍然一致 四、只容許使用lua內建基礎庫,不容許使用任何第三方開發庫 五、有合理的註釋和單元測試代碼 六、獨立完成此做業,對任何代碼抄襲現象零容忍 基本要求: 提交lua代碼文件名爲json.lua,測試代碼和文檔(若是有)能夠打一個包做爲第二個附件提交 json.lua中須要實現如下接口: function Marshal(json_str) return lua_val end function Unmarshal(lua_val) return "json_str" end 對基本要求的說明: 一、lua版本要求5.2.3 二、lua的空table統一轉化成json的空object,而不是空array 三、test case中的json_str符合ECMA-404 json格式標準 四、Unmarshal傳入的lua_val若是是table的話,不會有循環嵌套 五、table若是是以array方式使用,轉換以下:{[2]=1,[4]=1} == {nil,1,nil,1} <-> [null,1,null,1] 六、table中有string key時,統一處理成hash table的格式,如:{1,2;a=3} -> {"1":1,"2":2","a":3} 七、不會出現相似 {1,2;["2"]="same key 2 in json"} 形成轉換有歧義的table 八、Unicode轉成lua字符串時,按lua的字符串格式 \xXX\xYY... 九、能成功轉換的話,只須要return單個值 進階要求: 對test case的錯誤進行檢查,返回相應錯誤 function Marshal(json_str) return nil, "error_type" end 基本測試方法: local json = require 'json' local test_result1 = json.Marshal('{"a":1}') local test_result2 = json.Unmarshal{ b="cd" } -- validate test_result1 & test_result2
首先這個問題是實現一個模塊,在lua 5.1版開始,lua已經爲模塊和包定義了一系列的規則,咱們須要使用table,函數,元表和環境來實現這些規則。其中lua提供了兩個重要的函數實現這些規則,分別是require(使用模塊函數)和module(建立模塊函數)。數組
require "<模塊名>"。其實這裏require的功能感受和dofile比較像,可是仍是存在區別的,require詳細的內容我目前也不是很理解,這裏先略去。函數
local modname = ... local M = {} _G[modname] = M package.loaded[modname] = M <setup for external access> setfenv(1,M)
module(...,package.seeall) function Marshal(json_str) print(json_str) end function Unmarshal(lua_content) print(lua_content) end
json的語法很是的簡單,數據在 名稱/值 對中,數據由逗號分隔,花括號保存對象,方括號保存數組;
首先json數據是由對象 or 數組組成的基本結構;
因此會有兩個dict進行轉換; 關於unicode碼的轉換後面進行解釋;
json_to_lua = { ['\\"] = '"', ['\\/'] = '/', ['\\\\'] = '\\' ["\\t"] = "\t", ["\\f"] = "\f", ["\\r"] = "\r", ["\\n"] = "\n", ["\\b"] = "\b" } lua_json = { ['"'] = '\\"', ['\\'] = '\\\\', ['/'] = '\\/', ['\b'] = '\\b', ['\f'] = '\\f', ['\n'] = '\\n', ['\r'] = '\\r', ['\t'] = '\\t' }
a. Marsha1解析json字符串的接口,從第一個個字符開始遍歷json字符串,position設置爲1。
b. skipBlank函數跳過空格,tab,換行等空白字符;
c. 找到第一個有效字符,‘{’或者‘[’,分別繼續調用decodeObject和decodeArray函數返回相應的內部lua table便可。若是不是這兩個符號,則此json字符串存在格式錯誤。
--two interface encode json or decode json function M.Marshal(json_str) local nowTime = os.time() --json must be json array or object local position = 1 position = M.skipBlank(json_str,position) --null json string case local json_len = string.len(json_str) if position > json_len then return nil,[[null json string]] end --change to json object or json array --otherwise,invalid local c = string.sub(json_str,position,position) local res if c == [[{]] then res = M.decodeObject(json_str,position) elseif c == [[[]] then res = M.decodeArray(json_str,position) else res = nil,[[error that json no an object or array,invalid]] end M.MarshalTime = M.MarshalTime + os.time() - nowTime return res end
--skip the blank character --blank character include space,\n \r \t --params --[in] json_str : json string --[in] position : current position of the string --[out] the next of end position of the blank character function skipBlank(json_str,position) local blankcharacter = ' \t\r\n' local json_len = string.len(json_str) while position <= json_len do local c = string.sub(json_str,position,position) --malformed pattern (missing ']'),error if c == "[" then return position elseif string.find(blankcharacter,c) then position = position + 1 else break end end return position end
解析json object
json object開始於 '{',結束於 '}',由key:value對組成,由 ',' 分隔;
不斷的讀取key , ':' , value 而後填入相應的lua table,返回lua table便可;
其中利用計數的方法保證 ',' 的語法正確;
--decode from json object --begin with '{' --params --[in] json_str : json string --[in] position : current position of the string --[out] lua table , the next of end the end position of the string function decodeObject(json_str,position) local lua_object = {} local key,subobject,subarray,str,number,othervalue local c = string.sub(json_str,position,position) --check case if c ~= [[{]] then base.print [[error that object not start with { ]] return nil,[[error in decodeObject begin]] end position = position + 1 position = skipBlank(json_str,position) c = string.sub(json_str,position,position) if c == [[}]] then position = position + 1 return lua_object,position end --then json array including {key:value,key:value,key:value,...} --key --> string --value including --string --number --object --array --true,false,nil ---------------------------------------------------------------- local precount = -1 local curcount = 0 local json_len = string.len(json_str) while position <= json_len do position = skipBlank(json_str,position) c = string.sub(json_str,position,position) --key:value if c == [[}]] then --object over if precount >= curcount then --,is adjace to ] base.print "error that , is adjace to }" return nil,"error that , is adjace to }" end break elseif c == [[,]] then --next key:value or over position = position + 1 precount = precount + 1 if 0 == curcount then --,is the first,error base.print [[error that , in key:value is the first]] return nil,[[error that , in key:value is the first]] end if precount >= curcount then --,is more than one base.print [[error that , in key:value is more than one]] return nil,[[error that , in key:value is more than one]] end elseif c == [["]] then --begin key:value key,position = decodeString(json_str,position) --: position = skipBlank(json_str,position) c = string.sub(json_str,position,position) if c ~= [[:]] then base.print [[error,that object not key:value format]] return nil,[[error in decodeObject,format error]] else position = position + 1 end --begin value position = skipBlank(json_str,position) c = string.sub(json_str,position,position) if c == '[' then subarray,position = decodeArray(json_str,position) lua_object[key] = subarray elseif c == '{' then subobject,position = decodeObject(json_str,position) lua_object[key] = subobject elseif c == [["]] then str,position = decodeString(json_str,position) lua_object[key] = str elseif string.find([[+-0123456789.e]],c) then number,position = decodeNumber(json_str,position) lua_object[key] = number else othervalue,position = decodeOther(json_str,position) if othervalue then lua_object[key] = othervalue end end if not lua_object[key] then base.print [[error in json object key:value --> value,can't get value]] return nil,[[error in decodeObject value]] else curcount = curcount + 1 end --end value else base.print [[error json format]] return nil,[[error json format,in decodeObject end]] end end return lua_object,position + 1 end
解析json array
json array的解析開始於 '[' 符號,結束於 ']' 符號,value值之間利用 ',' 隔開;
建立一個lua table,針對value值利用 t[#t+1] = value插入新的值,新的值根據符號調用相應的decode方法便可,
其中爲了確保json語法錯誤被檢測出來,利用計數的方法保證 ',' 語法的正確;
--decode from json array --begin with '[' --params --[in] json_str : json string --[in] position : current position of the string --[out] lua table , the next of end the end position of the string function decodeArray(json_str,position) local lua_array = {} local c = string.sub(json_str,position,position) --check case if c ~= [[[]] then base.print [[error that array not start with [ ]] return nil,[[error in decodeArray begin]] end position = position + 1 position = skipBlank(json_str,position) c = string.sub(json_str,position,position) if c == ']' then position = position + 1 return lua_array,position end --then json array including [value,value,value...] --value including --string --number --object --array --true,false,nil ------------------------------------------------------------------------- --about [,] or ["hello",] or [,"hello"] or ["hello",,"world"] check error --using pre count & cur count to find this local precount = -1 local curcount = 0 local json_len = string.len(json_str) while position <= json_len do position = skipBlank(json_str,position) c = string.sub(json_str,position,position) if c == '[' then subarray,position = decodeArray(json_str,position) lua_array[#lua_array+1] = subarray curcount = curcount + 1 elseif c == '{' then subobject,position = decodeObject(json_str,position) lua_array[#lua_array+1] = subobject curcount = curcount + 1 elseif c == [["]] then str,position = decodeString(json_str,position) lua_array[#lua_array+1] = str curcount = curcount + 1 elseif string.find([[+-0123456789.e]],c) then number,position = decodeNumber(json_str,position) lua_array[#lua_array+1] = number curcount = curcount + 1 elseif c == ']' then --there is some bugs,which is end with , if precount >= curcount then --,is adjace to ] base.print "error that , is adjace to ]" return nil,"error that , is adjace to ]" end break elseif c == ',' then --there is some bugs,which is begin with , position = position + 1 precount = precount + 1 if 0 == curcount then --,is the first,error base.print [[error that , is the first]] return nil,[[error that , is the first]] end if precount >= curcount then --,is more than one base.print [[error that , is more than one]] return nil,[[error that , is more than one]] end else othervalue,position = decodeOther(json_str,position) lua_array[#lua_array+1] = othervalue curcount = curcount + 1 end end if position > json_len then base.print 'error that array not end with ]' return nil,[[error in decodeArray end]] end c = string.sub(json_str,position,position) if c ~= ']' then base.print 'error that array not end with ]' return nil,[[error in decodeArray end]] end position = position + 1 return lua_array,position end
解析json string
--decode json string,include json key of key/value and the string value --begin with ' " ' --params --[in] json_str : json string --[in] position : current position of the string --[out] lua string , the next of end the end position of the string function M.decodeString(json_str,position) nowTime = os.time() local endposition = position + 1 local json_len = string.len(json_str) while endposition <= json_len and ( [["]] ~= string.sub(json_str,endposition,endposition) or [[\]] == string.sub(json_str,endposition - 1,endposition - 1) ) do endposition = endposition + 1 end local str = string.sub(json_str,position + 1,endposition - 1) --process str str = string.gsub(str,'\\u....',function (tstr) local a = string.sub(tstr,3,6) local n = tonumber(a,16) local x if n < 0x80 then x = string.char(n % 0x80) elseif n < 0x800 then -- [110x xxxx] [10xx xxxx] x = string.char(0xC0 + (math.floor(n/64) % 0x20), 0x80 + (n % 0x40)) else -- [1110 xxxx] [10xx xxxx] [10xx xxxx] x = string.char(0xE0 + (math.floor(n/4096) % 0x10), 0x80 + (math.floor(n/64) % 0x40), 0x80 + (n % 0x40)) end return x end ) str = string.gsub(str,'\\.',escapeSequences) return str,endposition + 1 end
local ecapses = { ['"'] = '\\"', ['\\'] = '\\\\', ['/'] = '\\/', ['\b'] = '\\b', ['\f'] = '\\f', ['\n'] = '\\n', ['\r'] = '\\r', ['\t'] = '\\t' } function encodeString(s) return string.gsub(s,'.',function(c) return ecapses[c] end) end local escapeSequences = { ["\\t"] = "\t", ["\\f"] = "\f", ["\\r"] = "\r", ["\\n"] = "\n", ["\\b"] = "\b" } setmetatable(escapeSequences, {__index = function(t,k) -- skip "\" aka strip escape return string.sub(k,2) end})
解析json number
--decode json number --the valid number of json,include float,int and so on --[in] json_str : json string --[in] position : current position of the string --[out] lua number , the next of end the end position of the string function decodeNumber(json_str,position) --string to number,lua have this function - tonumber local acceptCharacter = [[+-0123456789.e]] if not string.find(acceptCharacter,string.sub(json_str,position,position)) then base.print [[error that string not start with " ]] return nil,[[error in decodeNumber begin]] end --find the endposition local endposition = position local json_len = string.len(json_str) while endposition <= json_len and string.find(acceptCharacter,string.sub(json_str,endposition,endposition)) do endposition = endposition + 1 end local number = base.tonumber(string.sub(json_str,position,endposition - 1)) if not number then base.print [[error in number format]] return nil,[[error in decodeNumber end]] end return number,endposition end
--decode other json value --include boolean value(true,false) or null --[in] json_str : json string --[in] position : current position of the string --[out] lua boolean or nil , the next of end the end position of the string function decodeOther(json_str,position) --true,false,null, --three value -- "true" --> true -- "false"--> false -- "null" --> nil OtherString = {"true","false","null"} JsonLua = { ["true"] = true,["false"] = false,["null"] = nil } for i = 1,#OtherString do local str = OtherString[i] if string.sub(json_str,position,position + string.len(str) - 1) == str then return JsonLua[str],position + string.len(str) end end base.print [[error,invalid json other,not true,false,null]] return nil,[[error in decodeOther end]] end
這部分比較簡單,也存在一種多是我考慮的比較簡單,目前感受實現仍是正確的,由於我在debug上面的時候實現了一個printLua函數,打印json轉換爲lua table的內部結構;
--this function check lua_table is array or is an object --compare to json --if there exists one key/value in the lua_table,it's an object,otherwise,it's an array --[in] lua_table : table type in lua --[out] boolean and maxnumber of array : true indicate that the lua table is an array,false indicate that the lua table is an key/value table function LuaArray(lua_table) --if lua_table is an array,it imply that all its key's type is number --if lua_table is an key/value table,imply that there exists string type in its keys --so just check all its key type local isarray = true local maxindex = 0 for k,_ in base.pairs(lua_table) do if base.type(k) ~= [[number]] then isarray = false break elseif base.type(k) == [[number]] and (math.floor(k) ~= k or k < 1) then isarray = false break else maxindex = math.max(maxindex,k) end end return isarray,maxindex end --for test lua Table --output lua table --format output table function printLuaTable(luaT,space) local ss = string.rep([[ ]],space) local isarray,alen = LuaArray(luaT) if isarray then io.write(ss .. '[\n') for i = 1,alen do io.write(ss .. [[ ]]) if base.type(luaT[i]) == "boolean" then if luaT[i] then io.write('true\n') else io.write('false\n') end elseif base.type(luaT[i]) == "number" then io.write(luaT[i] .. '\n') elseif base.type(luaT[i]) == "string" then io.write(luaT[i] .. '\n') elseif base.type(luaT[i]) == "nil" then io.write('nil\n') else printLuaTable(luaT[i],space + 4) end end io.write(ss .. ']\n') else io.write(ss .. '{\n') for k,v in base.pairs(luaT) do local str = [[ ]] .. k .. ':' io.write(ss .. str) if base.type(v) == "boolean" then if v then io.write('true\n') else io.write('false\n') end elseif base.type(v) == "number" then io.write(v .. '\n') elseif base.type(v) == "string" then io.write(v .. '\n') else printLuaTable(v,space + 4) end end end io.write(ss .. '}\n') end
--[out] json string function Unmarshal(lua_content) --like output lua_content --like printLuaTable --using table concat result = {} Unmarsha1Helper(lua_content,result) return table.concat(result) end --[in] lua_content:decode json to lua table --[in] result:table that convert to json string --like printLuaTable , all the element insert into result function Unmarsha1Helper(lua_content,result) if base.type(lua_content) ~= "table" then base.print [[error that lua_content is not table]] return nil,[[error in Unmarsha1Helper end]] end local isarray,arraylen = LuaArray(lua_content) if isarray and arraylen >= 1 then --array result[#result+1] = '[' for i = 1,arraylen do if base.type(lua_content[i]) == "boolean" then if lua_content[i] then result[#result+1] = [[true]] else result[#result+1] = [[false]] end elseif base.type(lua_content[i]) == "number" then result[#result+1] = '' .. lua_content[i] elseif base.type(lua_content[i]) == "string" then result[#result+1] = [["]] .. lua_content[i] .. [["]] elseif base.type(lua_content[i]) == "nil" then result[#result+1] = "null" else Unmarsha1Helper(lua_content[i],result) end result[#result+1] = ',' end if result[#result] == ',' then result[#result] = nil end result[#result+1] = ']' else --object result[#result+1] = [[{]] for k,v in base.pairs(lua_content) do result[#result+1] = '"' .. k .. '"' .. ':' if base.type(v) == "boolean" then if v then result[#result+1] = [[true]] else result[#result+1] = [[false]] end elseif base.type(v) == "number" then result[#result+1] = '' .. v elseif base.type(v) == "string" then result[#result+1] = [["]] .. v .. [["]] elseif base.type(v) == "nil" then result[#result+1] = "null" else Unmarsha1Helper(v,result) end result[#result+1] = ',' end if result[#result] == ',' then result[#result] = nil end result[#result+1] = [[}]] end end
Unicode符號範圍 | UTF-8編碼方式
(十六進制) | (二進制)
0000 0000-0000 007F | 0xxxxxxx
0000 0080-0000 07FF | 110xxxxx 10xxxxxx
0000 0800-0000 FFFF | 1110xxxx 10xxxxxx 10xxxxxx
0001 0000-0010 FFFF | 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx