Advertisement
immibis

decompress

Feb 25th, 2013
140
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Lua 4.03 KB | None | 0 0
  1. local inFN, outFN
  2.  
  3. local args = {...}
  4. if #args ~= 2 then
  5.     error("Usage: "..shell.getRunningProgram().." <input file> <output file>")
  6. end
  7. inFN = args[1]
  8. outFN = args[2]
  9.  
  10. local f = fs.open(inFN, "r")
  11. local inText = f.readAll()
  12. f.close()
  13.  
  14. local inPos = 1
  15.  
  16. local huffmanCompression = true
  17.  
  18. if huffmanCompression then
  19.     -- convert characters to bits
  20.     local inBits = {}
  21.     for k = 1, #inText do
  22.         local byte = inText:sub(k, k):byte() - 32
  23.         for i = 0, 5 do
  24.             local testBit = 2 ^ i
  25.             inBits[#inBits + 1] = (byte % (2 * testBit)) >= testBit
  26.         end
  27.     end
  28.    
  29.     -- remove padding
  30.     local padbit = inBits[#inBits]
  31.     while inBits[#inBits] == padbit do
  32.         inBits[#inBits] = nil
  33.     end
  34.    
  35.     local pos = 1
  36.     local function readBit()
  37.         if pos > #inBits then error("end of stream", 2) end
  38.         pos = pos + 1
  39.         return inBits[pos - 1]
  40.     end
  41.    
  42.     -- read huffman tree
  43.     local function readTree()
  44.         if readBit() then
  45.             local byte = 0
  46.             for i = 0, 7 do
  47.                 if readBit() then
  48.                     byte = byte + 2 ^ i
  49.                 end
  50.             end
  51.             --write(string.char(byte))
  52.             return string.char(byte)
  53.         else
  54.             local subtree_0 = readTree()
  55.             local subtree_1 = readTree()
  56.             return {[false]=subtree_0, [true]=subtree_1}
  57.         end
  58.     end
  59.     local tree = readTree()
  60.    
  61.     inText = ""
  62.    
  63.     local treePos = tree
  64.     while pos <= #inBits do
  65.         local bit = readBit()
  66.         treePos = treePos[bit]
  67.         if type(treePos) ~= "table" then
  68.             inText = inText .. treePos
  69.             treePos = tree
  70.         end
  71.     end
  72.     if treePos ~= tree then
  73.         error("unexpected end of stream")
  74.     end
  75. end
  76.  
  77. local function readTo(delim)
  78.     local start = inPos
  79.     local nextCaret = inText:find(delim, inPos, true)
  80.     if not nextCaret then
  81.         inPos = #inText + 1
  82.         return inText:sub(start)
  83.     end
  84.     inPos = nextCaret + 1
  85.     return inText:sub(start, nextCaret - 1)
  86. end
  87.  
  88. -- returns iterator
  89. local function splitString(str, delim)
  90.     local pos = 1
  91.     return function()
  92.         if pos > #str then return end
  93.         local start = pos
  94.         local nextDelim = str:find(delim, pos, true)
  95.         if not nextDelim then
  96.             pos = #str + 1
  97.             return str:sub(start)
  98.         end
  99.         pos = nextDelim + 1
  100.         return str:sub(start, nextDelim - 1)
  101.     end
  102. end
  103.  
  104. local nameTable = {}
  105.  
  106. local idents = "abcdefghijklmnopqrstvuwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789_"
  107. local nextCompressed
  108. do
  109.     local validchars = idents:gsub("_","")
  110.    
  111.     local function encode(n)
  112.         local s = ""
  113.         while n > 0 do
  114.             local digit = (n % #validchars) + 1
  115.             s = s .. validchars:sub(digit, digit)
  116.             n = math.floor(n / #validchars)
  117.         end
  118.         return s
  119.     end
  120.    
  121.     local next = 0
  122.     function nextCompressed()
  123.         next = next + 1
  124.         return encode(next)
  125.     end
  126. end
  127.  
  128. for k = 1, tonumber(readTo("^")) do
  129.     local key = nextCompressed()
  130.     local value = readTo("^")
  131.     --print(key," -> ",value)
  132.     nameTable[key] = value
  133.     --assert(readTo("^") == tostring(k), "mismatch at "..k)
  134. end
  135.  
  136. local out = ""
  137.  
  138. local function onFinishSegment(isIdent, segment)
  139.     if isIdent then
  140.         if segment:sub(1, 1) == "_" then
  141.             out = out .. segment:sub(2)
  142.         else
  143.             out = out .. tostring(nameTable[segment])
  144.         end
  145.     else
  146.         out = out .. segment
  147.     end
  148. end
  149.  
  150. local parsed = {}
  151. local idents = "abcdefghijklmnopqrstvuwxyzABCDEFGHIJKLMNOPQRSTUVWXYZ0123456789_"
  152. local lastIdent = nil
  153.  
  154. for k = inPos, #inText do
  155.     local ch = inText:sub(k, k)
  156.     local isIdent = idents:find(ch, 1, true) ~= nil
  157.     if isIdent ~= lastIdent then
  158.         if #parsed > 0 then
  159.             onFinishSegment(lastIdent, parsed[#parsed])
  160.         end
  161.         parsed[#parsed+1] = ""
  162.     end
  163.     lastIdent = isIdent
  164.     parsed[#parsed] = parsed[#parsed]..ch
  165. end
  166. if #parsed > 0 then
  167.     onFinishSegment(isIdent, parsed[#parsed])
  168. end
  169.  
  170. -- convert indentation back
  171. local out2 = ""
  172. local lastIndent = ""
  173. for line in splitString(out, "\n") do
  174.     while line:sub(1,2) == "&+" do
  175.         lastIndent = lastIndent .. "\t"
  176.         line = line:sub(3)
  177.     end
  178.     while line:sub(1,2) == "&-" do
  179.         lastIndent = lastIndent:sub(1, #lastIndent - 1)
  180.         line = line:sub(3)
  181.     end
  182.     if line:sub(1,2) == "&&" then
  183.         line = line:sub(2)
  184.     end
  185.    
  186.     out2 = out2 .. lastIndent .. line .. "\n"
  187. end
  188.  
  189. --print(out2)
  190.  
  191. local f = fs.open(outFN, "w")
  192. f.write(out2)
  193. f.close()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement