From 03f685eff7d8d5338da1e12251253180b5f38309 Mon Sep 17 00:00:00 2001 From: gloryknight Date: Wed, 19 Sep 2018 21:52:12 +0200 Subject: [PATCH] Selective node splitting. Nodes are split on defined code. By default breakCode is 44 which is comma symbol. Using setBreakCode it is possible to change the value. It may be a good idea to set breakCode to some obscure value (say 0) and ask users to change it to 44 or other value if needed. --- libs/lz-string.js | 25 +++++++++++++++++++++---- 1 file changed, 21 insertions(+), 4 deletions(-) diff --git a/libs/lz-string.js b/libs/lz-string.js index 7697d31..690a0e5 100644 --- a/libs/lz-string.js +++ b/libs/lz-string.js @@ -16,6 +16,7 @@ var LZString = (function () { streamDataPosition, streamBitsPerChar, streamGetCharFromInt, + breakCode=44, reverseDict = {}, base = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+", Base64CharArray = (base + "/=").split(''), @@ -61,7 +62,8 @@ var LZString = (function () { node = _node(3), // first node will always be initialised like this. nextNode, dictSize = 3, - numBitsMask = 0b100; + numBitsMask = 0b100, + forceBreak=true; if (uncompressed.length) { // If there is a string, the first charCode is guaranteed to @@ -87,8 +89,16 @@ var LZString = (function () { for (j = 1; j < uncompressed.length; j++) { c = uncompressed.charCodeAt(j); - // does the new charCode match an existing prefix? - nextNode = node.d[c]; + + // split Node at defined split symbol (do not split if the node starts with the symbol) + if (c===breakCode && forceBreak) { + nextNode=false; + forceBreak=false; + } else { + // does the new charCode match an existing prefix? + nextNode = node.d[c]; + } + if (nextNode) { // continue with next prefix node = nextNode; @@ -100,6 +110,11 @@ var LZString = (function () { // Then we set node to the root node matching // the charCode. + // mark the node if it starts not with the split symbol + if (c!==breakCode) { + forceBreak=true; + } + if (freshNode) { // Prefix is a freshly added character token, // which was already written to the bitstream @@ -369,7 +384,9 @@ var LZString = (function () { return _decompress(compressed.length, 16, function (index) { return compressed.charCodeAt(index); }); }, - decompressFromArray: _decompressFromArray + decompressFromArray: _decompressFromArray, + setBreakCode: function (a) { breakCode=a; }, + getBreakCode: function () { return breakCode; } }; })();