|
| 1 | +/*! bz2 (C) 2019-present SheetJS LLC */ |
| 2 | + |
| 3 | +'use strict'; |
| 4 | + |
| 5 | +(function bz2() { |
| 6 | +// https://www.ncbi.nlm.nih.gov/IEB/ToolBox/CPP_DOC/lxr/source/src/util/compress/bzip2/crctable.c |
| 7 | + const crc32Table = [ |
| 8 | + 0x00000000, 0x04c11db7, 0x09823b6e, 0x0d4326d9, 0x130476dc, 0x17c56b6b, 0x1a864db2, 0x1e475005, |
| 9 | + 0x2608edb8, 0x22c9f00f, 0x2f8ad6d6, 0x2b4bcb61, 0x350c9b64, 0x31cd86d3, 0x3c8ea00a, 0x384fbdbd, |
| 10 | + 0x4c11db70, 0x48d0c6c7, 0x4593e01e, 0x4152fda9, 0x5f15adac, 0x5bd4b01b, 0x569796c2, 0x52568b75, |
| 11 | + 0x6a1936c8, 0x6ed82b7f, 0x639b0da6, 0x675a1011, 0x791d4014, 0x7ddc5da3, 0x709f7b7a, 0x745e66cd, |
| 12 | + 0x9823b6e0, 0x9ce2ab57, 0x91a18d8e, 0x95609039, 0x8b27c03c, 0x8fe6dd8b, 0x82a5fb52, 0x8664e6e5, |
| 13 | + 0xbe2b5b58, 0xbaea46ef, 0xb7a96036, 0xb3687d81, 0xad2f2d84, 0xa9ee3033, 0xa4ad16ea, 0xa06c0b5d, |
| 14 | + 0xd4326d90, 0xd0f37027, 0xddb056fe, 0xd9714b49, 0xc7361b4c, 0xc3f706fb, 0xceb42022, 0xca753d95, |
| 15 | + 0xf23a8028, 0xf6fb9d9f, 0xfbb8bb46, 0xff79a6f1, 0xe13ef6f4, 0xe5ffeb43, 0xe8bccd9a, 0xec7dd02d, |
| 16 | + 0x34867077, 0x30476dc0, 0x3d044b19, 0x39c556ae, 0x278206ab, 0x23431b1c, 0x2e003dc5, 0x2ac12072, |
| 17 | + 0x128e9dcf, 0x164f8078, 0x1b0ca6a1, 0x1fcdbb16, 0x018aeb13, 0x054bf6a4, 0x0808d07d, 0x0cc9cdca, |
| 18 | + 0x7897ab07, 0x7c56b6b0, 0x71159069, 0x75d48dde, 0x6b93dddb, 0x6f52c06c, 0x6211e6b5, 0x66d0fb02, |
| 19 | + 0x5e9f46bf, 0x5a5e5b08, 0x571d7dd1, 0x53dc6066, 0x4d9b3063, 0x495a2dd4, 0x44190b0d, 0x40d816ba, |
| 20 | + 0xaca5c697, 0xa864db20, 0xa527fdf9, 0xa1e6e04e, 0xbfa1b04b, 0xbb60adfc, 0xb6238b25, 0xb2e29692, |
| 21 | + 0x8aad2b2f, 0x8e6c3698, 0x832f1041, 0x87ee0df6, 0x99a95df3, 0x9d684044, 0x902b669d, 0x94ea7b2a, |
| 22 | + 0xe0b41de7, 0xe4750050, 0xe9362689, 0xedf73b3e, 0xf3b06b3b, 0xf771768c, 0xfa325055, 0xfef34de2, |
| 23 | + 0xc6bcf05f, 0xc27dede8, 0xcf3ecb31, 0xcbffd686, 0xd5b88683, 0xd1799b34, 0xdc3abded, 0xd8fba05a, |
| 24 | + 0x690ce0ee, 0x6dcdfd59, 0x608edb80, 0x644fc637, 0x7a089632, 0x7ec98b85, 0x738aad5c, 0x774bb0eb, |
| 25 | + 0x4f040d56, 0x4bc510e1, 0x46863638, 0x42472b8f, 0x5c007b8a, 0x58c1663d, 0x558240e4, 0x51435d53, |
| 26 | + 0x251d3b9e, 0x21dc2629, 0x2c9f00f0, 0x285e1d47, 0x36194d42, 0x32d850f5, 0x3f9b762c, 0x3b5a6b9b, |
| 27 | + 0x0315d626, 0x07d4cb91, 0x0a97ed48, 0x0e56f0ff, 0x1011a0fa, 0x14d0bd4d, 0x19939b94, 0x1d528623, |
| 28 | + 0xf12f560e, 0xf5ee4bb9, 0xf8ad6d60, 0xfc6c70d7, 0xe22b20d2, 0xe6ea3d65, 0xeba91bbc, 0xef68060b, |
| 29 | + 0xd727bbb6, 0xd3e6a601, 0xdea580d8, 0xda649d6f, 0xc423cd6a, 0xc0e2d0dd, 0xcda1f604, 0xc960ebb3, |
| 30 | + 0xbd3e8d7e, 0xb9ff90c9, 0xb4bcb610, 0xb07daba7, 0xae3afba2, 0xaafbe615, 0xa7b8c0cc, 0xa379dd7b, |
| 31 | + 0x9b3660c6, 0x9ff77d71, 0x92b45ba8, 0x9675461f, 0x8832161a, 0x8cf30bad, 0x81b02d74, 0x857130c3, |
| 32 | + 0x5d8a9099, 0x594b8d2e, 0x5408abf7, 0x50c9b640, 0x4e8ee645, 0x4a4ffbf2, 0x470cdd2b, 0x43cdc09c, |
| 33 | + 0x7b827d21, 0x7f436096, 0x7200464f, 0x76c15bf8, 0x68860bfd, 0x6c47164a, 0x61043093, 0x65c52d24, |
| 34 | + 0x119b4be9, 0x155a565e, 0x18197087, 0x1cd86d30, 0x029f3d35, 0x065e2082, 0x0b1d065b, 0x0fdc1bec, |
| 35 | + 0x3793a651, 0x3352bbe6, 0x3e119d3f, 0x3ad08088, 0x2497d08d, 0x2056cd3a, 0x2d15ebe3, 0x29d4f654, |
| 36 | + 0xc5a92679, 0xc1683bce, 0xcc2b1d17, 0xc8ea00a0, 0xd6ad50a5, 0xd26c4d12, 0xdf2f6bcb, 0xdbee767c, |
| 37 | + 0xe3a1cbc1, 0xe760d676, 0xea23f0af, 0xeee2ed18, 0xf0a5bd1d, 0xf464a0aa, 0xf9278673, 0xfde69bc4, |
| 38 | + 0x89b8fd09, 0x8d79e0be, 0x803ac667, 0x84fbdbd0, 0x9abc8bd5, 0x9e7d9662, 0x933eb0bb, 0x97ffad0c, |
| 39 | + 0xafb010b1, 0xab710d06, 0xa6322bdf, 0xa2f33668, 0xbcb4666d, 0xb8757bda, 0xb5365d03, 0xb1f740b4, |
| 40 | + ]; |
| 41 | + |
| 42 | + // generated from 1 << i, except for 32 |
| 43 | + const masks = [ |
| 44 | + 0x00000000, 0x00000001, 0x00000003, 0x00000007, |
| 45 | + 0x0000000f, 0x0000001f, 0x0000003f, 0x0000007f, |
| 46 | + 0x000000ff, 0x000001ff, 0x000003ff, 0x000007ff, |
| 47 | + 0x00000fff, 0x00001fff, 0x00003fff, 0x00007fff, |
| 48 | + 0x0000ffff, 0x0001ffff, 0x0003ffff, 0x0007ffff, |
| 49 | + 0x000fffff, 0x001fffff, 0x003fffff, 0x007fffff, |
| 50 | + 0x00ffffff, 0x01ffffff, 0x03ffffff, 0x07ffffff, |
| 51 | + 0x0fffffff, 0x1fffffff, 0x3fffffff, -0x80000000, |
| 52 | + ]; |
| 53 | + |
| 54 | + function createOrderedHuffmanTable(lengths) { |
| 55 | + const z = []; |
| 56 | + for (let i = 0; i < lengths.length; i += 1) { |
| 57 | + z.push([i, lengths[i]]); |
| 58 | + } |
| 59 | + z.push([lengths.length, -1]); |
| 60 | + const table = []; |
| 61 | + let start = z[0][0]; |
| 62 | + let bits = z[0][1]; |
| 63 | + for (let i = 0; i < z.length; i += 1) { |
| 64 | + const finish = z[i][0]; |
| 65 | + const endbits = z[i][1]; |
| 66 | + if (bits) { |
| 67 | + for (let code = start; code < finish; code += 1) { |
| 68 | + table.push({ code, bits, symbol: undefined }); |
| 69 | + } |
| 70 | + } |
| 71 | + start = finish; |
| 72 | + bits = endbits; |
| 73 | + if (endbits === -1) { |
| 74 | + break; |
| 75 | + } |
| 76 | + } |
| 77 | + table.sort((a, b) => ((a.bits - b.bits) || (a.code - b.code))); |
| 78 | + let tempBits = 0; |
| 79 | + let symbol = -1; |
| 80 | + const fastAccess = []; |
| 81 | + let current; |
| 82 | + for (let i = 0; i < table.length; i += 1) { |
| 83 | + const t = table[i]; |
| 84 | + symbol += 1; |
| 85 | + if (t.bits !== tempBits) { |
| 86 | + symbol <<= t.bits - tempBits; |
| 87 | + tempBits = t.bits; |
| 88 | + current = fastAccess[tempBits] = {}; |
| 89 | + } |
| 90 | + t.symbol = symbol; |
| 91 | + current[symbol] = t; |
| 92 | + } |
| 93 | + return { |
| 94 | + table, |
| 95 | + fastAccess, |
| 96 | + }; |
| 97 | + } |
| 98 | + |
| 99 | + function bwtReverse(src, primary) { |
| 100 | + if (primary < 0 || primary >= src.length) { |
| 101 | + throw RangeError('Out of bound'); |
| 102 | + } |
| 103 | + const unsorted = src.slice(); |
| 104 | + src.sort((a, b) => a - b); |
| 105 | + const start = {}; |
| 106 | + for (let i = src.length - 1; i >= 0; i -= 1) { |
| 107 | + start[src[i]] = i; |
| 108 | + } |
| 109 | + const links = []; |
| 110 | + for (let i = 0; i < src.length; i += 1) { |
| 111 | + links.push(start[unsorted[i]]++); // eslint-disable-line no-plusplus |
| 112 | + } |
| 113 | + let i; |
| 114 | + const first = src[i = primary]; |
| 115 | + const ret = []; |
| 116 | + for (let j = 1; j < src.length; j += 1) { |
| 117 | + const x = src[i = links[i]]; |
| 118 | + if (x === undefined) { |
| 119 | + ret.push(255); |
| 120 | + } else { |
| 121 | + ret.push(x); |
| 122 | + } |
| 123 | + } |
| 124 | + ret.push(first); |
| 125 | + ret.reverse(); |
| 126 | + return ret; |
| 127 | + } |
| 128 | + |
| 129 | + function decompress(bytes, checkCRC = false) { |
| 130 | + let index = 0; |
| 131 | + let bitfield = 0; |
| 132 | + let bits = 0; |
| 133 | + const read = (n) => { |
| 134 | + if (n >= 32) { |
| 135 | + const nd = n >> 1; |
| 136 | + return read(nd) * (1 << nd) + read(n - nd); |
| 137 | + } |
| 138 | + while (bits < n) { |
| 139 | + bitfield = (bitfield << 8) + bytes[index]; |
| 140 | + index += 1; |
| 141 | + bits += 8; |
| 142 | + } |
| 143 | + const m = masks[n]; |
| 144 | + const r = (bitfield >> (bits - n)) & m; |
| 145 | + bits -= n; |
| 146 | + bitfield &= ~(m << bits); |
| 147 | + return r; |
| 148 | + }; |
| 149 | + |
| 150 | + const magic = read(16); |
| 151 | + if (magic !== 0x425A) { // 'BZ' |
| 152 | + throw new Error('Invalid magic'); |
| 153 | + } |
| 154 | + const method = read(8); |
| 155 | + if (method !== 0x68) { // h for huffman |
| 156 | + throw new Error('Invalid method'); |
| 157 | + } |
| 158 | + |
| 159 | + let blocksize = read(8); |
| 160 | + if (blocksize >= 49 && blocksize <= 57) { // 1..9 |
| 161 | + blocksize -= 48; |
| 162 | + } else { |
| 163 | + throw new Error('Invalid blocksize'); |
| 164 | + } |
| 165 | + |
| 166 | + let out = new Uint8Array(bytes.length * 1.5); |
| 167 | + let outIndex = 0; |
| 168 | + let newCRC = -1; |
| 169 | + while (true) { |
| 170 | + const blocktype = read(48); |
| 171 | + const crc = read(32) | 0; |
| 172 | + if (blocktype === 0x314159265359) { |
| 173 | + if (read(1)) { |
| 174 | + throw new Error('do not support randomised'); |
| 175 | + } |
| 176 | + const pointer = read(24); |
| 177 | + const used = []; |
| 178 | + const usedGroups = read(16); |
| 179 | + for (let i = 1 << 15; i > 0; i >>= 1) { |
| 180 | + if (!(usedGroups & i)) { |
| 181 | + for (let j = 0; j < 16; j += 1) { |
| 182 | + used.push(false); |
| 183 | + } |
| 184 | + continue; // eslint-disable-line no-continue |
| 185 | + } |
| 186 | + const usedChars = read(16); |
| 187 | + for (let j = 1 << 15; j > 0; j >>= 1) { |
| 188 | + used.push(!!(usedChars & j)); |
| 189 | + } |
| 190 | + } |
| 191 | + const groups = read(3); |
| 192 | + if (groups < 2 || groups > 6) { |
| 193 | + throw new Error('Invalid number of huffman groups'); |
| 194 | + } |
| 195 | + const selectorsUsed = read(15); |
| 196 | + const selectors = []; |
| 197 | + const mtf = Array.from({ length: groups }, (_, i) => i); |
| 198 | + for (let i = 0; i < selectorsUsed; i += 1) { |
| 199 | + let c = 0; |
| 200 | + while (read(1)) { |
| 201 | + c += 1; |
| 202 | + if (c >= groups) { |
| 203 | + throw new Error('MTF table out of range'); |
| 204 | + } |
| 205 | + } |
| 206 | + const v = mtf[c]; |
| 207 | + for (let j = c; j > 0; mtf[j] = mtf[--j]) { // eslint-disable-line no-plusplus |
| 208 | + // nothing |
| 209 | + } |
| 210 | + selectors.push(v); |
| 211 | + mtf[0] = v; |
| 212 | + } |
| 213 | + const symbolsInUse = used.reduce((a, b) => a + b, 0) + 2; |
| 214 | + const tables = []; |
| 215 | + for (let i = 0; i < groups; i += 1) { |
| 216 | + let length = read(5); |
| 217 | + const lengths = []; |
| 218 | + for (let j = 0; j < symbolsInUse; j += 1) { |
| 219 | + if (length < 0 || length > 20) { |
| 220 | + throw new Error('Huffman group length outside range'); |
| 221 | + } |
| 222 | + while (read(1)) { |
| 223 | + length -= (read(1) * 2) - 1; |
| 224 | + } |
| 225 | + lengths.push(length); |
| 226 | + } |
| 227 | + tables.push(createOrderedHuffmanTable(lengths)); |
| 228 | + } |
| 229 | + const favourites = []; |
| 230 | + for (let i = 0; i < used.length - 1; i += 1) { |
| 231 | + if (used[i]) { |
| 232 | + favourites.push(i); |
| 233 | + } |
| 234 | + } |
| 235 | + let decoded = 0; |
| 236 | + let selectorPointer = 0; |
| 237 | + let t; |
| 238 | + let r; |
| 239 | + let repeat = 0; |
| 240 | + let repeatPower = 0; |
| 241 | + const buffer = []; |
| 242 | + while (true) { |
| 243 | + decoded -= 1; |
| 244 | + if (decoded <= 0) { |
| 245 | + decoded = 50; |
| 246 | + if (selectorPointer <= selectors.length) { |
| 247 | + t = tables[selectors[selectorPointer]]; |
| 248 | + selectorPointer += 1; |
| 249 | + } |
| 250 | + } |
| 251 | + for (const b in t.fastAccess) { |
| 252 | + if (!Object.prototype.hasOwnProperty.call(t.fastAccess, b)) { |
| 253 | + continue; // eslint-disable-line no-continue |
| 254 | + } |
| 255 | + if (bits < b) { |
| 256 | + bitfield = (bitfield << 8) + bytes[index]; |
| 257 | + index += 1; |
| 258 | + bits += 8; |
| 259 | + } |
| 260 | + r = t.fastAccess[b][bitfield >> (bits - b)]; |
| 261 | + if (r) { |
| 262 | + bitfield &= masks[bits -= b]; |
| 263 | + r = r.code; |
| 264 | + break; |
| 265 | + } |
| 266 | + } |
| 267 | + if (r >= 0 && r <= 1) { |
| 268 | + if (repeat === 0) { |
| 269 | + repeatPower = 1; |
| 270 | + } |
| 271 | + repeat += repeatPower << r; |
| 272 | + repeatPower <<= 1; |
| 273 | + continue; // eslint-disable-line no-continue |
| 274 | + } else { |
| 275 | + const v = favourites[0]; |
| 276 | + for (; repeat > 0; repeat -= 1) { |
| 277 | + buffer.push(v); |
| 278 | + } |
| 279 | + } |
| 280 | + if (r === symbolsInUse - 1) { |
| 281 | + break; |
| 282 | + } else { |
| 283 | + const v = favourites[r - 1]; |
| 284 | + // eslint-disable-next-line no-plusplus |
| 285 | + for (let j = r - 1; j > 0; favourites[j] = favourites[--j]) { |
| 286 | + // nothing |
| 287 | + } |
| 288 | + favourites[0] = v; |
| 289 | + buffer.push(v); |
| 290 | + } |
| 291 | + } |
| 292 | + const nt = bwtReverse(buffer, pointer); |
| 293 | + let i = 0; |
| 294 | + while (i < nt.length) { |
| 295 | + const c = nt[i]; |
| 296 | + let count = 1; |
| 297 | + if ((i < nt.length - 4) |
| 298 | + && nt[i + 1] === c |
| 299 | + && nt[i + 2] === c |
| 300 | + && nt[i + 3] === c) { |
| 301 | + count = nt[i + 4] + 4; |
| 302 | + i += 5; |
| 303 | + } else { |
| 304 | + i += 1; |
| 305 | + } |
| 306 | + if (outIndex + count >= out.length) { |
| 307 | + const old = out; |
| 308 | + out = new Uint8Array(old.length * 2); |
| 309 | + out.set(old); |
| 310 | + } |
| 311 | + for (let j = 0; j < count; j += 1) { |
| 312 | + if (checkCRC) { |
| 313 | + newCRC = (newCRC << 8) ^ crc32Table[((newCRC >> 24) ^ c) & 0xff]; |
| 314 | + } |
| 315 | + out[outIndex] = c; |
| 316 | + outIndex += 1; |
| 317 | + } |
| 318 | + } |
| 319 | + if (checkCRC) { |
| 320 | + const calculatedCRC = newCRC ^ -1; |
| 321 | + if (calculatedCRC !== crc) { |
| 322 | + throw new Error(`CRC mismatch: ${calculatedCRC} !== ${crc}`); |
| 323 | + } |
| 324 | + newCRC = -1; |
| 325 | + } |
| 326 | + } else if (blocktype === 0x177245385090) { |
| 327 | + read(bits & 0x07); // pad align |
| 328 | + break; |
| 329 | + } else { |
| 330 | + throw new Error('Invalid bz2 blocktype'); |
| 331 | + } |
| 332 | + } |
| 333 | + return out.subarray(0, outIndex); |
| 334 | + } |
| 335 | + |
| 336 | + const exports = { decompress }; |
| 337 | + |
| 338 | + if (typeof window !== 'undefined') { |
| 339 | + window.bz2 = exports; // eslint-disable-line no-undef |
| 340 | + } else { |
| 341 | + module.exports = exports; |
| 342 | + } |
| 343 | +}()); |
0 commit comments