-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathlibsldc.c
172 lines (147 loc) · 6.3 KB
/
libsldc.c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
/* https://www.ecma-international.org/wp-content/uploads/ECMA-321_1st_edition_june_2001.pdf */
#include "sldc.h"
#define VERSION(major,minor,release) (((major)<<16)|((minor)<<8)|(release))
#define HBUFFER_SIZE 1024
#define CTRLSYMB_FLUSH 0x1FF0 /*0b1111111110000*/
#define CTRLSYMB_SCHEME_1 0x1FF1 /*0b1111111110001*/
#define CTRLSYMB_SCHEME_2 0x1FF2 /*0b1111111110010*/
#define CTRLSYMB_FILE_MARK 0x1FF3 /*0b1111111110011*/
#define CTRLSYMB_END_OF_RECORD 0x1FF4 /*0b1111111110100*/
#define CTRLSYMB_RESET_1 0x1FF5 /*0b1111111110101*/
#define CTRLSYMB_RESET_2 0x1FF6 /*0b1111111110110*/
#define CTRLSYMB_END_MARKER 0x1FFF /*0b1111111111111*/
#define REALLOC(buffer,current,limit) \
if (current >= limit) { limit <<= 1; buffer = realloc(buffer, limit); }
const guint32 sldc_version = VERSION(1,0,0);
guint16 bin2int(guchar* buf, goffset off, guint8 sz)
{
guint16 v = 0;
for (guint8 i = 0; i < sz; i++)
v |= buf[off + i] << (sz - 1 - i);
return v;
}
guchar* sldc_compress(guchar* buffer, gsize len, gsize* outlen)
{
/* if buffer is NULL, there is absolutely nothing to compress */
if (!buffer) return NULL;
gsize cindex = 0, outsize = 1024; guchar* binbuffer = malloc(outsize);
guchar c; /* general variables */
/* for simplicity reasons this compression implementation only
yields scheme 2 literal data symbols. the major downside of
this technique is that it almost always guarantees that the
compressed data is bigger than the uncompressed data. */
/* yield a RESET_2 control symbol */
for (guint8 i = 0; i < 13; i++)
{
REALLOC(binbuffer,cindex,outsize);
binbuffer[cindex++] = (CTRLSYMB_RESET_2 >> (12 - i)) & 1;
}
/* yield scheme 2 literal bytes */
for (gsize k = 0; k < len; k++)
{
c = buffer[k];
for (guint8 i = 0; i < 8; i++)
{
REALLOC(binbuffer,cindex,outsize);
binbuffer[cindex++] = (c >> (7 - i)) & 1;
}
if (c == 0xFF)
{
REALLOC(binbuffer,cindex,outsize);
binbuffer[cindex++] = 0;
}
}
/* yield an END_OF_RECORD control symbol */
for (guint8 i = 0; i < 13; i++)
{
REALLOC(binbuffer,cindex,outsize);
binbuffer[cindex++] = (CTRLSYMB_END_OF_RECORD >> (12 - i)) & 1;
}
/* add zero-padding to align data on 32 bits boundary */
while (cindex % 32)
{
REALLOC(binbuffer,cindex,outsize);
binbuffer[cindex++] = 0;
}
/* create and populate the output compressed buffer */
*outlen = cindex / 8;
guchar* cbuffer = malloc(*outlen);
for (gsize k = 0; k < *outlen; k++)
cbuffer[k] = bin2int(binbuffer, k << 3, 8);
/* free memory resources */
free(binbuffer);
return cbuffer;
}
guchar* sldc_decompress(guchar* buffer, gsize len, gsize* outlen)
{
/* if buffer is NULL there's absolutely nothing to decompress */
if (!buffer) return NULL;
/* general variables used by the compression algorithm itself */
guchar hbuffer[HBUFFER_SIZE]; gsize hindex = 0; guint8 scheme = 0;
guchar c; guint16 MCF, DF; gboolean breakloop = FALSE;
/* build binary representation of the compressed input buffer */
guchar* binbuffer = malloc(len << 3); goffset off = 0;
for (gsize i = 0; i < len << 3; i++)
binbuffer[i] = (buffer[i / 8] & (1 << (7 - i % 8))) ? 1 : 0;
/* primary allocation of the uncompressed data output buffer */
gsize uindex = 0, outsize = 1024; guchar* ubuffer = malloc(outsize);
/* decoding loop */
while (off < len << 3)
{
/* control symbol */
if (bin2int(binbuffer, off, 9) == 0x1FF /*0b111111111*/)
{
guint16 ctrlsymb = bin2int(binbuffer, off, 13); off += 13;
switch (ctrlsymb)
{
case CTRLSYMB_FLUSH: break;
case CTRLSYMB_SCHEME_1: scheme = 1; break;
case CTRLSYMB_SCHEME_2: scheme = 2; break;
case CTRLSYMB_FILE_MARK: break;
case CTRLSYMB_END_OF_RECORD: breakloop = TRUE; break;
case CTRLSYMB_RESET_1: hindex = 0; scheme = 1; break;
case CTRLSYMB_RESET_2: hindex = 0; scheme = 2; break;
case CTRLSYMB_END_MARKER: break;
default: return NULL;
}
if (breakloop) break;
}
else if (scheme == 1) /* scheme 1 */
{
gboolean literal = binbuffer[off++] == 0 ? TRUE : FALSE;
if (literal) /* literal data */
{
c = bin2int(binbuffer, off, 8); off += 8;
REALLOC(ubuffer,uindex,outsize);
ubuffer[uindex++] = c;
hbuffer[hindex++] = c; hindex %= HBUFFER_SIZE;
}
else /* copy pointer data */
{
if (bin2int(binbuffer, off, 1) == 0x0 /*0b0*/ ) { MCF = (1<<1) + bin2int(binbuffer, off + 1, 1); off += 1 + 1; }
else if (bin2int(binbuffer, off, 2) == 0x2 /*0b10*/ ) { MCF = (1<<2) + bin2int(binbuffer, off + 2, 2); off += 2 + 2; }
else if (bin2int(binbuffer, off, 3) == 0x6 /*0b110*/ ) { MCF = (1<<3) + bin2int(binbuffer, off + 3, 3); off += 3 + 3; }
else if (bin2int(binbuffer, off, 4) == 0xE /*0b1110*/) { MCF = (1<<4) + bin2int(binbuffer, off + 4, 4); off += 4 + 4; }
else if (bin2int(binbuffer, off, 4) == 0xF /*0b1111*/) { MCF = (1<<5) + bin2int(binbuffer, off + 4, 8); off += 4 + 8; }
DF = bin2int(binbuffer, off, 10); off += 10;
for (int k = DF; k < DF + MCF; k++)
{
c = hbuffer[k % HBUFFER_SIZE];
REALLOC(ubuffer,uindex,outsize);
ubuffer[uindex++] = c;
hbuffer[hindex++] = c; hindex %= HBUFFER_SIZE;
}
}
}
else if (scheme == 2) /* scheme 2 */
{
c = bin2int(binbuffer, off, 8); off += 8 + (c == 0xFF ? 1 : 0);
REALLOC(ubuffer,uindex,outsize);
ubuffer[uindex++] = c;
}
}
*outlen = uindex;
/* free memory resources */
free(binbuffer);
return ubuffer;
}