diff options
author | yann.collet.73@gmail.com <yann.collet.73@gmail.com@650e7d94-2a16-8b24-b05c-7c0b3f6821cd> | 2011-06-04 17:15:43 (GMT) |
---|---|---|
committer | yann.collet.73@gmail.com <yann.collet.73@gmail.com@650e7d94-2a16-8b24-b05c-7c0b3f6821cd> | 2011-06-04 17:15:43 (GMT) |
commit | 6b798d5e40e4c0788f7c51f6e9b0e9c4e966d068 (patch) | |
tree | f21ae23e1e95dffeee7f5b47c37dc93656ce26a3 /lz4.c | |
parent | 0121f47e00e44a40a41d7b49852129b12f5e1d43 (diff) | |
download | lz4-6b798d5e40e4c0788f7c51f6e9b0e9c4e966d068.zip lz4-6b798d5e40e4c0788f7c51f6e9b0e9c4e966d068.tar.gz lz4-6b798d5e40e4c0788f7c51f6e9b0e9c4e966d068.tar.bz2 |
New function : LZ4_uncompress : secure version which is safe against buffer overflow attacks
New function : LZ4_uncompress_unknownOutputSize : secure but slower version which also guess the size of data to be decoded
The demo file compression program (main.c) is updated to use these new functions
LZ4_decode is still supported but in deprecated status, due to its vulnerability to malicious buffer overflow scenario
git-svn-id: https://lz4.googlecode.com/svn/trunk@9 650e7d94-2a16-8b24-b05c-7c0b3f6821cd
Diffstat (limited to 'lz4.c')
-rw-r--r-- | lz4.c | 215 |
1 files changed, 181 insertions, 34 deletions
@@ -36,6 +36,16 @@ //**************************************
+// Performance parameter <---------------------------------------------------------
+//**************************************
+// Lowering this value reduce memory usage
+// It may also improve speed, especially if you reach L1 cache size (32KB for Intel, 64KB for AMD)
+// Expanding memory usage typically improves compression ratio
+// Memory usage formula : N->2^(N+2) Bytes (examples : 17 -> 512KB ; 12 -> 16KB)
+#define HASH_LOG 17
+
+
+//**************************************
// Basic Types
//**************************************
#if defined(_MSC_VER) || defined(_WIN32) || defined(__WIN32__)
@@ -61,7 +71,6 @@ #define MAXD_LOG 16
#define MAX_DISTANCE ((1 << MAXD_LOG) - 1)
-#define HASH_LOG 17 // <--- Lower this value to lower memory usage. N->2^(N+2) Bytes (ex : 17 -> 512KB)
#define HASHTABLESIZE (1 << HASH_LOG)
#define HASH_MASK (HASHTABLESIZE - 1)
@@ -145,27 +154,21 @@ int LZ4_compressCtx(void** ctx, ref = HashTable[h];
HashTable[h] = ip;
- // Min Match
+ // Check Min Match
if (( ((ip-ref) >> MAXD_LOG) != 0) || (*(U32*)ref != sequence))
{
- if (ip-anchor>limit) { limit<<=1; step += 1 + (step>>2); }
- ip+=step;
+ if (ip-anchor>limit) { limit <<= 1; step += 1 + (step>>2); }
+ ip += step;
continue;
}
// catch up
- if (step>1)
- {
- HashTable[h] = ref;
- ip -= (step-1);
- step=1;
- continue;
- }
- limit=INCOMPRESSIBLE;
+ if (step>1) { HashTable[h] = ref; ip -= (step-1); step=1; continue; }
+ limit = INCOMPRESSIBLE;
// Encode Literal length
len = length = ip - anchor;
- orun=op++;
+ orun = op++;
if (len>(RUN_MASK-1)) { *orun=(RUN_MASK<<ML_BITS); len-=RUN_MASK; for(; len > 254 ; len-=255) *op++ = 255; *op++ = (BYTE)len; }
else *orun = (len<<ML_BITS);
@@ -191,14 +194,16 @@ int LZ4_compressCtx(void** ctx, anchor = ip;
}
-
// Encode Last Literals
len = length = iend - anchor;
- orun=op++;
- if (len>(RUN_MASK-1)) { *orun=(RUN_MASK<<ML_BITS); len-=RUN_MASK; for(; len > 254 ; len-=255) *op++ = 255; *op++ = (BYTE) len; }
- else *orun = (len<<ML_BITS);
- for(;length>0;length-=4) { *(U32*)op = *(U32*)anchor; op+=4; anchor+=4; }
- op += length; // correction
+ if (length)
+ {
+ orun=op++;
+ if (len>(RUN_MASK-1)) { *orun=(RUN_MASK<<ML_BITS); len-=RUN_MASK; for(; len > 254 ; len-=255) *op++ = 255; *op++ = (BYTE) len; }
+ else *orun = (len<<ML_BITS);
+ for(;length>0;length-=4) { *(U32*)op = *(U32*)anchor; op+=4; anchor+=4; }
+ op += length; // correction
+ }
// End
return (int) (((char*)op)-dest);
@@ -209,15 +214,15 @@ int LZ4_compressCtx(void** ctx, //****************************
// Decompression CODE
//****************************
-int LZ4_decode ( char* source,
+int LZ4_uncompress(char* source,
char* dest,
- int isize)
+ int osize)
{
// Local Variables
- BYTE *ip = (BYTE*) source,
- *iend = (BYTE*) source + isize;
+ BYTE *ip = (BYTE*) source;
BYTE *op = (BYTE*) dest,
+ *oend=(BYTE*) dest + osize,
*ref, *cpy,
runcode;
@@ -226,7 +231,7 @@ int LZ4_decode ( char* source, // Main Loop
- while (ip < iend)
+ while (1)
{
// get runlength
runcode = *ip++;
@@ -234,19 +239,21 @@ int LZ4_decode ( char* source, // copy literals
ref = op+length;
-#ifdef SAFEWRITEBUFFER
- if (ref>iend-4) { while(op<iend-3) { *(U32*)op=*(U32*)ip; op+=4; ip+=4; } while(op<ref) *op++=*ip++; }
- else
-#endif
+ if (ref>oend-4)
+ {
+ if (ref > oend) goto _output_error;
+ while(op<oend-3) { *(U32*)op=*(U32*)ip; op+=4; ip+=4; }
+ while(op<ref) *op++=*ip++;
+ break; // Necessarily EOF
+ }
while (op<ref) { *(U32*)op = *(U32*)ip; op+=4; ip+=4; }
ip-=(op-ref); op=ref; // correction
- if (ip>=iend) break; // Check EOF
// get offset
ref -= *(U16*)ip; ip+=2;
// get matchlength
- if ((length=(runcode&ML_MASK)) == ML_MASK) { for (;(len=*ip++)==255;length+=255){} length += len; }
+ if ((length=(runcode&ML_MASK)) == ML_MASK) { for (;(len=*ip++)==255;length+=255){} length += len; }
length += MINMATCH;
// copy repeated sequence
@@ -259,17 +266,157 @@ int LZ4_decode ( char* source, *op++ = *ref++;
ref -= dec[op-ref];
}
-#ifdef SAFEWRITEBUFFER
- if (cpy>iend-4) { while(op<iend-3) { *(U32*)op=*(U32*)ref; op+=4; ref+=4; } while(op<cpy) *op++=*ref++; }
- else
-#endif
+ if (cpy>oend-4)
+ {
+ if (cpy > oend) goto _output_error;
+ while(op<cpy-3) { *(U32*)op=*(U32*)ref; op+=4; ref+=4; }
+ while(op<cpy) *op++=*ref++;
+ if (op>=oend) break; // Check EOF
+ continue;
+ }
+ while(op<cpy) { *(U32*)op=*(U32*)ref; op+=4; ref+=4; }
+ op=cpy; // correction
+ }
+
+ // end of decoding
+ return (int) (((char*)ip)-source);
+
+ // write overflow error detected
+_output_error:
+ return (int) (-(((char*)ip)-source));
+}
+
+
+int LZ4_uncompress_unknownOutputSize(
+ char* source,
+ char* dest,
+ int isize,
+ int maxOutputSize)
+{
+ // Local Variables
+ BYTE *ip = (BYTE*) source,
+ *iend = ip + isize;
+
+ BYTE *op = (BYTE*) dest,
+ *oend = op + maxOutputSize,
+ *ref, *cpy,
+ runcode;
+
+ U32 dec[4]={0, 3, 2, 3};
+ int len, length;
+
+
+ // Main Loop
+ while (ip<iend)
+ {
+ // get runlength
+ runcode = *ip++;
+ if ((length=(runcode>>ML_BITS)) == RUN_MASK) { for (;(len=*ip++)==255;length+=255){} length += len; }
+
+ // copy literals
+ ref = op+length;
+ if (ref>oend-4)
+ {
+ if (ref > oend) goto _output_error;
+ while(op<oend-3) { *(U32*)op=*(U32*)ip; op+=4; ip+=4; }
+ while(op<ref) *op++=*ip++;
+ break; // Necessarily EOF
+ }
+ while (op<ref) { *(U32*)op = *(U32*)ip; op+=4; ip+=4; }
+ ip-=(op-ref); op=ref; // correction
+ if (ip>=iend) break; // check EOF
+
+ // get offset
+ ref -= *(U16*)ip; ip+=2;
+
+ // get matchlength
+ if ((length=(runcode&ML_MASK)) == ML_MASK) { for (;(len=*ip++)==255;length+=255){} length += len; }
+ length += MINMATCH;
+
+ // copy repeated sequence
+ cpy = op + length;
+ if (op-ref<4)
+ {
+ *op++ = *ref++;
+ *op++ = *ref++;
+ *op++ = *ref++;
+ *op++ = *ref++;
+ ref -= dec[op-ref];
+ }
+ if (cpy>oend-4)
+ {
+ if (cpy > oend) goto _output_error;
+ while(op<cpy-3) { *(U32*)op=*(U32*)ref; op+=4; ref+=4; }
+ while(op<cpy) *op++=*ref++;
+ if (op>=oend) break; // Check EOF
+ continue;
+ }
while(op<cpy) { *(U32*)op=*(U32*)ref; op+=4; ref+=4; }
op=cpy; // correction
}
// end of decoding
return (int) (((char*)op)-dest);
+
+ // write overflow error detected
+_output_error:
+ return (int) (-(((char*)ip)-source));
}
+//****************************
+// Deprecated functions
+//****************************
+int LZ4_decode ( char* source,
+ char* dest,
+ int isize)
+{
+ // Local Variables
+ BYTE *ip = (BYTE*)source,
+ *iend = ip + isize;
+
+ BYTE *op = (BYTE*)dest,
+ *ref, *cpy,
+ runcode;
+
+ U32 dec[4]={0, 3, 2, 3};
+ int len, length;
+
+
+ // Main Loop
+ while (ip < iend)
+ {
+ // get runlength
+ runcode = *ip++;
+ if ((length=(runcode>>ML_BITS)) == RUN_MASK) { for (;(len=*ip++)==255;length+=255){} length += len; }
+
+ // copy literals
+ ref=op+length;
+ while (op<ref) { *(U32*)op = *(U32*)ip; op+=4; ip+=4; }
+ ip-=(op-ref); op=ref; // correction
+ if (ip>=iend) break; // Check EOF
+
+ // get offset
+ ref -= *(U16*)ip; ip+=2;
+
+ // get matchlength
+ if ((length=(runcode&ML_MASK)) == ML_MASK) { for (;(len=*ip++)==255;length+=255){} length += len; }
+ length += MINMATCH;
+
+ // copy repeated sequence
+ cpy = op + length;
+ if (op-ref<4)
+ {
+ *op++ = *ref++;
+ *op++ = *ref++;
+ *op++ = *ref++;
+ *op++ = *ref++;
+ ref -= dec[op-ref];
+ }
+ while(op<cpy) { *(U32*)op=*(U32*)ref; op+=4; ref+=4; }
+ op=cpy; // correction
+ }
+ // end of decoding
+ return (int) (((char*)op)-dest);
+}
|