2025-01-29 10:55:49 +01:00

705 lines
14 KiB
C

/*
LZ4X - An optimized LZ4 compressor
Written and placed in the public domain by Ilya Muravyov
*/
#ifndef _CRT_SECURE_NO_WARNINGS
#define _CRT_SECURE_NO_WARNINGS
#endif
#define _CRT_DISABLE_PERFCRIT_LOCKS
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <time.h>
#define NO_UTIME
#ifndef NO_UTIME
# include <sys/types.h>
# include <sys/stat.h>
# ifdef _MSC_VER
# include <sys/utime.h>
# else
# include <utime.h>
# endif
#endif
#ifndef _MSC_VER
# define _ftelli64 ftello64
#endif
typedef unsigned char U8;
typedef unsigned short U16;
typedef unsigned int U32;
//FILE* g_in;
//FILE* g_out;
#define LZ4_MAGIC 0x184C2102
#define BLOCK_SIZE (8<<20) // 8 MB
#define PADDING_LITERALS 5
#define WINDOW_BITS 16
#define WINDOW_SIZE (1<<WINDOW_BITS)
#define WINDOW_MASK (WINDOW_SIZE-1)
#define MIN_MATCH 4
#define EXCESS (16+(BLOCK_SIZE/255))
static U8 g_buf[BLOCK_SIZE+BLOCK_SIZE+EXCESS];
#define MIN(a, b) (((a)<(b))?(a):(b))
#define MAX(a, b) (((a)>(b))?(a):(b))
#define LOAD_16(p) (*(const U16*)(&g_buf[p]))
#define LOAD_32(p) (*(const U32*)(&g_buf[p]))
#define STORE_16(p, x) (*(U16*)(&g_buf[p])=(x))
#define COPY_32(d, s) (*(U32*)(&g_buf[d])=LOAD_32(s))
#define HASH_BITS 18
#define HASH_SIZE (1<<HASH_BITS)
#define NIL (-1)
#define HASH_32(p) ((LOAD_32(p)*0x9E3779B9)>>(32-HASH_BITS))
static inline void wild_copy(int d, int s, int n)
{
COPY_32(d, s);
COPY_32(d+4, s+4);
for (int i=8; i<n; i+=8)
{
COPY_32(d+i, s+i);
COPY_32(d+4+i, s+4+i);
}
}
#if 0
void compress(const int max_chain)
{
static int head[HASH_SIZE];
static int tail[WINDOW_SIZE];
int n;
while ((n=fread(g_buf, 1, BLOCK_SIZE, g_in))>0)
{
for (int i=0; i<HASH_SIZE; ++i)
head[i]=NIL;
int op=BLOCK_SIZE;
int pp=0;
int p=0;
while (p<n)
{
int best_len=0;
int dist=0;
const int max_match=(n-PADDING_LITERALS)-p;
if (max_match>=MAX(12-PADDING_LITERALS, MIN_MATCH))
{
const int limit=MAX(p-WINDOW_SIZE, NIL);
int chain_len=max_chain;
int s=head[HASH_32(p)];
while (s>limit)
{
if (g_buf[s+best_len]==g_buf[p+best_len] && LOAD_32(s)==LOAD_32(p))
{
int len=MIN_MATCH;
while (len<max_match && g_buf[s+len]==g_buf[p+len])
++len;
if (len>best_len)
{
best_len=len;
dist=p-s;
if (len==max_match)
break;
}
}
if (--chain_len==0)
break;
s=tail[s&WINDOW_MASK];
}
}
if (best_len>=MIN_MATCH)
{
int len=best_len-MIN_MATCH;
const int nib=MIN(len, 15);
if (pp!=p)
{
const int run=p-pp;
if (run>=15)
{
g_buf[op++]=(15<<4)+nib;
int j=run-15;
for (; j>=255; j-=255)
g_buf[op++]=255;
g_buf[op++]=j;
}
else
g_buf[op++]=(run<<4)+nib;
wild_copy(op, pp, run);
op+=run;
}
else
g_buf[op++]=nib;
STORE_16(op, dist);
op+=2;
if (len>=15)
{
len-=15;
for (; len>=255; len-=255)
g_buf[op++]=255;
g_buf[op++]=len;
}
pp=p+best_len;
while (p<pp)
{
const U32 h=HASH_32(p);
tail[p&WINDOW_MASK]=head[h];
head[h]=p++;
}
}
else
{
const U32 h=HASH_32(p);
tail[p&WINDOW_MASK]=head[h];
head[h]=p++;
}
}
if (pp!=p)
{
const int run=p-pp;
if (run>=15)
{
g_buf[op++]=15<<4;
int j=run-15;
for (; j>=255; j-=255)
g_buf[op++]=255;
g_buf[op++]=j;
}
else
g_buf[op++]=run<<4;
wild_copy(op, pp, run);
op+=run;
}
const int comp_len=op-BLOCK_SIZE;
fwrite(&comp_len, 1, sizeof(comp_len), g_out);
fwrite(&g_buf[BLOCK_SIZE], 1, comp_len, g_out);
fprintf(stderr, "%lld -> %lld\r", _ftelli64(g_in), _ftelli64(g_out));
}
}
void compress_optimal()
{
static int head[HASH_SIZE];
static int nodes[WINDOW_SIZE][2];
static struct
{
int cum;
int len;
int dist;
} path[BLOCK_SIZE+1];
int n;
while ((n=fread(g_buf, 1, BLOCK_SIZE, g_in))>0)
{
// Pass 1: Find all matches
for (int i=0; i<HASH_SIZE; ++i)
head[i]=NIL;
for (int p=0; p<n; ++p)
{
int best_len=0;
int dist=0;
const int max_match=(n-PADDING_LITERALS)-p;
if (max_match>=MAX(12-PADDING_LITERALS, MIN_MATCH))
{
const int limit=MAX(p-WINDOW_SIZE, NIL);
int* left=&nodes[p&WINDOW_MASK][1];
int* right=&nodes[p&WINDOW_MASK][0];
int left_len=0;
int right_len=0;
const U32 h=HASH_32(p);
int s=head[h];
head[h]=p;
while (s>limit)
{
int len=MIN(left_len, right_len);
if (g_buf[s+len]==g_buf[p+len])
{
while (++len<max_match && g_buf[s+len]==g_buf[p+len]);
if (len>best_len)
{
best_len=len;
dist=p-s;
if (len==max_match || len>=(1<<16))
break;
}
}
if (g_buf[s+len]<g_buf[p+len])
{
*right=s;
right=&nodes[s&WINDOW_MASK][1];
s=*right;
right_len=len;
}
else
{
*left=s;
left=&nodes[s&WINDOW_MASK][0];
s=*left;
left_len=len;
}
}
*left=NIL;
*right=NIL;
}
path[p].len=best_len;
path[p].dist=dist;
}
// Pass 2: Build the shortest path
path[n].cum=0;
int count=15;
for (int p=n-1; p>0; --p)
{
int c0=path[p+1].cum+1;
if (--count==0)
{
count=255;
++c0;
}
int len=path[p].len;
if (len>=MIN_MATCH)
{
int c1=1<<30;
const int j=MAX(len-255, MIN_MATCH);
for (int i=len; i>=j; --i)
{
int tmp=path[p+i].cum+3;
if (i>=(15+MIN_MATCH))
tmp+=1+((i-(15+MIN_MATCH))/255);
if (tmp<c1)
{
c1=tmp;
len=i;
}
}
if (c1<=c0)
{
path[p].cum=c1;
path[p].len=len;
count=15;
}
else
{
path[p].cum=c0;
path[p].len=0;
}
}
else
path[p].cum=c0;
}
// Pass 3: Output the codes
int op=BLOCK_SIZE;
int pp=0;
int p=0;
while (p<n)
{
if (path[p].len>=MIN_MATCH)
{
int len=path[p].len-MIN_MATCH;
const int nib=MIN(len, 15);
if (pp!=p)
{
const int run=p-pp;
if (run>=15)
{
g_buf[op++]=(15<<4)+nib;
int j=run-15;
for (; j>=255; j-=255)
g_buf[op++]=255;
g_buf[op++]=j;
}
else
g_buf[op++]=(run<<4)+nib;
wild_copy(op, pp, run);
op+=run;
}
else
g_buf[op++]=nib;
STORE_16(op, path[p].dist);
op+=2;
if (len>=15)
{
len-=15;
for (; len>=255; len-=255)
g_buf[op++]=255;
g_buf[op++]=len;
}
p+=path[p].len;
pp=p;
}
else
++p;
}
if (pp!=p)
{
const int run=p-pp;
if (run>=15)
{
g_buf[op++]=15<<4;
int j=run-15;
for (; j>=255; j-=255)
g_buf[op++]=255;
g_buf[op++]=j;
}
else
g_buf[op++]=run<<4;
wild_copy(op, pp, run);
op+=run;
}
const int comp_len=op-BLOCK_SIZE;
fwrite(&comp_len, 1, sizeof(comp_len), g_out);
fwrite(&g_buf[BLOCK_SIZE], 1, comp_len, g_out);
fprintf(stderr, "%lld -> %lld\r", _ftelli64(g_in), _ftelli64(g_out));
}
}
#endif
static size_t kread(void* dst, size_t size, const char* src, size_t* offset, size_t compressedSize) {
size_t realSize = MIN(size, compressedSize - *offset);
memcpy(dst, &src[*offset], realSize);
*offset += realSize;
return realSize;
}
static size_t kwrite(void* src, size_t size, char* dst, size_t* offset, int maxOutputSize) {
size_t realSize = MIN(size, maxOutputSize - *offset);
memcpy(&dst[*offset], src, size);
*offset += realSize;
return realSize;
}
//int decompress()
#ifdef KORE_LZ4X
int LZ4_decompress_safe(const char *source, char *buf, int compressedSize, int maxOutputSize)
{
size_t read_offset = 0;
size_t write_offset = 0;
int comp_len;
while (kread(&comp_len, sizeof(comp_len), source, &read_offset, compressedSize)>0)
{
if (comp_len<2 || comp_len>(BLOCK_SIZE+EXCESS)
|| kread(&g_buf[BLOCK_SIZE], comp_len, source, &read_offset, compressedSize)!=comp_len)
return -1;
int p=0;
int ip=BLOCK_SIZE;
const int ip_end=ip+comp_len;
for (;;)
{
const int token=g_buf[ip++];
if (token>=16)
{
int run=token>>4;
if (run==15)
{
for (;;)
{
const int c=g_buf[ip++];
run+=c;
if (c!=255)
break;
}
}
if ((p+run)>BLOCK_SIZE)
return -1;
wild_copy(p, ip, run);
p+=run;
ip+=run;
if (ip>=ip_end)
break;
}
int s=p-LOAD_16(ip);
ip+=2;
if (s<0)
return -1;
int len=(token&15)+MIN_MATCH;
if (len==(15+MIN_MATCH))
{
for (;;)
{
const int c=g_buf[ip++];
len+=c;
if (c!=255)
break;
}
}
if ((p+len)>BLOCK_SIZE)
return -1;
if ((p-s)>=4)
{
wild_copy(p, s, len);
p+=len;
}
else
{
while (len--!=0)
g_buf[p++]=g_buf[s++];
}
}
if (kwrite(g_buf, p, buf, &write_offset, maxOutputSize)!=p)
{
kinc_error_message("Fwrite() failed");
return -1;
}
}
return 0;
}
#endif
#if 0
int main(int argc, char** argv)
{
const clock_t start=clock();
int level=4;
bool do_decomp=false;
bool overwrite=false;
while (argc>1 && *argv[1]=='-')
{
for (int i=1; argv[1][i]!='\0'; ++i)
{
switch (argv[1][i])
{
case '1':
case '2':
case '3':
case '4':
case '5':
case '6':
case '7':
case '8':
case '9':
level=argv[1][i]-'0';
break;
case 'd':
do_decomp=true;
break;
case 'f':
overwrite=true;
break;
default:
fprintf(stderr, "Unknown option: -%c\n", argv[1][i]);
exit(1);
}
}
--argc;
++argv;
}
if (argc<2)
{
fprintf(stderr,
"LZ4X - An optimized LZ4 compressor, v1.60\n"
"Written and placed in the public domain by Ilya Muravyov\n"
"\n"
"Usage: LZ4X [options] infile [outfile]\n"
"\n"
"Options:\n"
" -1 Compress faster\n"
" -9 Compress better\n"
" -d Decompress\n"
" -f Force overwrite of output file\n");
exit(1);
}
g_in=fopen(argv[1], "rb");
if (!g_in)
{
perror(argv[1]);
exit(1);
}
char out_name[FILENAME_MAX];
if (argc<3)
{
strcpy(out_name, argv[1]);
if (do_decomp)
{
const int p=strlen(out_name)-4;
if (p>0 && strcmp(&out_name[p], ".lz4")==0)
out_name[p]='\0';
else
strcat(out_name, ".out");
}
else
strcat(out_name, ".lz4");
}
else
strcpy(out_name, argv[2]);
if (!overwrite)
{
FILE* f=fopen(out_name, "rb");
if (f)
{
fclose(f);
fprintf(stderr, "%s already exists. Overwrite (y/n)? ", out_name);
fflush(stderr);
if (getchar()!='y')
{
fprintf(stderr, "Not overwritten\n");
exit(1);
}
}
}
if (do_decomp)
{
int magic;
fread(&magic, 1, sizeof(magic), g_in);
if (magic!=LZ4_MAGIC)
{
fprintf(stderr, "%s: Not in Legacy format\n", argv[1]);
exit(1);
}
g_out=fopen(out_name, "wb");
if (!g_out)
{
perror(out_name);
exit(1);
}
fprintf(stderr, "Decompressing %s:\n", argv[1]);
if (decompress()!=0)
{
fprintf(stderr, "%s: Corrupt input\n", argv[1]);
exit(1);
}
}
else
{
g_out=fopen(out_name, "wb");
if (!g_out)
{
perror(out_name);
exit(1);
}
const int magic=LZ4_MAGIC;
fwrite(&magic, 1, sizeof(magic), g_out);
fprintf(stderr, "Compressing %s:\n", argv[1]);
if (level==9)
compress_optimal();
else
compress((level<8)?1<<level:WINDOW_SIZE);
}
fprintf(stderr, "%lld -> %lld in %1.3f sec\n", _ftelli64(g_in),
_ftelli64(g_out), double(clock()-start)/CLOCKS_PER_SEC);
fclose(g_in);
fclose(g_out);
#ifndef NO_UTIME
struct _stati64 sb;
if (_stati64(argv[1], &sb)!=0)
{
perror("Stat() failed");
exit(1);
}
struct utimbuf ub;
ub.actime=sb.st_atime;
ub.modtime=sb.st_mtime;
if (utime(out_name, &ub)!=0)
{
perror("Utime() failed");
exit(1);
}
#endif
return 0;
}
#endif