mirror of
https://github.com/ckolivas/lrzip.git
synced 2025-12-06 07:12:00 +01:00
Display the actual amount of ram detected, and then decrease the value for calculating what the calculated window will be. Move the variables to where they're only used locally.
1042 lines
33 KiB
C
1042 lines
33 KiB
C
/*
|
|
Copyright (C) 2006-2011 Con Kolivas
|
|
Copyright (C) 2011 Peter Hyman
|
|
Copyright (C) 1998-2003 Andrew Tridgell
|
|
|
|
This program is free software; you can redistribute it and/or modify
|
|
it under the terms of the GNU General Public License as published by
|
|
the Free Software Foundation; either version 2 of the License, or
|
|
(at your option) any later version.
|
|
|
|
This program is distributed in the hope that it will be useful,
|
|
but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
GNU General Public License for more details.
|
|
|
|
You should have received a copy of the GNU General Public License
|
|
along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
*/
|
|
/* lrzip compression - main program */
|
|
#include "rzip.h"
|
|
|
|
struct rzip_control control;
|
|
|
|
static void usage(void)
|
|
{
|
|
print_output("lrzip version %d.%d%d\n", LRZIP_MAJOR_VERSION, LRZIP_MINOR_VERSION, LRZIP_MINOR_SUBVERSION);
|
|
print_output("Copyright (C) Con Kolivas 2006-2011\n");
|
|
print_output("Based on rzip ");
|
|
print_output("Copyright (C) Andrew Tridgell 1998-2003\n\n");
|
|
print_output("Usage: lrzip [options] <file...>\n");
|
|
print_output("General options:\n");
|
|
print_output(" -c check integrity of file written on decompression\n");
|
|
print_output(" -d decompress\n");
|
|
print_output(" -H display md5 hash integrity information\n");
|
|
print_output(" -i show compressed file information\n");
|
|
print_output(" -q don't show compression progress\n");
|
|
print_output(" -t test compressed file integrity\n");
|
|
print_output(" -v[v] Increase verbosity\n");
|
|
print_output(" -V show version\n");
|
|
print_output("Options affecting output:\n");
|
|
print_output(" -D delete existing files\n");
|
|
print_output(" -f force overwrite of any existing files\n");
|
|
print_output(" -k keep broken or damaged output files\n");
|
|
print_output(" -o filename specify the output file name and/or path\n");
|
|
print_output(" -O directory specify the output directory when -o is not used\n");
|
|
print_output(" -S suffix specify compressed suffix (default '.lrz')\n");
|
|
print_output("Options affecting compression:\n");
|
|
print_output(" -b bzip2 compression\n");
|
|
print_output(" -g gzip compression using zlib\n");
|
|
print_output(" -l lzo compression (ultra fast)\n");
|
|
print_output(" -n no backend compression - prepare for other compressor\n");
|
|
print_output(" -z zpaq compression (best, extreme compression, extremely slow)\n");
|
|
print_output("Low level options:\n");
|
|
print_output(" -L level set lzma/bzip2/gzip compression level (1-9, default 7)\n");
|
|
print_output(" -N value Set nice value to value (default 19)\n");
|
|
print_output(" -p value Set processor count to override number of threads\n");
|
|
print_output(" -T Disable LZO compressibility testing\n");
|
|
print_output(" -U Use unlimited window size beyond ramsize (potentially much slower)\n");
|
|
print_output(" -w size maximum compression window in hundreds of MB\n");
|
|
print_output(" default chosen by heuristic dependent on ram and chosen compression\n");
|
|
print_output("\nLRZIP=NOCONFIG environment variable setting can be used to bypass lrzip.conf.\n");
|
|
print_output("TMP environment variable will be used for storage of temporary files when needed.\n");
|
|
print_output("TMPDIR may also be stored in lrzip.conf file.\n");
|
|
print_output("\nIf no filenames or \"-\" is specified, stdin/out will be used.\n");
|
|
|
|
}
|
|
|
|
static void write_magic(int fd_in, int fd_out)
|
|
{
|
|
struct stat st;
|
|
char magic[24];
|
|
int i;
|
|
|
|
memset(magic, 0, sizeof(magic));
|
|
strcpy(magic, "LRZI");
|
|
magic[4] = LRZIP_MAJOR_VERSION;
|
|
magic[5] = LRZIP_MINOR_VERSION;
|
|
|
|
if (unlikely(fstat(fd_in, &st)))
|
|
fatal("bad magic file descriptor!?\n");
|
|
|
|
memcpy(&magic[6], &control.st_size, 8);
|
|
|
|
/* save LZMA compression flags */
|
|
if (LZMA_COMPRESS) {
|
|
for (i = 0; i < 5; i++)
|
|
magic[i + 16] = (char)control.lzma_properties[i];
|
|
}
|
|
|
|
/* This is a flag that the archive contains an md5 sum at the end
|
|
* which can be used as an integrity check instead of crc check.
|
|
* crc is still stored for compatibility with 0.5 versions.
|
|
*/
|
|
magic[21] = 1;
|
|
|
|
if (unlikely(lseek(fd_out, 0, SEEK_SET)))
|
|
fatal("Failed to seek to BOF to write Magic Header\n");
|
|
|
|
if (unlikely(write(fd_out, magic, sizeof(magic)) != sizeof(magic)))
|
|
fatal("Failed to write magic header\n");
|
|
}
|
|
|
|
static void read_magic(int fd_in, i64 *expected_size)
|
|
{
|
|
char magic[24];
|
|
uint32_t v;
|
|
int md5, i;
|
|
|
|
if (unlikely(read(fd_in, magic, sizeof(magic)) != sizeof(magic)))
|
|
fatal("Failed to read magic header\n");
|
|
|
|
*expected_size = 0;
|
|
|
|
if (unlikely(strncmp(magic, "LRZI", 4)))
|
|
failure("Not an lrzip file\n");
|
|
|
|
memcpy(&control.major_version, &magic[4], 1);
|
|
memcpy(&control.minor_version, &magic[5], 1);
|
|
|
|
/* Support the convoluted way we described size in versions < 0.40 */
|
|
if (control.major_version == 0 && control.minor_version < 4) {
|
|
memcpy(&v, &magic[6], 4);
|
|
*expected_size = ntohl(v);
|
|
memcpy(&v, &magic[10], 4);
|
|
*expected_size |= ((i64)ntohl(v)) << 32;
|
|
} else
|
|
memcpy(expected_size, &magic[6], 8);
|
|
|
|
/* restore LZMA compression flags only if stored */
|
|
if ((int) magic[16]) {
|
|
for (i = 0; i < 5; i++)
|
|
control.lzma_properties[i] = magic[i + 16];
|
|
}
|
|
|
|
/* Whether this archive contains md5 data at the end or not */
|
|
md5 = magic[21];
|
|
if (md5 == 1)
|
|
control.flags |= FLAG_MD5;
|
|
|
|
print_verbose("Detected lrzip version %d.%d file.\n", control.major_version, control.minor_version);
|
|
if (control.major_version > LRZIP_MAJOR_VERSION ||
|
|
(control.major_version == LRZIP_MAJOR_VERSION && control.minor_version > LRZIP_MINOR_VERSION))
|
|
print_output("Attempting to work with file produced by newer lrzip version %d.%d file.\n", control.major_version, control.minor_version);
|
|
}
|
|
|
|
/* preserve ownership and permissions where possible */
|
|
static void preserve_perms(int fd_in, int fd_out)
|
|
{
|
|
struct stat st;
|
|
|
|
if (unlikely(fstat(fd_in, &st)))
|
|
fatal("Failed to fstat input file\n");
|
|
if (unlikely(fchmod(fd_out, (st.st_mode & 0777))))
|
|
print_err("Warning, unable to set permissions on %s\n", control.outfile);
|
|
|
|
/* chown fail is not fatal */
|
|
if (unlikely(fchown(fd_out, st.st_uid, st.st_gid)))
|
|
print_err("Warning, unable to set owner on %s\n", control.outfile);
|
|
}
|
|
|
|
/* Open a temporary outputfile to emulate stdout */
|
|
static int open_tmpoutfile(void)
|
|
{
|
|
int fd_out;
|
|
|
|
if (STDOUT)
|
|
print_verbose("Outputting to stdout.\n");
|
|
if (control.tmpdir) {
|
|
control.outfile = realloc(NULL, strlen(control.tmpdir)+16);
|
|
if (unlikely(!control.outfile))
|
|
fatal("Failed to allocate outfile name\n");
|
|
strcpy(control.outfile, control.tmpdir);
|
|
strcat(control.outfile, "lrzipout.XXXXXX");
|
|
} else {
|
|
control.outfile = realloc(NULL, 16);
|
|
if (unlikely(!control.outfile))
|
|
fatal("Failed to allocate outfile name\n");
|
|
strcpy(control.outfile, "lrzipout.XXXXXX");
|
|
}
|
|
|
|
fd_out = mkstemp(control.outfile);
|
|
if (unlikely(fd_out == -1))
|
|
fatal("Failed to create out tmpfile: %s\n", strerror(errno));
|
|
return fd_out;
|
|
}
|
|
|
|
/* Dump temporary outputfile to perform stdout */
|
|
static void dump_tmpoutfile(int fd_out)
|
|
{
|
|
FILE *tmpoutfp;
|
|
int tmpchar;
|
|
|
|
print_progress("Dumping to stdout.\n");
|
|
/* flush anything not yet in the temporary file */
|
|
fsync(fd_out);
|
|
tmpoutfp = fdopen(fd_out, "r");
|
|
if (unlikely(tmpoutfp == NULL))
|
|
fatal("Failed to fdopen out tmpfile: %s\n", strerror(errno));
|
|
rewind(tmpoutfp);
|
|
|
|
while ((tmpchar = fgetc(tmpoutfp)) != EOF)
|
|
putchar(tmpchar);
|
|
|
|
fflush(control.msgout);
|
|
}
|
|
|
|
/* Open a temporary inputfile to perform stdin decompression */
|
|
static int open_tmpinfile(void)
|
|
{
|
|
int fd_in;
|
|
|
|
if (control.tmpdir) {
|
|
control.infile = malloc(strlen(control.tmpdir)+15);
|
|
if (unlikely(!control.infile))
|
|
fatal("Failed to allocate infile name\n");
|
|
strcpy(control.infile, control.tmpdir);
|
|
strcat(control.infile, "lrzipin.XXXXXX");
|
|
} else {
|
|
control.infile = malloc(15);
|
|
if (unlikely(!control.infile))
|
|
fatal("Failed to allocate infile name\n");
|
|
strcpy(control.infile, "lrzipin.XXXXXX");
|
|
}
|
|
|
|
fd_in = mkstemp(control.infile);
|
|
if (unlikely(fd_in == -1))
|
|
fatal("Failed to create in tmpfile: %s\n", strerror(errno));
|
|
return fd_in;
|
|
}
|
|
|
|
/* Read data from stdin into temporary inputfile */
|
|
static void read_tmpinfile(int fd_in)
|
|
{
|
|
FILE *tmpinfp;
|
|
int tmpchar;
|
|
|
|
if (control.flags & FLAG_SHOW_PROGRESS)
|
|
fprintf(control.msgout, "Copying from stdin.\n");
|
|
tmpinfp = fdopen(fd_in, "w+");
|
|
if (unlikely(tmpinfp == NULL))
|
|
fatal("Failed to fdopen in tmpfile: %s\n", strerror(errno));
|
|
|
|
while ((tmpchar = getchar()) != EOF)
|
|
fputc(tmpchar, tmpinfp);
|
|
|
|
fflush(tmpinfp);
|
|
rewind(tmpinfp);
|
|
}
|
|
|
|
/*
|
|
decompress one file from the command line
|
|
*/
|
|
static void decompress_file(void)
|
|
{
|
|
char *tmp, *tmpoutfile, *infilecopy = NULL;
|
|
int fd_in, fd_out = -1, fd_hist = -1;
|
|
i64 expected_size;
|
|
|
|
if (!STDIN) {
|
|
if ((tmp = strrchr(control.infile, '.')) && strcmp(tmp,control.suffix)) {
|
|
/* make sure infile has an extension. If not, add it
|
|
* because manipulations may be made to input filename, set local ptr
|
|
*/
|
|
infilecopy = malloc(strlen(control.infile) + strlen(control.suffix) + 1);
|
|
if (unlikely(infilecopy == NULL))
|
|
fatal("Failed to allocate memory for infile suffix\n");
|
|
else {
|
|
strcpy(infilecopy, control.infile);
|
|
strcat(infilecopy, control.suffix);
|
|
}
|
|
} else
|
|
infilecopy = strdup(control.infile);
|
|
/* regardless, infilecopy has the input filename */
|
|
}
|
|
|
|
if (!STDOUT && !TEST_ONLY) {
|
|
/* if output name already set, use it */
|
|
if (control.outname) {
|
|
control.outfile = strdup(control.outname);
|
|
} else {
|
|
/* default output name from infilecopy
|
|
* test if outdir specified. If so, strip path from filename of
|
|
* infilecopy, then remove suffix.
|
|
*/
|
|
if (control.outdir && (tmp = strrchr(infilecopy, '/')))
|
|
tmpoutfile = strdup(tmp + 1);
|
|
else
|
|
tmpoutfile = strdup(infilecopy);
|
|
|
|
/* remove suffix to make outfile name */
|
|
if ((tmp = strrchr(tmpoutfile, '.')) && !strcmp(tmp, control.suffix))
|
|
*tmp='\0';
|
|
|
|
control.outfile = malloc((control.outdir == NULL? 0: strlen(control.outdir)) + strlen(tmpoutfile) + 1);
|
|
if (unlikely(!control.outfile))
|
|
fatal("Failed to allocate outfile name\n");
|
|
|
|
if (control.outdir) { /* prepend control.outdir */
|
|
strcpy(control.outfile, control.outdir);
|
|
strcat(control.outfile, tmpoutfile);
|
|
} else
|
|
strcpy(control.outfile, tmpoutfile);
|
|
free(tmpoutfile);
|
|
}
|
|
|
|
if (!STDOUT)
|
|
print_progress("Output filename is: %s...Decompressing...\n", control.outfile);
|
|
}
|
|
|
|
if (STDIN) {
|
|
fd_in = open_tmpinfile();
|
|
read_tmpinfile(fd_in);
|
|
} else {
|
|
fd_in = open(infilecopy, O_RDONLY);
|
|
if (unlikely(fd_in == -1)) {
|
|
fatal("Failed to open %s: %s\n",
|
|
infilecopy,
|
|
strerror(errno));
|
|
}
|
|
}
|
|
|
|
if (!(TEST_ONLY | STDOUT)) {
|
|
if (FORCE_REPLACE)
|
|
fd_out = open(control.outfile, O_WRONLY | O_CREAT | O_TRUNC, 0666);
|
|
else
|
|
fd_out = open(control.outfile, O_WRONLY | O_CREAT | O_EXCL, 0666);
|
|
if (unlikely(fd_out == -1)) {
|
|
/* We must ensure we don't delete a file that already
|
|
* exists just because we tried to create a new one */
|
|
control.flags |= FLAG_KEEP_BROKEN;
|
|
fatal("Failed to create %s: %s\n", control.outfile, strerror(errno));
|
|
}
|
|
|
|
preserve_perms(fd_in, fd_out);
|
|
} else
|
|
fd_out = open_tmpoutfile();
|
|
control.fd_out = fd_out;
|
|
|
|
fd_hist = open(control.outfile, O_RDONLY);
|
|
if (unlikely(fd_hist == -1))
|
|
fatal("Failed to open history file %s\n", control.outfile);
|
|
|
|
read_magic(fd_in, &expected_size);
|
|
if (NO_MD5)
|
|
print_verbose("Not performing MD5 hash check\n");
|
|
if (HAS_MD5)
|
|
print_verbose("MD5 ");
|
|
else
|
|
print_verbose("CRC32 ");
|
|
print_verbose("being used for integrity testing.\n");
|
|
|
|
print_progress("Decompressing...");
|
|
|
|
runzip_fd(fd_in, fd_out, fd_hist, expected_size);
|
|
|
|
if (STDOUT)
|
|
dump_tmpoutfile(fd_out);
|
|
|
|
/* if we get here, no fatal errors during decompression */
|
|
print_progress("\r");
|
|
if (!(STDOUT | TEST_ONLY))
|
|
print_output("Output filename is: %s: ", control.outfile);
|
|
print_progress("[OK] - %lld bytes \n", expected_size);
|
|
|
|
if (unlikely(close(fd_hist) || close(fd_out)))
|
|
fatal("Failed to close files\n");
|
|
|
|
if (TEST_ONLY | STDOUT) {
|
|
/* Delete temporary files generated for testing or faking stdout */
|
|
if (unlikely(unlink(control.outfile)))
|
|
fatal("Failed to unlink tmpfile: %s\n", strerror(errno));
|
|
}
|
|
|
|
close(fd_in);
|
|
|
|
if (!(KEEP_FILES | TEST_ONLY) || STDIN) {
|
|
if (unlikely(unlink(control.infile)))
|
|
fatal("Failed to unlink %s: %s\n", infilecopy, strerror(errno));
|
|
}
|
|
|
|
free(control.outfile);
|
|
free(infilecopy);
|
|
}
|
|
|
|
static void get_header_info(int fd_in, uchar *ctype, i64 *c_len, i64 *u_len, i64 *last_head)
|
|
{
|
|
if (unlikely(read(fd_in, ctype, 1) != 1))
|
|
fatal("Failed to read in get_header_info\n");
|
|
|
|
if (control.major_version == 0 && control.minor_version < 4) {
|
|
u32 c_len32, u_len32, last_head32;
|
|
|
|
if (unlikely(read(fd_in, &c_len32, 4) != 4))
|
|
fatal("Failed to read in get_header_info");
|
|
if (unlikely(read(fd_in, &u_len32, 4) != 4))
|
|
fatal("Failed to read in get_header_info");
|
|
if (unlikely(read(fd_in, &last_head32, 4) != 4))
|
|
fatal("Failed to read in get_header_info");
|
|
*c_len = c_len32;
|
|
*u_len = u_len32;
|
|
*last_head = last_head32;
|
|
} else {
|
|
if (unlikely(read(fd_in, c_len, 8) != 8))
|
|
fatal("Failed to read in get_header_info");
|
|
if (unlikely(read(fd_in, u_len, 8) != 8))
|
|
fatal("Failed to read in get_header_info");
|
|
if (unlikely(read(fd_in, last_head, 8) != 8))
|
|
fatal("Failed to read_i64 in get_header_info");
|
|
}
|
|
}
|
|
|
|
static void get_fileinfo(void)
|
|
{
|
|
i64 expected_size, infile_size;
|
|
int seekspot, fd_in;
|
|
long double cratio;
|
|
uchar ctype = 0;
|
|
struct stat st;
|
|
|
|
char *tmp, *infilecopy = NULL;
|
|
|
|
if (!STDIN) {
|
|
if ((tmp = strrchr(control.infile, '.')) && strcmp(tmp,control.suffix)) {
|
|
infilecopy = malloc(strlen(control.infile) + strlen(control.suffix) + 1);
|
|
if (unlikely(infilecopy == NULL))
|
|
fatal("Failed to allocate memory for infile suffix\n");
|
|
else {
|
|
strcpy(infilecopy, control.infile);
|
|
strcat(infilecopy, control.suffix);
|
|
}
|
|
} else
|
|
infilecopy = strdup(control.infile);
|
|
}
|
|
|
|
if (STDIN)
|
|
fd_in = 0;
|
|
else {
|
|
fd_in = open(infilecopy, O_RDONLY);
|
|
if (unlikely(fd_in == -1))
|
|
fatal("Failed to open %s: %s\n", infilecopy, strerror(errno));
|
|
}
|
|
|
|
/* Get file size */
|
|
if (unlikely(fstat(fd_in, &st)))
|
|
fatal("bad magic file descriptor!?\n");
|
|
memcpy(&infile_size, &st.st_size, 8);
|
|
|
|
/* Get decompressed size */
|
|
read_magic(fd_in, &expected_size);
|
|
|
|
/* Version < 0.4 had different file format */
|
|
if (control.major_version == 0 && control.minor_version < 4)
|
|
seekspot = 50;
|
|
else if (control.major_version == 0 && control.minor_version == 4)
|
|
seekspot = 74;
|
|
else
|
|
seekspot = 75;
|
|
if (unlikely(lseek(fd_in, seekspot, SEEK_SET) == -1))
|
|
fatal("Failed to lseek in get_fileinfo: %s\n", strerror(errno));
|
|
|
|
/* Read the compression type of the first block. It's possible that
|
|
not all blocks are compressed so this may not be accurate.
|
|
*/
|
|
if (unlikely(read(fd_in, &ctype, 1) != 1))
|
|
fatal("Failed to read in get_fileinfo\n");
|
|
|
|
cratio = (long double)expected_size / (long double)infile_size;
|
|
|
|
print_output("%s:\nlrzip version: %d.%d file\n", infilecopy, control.major_version, control.minor_version);
|
|
print_output("Compression: ");
|
|
if (ctype == CTYPE_NONE)
|
|
print_output("rzip alone\n");
|
|
else if (ctype == CTYPE_BZIP2)
|
|
print_output("rzip + bzip2\n");
|
|
else if (ctype == CTYPE_LZO)
|
|
print_output("rzip + lzo\n");
|
|
else if (ctype == CTYPE_LZMA)
|
|
print_output("rzip + lzma\n");
|
|
else if (ctype == CTYPE_GZIP)
|
|
print_output("rzip + gzip\n");
|
|
else if (ctype == CTYPE_ZPAQ)
|
|
print_output("rzip + zpaq\n");
|
|
else
|
|
print_output("Dunno wtf\n");
|
|
print_output("Decompressed file size: %llu\n", expected_size);
|
|
print_output("Compressed file size: %llu\n", infile_size);
|
|
print_output("Compression ratio: %.3Lf\n", cratio);
|
|
|
|
if (HAS_MD5) {
|
|
char md5_stored[MD5_DIGEST_SIZE];
|
|
int i;
|
|
|
|
print_output("MD5 used for integrity testing\n");
|
|
if (unlikely(lseek(fd_in, -MD5_DIGEST_SIZE, SEEK_END)) == -1)
|
|
fatal("Failed to seek to md5 data in runzip_fd\n");
|
|
if (unlikely(read(fd_in, md5_stored, MD5_DIGEST_SIZE) != MD5_DIGEST_SIZE))
|
|
fatal("Failed to read md5 data in runzip_fd\n");
|
|
print_output("MD5: ");
|
|
for (i = 0; i < MD5_DIGEST_SIZE; i++)
|
|
print_output("%02x", md5_stored[i] & 0xFF);
|
|
print_output("\n");
|
|
} else
|
|
print_output("CRC32 used for integrity testing\n");
|
|
|
|
if (VERBOSE || MAX_VERBOSE) {
|
|
i64 u_len, c_len, last_head, utotal = 0, ctotal = 0, ofs = 25,
|
|
stream_head[2];
|
|
int header_length = 25, stream = 0, chunk = 0;
|
|
|
|
if (control.major_version == 0 && control.minor_version < 4)
|
|
header_length = 13;
|
|
next_chunk:
|
|
stream = 0;
|
|
stream_head[0] = 0;
|
|
stream_head[1] = stream_head[0] + header_length;
|
|
|
|
print_output("Rzip chunk %d:\n", ++chunk);
|
|
while (stream < NUM_STREAMS) {
|
|
int block = 1;
|
|
|
|
if (unlikely(lseek(fd_in, stream_head[stream] + ofs, SEEK_SET)) == -1)
|
|
fatal("Failed to seek to header data in get_fileinfo\n");
|
|
get_header_info(fd_in, &ctype, &c_len, &u_len, &last_head);
|
|
|
|
print_output("Stream: %d\n", stream);
|
|
print_maxverbose("Offset: %lld\n", ofs);
|
|
print_output("Block\tComp\tPercent\tSize\n");
|
|
do {
|
|
if (unlikely(lseek(fd_in, last_head + ofs, SEEK_SET)) == -1)
|
|
fatal("Failed to seek to header data in get_fileinfo\n");
|
|
get_header_info(fd_in, &ctype, &c_len, &u_len, &last_head);
|
|
print_output("%d\t", block);
|
|
if (ctype == CTYPE_NONE)
|
|
print_output("none");
|
|
else if (ctype == CTYPE_BZIP2)
|
|
print_output("bzip2");
|
|
else if (ctype == CTYPE_LZO)
|
|
print_output("lzo");
|
|
else if (ctype == CTYPE_LZMA)
|
|
print_output("lzma");
|
|
else if (ctype == CTYPE_GZIP)
|
|
print_output("gzip");
|
|
else if (ctype == CTYPE_ZPAQ)
|
|
print_output("zpaq");
|
|
else
|
|
print_output("Dunno wtf");
|
|
utotal += u_len;
|
|
ctotal += c_len;
|
|
print_output("\t%.1f%%\t%lld / %lld", (double)c_len / (double)(u_len / 100), c_len, u_len);
|
|
print_maxverbose("\tHead: %lld", last_head);
|
|
print_output("\n");
|
|
block++;
|
|
} while (last_head);
|
|
++stream;
|
|
}
|
|
ofs = lseek(fd_in, 0, SEEK_CUR) + c_len;
|
|
/* Chunk byte entry */
|
|
if (control.major_version == 0 && control.minor_version > 4)
|
|
ofs++;
|
|
if (ofs < infile_size - MD5_DIGEST_SIZE)
|
|
goto next_chunk;
|
|
print_output("Rzip compression: %.1f%% %lld / %lld\n",
|
|
(double)utotal / (double)(expected_size / 100),
|
|
utotal, expected_size);
|
|
print_output("Back end compression: %.1f%% %lld / %lld\n",
|
|
(double)ctotal / (double)(utotal / 100),
|
|
ctotal, utotal);
|
|
print_output("Overall compression: %.1f%% %lld / %lld\n",
|
|
(double)ctotal / (double)(expected_size / 100),
|
|
ctotal, expected_size);
|
|
}
|
|
|
|
if (STDIN) {
|
|
if (unlikely(unlink(control.infile)))
|
|
fatal("Failed to unlink %s: %s\n", infilecopy, strerror(errno));
|
|
} else
|
|
if (unlikely(close(fd_in)))
|
|
fatal("Failed to close fd_in in get_fileinfo\n");
|
|
|
|
free(control.outfile);
|
|
free(infilecopy);
|
|
}
|
|
|
|
/*
|
|
compress one file from the command line
|
|
*/
|
|
static void compress_file(void)
|
|
{
|
|
const char *tmp, *tmpinfile; /* we're just using this as a proxy for control.infile.
|
|
* Spares a compiler warning
|
|
*/
|
|
int fd_in, fd_out;
|
|
char header[24];
|
|
|
|
memset(header, 0, sizeof(header));
|
|
|
|
if (!STDIN) {
|
|
/* is extension at end of infile? */
|
|
if ((tmp = strrchr(control.infile, '.')) && !strcmp(tmp, control.suffix)) {
|
|
print_err("%s: already has %s suffix. Skipping...\n", control.infile, control.suffix);
|
|
return;
|
|
}
|
|
|
|
fd_in = open(control.infile, O_RDONLY);
|
|
if (unlikely(fd_in == -1))
|
|
fatal("Failed to open %s: %s\n", control.infile, strerror(errno));
|
|
} else
|
|
fd_in = 0;
|
|
|
|
if (!STDOUT) {
|
|
if (control.outname) {
|
|
/* check if outname has control.suffix */
|
|
if (*(control.suffix) == '\0') /* suffix is empty string */
|
|
control.outfile = strdup(control.outname);
|
|
else if ((tmp=strrchr(control.outname, '.')) && strcmp(tmp, control.suffix)) {
|
|
control.outfile = malloc(strlen(control.outname) + strlen(control.suffix) + 1);
|
|
if (unlikely(!control.outfile))
|
|
fatal("Failed to allocate outfile name\n");
|
|
strcpy(control.outfile, control.outname);
|
|
strcat(control.outfile, control.suffix);
|
|
print_output("Suffix added to %s.\nFull pathname is: %s\n", control.outname, control.outfile);
|
|
} else /* no, already has suffix */
|
|
control.outfile = strdup(control.outname);
|
|
} else {
|
|
/* default output name from control.infile
|
|
* test if outdir specified. If so, strip path from filename of
|
|
* control.infile
|
|
*/
|
|
if (control.outdir && (tmp = strrchr(control.infile, '/')))
|
|
tmpinfile = tmp + 1;
|
|
else
|
|
tmpinfile = control.infile;
|
|
|
|
control.outfile = malloc((control.outdir == NULL? 0: strlen(control.outdir)) + strlen(tmpinfile) + strlen(control.suffix) + 1);
|
|
if (unlikely(!control.outfile))
|
|
fatal("Failed to allocate outfile name\n");
|
|
|
|
if (control.outdir) { /* prepend control.outdir */
|
|
strcpy(control.outfile, control.outdir);
|
|
strcat(control.outfile, tmpinfile);
|
|
} else
|
|
strcpy(control.outfile, tmpinfile);
|
|
strcat(control.outfile, control.suffix);
|
|
print_progress("Output filename is: %s\n", control.outfile);
|
|
}
|
|
|
|
if (FORCE_REPLACE)
|
|
fd_out = open(control.outfile, O_WRONLY | O_CREAT | O_TRUNC, 0666);
|
|
else
|
|
fd_out = open(control.outfile, O_WRONLY | O_CREAT | O_EXCL, 0666);
|
|
if (unlikely(fd_out == -1)) {
|
|
/* We must ensure we don't delete a file that already
|
|
* exists just because we tried to create a new one */
|
|
control.flags |= FLAG_KEEP_BROKEN;
|
|
fatal("Failed to create %s: %s\n", control.outfile, strerror(errno));
|
|
}
|
|
} else
|
|
fd_out = open_tmpoutfile();
|
|
control.fd_out = fd_out;
|
|
|
|
preserve_perms(fd_in, fd_out);
|
|
|
|
/* write zeroes to 24 bytes at beginning of file */
|
|
if (unlikely(write(fd_out, header, sizeof(header)) != sizeof(header)))
|
|
fatal("Cannot write file header\n");
|
|
|
|
rzip_fd(fd_in, fd_out);
|
|
|
|
/* write magic at end b/c lzma does not tell us properties until it is done */
|
|
write_magic(fd_in, fd_out);
|
|
|
|
if (STDOUT)
|
|
dump_tmpoutfile(fd_out);
|
|
|
|
if (unlikely(close(fd_in) || close(fd_out)))
|
|
fatal("Failed to close files\n");
|
|
|
|
if (STDOUT) {
|
|
/* Delete temporary files generated for testing or faking stdout */
|
|
if (unlikely(unlink(control.outfile)))
|
|
fatal("Failed to unlink tmpfile: %s\n", strerror(errno));
|
|
}
|
|
|
|
if (!KEEP_FILES) {
|
|
if (unlikely(unlink(control.infile)))
|
|
fatal("Failed to unlink %s: %s\n", control.infile, strerror(errno));
|
|
}
|
|
|
|
free(control.outfile);
|
|
}
|
|
|
|
int main(int argc, char *argv[])
|
|
{
|
|
struct timeval start_time, end_time;
|
|
struct sigaction handler;
|
|
double seconds,total_time; // for timers
|
|
int c, i;
|
|
int hours,minutes;
|
|
extern int optind;
|
|
char *eptr; /* for environment */
|
|
|
|
memset(&control, 0, sizeof(control));
|
|
|
|
control.msgout = stderr;
|
|
control.flags = FLAG_SHOW_PROGRESS | FLAG_KEEP_FILES | FLAG_THRESHOLD;
|
|
control.suffix = ".lrz";
|
|
control.outdir = NULL;
|
|
control.tmpdir = NULL;
|
|
|
|
if (strstr(argv[0], "lrunzip"))
|
|
control.flags |= FLAG_DECOMPRESS;
|
|
|
|
control.compression_level = 7;
|
|
control.ramsize = get_ram();
|
|
control.window = 0;
|
|
/* for testing single CPU */
|
|
control.threads = PROCESSORS; /* get CPUs for LZMA */
|
|
control.page_size = PAGE_SIZE;
|
|
control.md5_read = 0;
|
|
|
|
control.nice_val = 19;
|
|
|
|
/* generate crc table */
|
|
CrcGenerateTable();
|
|
|
|
/* Get Temp Dir */
|
|
eptr = getenv("TMP");
|
|
if (eptr != NULL) {
|
|
control.tmpdir = malloc(strlen(eptr)+2);
|
|
if (control.tmpdir == NULL)
|
|
fatal("Failed to allocate for tmpdir\n");
|
|
strcpy(control.tmpdir, eptr);
|
|
if (strcmp(eptr+strlen(eptr) - 1, "/")) /* need a trailing slash */
|
|
strcat(control.tmpdir, "/");
|
|
}
|
|
|
|
/* Get Preloaded Defaults from lrzip.conf
|
|
* Look in ., $HOME/.lrzip/, /etc/lrzip.
|
|
* If LRZIP=NOCONFIG is set, then ignore config
|
|
*/
|
|
eptr = getenv("LRZIP");
|
|
if (eptr == NULL)
|
|
read_config(&control);
|
|
else if (!strstr(eptr,"NOCONFIG"))
|
|
read_config(&control);
|
|
|
|
while ((c = getopt(argc, argv, "L:h?dS:tVvDfqo:w:nlbUO:TN:p:gziHck")) != -1) {
|
|
switch (c) {
|
|
case 'b':
|
|
if (control.flags & FLAG_NOT_LZMA)
|
|
failure("Can only use one of -l, -b, -g, -z or -n\n");
|
|
control.flags |= FLAG_BZIP2_COMPRESS;
|
|
break;
|
|
case 'c':
|
|
control.flags |= FLAG_CHECK;
|
|
control.flags |= FLAG_HASH;
|
|
break;
|
|
case 'd':
|
|
control.flags |= FLAG_DECOMPRESS;
|
|
break;
|
|
case 'D':
|
|
control.flags &= ~FLAG_KEEP_FILES;
|
|
break;
|
|
case 'f':
|
|
control.flags |= FLAG_FORCE_REPLACE;
|
|
break;
|
|
case 'g':
|
|
if (control.flags & FLAG_NOT_LZMA)
|
|
failure("Can only use one of -l, -b, -g, -z or -n\n");
|
|
control.flags |= FLAG_ZLIB_COMPRESS;
|
|
break;
|
|
case 'h':
|
|
case '?':
|
|
usage();
|
|
return -1;
|
|
case 'H':
|
|
control.flags |= FLAG_HASH;
|
|
break;
|
|
case 'i':
|
|
control.flags |= FLAG_INFO;
|
|
break;
|
|
case 'k':
|
|
control.flags |= FLAG_KEEP_BROKEN;
|
|
break;
|
|
case 'l':
|
|
if (control.flags & FLAG_NOT_LZMA)
|
|
failure("Can only use one of -l, -b, -g, -z or -n\n");
|
|
control.flags |= FLAG_LZO_COMPRESS;
|
|
break;
|
|
case 'L':
|
|
control.compression_level = atoi(optarg);
|
|
if (control.compression_level < 1 || control.compression_level > 9)
|
|
failure("Invalid compression level (must be 1-9)\n");
|
|
break;
|
|
case 'n':
|
|
if (control.flags & FLAG_NOT_LZMA)
|
|
failure("Can only use one of -l, -b, -g, -z or -n\n");
|
|
control.flags |= FLAG_NO_COMPRESS;
|
|
break;
|
|
case 'N':
|
|
control.nice_val = atoi(optarg);
|
|
if (control.nice_val < -20 || control.nice_val > 19)
|
|
failure("Invalid nice value (must be -20..19)\n");
|
|
break;
|
|
case 'o':
|
|
if (control.outdir)
|
|
failure("Cannot have -o and -O together\n");
|
|
control.outname = optarg;
|
|
break;
|
|
case 'O':
|
|
if (control.outname) /* can't mix -o and -O */
|
|
failure("Cannot have options -o and -O together\n");
|
|
control.outdir = malloc(strlen(optarg) + 2);
|
|
if (control.outdir == NULL)
|
|
fatal("Failed to allocate for outdir\n");
|
|
strcpy(control.outdir,optarg);
|
|
if (strcmp(optarg+strlen(optarg) - 1, "/")) /* need a trailing slash */
|
|
strcat(control.outdir, "/");
|
|
break;
|
|
case 'p':
|
|
control.threads = atoi(optarg);
|
|
if (control.threads < 1)
|
|
failure("Must have at least one thread\n");
|
|
break;
|
|
case 'q':
|
|
control.flags &= ~FLAG_SHOW_PROGRESS;
|
|
break;
|
|
case 'S':
|
|
control.suffix = optarg;
|
|
break;
|
|
case 't':
|
|
if (control.outname)
|
|
failure("Cannot specify an output file name when just testing.\n");
|
|
if (!KEEP_FILES)
|
|
failure("Doubt that you want to delete a file when just testing.\n");
|
|
control.flags |= FLAG_TEST_ONLY;
|
|
break;
|
|
case 'T':
|
|
control.flags &= ~FLAG_THRESHOLD;
|
|
break;
|
|
case 'U':
|
|
control.flags |= FLAG_UNLIMITED;
|
|
break;
|
|
case 'v':
|
|
/* set verbosity flag */
|
|
if (!(control.flags & FLAG_VERBOSITY) && !(control.flags & FLAG_VERBOSITY_MAX))
|
|
control.flags |= FLAG_VERBOSITY;
|
|
else if ((control.flags & FLAG_VERBOSITY)) {
|
|
control.flags &= ~FLAG_VERBOSITY;
|
|
control.flags |= FLAG_VERBOSITY_MAX;
|
|
}
|
|
break;
|
|
case 'V':
|
|
print_output("lrzip version %d.%d%d\n",
|
|
LRZIP_MAJOR_VERSION, LRZIP_MINOR_VERSION, LRZIP_MINOR_SUBVERSION);
|
|
exit(0);
|
|
break;
|
|
case 'w':
|
|
control.window = atol(optarg);
|
|
break;
|
|
case 'z':
|
|
if (control.flags & FLAG_NOT_LZMA)
|
|
failure("Can only use one of -l, -b, -g, -z or -n\n");
|
|
control.flags |= FLAG_ZPAQ_COMPRESS;
|
|
break;
|
|
}
|
|
}
|
|
|
|
argc -= optind;
|
|
argv += optind;
|
|
|
|
if (control.outname && argc > 1)
|
|
failure("Cannot specify output filename with more than 1 file\n");
|
|
|
|
if (VERBOSE && !SHOW_PROGRESS) {
|
|
print_err("Cannot have -v and -q options. -v wins.\n");
|
|
control.flags |= FLAG_SHOW_PROGRESS;
|
|
}
|
|
|
|
if (UNLIMITED && control.window) {
|
|
print_err("If -U used, cannot specify a window size with -w.\n");
|
|
control.window = 0;
|
|
}
|
|
|
|
if (argc < 1)
|
|
control.flags |= FLAG_STDIN;
|
|
|
|
if (UNLIMITED && STDIN) {
|
|
print_err("Cannot have -U and stdin, unlimited mode disabled.\n");
|
|
control.flags &= ~ FLAG_UNLIMITED;
|
|
}
|
|
|
|
if (CHECK_FILE && (!DECOMPRESS || !TEST_ONLY))
|
|
print_err("Can only check file written on decompression or testing.\n");
|
|
|
|
/* Work out the compression overhead per compression thread for the
|
|
* compression back-ends that need a lot of ram */
|
|
if (LZMA_COMPRESS) {
|
|
int level = control.compression_level * 7 / 9 ? : 1;
|
|
i64 dictsize = (level <= 5 ? (1 << (level * 2 + 14)) :
|
|
(level == 6 ? (1 << 25) : (1 << 26)));
|
|
|
|
control.overhead = (dictsize * 23 / 2) + (4 * 1024 * 1024);
|
|
} else if (ZPAQ_COMPRESS)
|
|
control.overhead = 112 * 1024 * 1024;
|
|
|
|
/* OK, if verbosity set, print summary of options selected */
|
|
if (!INFO) {
|
|
i64 temp_chunk, temp_window, temp_ramsize; /* to show heurisitic computed values */
|
|
|
|
if (!TEST_ONLY)
|
|
print_verbose("The following options are in effect for this %s.\n",
|
|
DECOMPRESS ? "DECOMPRESSION" : "COMPRESSION");
|
|
print_verbose("Threading is %s. Number of CPUs detected: %d\n", control.threads > 1? "ENABLED" : "DISABLED",
|
|
control.threads);
|
|
print_verbose("Detected %lld bytes ram\n", control.ramsize);
|
|
print_verbose("Compression level %d\n", control.compression_level);
|
|
print_verbose("Nice Value: %d\n", control.nice_val);
|
|
print_verbose("Show Progress\n");
|
|
print_maxverbose("Max ");
|
|
print_verbose("Verbose\n");
|
|
if (FORCE_REPLACE)
|
|
print_verbose("Overwrite Files\n");
|
|
if (!KEEP_FILES)
|
|
print_verbose("Remove input files on completion\n");
|
|
if (control.outdir)
|
|
print_verbose("Output Directory Specified: %s\n", control.outdir);
|
|
else if (control.outname)
|
|
print_verbose("Output Filename Specified: %s\n", control.outname);
|
|
if (TEST_ONLY)
|
|
print_verbose("Test file integrity\n");
|
|
if (control.tmpdir)
|
|
print_verbose("Temporary Directory set as: %s\n", control.tmpdir);
|
|
|
|
/* show compression options */
|
|
if (!DECOMPRESS && !TEST_ONLY) {
|
|
print_verbose("Compression mode is: ");
|
|
if (LZMA_COMPRESS)
|
|
print_verbose("LZMA. LZO Compressibility testing %s\n", (LZO_TEST? "enabled" : "disabled"));
|
|
else if (LZO_COMPRESS)
|
|
print_verbose("LZO\n");
|
|
else if (BZIP2_COMPRESS)
|
|
print_verbose("BZIP2. LZO Compressibility testing %s\n", (LZO_TEST? "enabled" : "disabled"));
|
|
else if (ZLIB_COMPRESS)
|
|
print_verbose("GZIP\n");
|
|
else if (ZPAQ_COMPRESS)
|
|
print_verbose("ZPAQ. LZO Compressibility testing %s\n", (LZO_TEST? "enabled" : "disabled"));
|
|
else if (NO_COMPRESS)
|
|
print_verbose("RZIP pre-processing only\n");
|
|
if (control.window)
|
|
print_verbose("Compression Window: %lld = %lldMB\n", control.window, control.window * 100ull);
|
|
/* show heuristically computed window size */
|
|
if (!control.window && !UNLIMITED) {
|
|
temp_ramsize = control.ramsize;
|
|
if (BITS32)
|
|
temp_ramsize = MAX(temp_ramsize - 900000000ll, 900000000ll);
|
|
temp_chunk = temp_ramsize / 3 * 2;
|
|
temp_window = temp_chunk / (100 * 1024 * 1024);
|
|
print_verbose("Heuristically Computed Compression Window: %lld = %lldMB\n", temp_window, temp_window * 100ull);
|
|
}
|
|
if (UNLIMITED)
|
|
print_verbose("Using Unlimited Window size\n");
|
|
}
|
|
}
|
|
|
|
/* Decrease usable ram size on 32 bits due to kernel/userspace split */
|
|
if (BITS32)
|
|
control.ramsize = MAX(control.ramsize - 900000000ll, 900000000ll);
|
|
|
|
/* Set the main nice value to half that of the backend threads since
|
|
* the rzip stage is usually the rate limiting step */
|
|
if (control.nice_val > 0 && !NO_COMPRESS) {
|
|
if (unlikely(setpriority(PRIO_PROCESS, 0, control.nice_val / 2) == -1))
|
|
print_err("Warning, unable to set nice value\n");
|
|
} else {
|
|
if (unlikely(setpriority(PRIO_PROCESS, 0, control.nice_val) == -1))
|
|
print_err("Warning, unable to set nice value\n");
|
|
}
|
|
|
|
/* One extra iteration for the case of no parameters means we will default to stdin/out */
|
|
for (i = 0; i <= argc; i++) {
|
|
if (i < argc)
|
|
control.infile = argv[i];
|
|
else if (!(i == 0 && STDIN))
|
|
break;
|
|
if (control.infile && (strcmp(control.infile, "-") == 0))
|
|
control.flags |= FLAG_STDIN;
|
|
|
|
if (control.outname && (strcmp(control.outname, "-") == 0)) {
|
|
control.flags |= FLAG_STDOUT;
|
|
control.msgout = stderr;
|
|
}
|
|
|
|
/* If we're using stdin and no output filename, use stdout */
|
|
if (STDIN && !control.outname) {
|
|
control.flags |= FLAG_STDOUT;
|
|
control.msgout = stderr;
|
|
}
|
|
|
|
if (!STDOUT)
|
|
control.msgout = stdout;
|
|
/* Implement signal handler only once flags are set */
|
|
handler.sa_handler = &sighandler;
|
|
sigaction(SIGTERM, &handler, 0);
|
|
sigaction(SIGINT, &handler, 0);
|
|
|
|
if (!FORCE_REPLACE) {
|
|
if (STDIN && isatty(fileno((FILE *)stdin))) {
|
|
print_err("Will not read stdin from a terminal. Use -f to override.\n");
|
|
usage();
|
|
exit (1);
|
|
}
|
|
if (STDIN && isatty(fileno((FILE *)stdout))) {
|
|
print_err("Will not write stdout to a terminal. Use -f to override.\n");
|
|
usage();
|
|
exit (1);
|
|
}
|
|
}
|
|
|
|
gettimeofday(&start_time, NULL);
|
|
|
|
if (control.flags & (FLAG_DECOMPRESS | FLAG_TEST_ONLY))
|
|
decompress_file();
|
|
else if (INFO)
|
|
get_fileinfo();
|
|
else
|
|
compress_file();
|
|
|
|
/* compute total time */
|
|
gettimeofday(&end_time, NULL);
|
|
total_time = (end_time.tv_sec + (double)end_time.tv_usec / 1000000) -
|
|
(start_time.tv_sec + (double)start_time.tv_usec / 1000000);
|
|
hours = (int)total_time / 3600;
|
|
minutes = (int)(total_time - hours * 3600) / 60;
|
|
seconds = total_time - hours * 60 - minutes * 60;
|
|
if (!INFO)
|
|
print_progress("Total time: %02d:%02d:%06.3f\n", hours, minutes, seconds);
|
|
}
|
|
|
|
return 0;
|
|
}
|