mirror of
https://github.com/ckolivas/lrzip.git
synced 2025-12-06 07:12:00 +01:00
Do real stdin without the stupid temporary files by mmapping into anonymous ram.
This commit is contained in:
parent
49336a5e87
commit
43dd72b9e1
49
main.c
49
main.c
|
|
@ -174,40 +174,6 @@ static void dump_tmpoutfile(int fd_out)
|
||||||
fflush(control.msgout);
|
fflush(control.msgout);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* Open a temporary inputfile to perform stdin */
|
|
||||||
static int open_tmpinfile(void)
|
|
||||||
{
|
|
||||||
int fd_in;
|
|
||||||
|
|
||||||
control.infile = malloc(15);
|
|
||||||
strcpy(control.infile, "lrzipin.XXXXXX");
|
|
||||||
if (!control.infile)
|
|
||||||
fatal("Failed to allocate infile name\n");
|
|
||||||
|
|
||||||
fd_in = mkstemp(control.infile);
|
|
||||||
if (fd_in == -1)
|
|
||||||
fatal("Failed to create in tmpfile: %s\n", strerror(errno));
|
|
||||||
return fd_in;
|
|
||||||
}
|
|
||||||
|
|
||||||
/* Read data from stdin into temporary inputfile */
|
|
||||||
static void read_tmpinfile(int fd_in)
|
|
||||||
{
|
|
||||||
FILE *tmpinfp;
|
|
||||||
int tmpchar;
|
|
||||||
|
|
||||||
print_progress("Copying from stdin.\n");
|
|
||||||
tmpinfp = fdopen(fd_in, "w+");
|
|
||||||
if (tmpinfp == NULL)
|
|
||||||
fatal("Failed to fdopen in tmpfile: %s\n", strerror(errno));
|
|
||||||
|
|
||||||
while ((tmpchar = getchar()) != EOF)
|
|
||||||
fputc(tmpchar, tmpinfp);
|
|
||||||
|
|
||||||
fflush(tmpinfp);
|
|
||||||
rewind(tmpinfp);
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
decompress one file from the command line
|
decompress one file from the command line
|
||||||
*/
|
*/
|
||||||
|
|
@ -352,10 +318,9 @@ static void get_fileinfo(void)
|
||||||
infilecopy = strdup(control.infile);
|
infilecopy = strdup(control.infile);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (STDIN) {
|
if (STDIN)
|
||||||
fd_in = open_tmpinfile();
|
fd_in = 0;
|
||||||
read_tmpinfile(fd_in);
|
else {
|
||||||
} else {
|
|
||||||
fd_in = open(infilecopy, O_RDONLY);
|
fd_in = open(infilecopy, O_RDONLY);
|
||||||
if (fd_in == -1)
|
if (fd_in == -1)
|
||||||
fatal("Failed to open %s: %s\n", infilecopy, strerror(errno));
|
fatal("Failed to open %s: %s\n", infilecopy, strerror(errno));
|
||||||
|
|
@ -434,10 +399,8 @@ static void compress_file(void)
|
||||||
fd_in = open(control.infile, O_RDONLY);
|
fd_in = open(control.infile, O_RDONLY);
|
||||||
if (fd_in == -1)
|
if (fd_in == -1)
|
||||||
fatal("Failed to open %s: %s\n", control.infile, strerror(errno));
|
fatal("Failed to open %s: %s\n", control.infile, strerror(errno));
|
||||||
} else {
|
} else
|
||||||
fd_in = open_tmpinfile();
|
fd_in = 0;
|
||||||
read_tmpinfile(fd_in);
|
|
||||||
}
|
|
||||||
|
|
||||||
if (!STDOUT) {
|
if (!STDOUT) {
|
||||||
if (control.outname) {
|
if (control.outname) {
|
||||||
|
|
@ -509,7 +472,7 @@ static void compress_file(void)
|
||||||
fatal("Failed to unlink tmpfile: %s\n", strerror(errno));
|
fatal("Failed to unlink tmpfile: %s\n", strerror(errno));
|
||||||
}
|
}
|
||||||
|
|
||||||
if (!KEEP_FILES || STDIN) {
|
if (!KEEP_FILES) {
|
||||||
if (unlink(control.infile) != 0)
|
if (unlink(control.infile) != 0)
|
||||||
fatal("Failed to unlink %s: %s\n", control.infile, strerror(errno));
|
fatal("Failed to unlink %s: %s\n", control.infile, strerror(errno));
|
||||||
}
|
}
|
||||||
|
|
|
||||||
62
rzip.c
62
rzip.c
|
|
@ -74,6 +74,7 @@ struct rzip_state {
|
||||||
char chunk_bytes;
|
char chunk_bytes;
|
||||||
uint32_t cksum;
|
uint32_t cksum;
|
||||||
int fd_in, fd_out;
|
int fd_in, fd_out;
|
||||||
|
int stdin_eof;
|
||||||
struct {
|
struct {
|
||||||
i64 inserts;
|
i64 inserts;
|
||||||
i64 literals;
|
i64 literals;
|
||||||
|
|
@ -519,6 +520,43 @@ static void init_hash_indexes(struct rzip_state *st)
|
||||||
st->hash_index[i] = ((random() << 16) ^ random());
|
st->hash_index[i] = ((random() << 16) ^ random());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
extern const i64 one_g;
|
||||||
|
|
||||||
|
/* stdin is not file backed so we have to emulate the mmap by mapping
|
||||||
|
* anonymous ram and reading stdin into it. It means the maximum ram
|
||||||
|
* we can use will be less but we will already have determined this in
|
||||||
|
* rzip_chunk */
|
||||||
|
static void mmap_stdin(uchar *buf, struct rzip_state *st)
|
||||||
|
{
|
||||||
|
i64 len = st->chunk_size;
|
||||||
|
uchar *offset_buf = buf;
|
||||||
|
ssize_t ret;
|
||||||
|
i64 total;
|
||||||
|
|
||||||
|
total = 0;
|
||||||
|
print_verbose("Reading stdin into mmapped ram...\n");
|
||||||
|
while (len > 0) {
|
||||||
|
if (len > one_g)
|
||||||
|
ret = one_g;
|
||||||
|
else
|
||||||
|
ret = len;
|
||||||
|
ret = read(0, offset_buf, (size_t)ret);
|
||||||
|
if (ret < 0)
|
||||||
|
fatal("Failed to read in mmap_stdin\n");
|
||||||
|
total += ret;
|
||||||
|
if (ret == 0) {
|
||||||
|
/* Should be EOF */
|
||||||
|
print_maxverbose("Shrinking chunk to %lld\n", total);
|
||||||
|
buf = mremap(buf, st->chunk_size, total, 0);
|
||||||
|
st->chunk_size = total;
|
||||||
|
st->stdin_eof = 1;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
offset_buf += ret;
|
||||||
|
len -= ret;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
/* compress a chunk of an open file. Assumes that the file is able to
|
/* compress a chunk of an open file. Assumes that the file is able to
|
||||||
be mmap'd and is seekable */
|
be mmap'd and is seekable */
|
||||||
static void rzip_chunk(struct rzip_state *st, int fd_in, int fd_out, i64 offset,
|
static void rzip_chunk(struct rzip_state *st, int fd_in, int fd_out, i64 offset,
|
||||||
|
|
@ -545,13 +583,20 @@ static void rzip_chunk(struct rzip_state *st, int fd_in, int fd_out, i64 offset,
|
||||||
print_maxverbose("Preallocated %lld ram...\n", prealloc_size);
|
print_maxverbose("Preallocated %lld ram...\n", prealloc_size);
|
||||||
if (!memset(buf, 0, prealloc_size))
|
if (!memset(buf, 0, prealloc_size))
|
||||||
fatal("Failed to memset in rzip_chunk\n");
|
fatal("Failed to memset in rzip_chunk\n");
|
||||||
if (munmap(buf, prealloc_size) != 0)
|
if (!STDIN) {
|
||||||
fatal("Failed to munmap in rzip_chunk\n");
|
if (munmap(buf, prealloc_size) != 0)
|
||||||
|
fatal("Failed to munmap in rzip_chunk\n");
|
||||||
|
} else
|
||||||
|
st->chunk_size = prealloc_size;
|
||||||
|
}
|
||||||
|
if (!STDIN) {
|
||||||
|
print_verbose("Reading file into mmapped ram...\n");
|
||||||
|
buf = (uchar *)mmap(buf, st->chunk_size, PROT_READ, MAP_SHARED, fd_in, offset);
|
||||||
}
|
}
|
||||||
print_verbose("Reading file into mmapped ram...\n");
|
|
||||||
buf = (uchar *)mmap(buf, st->chunk_size, PROT_READ, MAP_SHARED, fd_in, offset);
|
|
||||||
if (buf == (uchar *)-1)
|
if (buf == (uchar *)-1)
|
||||||
fatal("Failed to map buffer in rzip_chunk\n");
|
fatal("Failed to map buffer in rzip_chunk\n");
|
||||||
|
if (STDIN)
|
||||||
|
mmap_stdin(buf, st);
|
||||||
|
|
||||||
st->ss = open_stream_out(fd_out, NUM_STREAMS, limit);
|
st->ss = open_stream_out(fd_out, NUM_STREAMS, limit);
|
||||||
if (!st->ss)
|
if (!st->ss)
|
||||||
|
|
@ -603,6 +648,7 @@ void rzip_fd(int fd_in, int fd_out)
|
||||||
st->level = &levels[MIN(9, control.window)];
|
st->level = &levels[MIN(9, control.window)];
|
||||||
st->fd_in = fd_in;
|
st->fd_in = fd_in;
|
||||||
st->fd_out = fd_out;
|
st->fd_out = fd_out;
|
||||||
|
st->stdin_eof = 0;
|
||||||
|
|
||||||
init_hash_indexes(st);
|
init_hash_indexes(st);
|
||||||
|
|
||||||
|
|
@ -612,7 +658,7 @@ void rzip_fd(int fd_in, int fd_out)
|
||||||
last.tv_sec = last.tv_usec = 0;
|
last.tv_sec = last.tv_usec = 0;
|
||||||
gettimeofday(&start, NULL);
|
gettimeofday(&start, NULL);
|
||||||
|
|
||||||
while (len) {
|
while (len > 0 || (STDIN && !st->stdin_eof)) {
|
||||||
double pct_base, pct_multiple;
|
double pct_base, pct_multiple;
|
||||||
i64 chunk, limit = 0;
|
i64 chunk, limit = 0;
|
||||||
int bits = 8;
|
int bits = 8;
|
||||||
|
|
@ -625,7 +671,7 @@ void rzip_fd(int fd_in, int fd_out)
|
||||||
print_verbose("Flushing data to disk.\n");
|
print_verbose("Flushing data to disk.\n");
|
||||||
fsync(fd_out);
|
fsync(fd_out);
|
||||||
chunk = chunk_window;
|
chunk = chunk_window;
|
||||||
if (chunk > len)
|
if (chunk > len && !STDIN)
|
||||||
chunk = len;
|
chunk = len;
|
||||||
limit = chunk;
|
limit = chunk;
|
||||||
st->chunk_size = chunk;
|
st->chunk_size = chunk;
|
||||||
|
|
@ -633,7 +679,9 @@ void rzip_fd(int fd_in, int fd_out)
|
||||||
|
|
||||||
/* Determine the chunk byte width and write it to the file
|
/* Determine the chunk byte width and write it to the file
|
||||||
* This allows archives of different chunk sizes to have
|
* This allows archives of different chunk sizes to have
|
||||||
* optimal byte width entries. */
|
* optimal byte width entries. When working with stdin we
|
||||||
|
* won't know in advance how big it is so it will always be
|
||||||
|
* rounded up to the window size. */
|
||||||
while (chunk >> bits > 0)
|
while (chunk >> bits > 0)
|
||||||
bits++;
|
bits++;
|
||||||
st->chunk_bytes = bits / 8;
|
st->chunk_bytes = bits / 8;
|
||||||
|
|
|
||||||
Loading…
Reference in a new issue