Begin massive read changes to support using temporary file for STDIN.

This commit is contained in:
Con Kolivas 2011-03-14 20:22:45 +11:00
parent 91b8382214
commit 36e09f206e
4 changed files with 105 additions and 35 deletions

25
lrzip.c
View file

@ -327,6 +327,24 @@ void dump_tmpoutfile(rzip_control *control, int fd_out)
fatal("Failed to ftruncate fd_out in dump_tmpoutfile\n"); fatal("Failed to ftruncate fd_out in dump_tmpoutfile\n");
} }
/* Used if we're unable to read STDIN into the temporary buffer, shunts data
* to temporary file */
void write_fdin(struct rzip_control *control)
{
uchar *offset_buf = control->tmp_inbuf;
i64 len = control->in_len;
ssize_t ret;
while (len > 0) {
ret = MIN(len, one_g);
ret = write(control->fd_in, offset_buf, (size_t)ret);
if (unlikely(ret <= 0))
fatal("Failed to write to fd_in in write_fdin\n");
len -= ret;
offset_buf += ret;
}
}
/* Open a temporary inputfile to perform stdin decompression */ /* Open a temporary inputfile to perform stdin decompression */
int open_tmpinfile(rzip_control *control) int open_tmpinfile(rzip_control *control)
{ {
@ -497,9 +515,14 @@ void decompress_file(rzip_control *control)
if (STDIN) { if (STDIN) {
fd_in = open_tmpinfile(control); fd_in = open_tmpinfile(control);
open_tmpinbuf(control);
read_tmpinmagic(control); read_tmpinmagic(control);
expected_size = control->st_size; expected_size = control->st_size;
/* Version 0.6+ files we can tell how much to read for each
* chunk in advance and decide if we can do it using a
* temporary buffer instead of a temporary file */
if (control->major_version == 0 && control->minor_version > 5)
open_tmpinbuf(control);
else
read_tmpinfile(control, fd_in); read_tmpinfile(control, fd_in);
} else { } else {
fd_in = open(infilecopy, O_RDONLY); fd_in = open(infilecopy, O_RDONLY);

View file

@ -88,8 +88,6 @@ static i64 seekto_fdout(rzip_control *control, i64 pos)
if (control->out_ofs > control->out_len) if (control->out_ofs > control->out_len)
control->out_len = control->out_ofs; control->out_len = control->out_ofs;
if (unlikely(control->out_ofs < 0 || control->out_ofs > control->out_maxlen)) { if (unlikely(control->out_ofs < 0 || control->out_ofs > control->out_maxlen)) {
print_err("out_ofs %lld out_len %lld hist_ofs %lld out_relofs %lld\n",
control->out_ofs, control->out_len, control->hist_ofs, control->out_relofs);
print_err("Trying to seek outside tmpoutbuf to %lld in seekto_fdout\n", control->out_ofs); print_err("Trying to seek outside tmpoutbuf to %lld in seekto_fdout\n", control->out_ofs);
return -1; return -1;
} }
@ -104,14 +102,19 @@ static i64 seekto_fdhist(rzip_control *control, i64 pos)
if (control->hist_ofs > control->out_len) if (control->hist_ofs > control->out_len)
control->out_len = control->hist_ofs; control->out_len = control->hist_ofs;
if (unlikely(control->hist_ofs < 0 || control->hist_ofs > control->out_maxlen)) { if (unlikely(control->hist_ofs < 0 || control->hist_ofs > control->out_maxlen)) {
print_err("out_ofs %lld out_len %lld hist_ofs %lld out_relofs %lld\n",
control->out_ofs, control->out_len, control->hist_ofs, control->out_relofs);
print_err("Trying to seek outside tmpoutbuf to %lld in seekto_fdhist\n", control->hist_ofs); print_err("Trying to seek outside tmpoutbuf to %lld in seekto_fdhist\n", control->hist_ofs);
return -1; return -1;
} }
return pos; return pos;
} }
static i64 seekcur_fdin(struct rzip_control *control)
{
if (!TMP_INBUF)
return lseek(control->fd_in, 0, SEEK_CUR);
return (control->in_relofs + control->in_ofs);
}
static i64 read_header(rzip_control *control, void *ss, uchar *head) static i64 read_header(rzip_control *control, void *ss, uchar *head)
{ {
int chunk_bytes = 2; int chunk_bytes = 2;
@ -154,7 +157,7 @@ static i64 unzip_literal(rzip_control *control, void *ss, i64 len, int fd_out, u
static i64 read_fdhist(struct rzip_control *control, void *buf, i64 len) static i64 read_fdhist(struct rzip_control *control, void *buf, i64 len)
{ {
if (!TMP_OUTBUF) if (!TMP_OUTBUF)
return read_1g(control->fd_hist, buf, len); return read_1g(control, control->fd_hist, buf, len);
if (unlikely(len + control->hist_ofs > control->out_maxlen)) { if (unlikely(len + control->hist_ofs > control->out_maxlen)) {
print_err("Trying to read beyond end of tmpoutbuf in read_fdhist\n"); print_err("Trying to read beyond end of tmpoutbuf in read_fdhist\n");
return -1; return -1;
@ -257,7 +260,7 @@ static i64 runzip_chunk(rzip_control *control, int fd_in, int fd_out, int fd_his
print_maxverbose("Expected size: %lld\n", expected_size); print_maxverbose("Expected size: %lld\n", expected_size);
print_maxverbose("Chunk byte width: %d\n", chunk_bytes); print_maxverbose("Chunk byte width: %d\n", chunk_bytes);
ofs = lseek(fd_in, 0, SEEK_CUR); ofs = seekcur_fdin(control);
if (unlikely(ofs == -1)) if (unlikely(ofs == -1))
fatal("Failed to seek input file in runzip_fd\n"); fatal("Failed to seek input file in runzip_fd\n");

View file

@ -680,13 +680,57 @@ ssize_t write_1g(rzip_control *control, void *buf, i64 len)
return total; return total;
} }
static void read_fdin(struct rzip_control *control, i64 len)
{
int tmpchar;
i64 i;
for (i = 0; i < len; i++) {
tmpchar = getchar();
if (unlikely(tmpchar == EOF))
failure("Reached end of file on STDIN prematurely on read_fdin\n");
control->tmp_inbuf[control->in_ofs + i] = (char)tmpchar;
}
control->in_ofs += len;
control->in_len = control->in_ofs;
}
static i64 seekto_fdin(rzip_control *control, i64 pos)
{
if (!TMP_INBUF)
return lseek(control->fd_in, pos, SEEK_SET);
control->in_ofs = pos - control->in_relofs;
if (unlikely(control->in_ofs > control->in_len || control->in_ofs < 0)) {
print_err("Tried to seek outside of in_ofs range in seekto_fdin\n");
return -1;
}
return pos;
}
/* Ditto for read */ /* Ditto for read */
ssize_t read_1g(int fd, void *buf, i64 len) ssize_t read_1g(rzip_control *control, int fd, void *buf, i64 len)
{ {
uchar *offset_buf = buf; uchar *offset_buf = buf;
ssize_t ret; ssize_t ret;
i64 total; i64 total;
if (TMP_INBUF && fd == control->fd_in) {
/* We're decompressing from STDIN */
if (unlikely(control->in_ofs + len > control->in_maxlen)) {
/* We're unable to fit it all into the temp buffer */
write_fdin(control);
read_tmpinfile(control, control->fd_in);
close_tmpinbuf(control);
goto read_fd;
}
if (control->in_ofs + len > control->in_len)
read_fdin(control, control->in_ofs + len - control->in_len);
memcpy(buf, control->tmp_inbuf + control->in_ofs, len);
control->in_ofs += len;
return len;
}
read_fd:
total = 0; total = 0;
while (len > 0) { while (len > 0) {
ret = MIN(len, one_g); ret = MIN(len, one_g);
@ -732,11 +776,11 @@ static int write_i64(rzip_control *control, int f, i64 v)
return 0; return 0;
} }
static int read_buf(int f, uchar *p, i64 len) static int read_buf(rzip_control *control, int f, uchar *p, i64 len)
{ {
ssize_t ret; ssize_t ret;
ret = read_1g(f, p, (size_t)len); ret = read_1g(control, f, p, (size_t)len);
if (unlikely(ret == -1)) { if (unlikely(ret == -1)) {
print_err("Read of length %lld failed - %s\n", len, strerror(errno)); print_err("Read of length %lld failed - %s\n", len, strerror(errno));
return -1; return -1;
@ -748,21 +792,21 @@ static int read_buf(int f, uchar *p, i64 len)
return 0; return 0;
} }
static int read_u8(int f, uchar *v) static int read_u8(rzip_control *control, int f, uchar *v)
{ {
return read_buf(f, v, 1); return read_buf(control, f, v, 1);
} }
static int read_u32(int f, u32 *v) static int read_u32(rzip_control *control, int f, u32 *v)
{ {
if (unlikely(read_buf(f, (uchar *)v, 4))) if (unlikely(read_buf(control, f, (uchar *)v, 4)))
return -1; return -1;
return 0; return 0;
} }
static int read_i64(int f, i64 *v) static int read_i64(rzip_control *control, int f, i64 *v)
{ {
if (unlikely(read_buf(f, (uchar *)v, 8))) if (unlikely(read_buf(control, f, (uchar *)v, 8)))
return -1; return -1;
return 0; return 0;
} }
@ -978,12 +1022,12 @@ void *open_stream_in(rzip_control *control, int f, int n)
if (control->major_version == 0 && control->minor_version > 5) { if (control->major_version == 0 && control->minor_version > 5) {
/* Read in flag that tells us if there are more chunks after /* Read in flag that tells us if there are more chunks after
* this. Ignored if we know the final file size */ * this. Ignored if we know the final file size */
if (unlikely(read_u8(f, &control->eof))) { if (unlikely(read_u8(control, f, &control->eof))) {
print_err("Failed to read eof flag in open_stream_in\n"); print_err("Failed to read eof flag in open_stream_in\n");
goto failed; goto failed;
} }
/* Read in the expected chunk size */ /* Read in the expected chunk size */
if (unlikely(read_i64(f, &sinfo->size))) { if (unlikely(read_i64(control, f, &sinfo->size))) {
print_err("Failed to read in chunk size in open_stream_in\n"); print_err("Failed to read in chunk size in open_stream_in\n");
goto failed; goto failed;
} }
@ -1001,18 +1045,18 @@ void *open_stream_in(rzip_control *control, int f, int n)
sinfo->s[i].unext_thread = sinfo->s[i].base_thread; sinfo->s[i].unext_thread = sinfo->s[i].base_thread;
again: again:
if (unlikely(read_u8(f, &c))) if (unlikely(read_u8(control, f, &c)))
goto failed; goto failed;
/* Compatibility crap for versions < 0.40 */ /* Compatibility crap for versions < 0.40 */
if (control->major_version == 0 && control->minor_version < 4) { if (control->major_version == 0 && control->minor_version < 4) {
u32 v132, v232, last_head32; u32 v132, v232, last_head32;
if (unlikely(read_u32(f, &v132))) if (unlikely(read_u32(control, f, &v132)))
goto failed; goto failed;
if (unlikely(read_u32(f, &v232))) if (unlikely(read_u32(control, f, &v232)))
goto failed; goto failed;
if ((read_u32(f, &last_head32))) if ((read_u32(control, f, &last_head32)))
goto failed; goto failed;
v1 = v132; v1 = v132;
@ -1020,11 +1064,11 @@ again:
sinfo->s[i].last_head = last_head32; sinfo->s[i].last_head = last_head32;
header_length = 13; header_length = 13;
} else { } else {
if (unlikely(read_i64(f, &v1))) if (unlikely(read_i64(control, f, &v1)))
goto failed; goto failed;
if (unlikely(read_i64(f, &v2))) if (unlikely(read_i64(control, f, &v2)))
goto failed; goto failed;
if (unlikely(read_i64(f, &sinfo->s[i].last_head))) if (unlikely(read_i64(control, f, &sinfo->s[i].last_head)))
goto failed; goto failed;
header_length = 25; header_length = 25;
} }
@ -1304,29 +1348,29 @@ fill_another:
if (unlikely(read_seekto(control, sinfo, s->last_head))) if (unlikely(read_seekto(control, sinfo, s->last_head)))
return -1; return -1;
if (unlikely(read_u8(sinfo->fd, &c_type))) if (unlikely(read_u8(control, sinfo->fd, &c_type)))
return -1; return -1;
/* Compatibility crap for versions < 0.4 */ /* Compatibility crap for versions < 0.4 */
if (control->major_version == 0 && control->minor_version < 4) { if (control->major_version == 0 && control->minor_version < 4) {
u32 c_len32, u_len32, last_head32; u32 c_len32, u_len32, last_head32;
if (unlikely(read_u32(sinfo->fd, &c_len32))) if (unlikely(read_u32(control, sinfo->fd, &c_len32)))
return -1; return -1;
if (unlikely(read_u32(sinfo->fd, &u_len32))) if (unlikely(read_u32(control, sinfo->fd, &u_len32)))
return -1; return -1;
if (unlikely(read_u32(sinfo->fd, &last_head32))) if (unlikely(read_u32(control, sinfo->fd, &last_head32)))
return -1; return -1;
c_len = c_len32; c_len = c_len32;
u_len = u_len32; u_len = u_len32;
last_head = last_head32; last_head = last_head32;
header_length = 13; header_length = 13;
} else { } else {
if (unlikely(read_i64(sinfo->fd, &c_len))) if (unlikely(read_i64(control, sinfo->fd, &c_len)))
return -1; return -1;
if (unlikely(read_i64(sinfo->fd, &u_len))) if (unlikely(read_i64(control, sinfo->fd, &u_len)))
return -1; return -1;
if (unlikely(read_i64(sinfo->fd, &last_head))) if (unlikely(read_i64(control, sinfo->fd, &last_head)))
return -1; return -1;
header_length = 25; header_length = 25;
} }
@ -1340,7 +1384,7 @@ fill_another:
fatal("Unable to malloc buffer of size %lld in fill_buffer\n", u_len); fatal("Unable to malloc buffer of size %lld in fill_buffer\n", u_len);
sinfo->ram_alloced += u_len; sinfo->ram_alloced += u_len;
if (unlikely(read_buf(sinfo->fd, s_buf, c_len))) if (unlikely(read_buf(control, sinfo->fd, s_buf, c_len)))
return -1; return -1;
sinfo->total_read += c_len; sinfo->total_read += c_len;

View file

@ -27,7 +27,7 @@ void create_pthread(pthread_t *thread, pthread_attr_t *attr,
void * (*start_routine)(void *), void *arg); void * (*start_routine)(void *), void *arg);
void join_pthread(pthread_t th, void **thread_return); void join_pthread(pthread_t th, void **thread_return);
ssize_t write_1g(rzip_control *control, void *buf, i64 len); ssize_t write_1g(rzip_control *control, void *buf, i64 len);
ssize_t read_1g(int fd, void *buf, i64 len); ssize_t read_1g(rzip_control *control, int fd, void *buf, i64 len);
void prepare_streamout_threads(rzip_control *control); void prepare_streamout_threads(rzip_control *control);
void close_streamout_threads(rzip_control *control); void close_streamout_threads(rzip_control *control);
void *open_stream_out(rzip_control *control, int f, unsigned int n, i64 chunk_limit, char cbytes); void *open_stream_out(rzip_control *control, int f, unsigned int n, i64 chunk_limit, char cbytes);