Single thread uncompress working, no sparse support.

author Richard W.M. Jones <rjones@redhat.com>

Mon, 21 Oct 2013 12:59:16 +0000 (13:59 +0100)

committer Richard W.M. Jones <rjones@redhat.com>

Mon, 21 Oct 2013 12:59:16 +0000 (13:59 +0100)
author Richard W.M. Jones <rjones@redhat.com>
Mon, 21 Oct 2013 12:59:16 +0000 (13:59 +0100)
committer Richard W.M. Jones <rjones@redhat.com>
Mon, 21 Oct 2013 12:59:16 +0000 (13:59 +0100)
diff --git a/configure.ac b/configure.ac

index 7bdce4d..c34e1a1 100644 (file)
--- a/configure.ac
+++ b/configure.ac
@@ -16,6 +16,9 @@ test "x$U" != "x" && AC_MSG_ERROR([Compiler not ANSI compliant])
  
  AM_PROG_CC_C_O
  
+dnl Check support for 64 bit file offsets.
+AC_SYS_LARGEFILE
+
  PKG_CHECK_MODULES([LIBLZMA], [liblzma])
  
  AC_CONFIG_HEADERS([config.h])
diff --git a/pxzcat.c b/pxzcat.c

index 0ac0eb9..befc2c0 100644 (file)
--- a/pxzcat.c
+++ b/pxzcat.c
@@ -50,7 +50,7 @@
  #define DEBUG 1
  
  #if DEBUG
-#define debug(fs,...) fprintf (stderr, "pxzcat: debug: " fs, ## __VA_ARGS__)
+#define debug(fs,...) fprintf (stderr, "pxzcat: debug: " fs "\n", ## __VA_ARGS__)
  #else
  #define debug(fs,...) /* nothing */
  #endif
@@ -64,7 +64,7 @@ static void usage (int exitcode);
  static void xzfile_uncompress (const char *filename, const char *outputfile);
  static int check_header_magic (int fd);
  static lzma_index *parse_indexes (const char *filename, int fd);
-static void iter_indexes (lzma_index *idx);
+static void iter_blocks (lzma_index *idx, const char *filename, int fd, const char *outputfile, int ofd);
  
  static struct option long_options[] = {
    { "output",   required_argument,  0, 'o' },
@@ -124,7 +124,7 @@ usage (int exitcode)
  static void
  xzfile_uncompress (const char *filename, const char *outputfile)
  {
-  int fd;
+  int fd, ofd;
    uint64_t size;
    lzma_index *idx;
  
@@ -140,8 +140,18 @@ xzfile_uncompress (const char *filename, const char *outputfile)
    /* Read and parse the indexes. */
    idx = parse_indexes (filename, fd);
  
-  /* Iterate over indexes and uncompress. */
-  iter_indexes (idx);
+  /* Get the file uncompressed size, create the output file. */
+  size = lzma_index_uncompressed_size (idx);
+  debug ("uncompressed size = %" PRIu64 " bytes", size);
+
+  ofd = open (outputfile, O_WRONLY|O_CREAT|O_TRUNC|O_NOCTTY, 0644);
+  if (ofd == -1)
+    error (EXIT_FAILURE, errno, "open: %s", outputfile);
+  if (ftruncate (ofd, size) == -1)
+    error (EXIT_FAILURE, errno, "ftruncate: %s", outputfile);
+
+  /* Iterate over blocks and uncompress. */
+  iter_blocks (idx, filename, fd, outputfile, ofd);
  
    close (fd);
  }
@@ -315,166 +325,115 @@ parse_indexes (const char *filename, int fd)
    return combined_index;
  }
  
-/* Iterate over the indexes and uncompress.
- */
+/* Iterate over the blocks and uncompress. */
  static void
-iter_indexes (lzma_index *idx)
-{
-  lzma_index_iter iter;
-
-  lzma_index_iter_init (&iter, idx);
-  while (!lzma_index_iter_next (&iter, LZMA_INDEX_ITER_NONEMPTY_BLOCK)) {
-    abort ();
-
-
-
-
-  }
-}
-
-#if 0
-char *
-xzfile_read_block (xzfile *xz, uint64_t offset,
-                   uint64_t *start_rtn, uint64_t *size_rtn)
+iter_blocks (lzma_index *idx,
+             const char *filename, int fd, const char *outputfile, int ofd)
  {
    lzma_index_iter iter;
    uint8_t header[LZMA_BLOCK_HEADER_SIZE_MAX];
+  ssize_t n;
    lzma_block block;
    lzma_filter filters[LZMA_FILTERS_MAX + 1];
    lzma_ret r;
    lzma_stream strm = LZMA_STREAM_INIT;
-  char *data;
-  ssize_t n;
+  char outbuf[BUFSIZ];
    size_t i;
  
-  /* Locate the block containing the uncompressed offset. */
-  lzma_index_iter_init (&iter, xz->idx);
-  if (lzma_index_iter_locate (&iter, offset)) {
-    nbdkit_error ("cannot find offset %" PRIu64 " in the xz file", offset);
-    return NULL;
-  }
-
-  *start_rtn = iter.block.uncompressed_file_offset;
-  *size_rtn = iter.block.uncompressed_size;
-
-  nbdkit_debug ("seek: block number %d at file offset %" PRIu64,
-                (int) iter.block.number_in_file,
-                (uint64_t) iter.block.compressed_file_offset);
-
-  if (lseek (xz->fd, iter.block.compressed_file_offset, SEEK_SET) == -1) {
-    nbdkit_error ("lseek: %m");
-    return NULL;
-  }
-
-  /* Read the block header.  Start by reading a single byte which
-   * tell us how big the block header is.
-   */
-  n = read (xz->fd, header, 1);
-  if (n == 0) {
-    nbdkit_error ("read: unexpected end of file reading block header byte");
-    return NULL;
-  }
-  if (n == -1) {
-    nbdkit_error ("read: %m");
-    return NULL;
-  }
-
-  if (header[0] == '\0') {
-    nbdkit_error ("read: unexpected invalid block in file, header[0] = 0");
-    return NULL;
-  }
-
-  block.version = 0;
-  block.check = iter.stream.flags->check;
-  block.filters = filters;
-  block.header_size = lzma_block_header_size_decode (header[0]);
+  lzma_index_iter_init (&iter, idx);
+  while (!lzma_index_iter_next (&iter, LZMA_INDEX_ITER_NONEMPTY_BLOCK)) {
+    /* Seek to the start of the block in the input file. */
+    if (lseek (fd, iter.block.compressed_file_offset, SEEK_SET) == -1)
+      error (EXIT_FAILURE, errno, "lseek");
  
-  /* Now read and decode the block header. */
-  n = read (xz->fd, &header[1], block.header_size-1);
-  if (n >= 0 && n != block.header_size-1) {
-    nbdkit_error ("read: unexpected end of file reading block header");
-    return NULL;
-  }
-  if (n == -1) {
-    nbdkit_error ("read: %m");
-    return NULL;
-  }
+    /* Read the block header.  Start by reading a single byte which
+     * tell us how big the block header is.
+     */
+    n = read (fd, header, 1);
+    if (n == 0)
+      error (EXIT_FAILURE, 0,
+             "%s: read: unexpected end of file reading block header byte",
+             filename);
+    if (n == -1)
+      error (EXIT_FAILURE, errno, "%s: read", filename);
+
+    if (header[0] == '\0')
+      error (EXIT_FAILURE, errno,
+             "%s: read: unexpected invalid block in file, header[0] = 0",
+             filename);
+
+    block.version = 0;
+    block.check = iter.stream.flags->check;
+    block.filters = filters;
+    block.header_size = lzma_block_header_size_decode (header[0]);
+
+    /* Now read and decode the block header. */
+    n = read (fd, &header[1], block.header_size-1);
+    if (n >= 0 && n != block.header_size-1)
+      error (EXIT_FAILURE, 0,
+             "%s: read: unexpected end of file reading block header",
+             filename);
+    if (n == -1)
+      error (EXIT_FAILURE, errno, "%s: read", filename);
  
-  r = lzma_block_header_decode (&block, NULL, header);
-  if (r != LZMA_OK) {
-    nbdkit_error ("invalid block header (error %d)", r);
-    return NULL;
-  }
+    r = lzma_block_header_decode (&block, NULL, header);
+    if (r != LZMA_OK)
+      error (EXIT_FAILURE, errno, "%s: invalid block header (error %d)",
+             filename, r);
  
-  /* What this actually does is it checks that the block header
-   * matches the index.
-   */
-  r = lzma_block_compressed_size (&block, iter.block.unpadded_size);
-  if (r != LZMA_OK) {
-    nbdkit_error ("cannot calculate compressed size (error %d)", r);
-    goto err1;
-  }
+    /* What this actually does is it checks that the block header
+     * matches the index.
+     */
+    r = lzma_block_compressed_size (&block, iter.block.unpadded_size);
+    if (r != LZMA_OK)
+      error (EXIT_FAILURE, errno,
+             "%s: cannot calculate compressed size (error %d)", filename, r);
  
-  /* Read the block data. */
-  r = lzma_block_decoder (&strm, &block);
-  if (r != LZMA_OK) {
-    nbdkit_error ("invalid block (error %d)", r);
-    goto err1;
-  }
+    /* Read the block data and uncompress it. */
+    r = lzma_block_decoder (&strm, &block);
+    if (r != LZMA_OK)
+      error (EXIT_FAILURE, 0, "%s: invalid block (error %d)", filename, r);
  
-  data = malloc (*size_rtn);
-  if (data == NULL) {
-    nbdkit_error ("malloc (%zu bytes): %m\n"
-                  "NOTE: If this error occurs, you need to recompress your xz files with a smaller block size.  Use: 'xz --block-size=16777216 ...'.",
-                  *size_rtn);
-    goto err1;
-  }
+    strm.next_in = NULL;
+    strm.avail_in = 0;
+    strm.next_out = outbuf;
+    strm.avail_out = sizeof outbuf;
  
-  strm.next_in = NULL;
-  strm.avail_in = 0;
-  strm.next_out = (uint8_t *) data;
-  strm.avail_out = block.uncompressed_size;
+    for (;;) {
+      uint8_t buf[BUFSIZ];
+      lzma_action action = LZMA_RUN;
+
+      if (strm.avail_in == 0) {
+        strm.next_in = buf;
+        n = read (fd, buf, sizeof buf);
+        if (n == -1)
+          error (EXIT_FAILURE, errno, "%s: read", filename);
+        strm.avail_in = n;
+        if (n == 0)
+          action = LZMA_FINISH;
+      }
  
-  do {
-    uint8_t buf[BUFSIZ];
-    lzma_action action = LZMA_RUN;
+      r = lzma_code (&strm, action);
  
-    if (strm.avail_in == 0) {
-      strm.next_in = buf;
-      n = read (xz->fd, buf, sizeof buf);
-      if (n == -1) {
-        nbdkit_error ("read: %m");
-        goto err2;
+      if (strm.avail_out == 0 || r == LZMA_STREAM_END) {
+        size_t wsz = sizeof outbuf - strm.avail_out;
+        if (write (ofd, outbuf, wsz) != wsz)
+          /* XXX Handle short writes. */
+          error (EXIT_FAILURE, errno, "%s: write", filename);
+        strm.next_out = outbuf;
+        strm.avail_out = sizeof outbuf;
        }
-      strm.avail_in = n;
-      if (n == 0)
-        action = LZMA_FINISH;
+
+      if (r == LZMA_STREAM_END)
+        break;
+      if (r != LZMA_OK)
+        error (EXIT_FAILURE, 0,
+               "%s: could not parse block data (error %d)", filename, r);
      }
  
-    strm.avail_in = n;
-    strm.next_in = buf;
-    r = lzma_code (&strm, action);
-  } while (r == LZMA_OK);
+    lzma_end (&strm);
  
-  if (r != LZMA_OK && r != LZMA_STREAM_END) {
-    nbdkit_error ("could not parse block data (error %d)", r);
-    goto err2;
+    for (i = 0; filters[i].id != LZMA_VLI_UNKNOWN; ++i)
+      free (filters[i].options);
    }
-
-  lzma_end (&strm);
-
-  for (i = 0; filters[i].id != LZMA_VLI_UNKNOWN; ++i)
-    free (filters[i].options);
-
-  return data;
-
- err2:
-  free (data);
-  lzma_end (&strm);
- err1:
-  for (i = 0; filters[i].id != LZMA_VLI_UNKNOWN; ++i)
-    free (filters[i].options);
-
-  return NULL;
  }
-#endif
author	Richard W.M. Jones <rjones@redhat.com>
	Mon, 21 Oct 2013 12:59:16 +0000 (13:59 +0100)
committer	Richard W.M. Jones <rjones@redhat.com>
	Mon, 21 Oct 2013 12:59:16 +0000 (13:59 +0100)
configure.ac		patch \| blob \| history
pxzcat.c		patch \| blob \| history