Home | History | Annotate | Line # | Download | only in vndcompress
vndcompress.c revision 1.15
      1  1.14  riastrad /*	$NetBSD: vndcompress.c,v 1.15 2014/01/22 06:14:46 riastradh Exp $	*/
      2   1.1   hubertf 
      3   1.8  riastrad /*-
      4   1.8  riastrad  * Copyright (c) 2013 The NetBSD Foundation, Inc.
      5   1.1   hubertf  * All rights reserved.
      6   1.1   hubertf  *
      7   1.8  riastrad  * This code is derived from software contributed to The NetBSD Foundation
      8   1.8  riastrad  * by Taylor R. Campbell.
      9   1.8  riastrad  *
     10   1.1   hubertf  * Redistribution and use in source and binary forms, with or without
     11   1.1   hubertf  * modification, are permitted provided that the following conditions
     12   1.1   hubertf  * are met:
     13   1.1   hubertf  * 1. Redistributions of source code must retain the above copyright
     14   1.1   hubertf  *    notice, this list of conditions and the following disclaimer.
     15   1.1   hubertf  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1   hubertf  *    notice, this list of conditions and the following disclaimer in the
     17   1.1   hubertf  *    documentation and/or other materials provided with the distribution.
     18   1.1   hubertf  *
     19   1.8  riastrad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.8  riastrad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.1   hubertf  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.1   hubertf  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.1   hubertf  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.1   hubertf  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.1   hubertf  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.1   hubertf  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.1   hubertf  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.1   hubertf  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.1   hubertf  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1   hubertf  */
     31   1.8  riastrad 
     32   1.8  riastrad #include <sys/cdefs.h>
     33  1.14  riastrad __RCSID("$NetBSD: vndcompress.c,v 1.15 2014/01/22 06:14:46 riastradh Exp $");
     34   1.8  riastrad 
     35   1.8  riastrad #include <sys/endian.h>
     36   1.8  riastrad 
     37   1.8  riastrad #include <assert.h>
     38   1.1   hubertf #include <err.h>
     39   1.8  riastrad #include <errno.h>
     40   1.1   hubertf #include <fcntl.h>
     41   1.5     lukem #include <inttypes.h>
     42   1.8  riastrad #include <limits.h>
     43   1.8  riastrad #include <signal.h>
     44   1.8  riastrad #include <stdbool.h>
     45   1.8  riastrad #include <stdint.h>
     46   1.1   hubertf #include <stdio.h>
     47   1.1   hubertf #include <stdlib.h>
     48   1.1   hubertf #include <string.h>
     49   1.1   hubertf #include <unistd.h>
     50   1.1   hubertf #include <zlib.h>
     51   1.1   hubertf 
     52   1.8  riastrad #include "common.h"
     53  1.15  riastrad #include "offtab.h"
     54  1.14  riastrad #include "utils.h"
     55   1.8  riastrad 
     56   1.8  riastrad /*
     57   1.8  riastrad  * XXX Switch to control bug-for-bug byte-for-byte compatibility with
     58   1.8  riastrad  * NetBSD's vndcompress.
     59   1.8  riastrad  */
     60   1.8  riastrad #define	VNDCOMPRESS_COMPAT	0
     61   1.8  riastrad 
     62   1.8  riastrad __CTASSERT(sizeof(struct cloop2_header) == CLOOP2_OFFSET_TABLE_OFFSET);
     63   1.8  riastrad 
     64   1.8  riastrad struct compress_state {
     65   1.8  riastrad 	uint64_t	size;		/* uncompressed size */
     66   1.8  riastrad 	uint64_t	offset;		/* output byte offset */
     67   1.8  riastrad 	uint32_t	blocksize;	/* bytes per block */
     68   1.8  riastrad 	uint32_t	blkno;		/* input block number */
     69   1.8  riastrad 	uint32_t	n_full_blocks;	/* floor(size/blocksize) */
     70   1.8  riastrad 	uint32_t	n_blocks;	/* ceiling(size/blocksize) */
     71   1.8  riastrad 	uint32_t	n_offsets;	/* n_blocks + 1 */
     72   1.8  riastrad 	uint32_t	end_block;	/* last block to transfer */
     73   1.8  riastrad 	uint32_t	checkpoint_blocks;	/* blocks before checkpoint */
     74   1.8  riastrad 	int		image_fd;
     75   1.8  riastrad 	int		cloop2_fd;
     76  1.15  riastrad 	struct offtab	offtab;
     77   1.8  riastrad 	uint32_t	n_checkpointed_blocks;
     78   1.8  riastrad 	volatile sig_atomic_t
     79   1.8  riastrad 			initialized;	/* everything above initialized?  */
     80   1.8  riastrad };
     81   1.8  riastrad 
     82   1.8  riastrad /* Global compression state for SIGINFO handler.  */
     83   1.8  riastrad static struct compress_state	global_state;
     84   1.8  riastrad 
     85   1.8  riastrad struct sigdesc {
     86   1.8  riastrad 	int sd_signo;
     87   1.8  riastrad 	const char *sd_name;
     88   1.8  riastrad };
     89   1.1   hubertf 
     90   1.8  riastrad static const struct sigdesc info_signals[] = {
     91   1.8  riastrad 	{ SIGINFO, "SIGINFO" },
     92   1.8  riastrad 	{ SIGUSR1, "SIGUSR1" },
     93   1.1   hubertf };
     94   1.1   hubertf 
     95   1.8  riastrad static const struct sigdesc checkpoint_signals[] = {
     96   1.8  riastrad 	{ SIGUSR2, "SIGUSR2" },
     97   1.8  riastrad };
     98   1.8  riastrad 
     99   1.8  riastrad static void	init_signals(void);
    100   1.8  riastrad static void	init_signal_handler(int, const struct sigdesc *, size_t,
    101   1.8  riastrad 		    void (*)(int));
    102   1.8  riastrad static void	info_signal_handler(int);
    103   1.8  riastrad static void	checkpoint_signal_handler(int);
    104   1.8  riastrad static void	block_signals(sigset_t *);
    105   1.8  riastrad static void	restore_sigmask(const sigset_t *);
    106   1.8  riastrad static void	compress_progress(struct compress_state *);
    107   1.8  riastrad static void	compress_init(int, char **, const struct options *,
    108   1.8  riastrad 		    struct compress_state *);
    109   1.8  riastrad static bool	compress_restart(struct compress_state *);
    110   1.8  riastrad static uint32_t	compress_block(int, int, uint32_t, uint32_t, uint32_t, void *,
    111   1.8  riastrad 		    void *);
    112   1.8  riastrad static void	compress_maybe_checkpoint(struct compress_state *);
    113   1.8  riastrad static void	compress_checkpoint(struct compress_state *);
    114   1.8  riastrad static void	compress_exit(struct compress_state *);
    115   1.8  riastrad 
    116   1.1   hubertf /*
    117   1.8  riastrad  * Compression entry point.
    118   1.1   hubertf  */
    119   1.8  riastrad int
    120   1.8  riastrad vndcompress(int argc, char **argv, const struct options *O)
    121   1.8  riastrad {
    122   1.8  riastrad 	struct compress_state *const S = &global_state;
    123   1.8  riastrad 
    124   1.8  riastrad 	/* Paranoia.  The other fields either have no sentinel or use zero.  */
    125   1.8  riastrad 	S->image_fd = -1;
    126   1.8  riastrad 	S->cloop2_fd = -1;
    127   1.8  riastrad 
    128   1.8  riastrad 	/* Set up signal handlers so we can handle SIGINFO ASAP.  */
    129   1.8  riastrad 	init_signals();
    130   1.8  riastrad 
    131   1.8  riastrad 	/*
    132   1.8  riastrad 	 * Parse the arguments to initialize our state.
    133   1.8  riastrad 	 */
    134   1.8  riastrad 	compress_init(argc, argv, O, S);
    135   1.8  riastrad 	assert(MIN_BLOCKSIZE <= S->blocksize);
    136   1.8  riastrad 	assert(S->blocksize <= MAX_BLOCKSIZE);
    137   1.8  riastrad 
    138   1.8  riastrad 	/*
    139   1.8  riastrad 	 * Allocate compression buffers.
    140   1.8  riastrad 	 *
    141   1.8  riastrad 	 * Compression may actually expand.  From an overabundance of
    142   1.8  riastrad 	 * caution, assume it can expand by at most double.
    143   1.8  riastrad 	 *
    144   1.8  riastrad 	 * XXX Check and consider tightening this assumption.
    145   1.8  riastrad 	 */
    146   1.8  riastrad 	__CTASSERT(MAX_BLOCKSIZE <= SIZE_MAX);
    147   1.8  riastrad 	void *const uncompbuf = malloc(S->blocksize);
    148   1.8  riastrad 	if (uncompbuf == NULL)
    149   1.8  riastrad 		err(1, "malloc uncompressed buffer");
    150   1.8  riastrad 
    151   1.8  riastrad 	/* XXX compression ratio bound */
    152   1.8  riastrad 	__CTASSERT(MAX_BLOCKSIZE <= (SIZE_MAX / 2));
    153   1.8  riastrad 	void *const compbuf = malloc(2 * (size_t)S->blocksize);
    154   1.8  riastrad 	if (compbuf == NULL)
    155   1.8  riastrad 		err(1, "malloc compressed buffer");
    156   1.8  riastrad 
    157   1.8  riastrad 	/*
    158   1.8  riastrad 	 * Compress the blocks.  S->blkno specifies the input block
    159   1.8  riastrad 	 * we're about to transfer.  S->offset is the current output
    160   1.8  riastrad 	 * offset.
    161   1.8  riastrad 	 */
    162   1.8  riastrad 	while (S->blkno < S->n_blocks) {
    163   1.8  riastrad 		/* Report any progress.  */
    164   1.8  riastrad 		compress_progress(S);
    165   1.8  riastrad 
    166   1.8  riastrad 		/* Stop if we've done the requested partial transfer.  */
    167   1.8  riastrad 		if ((0 < S->end_block) && (S->end_block <= S->blkno))
    168   1.8  riastrad 			goto out;
    169   1.8  riastrad 
    170   1.8  riastrad 		/* Checkpoint if appropriate.  */
    171   1.8  riastrad 		compress_maybe_checkpoint(S);
    172  1.15  riastrad 		offtab_prepare_put(&S->offtab, (S->blkno + 1));
    173   1.8  riastrad 
    174   1.8  riastrad 		/* Choose read size: partial if last block, full if not.  */
    175   1.8  riastrad 		const uint32_t readsize = (S->blkno == S->n_full_blocks?
    176   1.8  riastrad 		    (S->size % S->blocksize) : S->blocksize);
    177   1.8  riastrad 		assert(readsize > 0);
    178   1.8  riastrad 		assert(readsize <= S->blocksize);
    179   1.8  riastrad 
    180   1.8  riastrad 		/* Fail noisily if we might be about to overflow.  */
    181   1.8  riastrad 		/* XXX compression ratio bound */
    182   1.8  riastrad 		__CTASSERT(MAX_BLOCKSIZE <= (UINTMAX_MAX / 2));
    183   1.8  riastrad 		assert(S->offset <= MIN(UINT64_MAX, OFF_MAX));
    184   1.8  riastrad 		if ((2 * (uintmax_t)readsize) >
    185   1.8  riastrad 		    (MIN(UINT64_MAX, OFF_MAX) - S->offset))
    186   1.8  riastrad 			errx(1, "blkno %"PRIu32" may overflow: %ju + 2*%ju",
    187   1.8  riastrad 			    S->blkno, (uintmax_t)S->offset,
    188   1.8  riastrad 			    (uintmax_t)readsize);
    189   1.8  riastrad 
    190   1.8  riastrad 		/* Process the block.  */
    191   1.8  riastrad 		const uint32_t complen =
    192   1.8  riastrad 		    compress_block(S->image_fd, S->cloop2_fd, S->blkno,
    193   1.8  riastrad 			S->blocksize, readsize, uncompbuf, compbuf);
    194   1.8  riastrad 
    195   1.8  riastrad 		/*
    196   1.8  riastrad 		 * Signal-atomically update the state to reflect
    197   1.8  riastrad 		 * (a) what block number we are now at,
    198   1.8  riastrad 		 * (b) how far we are now in the output file, and
    199   1.8  riastrad 		 * (c) where the last block ended.
    200   1.8  riastrad 		 */
    201   1.8  riastrad 		assert(S->blkno <= (UINT32_MAX - 1));
    202   1.8  riastrad 		assert(complen <= (MIN(UINT64_MAX, OFF_MAX) - S->offset));
    203   1.8  riastrad 		assert((S->blkno + 1) < S->n_offsets);
    204   1.8  riastrad 	    {
    205   1.8  riastrad 		sigset_t old_sigmask;
    206   1.8  riastrad 		block_signals(&old_sigmask);
    207   1.8  riastrad 		S->blkno += 1;					/* (a) */
    208   1.8  riastrad 		S->offset += complen;				/* (b) */
    209  1.15  riastrad 		offtab_put(&S->offtab, S->blkno, S->offset);	/* (c) */
    210   1.8  riastrad 		restore_sigmask(&old_sigmask);
    211   1.8  riastrad 	    }
    212   1.8  riastrad 	}
    213   1.8  riastrad 
    214   1.8  riastrad 	/* Make sure we're all done. */
    215   1.8  riastrad 	assert(S->blkno == S->n_blocks);
    216   1.8  riastrad 	assert((S->blkno + 1) == S->n_offsets);
    217   1.8  riastrad 
    218   1.8  riastrad 	/* Pad to the disk block size.  */
    219   1.8  riastrad 	const uint32_t n_extra = (S->offset % DEV_BSIZE);
    220   1.8  riastrad 	if (n_extra != 0) {
    221   1.8  riastrad 		const uint32_t n_padding = (DEV_BSIZE - n_extra);
    222   1.8  riastrad 		/* Reuse compbuf -- guaranteed to be large enough.  */
    223   1.8  riastrad 		(void)memset(compbuf, 0, n_padding);
    224   1.8  riastrad 		const ssize_t n_written = write(S->cloop2_fd, compbuf,
    225   1.8  riastrad 		    n_padding);
    226   1.8  riastrad 		if (n_written == -1)
    227   1.8  riastrad 			err(1, "write final padding failed");
    228   1.8  riastrad 		assert(n_written >= 0);
    229   1.8  riastrad 		if ((size_t)n_written != n_padding)
    230   1.8  riastrad 			errx(1, "partial write of final padding bytes"
    231  1.13  riastrad 			    ": %zu != %"PRIu32,
    232  1.13  riastrad 			    (size_t)n_written, n_padding);
    233   1.8  riastrad 
    234   1.8  riastrad 		/* Account for the extra bytes in the output file.  */
    235   1.8  riastrad 		assert(n_padding <= (MIN(UINT64_MAX, OFF_MAX) - S->offset));
    236   1.8  riastrad 	    {
    237   1.8  riastrad 		sigset_t old_sigmask;
    238   1.8  riastrad 		block_signals(&old_sigmask);
    239   1.8  riastrad 		S->offset += n_padding;
    240   1.8  riastrad 		restore_sigmask(&old_sigmask);
    241   1.8  riastrad 	    }
    242   1.8  riastrad 	}
    243   1.8  riastrad 
    244   1.8  riastrad out:
    245  1.15  riastrad 	/* One last checkpoint to commit the offset table.  */
    246   1.8  riastrad 	assert(S->offset <= OFF_MAX);
    247   1.8  riastrad 	assert((off_t)S->offset == lseek(S->cloop2_fd, 0, SEEK_CUR));
    248   1.8  riastrad 	compress_checkpoint(S);
    249   1.8  riastrad 
    250   1.8  riastrad 	/*
    251   1.8  riastrad 	 * Free the compression buffers and finalize the compression.
    252   1.8  riastrad 	 */
    253   1.8  riastrad 	free(compbuf);
    254   1.8  riastrad 	free(uncompbuf);
    255   1.8  riastrad 	compress_exit(S);
    256   1.1   hubertf 
    257   1.8  riastrad 	return 0;
    258   1.8  riastrad }
    259   1.1   hubertf 
    260   1.1   hubertf /*
    261   1.8  riastrad  * Signal cruft.
    262   1.1   hubertf  */
    263   1.8  riastrad 
    264   1.8  riastrad static void
    265   1.8  riastrad init_signals(void)
    266   1.8  riastrad {
    267   1.8  riastrad 
    268   1.8  riastrad 	init_signal_handler(SA_RESTART, info_signals,
    269   1.8  riastrad 	    __arraycount(info_signals), &info_signal_handler);
    270   1.8  riastrad 	init_signal_handler(SA_RESTART, checkpoint_signals,
    271   1.8  riastrad 	    __arraycount(checkpoint_signals), &checkpoint_signal_handler);
    272   1.8  riastrad }
    273   1.8  riastrad 
    274   1.8  riastrad static void
    275   1.8  riastrad init_signal_handler(int flags, const struct sigdesc *signals, size_t n,
    276   1.8  riastrad     void (*handler)(int))
    277   1.1   hubertf {
    278   1.8  riastrad 	static const struct sigaction zero_sa;
    279   1.8  riastrad 	struct sigaction sa = zero_sa;
    280   1.8  riastrad 	size_t i;
    281   1.8  riastrad 
    282   1.8  riastrad 	(void)sigemptyset(&sa.sa_mask);
    283   1.8  riastrad 	for (i = 0; i < n; i++)
    284   1.8  riastrad 		(void)sigaddset(&sa.sa_mask, signals[i].sd_signo);
    285   1.8  riastrad 	sa.sa_flags = flags;
    286   1.8  riastrad 	sa.sa_handler = handler;
    287   1.8  riastrad 	for (i = 0; i < n; i++)
    288   1.8  riastrad 		if (sigaction(signals[i].sd_signo, &sa, NULL) == -1)
    289   1.8  riastrad 			err(1, "sigaction(%s)", signals[i].sd_name);
    290   1.8  riastrad }
    291   1.8  riastrad 
    292   1.8  riastrad static void
    293   1.8  riastrad info_signal_handler(int signo __unused)
    294   1.8  riastrad {
    295   1.8  riastrad 	/* Save errno.  */
    296   1.8  riastrad 	const int error = errno;
    297   1.8  riastrad 	struct compress_state *const S = &global_state;
    298   1.8  riastrad 	char buf[128];
    299   1.8  riastrad 
    300   1.8  riastrad 	/* Bail if the state is not yet initialized.  */
    301   1.8  riastrad 	if (!S->initialized) {
    302   1.8  riastrad 		warnx_ss("initializing");
    303   1.8  riastrad 		goto out;
    304   1.8  riastrad 	}
    305   1.8  riastrad 
    306   1.8  riastrad 	/* Carefully calculate our I/O position.  */
    307   1.8  riastrad 	assert(S->blocksize > 0);
    308   1.8  riastrad 	__CTASSERT(MAX_N_BLOCKS <= (UINT64_MAX / MAX_BLOCKSIZE));
    309   1.8  riastrad 	const uint64_t nread = ((uint64_t)S->blkno * (uint64_t)S->blocksize);
    310   1.8  riastrad 
    311   1.8  riastrad 	assert(S->n_blocks > 0);
    312   1.8  riastrad 	__CTASSERT(MAX_N_BLOCKS <= ((UINT64_MAX / sizeof(uint64_t)) -
    313   1.8  riastrad 		CLOOP2_OFFSET_TABLE_OFFSET));
    314   1.8  riastrad 	const uint64_t nwritten = (S->offset <= (CLOOP2_OFFSET_TABLE_OFFSET +
    315   1.8  riastrad 		(S->n_blocks * sizeof(uint64_t)))?
    316   1.8  riastrad 	    0 : S->offset);
    317   1.8  riastrad 
    318   1.8  riastrad 	/* snprintf_ss can't do floating-point, so do fixed-point instead.  */
    319   1.8  riastrad 	const uint64_t ratio_percent =
    320   1.8  riastrad 	    (nread > 0?
    321   1.8  riastrad 		((nwritten >= (UINT64_MAX / 100)) ?
    322   1.8  riastrad 		    ((nwritten / nread) * 100) : ((nwritten * 100) / nread))
    323   1.8  riastrad 		: 0);
    324   1.8  riastrad 
    325   1.8  riastrad 	/* Format the status.  */
    326   1.8  riastrad 	assert(S->n_checkpointed_blocks <= (UINT64_MAX / S->blocksize));
    327   1.8  riastrad 	const int n = snprintf_ss(buf, sizeof(buf),
    328   1.8  riastrad 	    "vndcompress: read %"PRIu64" bytes, wrote %"PRIu64" bytes, "
    329   1.8  riastrad 	    "compression ratio %"PRIu64"%% (checkpointed %"PRIu64" bytes)\n",
    330   1.8  riastrad 	    nread, nwritten, ratio_percent,
    331   1.8  riastrad 	    ((uint64_t)S->n_checkpointed_blocks * (uint64_t)S->blocksize));
    332   1.8  riastrad 	if (n < 0) {
    333   1.8  riastrad 		const char msg[] = "vndcompress: can't format info\n";
    334   1.8  riastrad 		(void)write(STDERR_FILENO, msg, __arraycount(msg));
    335   1.1   hubertf 	} else {
    336   1.8  riastrad 		__CTASSERT(INT_MAX <= SIZE_MAX);
    337   1.8  riastrad 		(void)write(STDERR_FILENO, buf, (size_t)n);
    338   1.8  riastrad 	}
    339   1.8  riastrad 
    340   1.8  riastrad out:
    341   1.8  riastrad 	/* Restore errno.  */
    342   1.8  riastrad 	errno = error;
    343   1.8  riastrad }
    344   1.8  riastrad 
    345   1.8  riastrad static void
    346   1.8  riastrad checkpoint_signal_handler(int signo __unused)
    347   1.8  riastrad {
    348   1.8  riastrad 	/* Save errno.  */
    349   1.8  riastrad 	const int error = errno;
    350   1.8  riastrad 	struct compress_state *const S = &global_state;
    351   1.8  riastrad 
    352   1.8  riastrad 	/* Bail if the state is not yet initialized.  */
    353   1.8  riastrad 	if (!S->initialized) {
    354   1.8  riastrad 		warnx_ss("nothing to checkpoint yet");
    355   1.8  riastrad 		goto out;
    356   1.1   hubertf 	}
    357   1.8  riastrad 
    358   1.8  riastrad 	assert(S->image_fd >= 0);
    359   1.8  riastrad 	assert(S->cloop2_fd >= 0);
    360   1.8  riastrad 
    361   1.8  riastrad 	/* Take a checkpoint.  */
    362   1.8  riastrad 	assert(S->blocksize > 0);
    363   1.8  riastrad 	assert(S->blkno <= (UINT64_MAX / S->blocksize));
    364   1.8  riastrad 	warnx_ss("checkpointing %"PRIu64" bytes",
    365   1.8  riastrad 	    ((uint64_t)S->blkno * (uint64_t)S->blocksize));
    366   1.8  riastrad 	compress_checkpoint(S);
    367   1.8  riastrad 
    368   1.8  riastrad out:
    369   1.8  riastrad 	/* Restore errno.  */
    370   1.8  riastrad 	errno = error;
    371   1.8  riastrad }
    372   1.8  riastrad 
    373   1.8  riastrad static void
    374   1.8  riastrad block_signals(sigset_t *old_sigmask)
    375   1.8  riastrad {
    376   1.8  riastrad 	sigset_t block;
    377   1.8  riastrad 
    378   1.8  riastrad 	(void)sigfillset(&block);
    379   1.8  riastrad 	(void)sigprocmask(SIG_BLOCK, &block, old_sigmask);
    380   1.8  riastrad }
    381   1.8  riastrad 
    382   1.8  riastrad static void
    383   1.8  riastrad restore_sigmask(const sigset_t *sigmask)
    384   1.8  riastrad {
    385   1.8  riastrad 
    386   1.8  riastrad 	(void)sigprocmask(SIG_SETMASK, sigmask, NULL);
    387   1.8  riastrad }
    388   1.8  riastrad 
    389   1.8  riastrad /*
    390   1.8  riastrad  * Report progress.
    391   1.8  riastrad  *
    392   1.8  riastrad  * XXX Should do a progress bar here.
    393   1.8  riastrad  */
    394   1.8  riastrad static void
    395   1.8  riastrad compress_progress(struct compress_state *S __unused)
    396   1.8  riastrad {
    397   1.1   hubertf }
    398   1.1   hubertf 
    399   1.1   hubertf /*
    400   1.8  riastrad  * Parse arguments, open the files, and initialize the state.
    401   1.1   hubertf  */
    402   1.7     joerg static void
    403   1.8  riastrad compress_init(int argc, char **argv, const struct options *O,
    404   1.8  riastrad     struct compress_state *S)
    405   1.8  riastrad {
    406   1.8  riastrad 
    407   1.8  riastrad 	if (!((argc == 2) || (argc == 3)))
    408   1.8  riastrad 		usage();
    409   1.8  riastrad 
    410   1.8  riastrad 	const char *const image_pathname = argv[0];
    411   1.8  riastrad 	const char *const cloop2_pathname = argv[1];
    412   1.8  riastrad 
    413   1.8  riastrad 	/* Grab the block size either from `-s' or from the last argument.  */
    414   1.8  riastrad 	__CTASSERT(0 < DEV_BSIZE);
    415   1.8  riastrad 	__CTASSERT((MIN_BLOCKSIZE % DEV_BSIZE) == 0);
    416   1.8  riastrad 	__CTASSERT(MIN_BLOCKSIZE <= DEF_BLOCKSIZE);
    417   1.8  riastrad 	__CTASSERT((DEF_BLOCKSIZE % DEV_BSIZE) == 0);
    418   1.8  riastrad 	__CTASSERT(DEF_BLOCKSIZE <= MAX_BLOCKSIZE);
    419   1.8  riastrad 	__CTASSERT((MAX_BLOCKSIZE % DEV_BSIZE) == 0);
    420   1.8  riastrad 	if (ISSET(O->flags, FLAG_s)) {
    421   1.8  riastrad 		if (argc == 3) {
    422   1.8  riastrad 			warnx("use -s or the extra argument, not both");
    423   1.8  riastrad 			usage();
    424   1.8  riastrad 		}
    425   1.8  riastrad 		S->blocksize = O->blocksize;
    426   1.8  riastrad 	} else {
    427   1.8  riastrad 		S->blocksize = (argc == 2? DEF_BLOCKSIZE :
    428   1.8  riastrad 		    strsuftoll("block size", argv[2], MIN_BLOCKSIZE,
    429   1.8  riastrad 			MAX_BLOCKSIZE));
    430   1.8  riastrad 	}
    431   1.8  riastrad 
    432   1.8  riastrad 	/* Sanity-check the blocksize.  (strsuftoll guarantees bounds.)  */
    433   1.8  riastrad 	__CTASSERT(DEV_BSIZE <= UINT32_MAX);
    434   1.8  riastrad 	if ((S->blocksize % DEV_BSIZE) != 0)
    435   1.8  riastrad 		errx(1, "bad blocksize: %"PRIu32
    436   1.8  riastrad 		    " (not a multiple of %"PRIu32")",
    437   1.8  riastrad 		    S->blocksize, (uint32_t)DEV_BSIZE);
    438   1.8  riastrad 	assert(MIN_BLOCKSIZE <= S->blocksize);
    439   1.8  riastrad 	assert((S->blocksize % DEV_BSIZE) == 0);
    440   1.8  riastrad 	assert(S->blocksize <= MAX_BLOCKSIZE);
    441   1.8  riastrad 
    442   1.8  riastrad 	/* Grab the end block number if we have one.  */
    443   1.8  riastrad 	S->end_block = (ISSET(O->flags, FLAG_p)? O->end_block : 0);
    444   1.8  riastrad 
    445   1.8  riastrad 	/* Grab the checkpoint block count, if we have one.  */
    446   1.8  riastrad 	S->checkpoint_blocks =
    447   1.8  riastrad 	    (ISSET(O->flags, FLAG_k)? O->checkpoint_blocks : 0);
    448   1.8  riastrad 
    449   1.8  riastrad 	/* Open the input image file and the output cloop2 file.  */
    450   1.8  riastrad 	S->image_fd = open(image_pathname, O_RDONLY);
    451   1.8  riastrad 	if (S->image_fd == -1)
    452   1.8  riastrad 		err(1, "open(%s)", image_pathname);
    453   1.8  riastrad 
    454   1.8  riastrad 	int oflags;
    455   1.8  riastrad 	if (!ISSET(O->flags, FLAG_r))
    456   1.8  riastrad 		oflags = (O_WRONLY | O_TRUNC | O_CREAT); /* XXX O_EXCL?  */
    457   1.8  riastrad 	else if (!ISSET(O->flags, FLAG_R))
    458   1.8  riastrad 		oflags = (O_RDWR | O_CREAT);
    459   1.8  riastrad 	else
    460   1.8  riastrad 		oflags = O_RDWR;
    461   1.8  riastrad 	S->cloop2_fd = open(cloop2_pathname, oflags, 0777);
    462   1.8  riastrad 	if (S->cloop2_fd == -1)
    463   1.8  riastrad 		err(1, "open(%s)", cloop2_pathname);
    464   1.8  riastrad 
    465   1.8  riastrad 	/* Find the size of the input image.  */
    466   1.8  riastrad 	if (ISSET(O->flags, FLAG_l)) {
    467   1.8  riastrad 		S->size = O->length;
    468   1.8  riastrad 	} else {
    469   1.8  riastrad 		static const struct stat zero_st;
    470   1.8  riastrad 		struct stat st = zero_st;
    471   1.8  riastrad 		if (fstat(S->image_fd, &st) == -1)
    472   1.8  riastrad 			err(1, "stat(%s)", image_pathname);
    473   1.8  riastrad 		if (st.st_size <= 0)
    474   1.8  riastrad 			errx(1, "unknown image size");
    475   1.8  riastrad 		assert(st.st_size >= 0);
    476   1.8  riastrad 		__CTASSERT(OFF_MAX <= UINT64_MAX);
    477   1.8  riastrad 		assert(__type_fit(uint64_t, st.st_size));
    478   1.8  riastrad 		S->size = st.st_size;
    479   1.8  riastrad 	}
    480   1.8  riastrad 	assert(S->size <= OFF_MAX);
    481   1.8  riastrad 
    482   1.8  riastrad 	/* Find number of full blocks and whether there's a partial block.  */
    483   1.8  riastrad 	S->n_full_blocks = (S->size / S->blocksize);
    484   1.8  riastrad 	assert(S->n_full_blocks <=
    485   1.8  riastrad 	    (UINT32_MAX - ((S->size % S->blocksize) > 0)));
    486   1.8  riastrad 	S->n_blocks = (S->n_full_blocks + ((S->size % S->blocksize) > 0));
    487   1.8  riastrad 	assert(S->n_full_blocks <= S->n_blocks);
    488   1.8  riastrad 
    489   1.8  riastrad 	if (S->n_blocks > MAX_N_BLOCKS)
    490   1.8  riastrad 		errx(1, "image too large for block size %"PRIu32": %"PRIu64,
    491   1.8  riastrad 		    S->blocksize, S->size);
    492   1.8  riastrad 	assert(S->n_blocks <= MAX_N_BLOCKS);
    493   1.8  riastrad 
    494  1.15  riastrad 	/* Create an offset table for the blocks; one extra for the end.  */
    495   1.8  riastrad 	__CTASSERT(MAX_N_BLOCKS <= (UINT32_MAX - 1));
    496   1.8  riastrad 	S->n_offsets = (S->n_blocks + 1);
    497   1.8  riastrad 	__CTASSERT(MAX_N_OFFSETS == (MAX_N_BLOCKS + 1));
    498   1.8  riastrad 	__CTASSERT(MAX_N_OFFSETS <= (SIZE_MAX / sizeof(uint64_t)));
    499  1.15  riastrad 	offtab_init(&S->offtab, S->n_offsets, S->cloop2_fd,
    500  1.15  riastrad 	    CLOOP2_OFFSET_TABLE_OFFSET);
    501   1.8  riastrad 
    502   1.8  riastrad 	/* Attempt to restart a partial transfer if requested.  */
    503   1.8  riastrad 	if (ISSET(O->flags, FLAG_r)) {
    504   1.8  riastrad 		if (compress_restart(S)) {
    505   1.8  riastrad 			/*
    506   1.8  riastrad 			 * Restart succeeded.  Truncate the output
    507   1.8  riastrad 			 * here, in case any garbage got appended.  We
    508   1.8  riastrad 			 * are committed to making progress at this
    509   1.8  riastrad 			 * point.  If the ftruncate fails, we don't
    510   1.8  riastrad 			 * lose anything valuable -- this is the last
    511   1.8  riastrad 			 * point at which we can restart anyway.
    512   1.8  riastrad 			 */
    513   1.8  riastrad 			if (ftruncate(S->cloop2_fd, S->offset) == -1)
    514   1.8  riastrad 				err(1, "ftruncate failed");
    515   1.8  riastrad 
    516   1.8  riastrad 			/* All set!  No more initialization to do.  */
    517   1.8  riastrad 			return;
    518   1.8  riastrad 		} else {
    519   1.8  riastrad 			/* Restart failed.  Barf now if requested.  */
    520   1.8  riastrad 			if (ISSET(O->flags, FLAG_R))
    521   1.8  riastrad 				errx(1, "restart failed, aborting");
    522   1.8  riastrad 
    523   1.8  riastrad 			/* Otherwise, truncate and start at the top.  */
    524   1.8  riastrad 			if (ftruncate(S->cloop2_fd, 0) == -1)
    525   1.8  riastrad 				err(1, "truncate failed");
    526   1.8  riastrad 			if (lseek(S->cloop2_fd, 0, SEEK_SET) == -1)
    527   1.8  riastrad 				err(1, "lseek to cloop2 beginning failed");
    528   1.8  riastrad 			if (lseek(S->image_fd, 0, SEEK_SET) == -1)
    529   1.8  riastrad 				err(1, "lseek to image beginning failed");
    530   1.8  riastrad 		}
    531   1.8  riastrad 	}
    532   1.8  riastrad 
    533   1.8  riastrad 	/* Write a bogus (zero) header for now, until we checkpoint.  */
    534   1.8  riastrad 	static const struct cloop2_header zero_header;
    535   1.8  riastrad 	const ssize_t h_written = write(S->cloop2_fd, &zero_header,
    536   1.8  riastrad 	    sizeof(zero_header));
    537   1.8  riastrad 	if (h_written == -1)
    538   1.8  riastrad 		err(1, "write header");
    539   1.8  riastrad 	assert(h_written >= 0);
    540   1.8  riastrad 	if ((size_t)h_written != sizeof(zero_header))
    541  1.13  riastrad 		errx(1, "partial write of header: %zu != %zu",
    542  1.13  riastrad 		    (size_t)h_written, sizeof(zero_header));
    543   1.8  riastrad 
    544  1.15  riastrad 	/* Reset the offset table to be empty and write it.  */
    545  1.15  riastrad 	offtab_reset_write(&S->offtab);
    546   1.8  riastrad 
    547   1.8  riastrad 	/* Start at the beginning of the image.  */
    548   1.8  riastrad 	S->blkno = 0;
    549   1.8  riastrad 	S->offset = (sizeof(struct cloop2_header) +
    550   1.8  riastrad 	    (S->n_offsets * sizeof(uint64_t)));
    551   1.8  riastrad 	S->n_checkpointed_blocks = 0;
    552   1.8  riastrad 
    553   1.8  riastrad 	/* Good to go and ready for interruption by a signal.  */
    554   1.8  riastrad 	S->initialized = 1;
    555   1.8  riastrad }
    556   1.8  riastrad 
    557   1.8  riastrad /*
    558   1.8  riastrad  * Try to recover state from an existing output file.
    559   1.8  riastrad  *
    560  1.15  riastrad  * On success, fill the offset table with what's in the file, set
    561   1.8  riastrad  * S->blkno and S->offset to reflect our position, and seek to the
    562   1.8  riastrad  * respective positions in the input and output files.
    563   1.8  riastrad  *
    564  1.15  riastrad  * On failure, return false.  May clobber the offset table, S->blkno,
    565   1.8  riastrad  * S->offset, and the file pointers.
    566   1.8  riastrad  */
    567   1.8  riastrad static bool
    568   1.8  riastrad compress_restart(struct compress_state *S)
    569   1.8  riastrad {
    570   1.8  riastrad 
    571   1.8  riastrad 	/* Read in the header.  */
    572   1.8  riastrad 	static const struct cloop2_header zero_header;
    573   1.8  riastrad 	struct cloop2_header header = zero_header;
    574   1.8  riastrad 
    575   1.8  riastrad 	const ssize_t h_read = read_block(S->cloop2_fd, &header,
    576   1.8  riastrad 	    sizeof(header));
    577   1.8  riastrad 	if (h_read == -1) {
    578   1.8  riastrad 		warn("failed to read header");
    579   1.8  riastrad 		return false;
    580   1.8  riastrad 	}
    581   1.8  riastrad 	assert(h_read >= 0);
    582   1.8  riastrad 	if ((size_t)h_read != sizeof(header)) {
    583   1.8  riastrad 		warnx("partial read of header");
    584   1.8  riastrad 		return false;
    585   1.8  riastrad 	}
    586   1.8  riastrad 
    587   1.8  riastrad 	/* Check that the header looks like a header.  */
    588   1.8  riastrad 	__CTASSERT(sizeof(cloop2_magic) <= sizeof(header.cl2h_magic));
    589   1.8  riastrad 	if (memcmp(header.cl2h_magic, cloop2_magic, sizeof(cloop2_magic))
    590   1.8  riastrad 	    != 0) {
    591   1.8  riastrad 		warnx("bad cloop2 shell script magic");
    592   1.8  riastrad 		return false;
    593   1.8  riastrad 	}
    594   1.8  riastrad 
    595   1.8  riastrad 	/* Check the header parameters.  */
    596   1.8  riastrad 	if (be32toh(header.cl2h_blocksize) != S->blocksize) {
    597   1.8  riastrad 		warnx("mismatched block size: %"PRIu32
    598   1.8  riastrad 		    " (expected %"PRIu32")",
    599   1.8  riastrad 		    be32toh(header.cl2h_blocksize), S->blocksize);
    600   1.8  riastrad 		return false;
    601   1.8  riastrad 	}
    602   1.8  riastrad 	if (be32toh(header.cl2h_n_blocks) != S->n_blocks) {
    603   1.8  riastrad 		warnx("mismatched number of blocks: %"PRIu32
    604   1.8  riastrad 		    " (expected %"PRIu32")",
    605   1.8  riastrad 		    be32toh(header.cl2h_n_blocks), S->n_blocks);
    606   1.8  riastrad 		return false;
    607   1.8  riastrad 	}
    608   1.8  riastrad 
    609   1.8  riastrad 	/* Read in the partial offset table.  */
    610  1.15  riastrad 	if (!offtab_reset_read(&S->offtab, &warn, &warnx))
    611   1.8  riastrad 		return false;
    612  1.15  riastrad 	if (!offtab_prepare_get(&S->offtab, 0))
    613   1.8  riastrad 		return false;
    614  1.15  riastrad 	const uint64_t first_offset = offtab_get(&S->offtab, 0);
    615  1.15  riastrad 	if (first_offset != (sizeof(struct cloop2_header) +
    616   1.8  riastrad 		(S->n_offsets * sizeof(uint64_t)))) {
    617   1.8  riastrad 		warnx("first offset is not %"PRIu64": %"PRIu64,
    618   1.8  riastrad 		    ((uint64_t)S->n_offsets * sizeof(uint64_t)),
    619  1.15  riastrad 		    first_offset);
    620   1.8  riastrad 		return false;
    621   1.8  riastrad 	}
    622   1.8  riastrad 
    623   1.8  riastrad 	/* Find where we left off.  */
    624   1.8  riastrad 	__CTASSERT(MAX_N_OFFSETS <= UINT32_MAX);
    625   1.8  riastrad 	uint32_t blkno = 0;
    626  1.15  riastrad 	uint64_t last_offset = first_offset;
    627   1.8  riastrad 	for (blkno = 0; blkno < S->n_blocks; blkno++) {
    628  1.15  riastrad 		if (!offtab_prepare_get(&S->offtab, blkno))
    629  1.15  riastrad 			return false;
    630  1.15  riastrad 		const uint64_t offset = offtab_get(&S->offtab, blkno);
    631  1.15  riastrad 		if (offset == ~(uint64_t)0)
    632   1.8  riastrad 			break;
    633  1.15  riastrad 
    634   1.8  riastrad 		if (0 < blkno) {
    635  1.15  riastrad 			const uint64_t start = last_offset;
    636  1.15  riastrad 			const uint64_t end = offset;
    637   1.8  riastrad 			if (end <= start) {
    638   1.8  riastrad 				warnx("bad offset table: 0x%"PRIx64
    639   1.8  riastrad 				    ", 0x%"PRIx64, start, end);
    640   1.8  riastrad 				return false;
    641   1.8  riastrad 			}
    642   1.8  riastrad 			/* XXX compression ratio bound */
    643   1.8  riastrad 			__CTASSERT(MAX_BLOCKSIZE <= (SIZE_MAX / 2));
    644   1.8  riastrad 			if ((2 * (size_t)S->blocksize) <= (end - start)) {
    645   1.8  riastrad 				warnx("block %"PRIu32" too large:"
    646   1.8  riastrad 				    " %"PRIu64" bytes",
    647   1.8  riastrad 				    blkno, (end - start));
    648   1.8  riastrad 				return false;
    649   1.8  riastrad 			}
    650   1.8  riastrad 		}
    651  1.15  riastrad 
    652  1.15  riastrad 		last_offset = offset;
    653   1.8  riastrad 	}
    654   1.8  riastrad 
    655   1.8  riastrad 	if (blkno == 0) {
    656   1.8  riastrad 		warnx("no blocks were written; nothing to restart");
    657   1.8  riastrad 		return false;
    658   1.8  riastrad 	}
    659   1.8  riastrad 
    660   1.8  riastrad 	/* Make sure the rest of the offset table is all ones.  */
    661   1.8  riastrad 	if (blkno < S->n_blocks) {
    662   1.8  riastrad 		uint32_t nblkno;
    663   1.8  riastrad 
    664   1.8  riastrad 		for (nblkno = blkno; nblkno < S->n_blocks; nblkno++) {
    665  1.15  riastrad 			if (!offtab_prepare_get(&S->offtab, nblkno))
    666  1.15  riastrad 				return false;
    667  1.15  riastrad 			const uint64_t offset = offtab_get(&S->offtab, nblkno);
    668  1.15  riastrad 			if (offset != ~(uint64_t)0) {
    669   1.8  riastrad 				warnx("bad partial offset table entry"
    670   1.8  riastrad 				    " at %"PRIu32": %"PRIu64,
    671  1.15  riastrad 				    nblkno, offset);
    672   1.8  riastrad 				return false;
    673   1.8  riastrad 			}
    674   1.8  riastrad 		}
    675   1.1   hubertf 	}
    676   1.8  riastrad 
    677   1.1   hubertf 	/*
    678   1.8  riastrad 	 * XXX Consider decompressing some number of blocks to make
    679   1.8  riastrad 	 * sure they match.
    680   1.1   hubertf 	 */
    681   1.8  riastrad 
    682   1.8  riastrad 	/* Back up by one.  */
    683   1.8  riastrad 	assert(1 <= blkno);
    684   1.8  riastrad 	blkno -= 1;
    685   1.8  riastrad 
    686   1.8  riastrad 	/* Seek to the input position.  */
    687   1.8  riastrad 	assert(S->size <= OFF_MAX);
    688   1.8  riastrad 	assert(blkno <= (S->size / S->blocksize));
    689   1.8  riastrad 	const off_t restart_position = ((off_t)blkno * (off_t)S->blocksize);
    690   1.8  riastrad 	assert(0 <= restart_position);
    691   1.8  riastrad 	assert(restart_position <= (off_t)S->size);
    692   1.8  riastrad 	if (lseek(S->image_fd, restart_position, SEEK_SET) == -1) {
    693   1.8  riastrad 		if (errno != ESPIPE) {
    694   1.8  riastrad 			warn("lseek input image failed");
    695   1.8  riastrad 			return false;
    696   1.8  riastrad 		}
    697   1.8  riastrad 
    698   1.8  riastrad 		/* Try read instead of lseek for a pipe/socket/fifo.  */
    699   1.8  riastrad 		void *const buffer = malloc(0x10000);
    700   1.8  riastrad 		if (buffer == NULL)
    701   1.8  riastrad 			err(1, "malloc temporary buffer");
    702   1.8  riastrad 		off_t left = restart_position;
    703   1.8  riastrad 		while (left > 0) {
    704   1.8  riastrad 			const size_t size = MIN(0x10000, left);
    705   1.8  riastrad 			const ssize_t n_read = read_block(S->image_fd, buffer,
    706   1.8  riastrad 			    size);
    707   1.8  riastrad 			if (n_read == -1) {
    708   1.8  riastrad 				free(buffer);
    709   1.8  riastrad 				warn("read of input image failed");
    710   1.8  riastrad 				return false;
    711   1.8  riastrad 			}
    712   1.8  riastrad 			assert(n_read >= 0);
    713   1.8  riastrad 			if ((size_t)n_read != size) {
    714   1.8  riastrad 				free(buffer);
    715   1.8  riastrad 				warnx("partial read of input image");
    716   1.8  riastrad 				return false;
    717   1.1   hubertf 			}
    718   1.8  riastrad 			assert((off_t)size <= left);
    719   1.8  riastrad 			left -= size;
    720   1.1   hubertf 		}
    721   1.8  riastrad 		free(buffer);
    722   1.8  riastrad 	}
    723   1.8  riastrad 
    724   1.8  riastrad 	/* Seek to the output position.  */
    725  1.15  riastrad 	assert(last_offset <= OFF_MAX);
    726  1.15  riastrad 	if (lseek(S->cloop2_fd, last_offset, SEEK_SET) == -1) {
    727  1.15  riastrad 		warn("lseek output cloop2 to %"PRIx64" failed", last_offset);
    728   1.8  riastrad 		return false;
    729   1.1   hubertf 	}
    730   1.8  riastrad 
    731  1.15  riastrad 	/* Switch from reading to writing the offset table.  */
    732  1.15  riastrad 	offtab_transmogrify_read_to_write(&S->offtab);
    733  1.15  riastrad 
    734   1.8  riastrad 	/* Start where we left off.  */
    735   1.8  riastrad 	S->blkno = blkno;
    736  1.15  riastrad 	S->offset = last_offset;
    737   1.8  riastrad 	S->n_checkpointed_blocks = blkno;
    738   1.8  riastrad 
    739   1.8  riastrad 	/* Good to go and ready for interruption by a signal.  */
    740   1.8  riastrad 	S->initialized = 1;
    741   1.8  riastrad 
    742   1.8  riastrad 	/* Success!  */
    743   1.8  riastrad 	return true;
    744   1.8  riastrad }
    745   1.8  riastrad 
    746   1.8  riastrad /*
    747   1.8  riastrad  * Read a single block, compress it, and write the compressed block.
    748   1.8  riastrad  * Return the size of the compressed block.
    749   1.8  riastrad  */
    750   1.8  riastrad static uint32_t
    751   1.8  riastrad compress_block(int in_fd, int out_fd, uint32_t blkno, uint32_t blocksize,
    752   1.8  riastrad     uint32_t readsize, void *uncompbuf, void *compbuf)
    753   1.8  riastrad {
    754   1.8  riastrad 
    755   1.8  riastrad 	assert(readsize <= blocksize);
    756   1.8  riastrad 	assert(blocksize <= MAX_BLOCKSIZE);
    757   1.8  riastrad 
    758   1.8  riastrad 	/* Read the uncompressed block.  */
    759   1.8  riastrad 	const ssize_t n_read = read_block(in_fd, uncompbuf, readsize);
    760   1.8  riastrad 	if (n_read == -1)
    761   1.8  riastrad 		err(1, "read block %"PRIu32, blkno);
    762   1.8  riastrad 	assert(n_read >= 0);
    763  1.13  riastrad 	if ((size_t)n_read != readsize)
    764  1.13  riastrad 		errx(1, "partial read of block %"PRIu32": %zu != %"PRIu32,
    765  1.13  riastrad 		    blkno, (size_t)n_read, readsize);
    766   1.8  riastrad 
    767   1.8  riastrad 	/* Compress the block.  */
    768   1.8  riastrad 	/* XXX compression ratio bound */
    769   1.8  riastrad 	__CTASSERT(MAX_BLOCKSIZE <= (ULONG_MAX / 2));
    770   1.8  riastrad 	const unsigned long uncomplen =
    771   1.8  riastrad 	    (VNDCOMPRESS_COMPAT? blocksize : readsize); /* XXX */
    772   1.8  riastrad 	unsigned long complen = (uncomplen * 2);
    773   1.8  riastrad 	const int zerror = compress2(compbuf, &complen, uncompbuf, uncomplen,
    774   1.8  riastrad 	    Z_BEST_COMPRESSION);
    775   1.8  riastrad 	if (zerror != Z_OK)
    776   1.8  riastrad 		errx(1, "compressed failed at block %"PRIu32" (%d): %s", blkno,
    777   1.8  riastrad 		    zerror, zError(zerror));
    778   1.8  riastrad 	assert(complen <= (uncomplen * 2));
    779   1.8  riastrad 
    780   1.8  riastrad 	/* Write the compressed block.  */
    781   1.8  riastrad 	const ssize_t n_written = write(out_fd, compbuf, complen);
    782   1.8  riastrad 	if (n_written == -1)
    783   1.8  riastrad 		err(1, "write block %"PRIu32, blkno);
    784   1.8  riastrad 	assert(n_written >= 0);
    785  1.13  riastrad 	if ((size_t)n_written != complen)
    786  1.13  riastrad 		errx(1, "partial write of block %"PRIu32": %zu != %lu",
    787  1.13  riastrad 		    blkno, (size_t)n_written, complen);
    788   1.8  riastrad 
    789  1.13  riastrad 	return (size_t)n_written;
    790   1.1   hubertf }
    791   1.1   hubertf 
    792   1.1   hubertf /*
    793   1.8  riastrad  * Checkpoint if appropriate.
    794   1.1   hubertf  */
    795   1.8  riastrad static void
    796   1.8  riastrad compress_maybe_checkpoint(struct compress_state *S)
    797   1.1   hubertf {
    798   1.1   hubertf 
    799   1.8  riastrad 	if ((0 < S->checkpoint_blocks) && (0 < S->blkno) &&
    800   1.8  riastrad 	    ((S->blkno % S->checkpoint_blocks) == 0)) {
    801   1.8  riastrad 		assert(S->offset <= OFF_MAX);
    802   1.8  riastrad 		assert((off_t)S->offset == lseek(S->cloop2_fd, 0, SEEK_CUR));
    803   1.8  riastrad 		compress_checkpoint(S);
    804   1.1   hubertf 	}
    805   1.1   hubertf }
    806   1.1   hubertf 
    807   1.1   hubertf /*
    808   1.8  riastrad  * Write the prefix of the offset table that we have filled so far.
    809   1.8  riastrad  *
    810   1.8  riastrad  * We fsync the data blocks we have written, and then write the offset
    811   1.8  riastrad  * table, and then fsync the offset table and file metadata.  This
    812   1.8  riastrad  * should help to avoid offset tables that point at garbage data.
    813   1.8  riastrad  *
    814   1.8  riastrad  * This may be called from a signal handler, so it must not use stdio,
    815   1.8  riastrad  * malloc, &c. -- it may only (a) handle signal-safe state in S, and
    816   1.8  riastrad  * (b) do file descriptor I/O / fsync.
    817   1.8  riastrad  *
    818   1.8  riastrad  * XXX This requires further thought and heavy testing to be sure.
    819   1.8  riastrad  *
    820   1.8  riastrad  * XXX Should have an option to suppress fsync.
    821   1.8  riastrad  *
    822   1.8  riastrad  * XXX Should have an option to fail on fsync failures.
    823   1.8  riastrad  *
    824   1.8  riastrad  * XXX Would be nice if we could just do a barrier rather than an
    825   1.8  riastrad  * fsync.
    826   1.8  riastrad  *
    827   1.8  riastrad  * XXX How might we automatically test the fsyncs?
    828   1.1   hubertf  */
    829   1.7     joerg static void
    830   1.8  riastrad compress_checkpoint(struct compress_state *S)
    831   1.1   hubertf {
    832   1.8  riastrad 
    833   1.8  riastrad 	assert(S->blkno < S->n_offsets);
    834   1.8  riastrad 	const uint32_t n_offsets = (S->blkno + 1);
    835   1.8  riastrad 	assert(n_offsets <= S->n_offsets);
    836   1.8  riastrad 
    837   1.8  riastrad 	assert(S->offset <= OFF_MAX);
    838   1.8  riastrad 	assert((off_t)S->offset <= lseek(S->cloop2_fd, 0, SEEK_CUR));
    839   1.8  riastrad 
    840   1.8  riastrad 	/* Make sure the data hits the disk before we say it's ready.  */
    841   1.8  riastrad 	if (fsync_range(S->cloop2_fd, (FFILESYNC | FDISKSYNC), 0, S->offset)
    842   1.8  riastrad 	    == -1)
    843   1.8  riastrad 		warn_ss("fsync of output failed");
    844   1.8  riastrad 
    845   1.8  riastrad 	/* Say the data blocks are ready.  */
    846  1.15  riastrad 	offtab_checkpoint(&S->offtab, n_offsets,
    847  1.15  riastrad 	    (S->n_checkpointed_blocks == 0? OFFTAB_CHECKPOINT_SYNC : 0));
    848   1.8  riastrad 
    849   1.1   hubertf 	/*
    850   1.8  riastrad 	 * If this is the first checkpoint, initialize the header.
    851   1.8  riastrad 	 * Signal handler can race with main code here, but it is
    852   1.8  riastrad 	 * harmless -- just an extra fsync and write of the header,
    853   1.8  riastrad 	 * which are both idempotent.
    854  1.15  riastrad 	 *
    855  1.15  riastrad 	 * Once we have synchronously checkpointed the offset table,
    856  1.15  riastrad 	 * subsequent writes will preserve a valid state.
    857   1.1   hubertf 	 */
    858   1.8  riastrad 	if (S->n_checkpointed_blocks == 0) {
    859   1.8  riastrad 		static const struct cloop2_header zero_header;
    860   1.8  riastrad 		struct cloop2_header header = zero_header;
    861   1.8  riastrad 
    862   1.8  riastrad 		/* Format the header.  */
    863   1.8  riastrad 		__CTASSERT(sizeof(cloop2_magic) <= sizeof(header.cl2h_magic));
    864   1.8  riastrad 		(void)memcpy(header.cl2h_magic, cloop2_magic,
    865   1.8  riastrad 		    sizeof(cloop2_magic));
    866   1.8  riastrad 		header.cl2h_blocksize = htobe32(S->blocksize);
    867   1.8  riastrad 		header.cl2h_n_blocks = htobe32(S->n_blocks);
    868   1.8  riastrad 
    869   1.8  riastrad 		/* Write the header.  */
    870   1.8  riastrad 		const ssize_t h_written = pwrite(S->cloop2_fd, &header,
    871   1.8  riastrad 		    sizeof(header), 0);
    872   1.8  riastrad 		if (h_written == -1)
    873   1.8  riastrad 			err_ss(1, "write header");
    874   1.8  riastrad 		assert(h_written >= 0);
    875   1.8  riastrad 		if ((size_t)h_written != sizeof(header))
    876  1.13  riastrad 			errx_ss(1, "partial write of header: %zu != %zu",
    877  1.13  riastrad 			    (size_t)h_written, sizeof(header));
    878   1.8  riastrad 	}
    879   1.8  riastrad 
    880   1.8  riastrad 	/* Record how many blocks we've checkpointed.  */
    881   1.8  riastrad     {
    882   1.8  riastrad 	sigset_t old_sigmask;
    883   1.8  riastrad 	block_signals(&old_sigmask);
    884   1.8  riastrad 	S->n_checkpointed_blocks = S->blkno;
    885   1.8  riastrad 	restore_sigmask(&old_sigmask);
    886   1.8  riastrad     }
    887   1.8  riastrad }
    888   1.8  riastrad 
    889   1.8  riastrad /*
    890   1.8  riastrad  * Release everything we allocated in compress_init.
    891   1.8  riastrad  */
    892   1.8  riastrad static void
    893   1.8  riastrad compress_exit(struct compress_state *S)
    894   1.8  riastrad {
    895   1.8  riastrad 
    896  1.15  riastrad 	/* Done with the offset table.  Destroy it.  */
    897  1.15  riastrad 	offtab_destroy(&S->offtab);
    898   1.8  riastrad 
    899   1.8  riastrad 	/* Done with the files.  Close them.  */
    900   1.8  riastrad 	if (close(S->cloop2_fd) == -1)
    901   1.8  riastrad 		warn("close(cloop2 fd)");
    902   1.8  riastrad 	if (close(S->image_fd) == -1)
    903   1.8  riastrad 		warn("close(image fd)");
    904   1.1   hubertf }
    905