Home | History | Annotate | Line # | Download | only in vndcompress
vndcompress.c revision 1.14
      1  1.14  riastrad /*	$NetBSD: vndcompress.c,v 1.14 2014/01/22 06:14:20 riastradh Exp $	*/
      2   1.1   hubertf 
      3   1.8  riastrad /*-
      4   1.8  riastrad  * Copyright (c) 2013 The NetBSD Foundation, Inc.
      5   1.1   hubertf  * All rights reserved.
      6   1.1   hubertf  *
      7   1.8  riastrad  * This code is derived from software contributed to The NetBSD Foundation
      8   1.8  riastrad  * by Taylor R. Campbell.
      9   1.8  riastrad  *
     10   1.1   hubertf  * Redistribution and use in source and binary forms, with or without
     11   1.1   hubertf  * modification, are permitted provided that the following conditions
     12   1.1   hubertf  * are met:
     13   1.1   hubertf  * 1. Redistributions of source code must retain the above copyright
     14   1.1   hubertf  *    notice, this list of conditions and the following disclaimer.
     15   1.1   hubertf  * 2. Redistributions in binary form must reproduce the above copyright
     16   1.1   hubertf  *    notice, this list of conditions and the following disclaimer in the
     17   1.1   hubertf  *    documentation and/or other materials provided with the distribution.
     18   1.1   hubertf  *
     19   1.8  riastrad  * THIS SOFTWARE IS PROVIDED BY THE NETBSD FOUNDATION, INC. AND CONTRIBUTORS
     20   1.8  riastrad  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED
     21   1.1   hubertf  * TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     22   1.1   hubertf  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR CONTRIBUTORS
     23   1.1   hubertf  * BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
     24   1.1   hubertf  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
     25   1.1   hubertf  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
     26   1.1   hubertf  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
     27   1.1   hubertf  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
     28   1.1   hubertf  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
     29   1.1   hubertf  * POSSIBILITY OF SUCH DAMAGE.
     30   1.1   hubertf  */
     31   1.8  riastrad 
     32   1.8  riastrad #include <sys/cdefs.h>
     33  1.14  riastrad __RCSID("$NetBSD: vndcompress.c,v 1.14 2014/01/22 06:14:20 riastradh Exp $");
     34   1.8  riastrad 
     35   1.8  riastrad #include <sys/endian.h>
     36   1.8  riastrad 
     37   1.8  riastrad #include <assert.h>
     38   1.1   hubertf #include <err.h>
     39   1.8  riastrad #include <errno.h>
     40   1.1   hubertf #include <fcntl.h>
     41   1.5     lukem #include <inttypes.h>
     42   1.8  riastrad #include <limits.h>
     43   1.8  riastrad #include <signal.h>
     44   1.8  riastrad #include <stdbool.h>
     45   1.8  riastrad #include <stdint.h>
     46   1.1   hubertf #include <stdio.h>
     47   1.1   hubertf #include <stdlib.h>
     48   1.1   hubertf #include <string.h>
     49   1.1   hubertf #include <unistd.h>
     50   1.1   hubertf #include <zlib.h>
     51   1.1   hubertf 
     52   1.8  riastrad #include "common.h"
     53  1.14  riastrad #include "utils.h"
     54   1.8  riastrad 
     55   1.8  riastrad /*
     56   1.8  riastrad  * XXX Switch to control bug-for-bug byte-for-byte compatibility with
     57   1.8  riastrad  * NetBSD's vndcompress.
     58   1.8  riastrad  */
     59   1.8  riastrad #define	VNDCOMPRESS_COMPAT	0
     60   1.8  riastrad 
     61   1.8  riastrad __CTASSERT(sizeof(struct cloop2_header) == CLOOP2_OFFSET_TABLE_OFFSET);
     62   1.8  riastrad 
     63   1.8  riastrad struct compress_state {
     64   1.8  riastrad 	uint64_t	size;		/* uncompressed size */
     65   1.8  riastrad 	uint64_t	offset;		/* output byte offset */
     66   1.8  riastrad 	uint32_t	blocksize;	/* bytes per block */
     67   1.8  riastrad 	uint32_t	blkno;		/* input block number */
     68   1.8  riastrad 	uint32_t	n_full_blocks;	/* floor(size/blocksize) */
     69   1.8  riastrad 	uint32_t	n_blocks;	/* ceiling(size/blocksize) */
     70   1.8  riastrad 	uint32_t	n_offsets;	/* n_blocks + 1 */
     71   1.8  riastrad 	uint32_t	end_block;	/* last block to transfer */
     72   1.8  riastrad 	uint32_t	checkpoint_blocks;	/* blocks before checkpoint */
     73   1.8  riastrad 	int		image_fd;
     74   1.8  riastrad 	int		cloop2_fd;
     75   1.8  riastrad 	uint64_t	*offset_table;
     76   1.8  riastrad 	uint32_t	n_checkpointed_blocks;
     77   1.8  riastrad 	volatile sig_atomic_t
     78   1.8  riastrad 			initialized;	/* everything above initialized?  */
     79   1.8  riastrad };
     80   1.8  riastrad 
     81   1.8  riastrad /* Global compression state for SIGINFO handler.  */
     82   1.8  riastrad static struct compress_state	global_state;
     83   1.8  riastrad 
     84   1.8  riastrad struct sigdesc {
     85   1.8  riastrad 	int sd_signo;
     86   1.8  riastrad 	const char *sd_name;
     87   1.8  riastrad };
     88   1.1   hubertf 
     89   1.8  riastrad static const struct sigdesc info_signals[] = {
     90   1.8  riastrad 	{ SIGINFO, "SIGINFO" },
     91   1.8  riastrad 	{ SIGUSR1, "SIGUSR1" },
     92   1.1   hubertf };
     93   1.1   hubertf 
     94   1.8  riastrad static const struct sigdesc checkpoint_signals[] = {
     95   1.8  riastrad 	{ SIGUSR2, "SIGUSR2" },
     96   1.8  riastrad };
     97   1.8  riastrad 
     98   1.8  riastrad static void	init_signals(void);
     99   1.8  riastrad static void	init_signal_handler(int, const struct sigdesc *, size_t,
    100   1.8  riastrad 		    void (*)(int));
    101   1.8  riastrad static void	info_signal_handler(int);
    102   1.8  riastrad static void	checkpoint_signal_handler(int);
    103   1.8  riastrad static void	block_signals(sigset_t *);
    104   1.8  riastrad static void	restore_sigmask(const sigset_t *);
    105   1.8  riastrad static void	compress_progress(struct compress_state *);
    106   1.8  riastrad static void	compress_init(int, char **, const struct options *,
    107   1.8  riastrad 		    struct compress_state *);
    108   1.8  riastrad static bool	compress_restart(struct compress_state *);
    109   1.8  riastrad static uint32_t	compress_block(int, int, uint32_t, uint32_t, uint32_t, void *,
    110   1.8  riastrad 		    void *);
    111   1.8  riastrad static void	compress_maybe_checkpoint(struct compress_state *);
    112   1.8  riastrad static void	compress_checkpoint(struct compress_state *);
    113   1.8  riastrad static void	compress_exit(struct compress_state *);
    114   1.8  riastrad 
    115   1.1   hubertf /*
    116   1.8  riastrad  * Compression entry point.
    117   1.1   hubertf  */
    118   1.8  riastrad int
    119   1.8  riastrad vndcompress(int argc, char **argv, const struct options *O)
    120   1.8  riastrad {
    121   1.8  riastrad 	struct compress_state *const S = &global_state;
    122   1.8  riastrad 
    123   1.8  riastrad 	/* Paranoia.  The other fields either have no sentinel or use zero.  */
    124   1.8  riastrad 	S->image_fd = -1;
    125   1.8  riastrad 	S->cloop2_fd = -1;
    126   1.8  riastrad 
    127   1.8  riastrad 	/* Set up signal handlers so we can handle SIGINFO ASAP.  */
    128   1.8  riastrad 	init_signals();
    129   1.8  riastrad 
    130   1.8  riastrad 	/*
    131   1.8  riastrad 	 * Parse the arguments to initialize our state.
    132   1.8  riastrad 	 */
    133   1.8  riastrad 	compress_init(argc, argv, O, S);
    134   1.8  riastrad 	assert(MIN_BLOCKSIZE <= S->blocksize);
    135   1.8  riastrad 	assert(S->blocksize <= MAX_BLOCKSIZE);
    136   1.8  riastrad 	assert(S->offset_table != NULL);
    137   1.8  riastrad 	assert(S->n_offsets > 0);
    138   1.8  riastrad 	assert(S->offset_table[0] == htobe64(sizeof(struct cloop2_header) +
    139   1.8  riastrad 		(S->n_offsets * sizeof(uint64_t))));
    140   1.8  riastrad 
    141   1.8  riastrad 	/*
    142   1.8  riastrad 	 * Allocate compression buffers.
    143   1.8  riastrad 	 *
    144   1.8  riastrad 	 * Compression may actually expand.  From an overabundance of
    145   1.8  riastrad 	 * caution, assume it can expand by at most double.
    146   1.8  riastrad 	 *
    147   1.8  riastrad 	 * XXX Check and consider tightening this assumption.
    148   1.8  riastrad 	 */
    149   1.8  riastrad 	__CTASSERT(MAX_BLOCKSIZE <= SIZE_MAX);
    150   1.8  riastrad 	void *const uncompbuf = malloc(S->blocksize);
    151   1.8  riastrad 	if (uncompbuf == NULL)
    152   1.8  riastrad 		err(1, "malloc uncompressed buffer");
    153   1.8  riastrad 
    154   1.8  riastrad 	/* XXX compression ratio bound */
    155   1.8  riastrad 	__CTASSERT(MAX_BLOCKSIZE <= (SIZE_MAX / 2));
    156   1.8  riastrad 	void *const compbuf = malloc(2 * (size_t)S->blocksize);
    157   1.8  riastrad 	if (compbuf == NULL)
    158   1.8  riastrad 		err(1, "malloc compressed buffer");
    159   1.8  riastrad 
    160   1.8  riastrad 	/*
    161   1.8  riastrad 	 * Compress the blocks.  S->blkno specifies the input block
    162   1.8  riastrad 	 * we're about to transfer.  S->offset is the current output
    163   1.8  riastrad 	 * offset.
    164   1.8  riastrad 	 */
    165   1.8  riastrad 	while (S->blkno < S->n_blocks) {
    166   1.8  riastrad 		/* Report any progress.  */
    167   1.8  riastrad 		compress_progress(S);
    168   1.8  riastrad 
    169   1.8  riastrad 		/* Stop if we've done the requested partial transfer.  */
    170   1.8  riastrad 		if ((0 < S->end_block) && (S->end_block <= S->blkno))
    171   1.8  riastrad 			goto out;
    172   1.8  riastrad 
    173   1.8  riastrad 		/* Checkpoint if appropriate.  */
    174   1.8  riastrad 		compress_maybe_checkpoint(S);
    175   1.8  riastrad 
    176   1.8  riastrad 		/* Choose read size: partial if last block, full if not.  */
    177   1.8  riastrad 		const uint32_t readsize = (S->blkno == S->n_full_blocks?
    178   1.8  riastrad 		    (S->size % S->blocksize) : S->blocksize);
    179   1.8  riastrad 		assert(readsize > 0);
    180   1.8  riastrad 		assert(readsize <= S->blocksize);
    181   1.8  riastrad 
    182   1.8  riastrad 		/* Fail noisily if we might be about to overflow.  */
    183   1.8  riastrad 		/* XXX compression ratio bound */
    184   1.8  riastrad 		__CTASSERT(MAX_BLOCKSIZE <= (UINTMAX_MAX / 2));
    185   1.8  riastrad 		assert(S->offset <= MIN(UINT64_MAX, OFF_MAX));
    186   1.8  riastrad 		if ((2 * (uintmax_t)readsize) >
    187   1.8  riastrad 		    (MIN(UINT64_MAX, OFF_MAX) - S->offset))
    188   1.8  riastrad 			errx(1, "blkno %"PRIu32" may overflow: %ju + 2*%ju",
    189   1.8  riastrad 			    S->blkno, (uintmax_t)S->offset,
    190   1.8  riastrad 			    (uintmax_t)readsize);
    191   1.8  riastrad 
    192   1.8  riastrad 		/* Process the block.  */
    193   1.8  riastrad 		const uint32_t complen =
    194   1.8  riastrad 		    compress_block(S->image_fd, S->cloop2_fd, S->blkno,
    195   1.8  riastrad 			S->blocksize, readsize, uncompbuf, compbuf);
    196   1.8  riastrad 
    197   1.8  riastrad 		/*
    198   1.8  riastrad 		 * Signal-atomically update the state to reflect
    199   1.8  riastrad 		 * (a) what block number we are now at,
    200   1.8  riastrad 		 * (b) how far we are now in the output file, and
    201   1.8  riastrad 		 * (c) where the last block ended.
    202   1.8  riastrad 		 */
    203   1.8  riastrad 		assert(S->blkno <= (UINT32_MAX - 1));
    204   1.8  riastrad 		assert(complen <= (MIN(UINT64_MAX, OFF_MAX) - S->offset));
    205   1.8  riastrad 		assert((S->blkno + 1) < S->n_offsets);
    206   1.8  riastrad 	    {
    207   1.8  riastrad 		sigset_t old_sigmask;
    208   1.8  riastrad 		block_signals(&old_sigmask);
    209   1.8  riastrad 		S->blkno += 1;					/* (a) */
    210   1.8  riastrad 		S->offset += complen;				/* (b) */
    211   1.8  riastrad 		S->offset_table[S->blkno] = htobe64(S->offset);	/* (c) */
    212   1.8  riastrad 		restore_sigmask(&old_sigmask);
    213   1.8  riastrad 	    }
    214   1.8  riastrad 	}
    215   1.8  riastrad 
    216   1.8  riastrad 	/* Make sure we're all done. */
    217   1.8  riastrad 	assert(S->blkno == S->n_blocks);
    218   1.8  riastrad 	assert((S->blkno + 1) == S->n_offsets);
    219   1.8  riastrad 
    220   1.8  riastrad 	/* Pad to the disk block size.  */
    221   1.8  riastrad 	const uint32_t n_extra = (S->offset % DEV_BSIZE);
    222   1.8  riastrad 	if (n_extra != 0) {
    223   1.8  riastrad 		const uint32_t n_padding = (DEV_BSIZE - n_extra);
    224   1.8  riastrad 		/* Reuse compbuf -- guaranteed to be large enough.  */
    225   1.8  riastrad 		(void)memset(compbuf, 0, n_padding);
    226   1.8  riastrad 		const ssize_t n_written = write(S->cloop2_fd, compbuf,
    227   1.8  riastrad 		    n_padding);
    228   1.8  riastrad 		if (n_written == -1)
    229   1.8  riastrad 			err(1, "write final padding failed");
    230   1.8  riastrad 		assert(n_written >= 0);
    231   1.8  riastrad 		if ((size_t)n_written != n_padding)
    232   1.8  riastrad 			errx(1, "partial write of final padding bytes"
    233  1.13  riastrad 			    ": %zu != %"PRIu32,
    234  1.13  riastrad 			    (size_t)n_written, n_padding);
    235   1.8  riastrad 
    236   1.8  riastrad 		/* Account for the extra bytes in the output file.  */
    237   1.8  riastrad 		assert(n_padding <= (MIN(UINT64_MAX, OFF_MAX) - S->offset));
    238   1.8  riastrad 	    {
    239   1.8  riastrad 		sigset_t old_sigmask;
    240   1.8  riastrad 		block_signals(&old_sigmask);
    241   1.8  riastrad 		S->offset += n_padding;
    242   1.8  riastrad 		restore_sigmask(&old_sigmask);
    243   1.8  riastrad 	    }
    244   1.8  riastrad 	}
    245   1.8  riastrad 
    246   1.8  riastrad out:
    247   1.8  riastrad 	/* Commit the offset table.  */
    248   1.8  riastrad 	assert(S->offset <= OFF_MAX);
    249   1.8  riastrad 	assert((off_t)S->offset == lseek(S->cloop2_fd, 0, SEEK_CUR));
    250   1.8  riastrad 	compress_checkpoint(S);
    251   1.8  riastrad 
    252   1.8  riastrad 	/*
    253   1.8  riastrad 	 * Free the compression buffers and finalize the compression.
    254   1.8  riastrad 	 */
    255   1.8  riastrad 	free(compbuf);
    256   1.8  riastrad 	free(uncompbuf);
    257   1.8  riastrad 	compress_exit(S);
    258   1.1   hubertf 
    259   1.8  riastrad 	return 0;
    260   1.8  riastrad }
    261   1.1   hubertf 
    262   1.1   hubertf /*
    263   1.8  riastrad  * Signal cruft.
    264   1.1   hubertf  */
    265   1.8  riastrad 
    266   1.8  riastrad static void
    267   1.8  riastrad init_signals(void)
    268   1.8  riastrad {
    269   1.8  riastrad 
    270   1.8  riastrad 	init_signal_handler(SA_RESTART, info_signals,
    271   1.8  riastrad 	    __arraycount(info_signals), &info_signal_handler);
    272   1.8  riastrad 	init_signal_handler(SA_RESTART, checkpoint_signals,
    273   1.8  riastrad 	    __arraycount(checkpoint_signals), &checkpoint_signal_handler);
    274   1.8  riastrad }
    275   1.8  riastrad 
    276   1.8  riastrad static void
    277   1.8  riastrad init_signal_handler(int flags, const struct sigdesc *signals, size_t n,
    278   1.8  riastrad     void (*handler)(int))
    279   1.1   hubertf {
    280   1.8  riastrad 	static const struct sigaction zero_sa;
    281   1.8  riastrad 	struct sigaction sa = zero_sa;
    282   1.8  riastrad 	size_t i;
    283   1.8  riastrad 
    284   1.8  riastrad 	(void)sigemptyset(&sa.sa_mask);
    285   1.8  riastrad 	for (i = 0; i < n; i++)
    286   1.8  riastrad 		(void)sigaddset(&sa.sa_mask, signals[i].sd_signo);
    287   1.8  riastrad 	sa.sa_flags = flags;
    288   1.8  riastrad 	sa.sa_handler = handler;
    289   1.8  riastrad 	for (i = 0; i < n; i++)
    290   1.8  riastrad 		if (sigaction(signals[i].sd_signo, &sa, NULL) == -1)
    291   1.8  riastrad 			err(1, "sigaction(%s)", signals[i].sd_name);
    292   1.8  riastrad }
    293   1.8  riastrad 
    294   1.8  riastrad static void
    295   1.8  riastrad info_signal_handler(int signo __unused)
    296   1.8  riastrad {
    297   1.8  riastrad 	/* Save errno.  */
    298   1.8  riastrad 	const int error = errno;
    299   1.8  riastrad 	struct compress_state *const S = &global_state;
    300   1.8  riastrad 	char buf[128];
    301   1.8  riastrad 
    302   1.8  riastrad 	/* Bail if the state is not yet initialized.  */
    303   1.8  riastrad 	if (!S->initialized) {
    304   1.8  riastrad 		warnx_ss("initializing");
    305   1.8  riastrad 		goto out;
    306   1.8  riastrad 	}
    307   1.8  riastrad 
    308   1.8  riastrad 	/* Carefully calculate our I/O position.  */
    309   1.8  riastrad 	assert(S->blocksize > 0);
    310   1.8  riastrad 	__CTASSERT(MAX_N_BLOCKS <= (UINT64_MAX / MAX_BLOCKSIZE));
    311   1.8  riastrad 	const uint64_t nread = ((uint64_t)S->blkno * (uint64_t)S->blocksize);
    312   1.8  riastrad 
    313   1.8  riastrad 	assert(S->n_blocks > 0);
    314   1.8  riastrad 	__CTASSERT(MAX_N_BLOCKS <= ((UINT64_MAX / sizeof(uint64_t)) -
    315   1.8  riastrad 		CLOOP2_OFFSET_TABLE_OFFSET));
    316   1.8  riastrad 	const uint64_t nwritten = (S->offset <= (CLOOP2_OFFSET_TABLE_OFFSET +
    317   1.8  riastrad 		(S->n_blocks * sizeof(uint64_t)))?
    318   1.8  riastrad 	    0 : S->offset);
    319   1.8  riastrad 
    320   1.8  riastrad 	/* snprintf_ss can't do floating-point, so do fixed-point instead.  */
    321   1.8  riastrad 	const uint64_t ratio_percent =
    322   1.8  riastrad 	    (nread > 0?
    323   1.8  riastrad 		((nwritten >= (UINT64_MAX / 100)) ?
    324   1.8  riastrad 		    ((nwritten / nread) * 100) : ((nwritten * 100) / nread))
    325   1.8  riastrad 		: 0);
    326   1.8  riastrad 
    327   1.8  riastrad 	/* Format the status.  */
    328   1.8  riastrad 	assert(S->n_checkpointed_blocks <= (UINT64_MAX / S->blocksize));
    329   1.8  riastrad 	const int n = snprintf_ss(buf, sizeof(buf),
    330   1.8  riastrad 	    "vndcompress: read %"PRIu64" bytes, wrote %"PRIu64" bytes, "
    331   1.8  riastrad 	    "compression ratio %"PRIu64"%% (checkpointed %"PRIu64" bytes)\n",
    332   1.8  riastrad 	    nread, nwritten, ratio_percent,
    333   1.8  riastrad 	    ((uint64_t)S->n_checkpointed_blocks * (uint64_t)S->blocksize));
    334   1.8  riastrad 	if (n < 0) {
    335   1.8  riastrad 		const char msg[] = "vndcompress: can't format info\n";
    336   1.8  riastrad 		(void)write(STDERR_FILENO, msg, __arraycount(msg));
    337   1.1   hubertf 	} else {
    338   1.8  riastrad 		__CTASSERT(INT_MAX <= SIZE_MAX);
    339   1.8  riastrad 		(void)write(STDERR_FILENO, buf, (size_t)n);
    340   1.8  riastrad 	}
    341   1.8  riastrad 
    342   1.8  riastrad out:
    343   1.8  riastrad 	/* Restore errno.  */
    344   1.8  riastrad 	errno = error;
    345   1.8  riastrad }
    346   1.8  riastrad 
    347   1.8  riastrad static void
    348   1.8  riastrad checkpoint_signal_handler(int signo __unused)
    349   1.8  riastrad {
    350   1.8  riastrad 	/* Save errno.  */
    351   1.8  riastrad 	const int error = errno;
    352   1.8  riastrad 	struct compress_state *const S = &global_state;
    353   1.8  riastrad 
    354   1.8  riastrad 	/* Bail if the state is not yet initialized.  */
    355   1.8  riastrad 	if (!S->initialized) {
    356   1.8  riastrad 		warnx_ss("nothing to checkpoint yet");
    357   1.8  riastrad 		goto out;
    358   1.1   hubertf 	}
    359   1.8  riastrad 
    360   1.8  riastrad 	assert(S->image_fd >= 0);
    361   1.8  riastrad 	assert(S->cloop2_fd >= 0);
    362   1.8  riastrad 
    363   1.8  riastrad 	/* Take a checkpoint.  */
    364   1.8  riastrad 	assert(S->blocksize > 0);
    365   1.8  riastrad 	assert(S->blkno <= (UINT64_MAX / S->blocksize));
    366   1.8  riastrad 	warnx_ss("checkpointing %"PRIu64" bytes",
    367   1.8  riastrad 	    ((uint64_t)S->blkno * (uint64_t)S->blocksize));
    368   1.8  riastrad 	compress_checkpoint(S);
    369   1.8  riastrad 
    370   1.8  riastrad out:
    371   1.8  riastrad 	/* Restore errno.  */
    372   1.8  riastrad 	errno = error;
    373   1.8  riastrad }
    374   1.8  riastrad 
    375   1.8  riastrad static void
    376   1.8  riastrad block_signals(sigset_t *old_sigmask)
    377   1.8  riastrad {
    378   1.8  riastrad 	sigset_t block;
    379   1.8  riastrad 
    380   1.8  riastrad 	(void)sigfillset(&block);
    381   1.8  riastrad 	(void)sigprocmask(SIG_BLOCK, &block, old_sigmask);
    382   1.8  riastrad }
    383   1.8  riastrad 
    384   1.8  riastrad static void
    385   1.8  riastrad restore_sigmask(const sigset_t *sigmask)
    386   1.8  riastrad {
    387   1.8  riastrad 
    388   1.8  riastrad 	(void)sigprocmask(SIG_SETMASK, sigmask, NULL);
    389   1.8  riastrad }
    390   1.8  riastrad 
    391   1.8  riastrad /*
    392   1.8  riastrad  * Report progress.
    393   1.8  riastrad  *
    394   1.8  riastrad  * XXX Should do a progress bar here.
    395   1.8  riastrad  */
    396   1.8  riastrad static void
    397   1.8  riastrad compress_progress(struct compress_state *S __unused)
    398   1.8  riastrad {
    399   1.1   hubertf }
    400   1.1   hubertf 
    401   1.1   hubertf /*
    402   1.8  riastrad  * Parse arguments, open the files, and initialize the state.
    403   1.1   hubertf  */
    404   1.7     joerg static void
    405   1.8  riastrad compress_init(int argc, char **argv, const struct options *O,
    406   1.8  riastrad     struct compress_state *S)
    407   1.8  riastrad {
    408   1.8  riastrad 	uint32_t i;
    409   1.8  riastrad 
    410   1.8  riastrad 	if (!((argc == 2) || (argc == 3)))
    411   1.8  riastrad 		usage();
    412   1.8  riastrad 
    413   1.8  riastrad 	const char *const image_pathname = argv[0];
    414   1.8  riastrad 	const char *const cloop2_pathname = argv[1];
    415   1.8  riastrad 
    416   1.8  riastrad 	/* Grab the block size either from `-s' or from the last argument.  */
    417   1.8  riastrad 	__CTASSERT(0 < DEV_BSIZE);
    418   1.8  riastrad 	__CTASSERT((MIN_BLOCKSIZE % DEV_BSIZE) == 0);
    419   1.8  riastrad 	__CTASSERT(MIN_BLOCKSIZE <= DEF_BLOCKSIZE);
    420   1.8  riastrad 	__CTASSERT((DEF_BLOCKSIZE % DEV_BSIZE) == 0);
    421   1.8  riastrad 	__CTASSERT(DEF_BLOCKSIZE <= MAX_BLOCKSIZE);
    422   1.8  riastrad 	__CTASSERT((MAX_BLOCKSIZE % DEV_BSIZE) == 0);
    423   1.8  riastrad 	if (ISSET(O->flags, FLAG_s)) {
    424   1.8  riastrad 		if (argc == 3) {
    425   1.8  riastrad 			warnx("use -s or the extra argument, not both");
    426   1.8  riastrad 			usage();
    427   1.8  riastrad 		}
    428   1.8  riastrad 		S->blocksize = O->blocksize;
    429   1.8  riastrad 	} else {
    430   1.8  riastrad 		S->blocksize = (argc == 2? DEF_BLOCKSIZE :
    431   1.8  riastrad 		    strsuftoll("block size", argv[2], MIN_BLOCKSIZE,
    432   1.8  riastrad 			MAX_BLOCKSIZE));
    433   1.8  riastrad 	}
    434   1.8  riastrad 
    435   1.8  riastrad 	/* Sanity-check the blocksize.  (strsuftoll guarantees bounds.)  */
    436   1.8  riastrad 	__CTASSERT(DEV_BSIZE <= UINT32_MAX);
    437   1.8  riastrad 	if ((S->blocksize % DEV_BSIZE) != 0)
    438   1.8  riastrad 		errx(1, "bad blocksize: %"PRIu32
    439   1.8  riastrad 		    " (not a multiple of %"PRIu32")",
    440   1.8  riastrad 		    S->blocksize, (uint32_t)DEV_BSIZE);
    441   1.8  riastrad 	assert(MIN_BLOCKSIZE <= S->blocksize);
    442   1.8  riastrad 	assert((S->blocksize % DEV_BSIZE) == 0);
    443   1.8  riastrad 	assert(S->blocksize <= MAX_BLOCKSIZE);
    444   1.8  riastrad 
    445   1.8  riastrad 	/* Grab the end block number if we have one.  */
    446   1.8  riastrad 	S->end_block = (ISSET(O->flags, FLAG_p)? O->end_block : 0);
    447   1.8  riastrad 
    448   1.8  riastrad 	/* Grab the checkpoint block count, if we have one.  */
    449   1.8  riastrad 	S->checkpoint_blocks =
    450   1.8  riastrad 	    (ISSET(O->flags, FLAG_k)? O->checkpoint_blocks : 0);
    451   1.8  riastrad 
    452   1.8  riastrad 	/* Open the input image file and the output cloop2 file.  */
    453   1.8  riastrad 	S->image_fd = open(image_pathname, O_RDONLY);
    454   1.8  riastrad 	if (S->image_fd == -1)
    455   1.8  riastrad 		err(1, "open(%s)", image_pathname);
    456   1.8  riastrad 
    457   1.8  riastrad 	int oflags;
    458   1.8  riastrad 	if (!ISSET(O->flags, FLAG_r))
    459   1.8  riastrad 		oflags = (O_WRONLY | O_TRUNC | O_CREAT); /* XXX O_EXCL?  */
    460   1.8  riastrad 	else if (!ISSET(O->flags, FLAG_R))
    461   1.8  riastrad 		oflags = (O_RDWR | O_CREAT);
    462   1.8  riastrad 	else
    463   1.8  riastrad 		oflags = O_RDWR;
    464   1.8  riastrad 	S->cloop2_fd = open(cloop2_pathname, oflags, 0777);
    465   1.8  riastrad 	if (S->cloop2_fd == -1)
    466   1.8  riastrad 		err(1, "open(%s)", cloop2_pathname);
    467   1.8  riastrad 
    468   1.8  riastrad 	/* Find the size of the input image.  */
    469   1.8  riastrad 	if (ISSET(O->flags, FLAG_l)) {
    470   1.8  riastrad 		S->size = O->length;
    471   1.8  riastrad 	} else {
    472   1.8  riastrad 		static const struct stat zero_st;
    473   1.8  riastrad 		struct stat st = zero_st;
    474   1.8  riastrad 		if (fstat(S->image_fd, &st) == -1)
    475   1.8  riastrad 			err(1, "stat(%s)", image_pathname);
    476   1.8  riastrad 		if (st.st_size <= 0)
    477   1.8  riastrad 			errx(1, "unknown image size");
    478   1.8  riastrad 		assert(st.st_size >= 0);
    479   1.8  riastrad 		__CTASSERT(OFF_MAX <= UINT64_MAX);
    480   1.8  riastrad 		assert(__type_fit(uint64_t, st.st_size));
    481   1.8  riastrad 		S->size = st.st_size;
    482   1.8  riastrad 	}
    483   1.8  riastrad 	assert(S->size <= OFF_MAX);
    484   1.8  riastrad 
    485   1.8  riastrad 	/* Find number of full blocks and whether there's a partial block.  */
    486   1.8  riastrad 	S->n_full_blocks = (S->size / S->blocksize);
    487   1.8  riastrad 	assert(S->n_full_blocks <=
    488   1.8  riastrad 	    (UINT32_MAX - ((S->size % S->blocksize) > 0)));
    489   1.8  riastrad 	S->n_blocks = (S->n_full_blocks + ((S->size % S->blocksize) > 0));
    490   1.8  riastrad 	assert(S->n_full_blocks <= S->n_blocks);
    491   1.8  riastrad 
    492   1.8  riastrad 	if (S->n_blocks > MAX_N_BLOCKS)
    493   1.8  riastrad 		errx(1, "image too large for block size %"PRIu32": %"PRIu64,
    494   1.8  riastrad 		    S->blocksize, S->size);
    495   1.8  riastrad 	assert(S->n_blocks <= MAX_N_BLOCKS);
    496   1.8  riastrad 
    497   1.8  riastrad 	/* Allocate an offset table for the blocks; one extra for the end.  */
    498   1.8  riastrad 	__CTASSERT(MAX_N_BLOCKS <= (UINT32_MAX - 1));
    499   1.8  riastrad 	S->n_offsets = (S->n_blocks + 1);
    500   1.8  riastrad 	__CTASSERT(MAX_N_OFFSETS == (MAX_N_BLOCKS + 1));
    501   1.8  riastrad 	__CTASSERT(MAX_N_OFFSETS <= (SIZE_MAX / sizeof(uint64_t)));
    502   1.8  riastrad 	S->offset_table = malloc(S->n_offsets * sizeof(uint64_t));
    503   1.8  riastrad 	if (S->offset_table == NULL)
    504   1.8  riastrad 		err(1, "malloc offset table");
    505   1.8  riastrad 
    506   1.8  riastrad 	/* Attempt to restart a partial transfer if requested.  */
    507   1.8  riastrad 	if (ISSET(O->flags, FLAG_r)) {
    508   1.8  riastrad 		if (compress_restart(S)) {
    509   1.8  riastrad 			/*
    510   1.8  riastrad 			 * Restart succeeded.  Truncate the output
    511   1.8  riastrad 			 * here, in case any garbage got appended.  We
    512   1.8  riastrad 			 * are committed to making progress at this
    513   1.8  riastrad 			 * point.  If the ftruncate fails, we don't
    514   1.8  riastrad 			 * lose anything valuable -- this is the last
    515   1.8  riastrad 			 * point at which we can restart anyway.
    516   1.8  riastrad 			 */
    517   1.8  riastrad 			if (ftruncate(S->cloop2_fd, S->offset) == -1)
    518   1.8  riastrad 				err(1, "ftruncate failed");
    519   1.8  riastrad 
    520   1.8  riastrad 			/* All set!  No more initialization to do.  */
    521   1.8  riastrad 			return;
    522   1.8  riastrad 		} else {
    523   1.8  riastrad 			/* Restart failed.  Barf now if requested.  */
    524   1.8  riastrad 			if (ISSET(O->flags, FLAG_R))
    525   1.8  riastrad 				errx(1, "restart failed, aborting");
    526   1.8  riastrad 
    527   1.8  riastrad 			/* Otherwise, truncate and start at the top.  */
    528   1.8  riastrad 			if (ftruncate(S->cloop2_fd, 0) == -1)
    529   1.8  riastrad 				err(1, "truncate failed");
    530   1.8  riastrad 			if (lseek(S->cloop2_fd, 0, SEEK_SET) == -1)
    531   1.8  riastrad 				err(1, "lseek to cloop2 beginning failed");
    532   1.8  riastrad 			if (lseek(S->image_fd, 0, SEEK_SET) == -1)
    533   1.8  riastrad 				err(1, "lseek to image beginning failed");
    534   1.8  riastrad 		}
    535   1.8  riastrad 	}
    536   1.8  riastrad 
    537   1.1   hubertf 	/*
    538   1.8  riastrad 	 * Initialize the offset table to all ones (except for the
    539   1.8  riastrad 	 * fixed first offset) so that we can easily detect where we
    540   1.8  riastrad 	 * were interrupted if we want to restart.
    541   1.1   hubertf 	 */
    542   1.8  riastrad 	__CTASSERT(MAX_N_OFFSETS <= UINT32_MAX);
    543   1.8  riastrad 	assert(S->n_offsets > 0);
    544   1.8  riastrad 	S->offset_table[0] = htobe64(sizeof(struct cloop2_header) +
    545   1.8  riastrad 	    (S->n_offsets * sizeof(uint64_t)));
    546   1.8  riastrad 	for (i = 1; i < S->n_offsets; i++)
    547   1.8  riastrad 		S->offset_table[i] = ~(uint64_t)0;
    548   1.8  riastrad 
    549   1.8  riastrad 	/* Write a bogus (zero) header for now, until we checkpoint.  */
    550   1.8  riastrad 	static const struct cloop2_header zero_header;
    551   1.8  riastrad 	const ssize_t h_written = write(S->cloop2_fd, &zero_header,
    552   1.8  riastrad 	    sizeof(zero_header));
    553   1.8  riastrad 	if (h_written == -1)
    554   1.8  riastrad 		err(1, "write header");
    555   1.8  riastrad 	assert(h_written >= 0);
    556   1.8  riastrad 	if ((size_t)h_written != sizeof(zero_header))
    557  1.13  riastrad 		errx(1, "partial write of header: %zu != %zu",
    558  1.13  riastrad 		    (size_t)h_written, sizeof(zero_header));
    559   1.8  riastrad 
    560   1.8  riastrad 	/* Write the initial (empty) offset table.  */
    561   1.8  riastrad 	const ssize_t ot_written = write(S->cloop2_fd, S->offset_table,
    562   1.8  riastrad 	    (S->n_offsets * sizeof(uint64_t)));
    563   1.8  riastrad 	if (ot_written == -1)
    564   1.8  riastrad 		err(1, "write initial offset table");
    565   1.8  riastrad 	assert(ot_written >= 0);
    566   1.8  riastrad 	if ((size_t)ot_written != (S->n_offsets * sizeof(uint64_t)))
    567  1.13  riastrad 		errx(1, "partial write of initial offset bytes: %zu <= %zu",
    568  1.13  riastrad 		    (size_t)ot_written,
    569  1.13  riastrad 		    (size_t)(S->n_offsets * sizeof(uint64_t)));
    570   1.8  riastrad 
    571   1.8  riastrad 	/* Start at the beginning of the image.  */
    572   1.8  riastrad 	S->blkno = 0;
    573   1.8  riastrad 	S->offset = (sizeof(struct cloop2_header) +
    574   1.8  riastrad 	    (S->n_offsets * sizeof(uint64_t)));
    575   1.8  riastrad 	S->n_checkpointed_blocks = 0;
    576   1.8  riastrad 
    577   1.8  riastrad 	/* Good to go and ready for interruption by a signal.  */
    578   1.8  riastrad 	S->initialized = 1;
    579   1.8  riastrad }
    580   1.8  riastrad 
    581   1.8  riastrad /*
    582   1.8  riastrad  * Try to recover state from an existing output file.
    583   1.8  riastrad  *
    584   1.8  riastrad  * On success, fill S->offset_table with what's in the file, set
    585   1.8  riastrad  * S->blkno and S->offset to reflect our position, and seek to the
    586   1.8  riastrad  * respective positions in the input and output files.
    587   1.8  riastrad  *
    588   1.8  riastrad  * On failure, return false.  May clobber S->offset_table, S->blkno,
    589   1.8  riastrad  * S->offset, and the file pointers.
    590   1.8  riastrad  */
    591   1.8  riastrad static bool
    592   1.8  riastrad compress_restart(struct compress_state *S)
    593   1.8  riastrad {
    594   1.8  riastrad 
    595   1.8  riastrad 	/* Read in the header.  */
    596   1.8  riastrad 	static const struct cloop2_header zero_header;
    597   1.8  riastrad 	struct cloop2_header header = zero_header;
    598   1.8  riastrad 
    599   1.8  riastrad 	const ssize_t h_read = read_block(S->cloop2_fd, &header,
    600   1.8  riastrad 	    sizeof(header));
    601   1.8  riastrad 	if (h_read == -1) {
    602   1.8  riastrad 		warn("failed to read header");
    603   1.8  riastrad 		return false;
    604   1.8  riastrad 	}
    605   1.8  riastrad 	assert(h_read >= 0);
    606   1.8  riastrad 	if ((size_t)h_read != sizeof(header)) {
    607   1.8  riastrad 		warnx("partial read of header");
    608   1.8  riastrad 		return false;
    609   1.8  riastrad 	}
    610   1.8  riastrad 
    611   1.8  riastrad 	/* Check that the header looks like a header.  */
    612   1.8  riastrad 	__CTASSERT(sizeof(cloop2_magic) <= sizeof(header.cl2h_magic));
    613   1.8  riastrad 	if (memcmp(header.cl2h_magic, cloop2_magic, sizeof(cloop2_magic))
    614   1.8  riastrad 	    != 0) {
    615   1.8  riastrad 		warnx("bad cloop2 shell script magic");
    616   1.8  riastrad 		return false;
    617   1.8  riastrad 	}
    618   1.8  riastrad 
    619   1.8  riastrad 	/* Check the header parameters.  */
    620   1.8  riastrad 	if (be32toh(header.cl2h_blocksize) != S->blocksize) {
    621   1.8  riastrad 		warnx("mismatched block size: %"PRIu32
    622   1.8  riastrad 		    " (expected %"PRIu32")",
    623   1.8  riastrad 		    be32toh(header.cl2h_blocksize), S->blocksize);
    624   1.8  riastrad 		return false;
    625   1.8  riastrad 	}
    626   1.8  riastrad 	if (be32toh(header.cl2h_n_blocks) != S->n_blocks) {
    627   1.8  riastrad 		warnx("mismatched number of blocks: %"PRIu32
    628   1.8  riastrad 		    " (expected %"PRIu32")",
    629   1.8  riastrad 		    be32toh(header.cl2h_n_blocks), S->n_blocks);
    630   1.8  riastrad 		return false;
    631   1.8  riastrad 	}
    632   1.8  riastrad 
    633   1.8  riastrad 	/* Read in the partial offset table.  */
    634   1.8  riastrad 	const ssize_t ot_read = read_block(S->cloop2_fd, S->offset_table,
    635   1.8  riastrad 	    (S->n_offsets * sizeof(uint64_t)));
    636   1.8  riastrad 	if (ot_read == -1) {
    637   1.8  riastrad 		warn("failed to read offset table");
    638   1.8  riastrad 		return false;
    639   1.8  riastrad 	}
    640   1.8  riastrad 	assert(ot_read >= 0);
    641   1.8  riastrad 	if ((size_t)ot_read != (S->n_offsets * sizeof(uint64_t))) {
    642   1.8  riastrad 		warnx("partial read of offset table");
    643   1.8  riastrad 		return false;
    644   1.8  riastrad 	}
    645   1.8  riastrad 
    646   1.8  riastrad 	if (be64toh(S->offset_table[0]) != (sizeof(struct cloop2_header) +
    647   1.8  riastrad 		(S->n_offsets * sizeof(uint64_t)))) {
    648   1.8  riastrad 		warnx("first offset is not %"PRIu64": %"PRIu64,
    649   1.8  riastrad 		    ((uint64_t)S->n_offsets * sizeof(uint64_t)),
    650   1.8  riastrad 		    be64toh(S->offset_table[0]));
    651   1.8  riastrad 		return false;
    652   1.8  riastrad 	}
    653   1.8  riastrad 
    654   1.8  riastrad 	/* Find where we left off.  */
    655   1.8  riastrad 	__CTASSERT(MAX_N_OFFSETS <= UINT32_MAX);
    656   1.8  riastrad 	uint32_t blkno = 0;
    657   1.8  riastrad 	for (blkno = 0; blkno < S->n_blocks; blkno++) {
    658   1.8  riastrad 		if (S->offset_table[blkno] == ~(uint64_t)0)
    659   1.8  riastrad 			break;
    660   1.8  riastrad 		if (0 < blkno) {
    661   1.8  riastrad 			const uint64_t start =
    662   1.8  riastrad 			    be64toh(S->offset_table[blkno - 1]);
    663   1.8  riastrad 			const uint64_t end = be64toh(S->offset_table[blkno]);
    664   1.8  riastrad 			if (end <= start) {
    665   1.8  riastrad 				warnx("bad offset table: 0x%"PRIx64
    666   1.8  riastrad 				    ", 0x%"PRIx64, start, end);
    667   1.8  riastrad 				return false;
    668   1.8  riastrad 			}
    669   1.8  riastrad 			/* XXX compression ratio bound */
    670   1.8  riastrad 			__CTASSERT(MAX_BLOCKSIZE <= (SIZE_MAX / 2));
    671   1.8  riastrad 			if ((2 * (size_t)S->blocksize) <= (end - start)) {
    672   1.8  riastrad 				warnx("block %"PRIu32" too large:"
    673   1.8  riastrad 				    " %"PRIu64" bytes",
    674   1.8  riastrad 				    blkno, (end - start));
    675   1.8  riastrad 				return false;
    676   1.8  riastrad 			}
    677   1.8  riastrad 		}
    678   1.8  riastrad 	}
    679   1.8  riastrad 
    680   1.8  riastrad 	if (blkno == 0) {
    681   1.8  riastrad 		warnx("no blocks were written; nothing to restart");
    682   1.8  riastrad 		return false;
    683   1.8  riastrad 	}
    684   1.8  riastrad 
    685   1.8  riastrad 	/* Make sure the rest of the offset table is all ones.  */
    686   1.8  riastrad 	if (blkno < S->n_blocks) {
    687   1.8  riastrad 		uint32_t nblkno;
    688   1.8  riastrad 
    689   1.8  riastrad 		for (nblkno = blkno; nblkno < S->n_blocks; nblkno++) {
    690   1.8  riastrad 			if (S->offset_table[nblkno] != ~(uint64_t)0) {
    691   1.8  riastrad 				warnx("bad partial offset table entry"
    692   1.8  riastrad 				    " at %"PRIu32": %"PRIu64,
    693   1.8  riastrad 				    nblkno,
    694   1.8  riastrad 				    be64toh(S->offset_table[nblkno]));
    695   1.8  riastrad 				return false;
    696   1.8  riastrad 			}
    697   1.8  riastrad 		}
    698   1.1   hubertf 	}
    699   1.8  riastrad 
    700   1.1   hubertf 	/*
    701   1.8  riastrad 	 * XXX Consider decompressing some number of blocks to make
    702   1.8  riastrad 	 * sure they match.
    703   1.1   hubertf 	 */
    704   1.8  riastrad 
    705   1.8  riastrad 	/* Back up by one.  */
    706   1.8  riastrad 	assert(1 <= blkno);
    707   1.8  riastrad 	blkno -= 1;
    708   1.8  riastrad 
    709   1.8  riastrad 	/* Seek to the input position.  */
    710   1.8  riastrad 	assert(S->size <= OFF_MAX);
    711   1.8  riastrad 	assert(blkno <= (S->size / S->blocksize));
    712   1.8  riastrad 	const off_t restart_position = ((off_t)blkno * (off_t)S->blocksize);
    713   1.8  riastrad 	assert(0 <= restart_position);
    714   1.8  riastrad 	assert(restart_position <= (off_t)S->size);
    715   1.8  riastrad 	if (lseek(S->image_fd, restart_position, SEEK_SET) == -1) {
    716   1.8  riastrad 		if (errno != ESPIPE) {
    717   1.8  riastrad 			warn("lseek input image failed");
    718   1.8  riastrad 			return false;
    719   1.8  riastrad 		}
    720   1.8  riastrad 
    721   1.8  riastrad 		/* Try read instead of lseek for a pipe/socket/fifo.  */
    722   1.8  riastrad 		void *const buffer = malloc(0x10000);
    723   1.8  riastrad 		if (buffer == NULL)
    724   1.8  riastrad 			err(1, "malloc temporary buffer");
    725   1.8  riastrad 		off_t left = restart_position;
    726   1.8  riastrad 		while (left > 0) {
    727   1.8  riastrad 			const size_t size = MIN(0x10000, left);
    728   1.8  riastrad 			const ssize_t n_read = read_block(S->image_fd, buffer,
    729   1.8  riastrad 			    size);
    730   1.8  riastrad 			if (n_read == -1) {
    731   1.8  riastrad 				free(buffer);
    732   1.8  riastrad 				warn("read of input image failed");
    733   1.8  riastrad 				return false;
    734   1.8  riastrad 			}
    735   1.8  riastrad 			assert(n_read >= 0);
    736   1.8  riastrad 			if ((size_t)n_read != size) {
    737   1.8  riastrad 				free(buffer);
    738   1.8  riastrad 				warnx("partial read of input image");
    739   1.8  riastrad 				return false;
    740   1.1   hubertf 			}
    741   1.8  riastrad 			assert((off_t)size <= left);
    742   1.8  riastrad 			left -= size;
    743   1.1   hubertf 		}
    744   1.8  riastrad 		free(buffer);
    745   1.8  riastrad 	}
    746   1.8  riastrad 
    747   1.8  riastrad 	/* Seek to the output position.  */
    748   1.8  riastrad 	const uint64_t offset = be64toh(S->offset_table[blkno]);
    749   1.8  riastrad 	assert(offset <= OFF_MAX);
    750   1.8  riastrad 	if (lseek(S->cloop2_fd, offset, SEEK_SET) == -1) {
    751   1.8  riastrad 		warn("lseek output cloop2 to %"PRIx64" failed",
    752   1.8  riastrad 		    S->offset);
    753   1.8  riastrad 		return false;
    754   1.1   hubertf 	}
    755   1.8  riastrad 
    756   1.8  riastrad 	/* Start where we left off.  */
    757   1.8  riastrad 	S->blkno = blkno;
    758   1.8  riastrad 	S->offset = offset;
    759   1.8  riastrad 	S->n_checkpointed_blocks = blkno;
    760   1.8  riastrad 
    761   1.8  riastrad 	/* Good to go and ready for interruption by a signal.  */
    762   1.8  riastrad 	S->initialized = 1;
    763   1.8  riastrad 
    764   1.8  riastrad 	/* Success!  */
    765   1.8  riastrad 	return true;
    766   1.8  riastrad }
    767   1.8  riastrad 
    768   1.8  riastrad /*
    769   1.8  riastrad  * Read a single block, compress it, and write the compressed block.
    770   1.8  riastrad  * Return the size of the compressed block.
    771   1.8  riastrad  */
    772   1.8  riastrad static uint32_t
    773   1.8  riastrad compress_block(int in_fd, int out_fd, uint32_t blkno, uint32_t blocksize,
    774   1.8  riastrad     uint32_t readsize, void *uncompbuf, void *compbuf)
    775   1.8  riastrad {
    776   1.8  riastrad 
    777   1.8  riastrad 	assert(readsize <= blocksize);
    778   1.8  riastrad 	assert(blocksize <= MAX_BLOCKSIZE);
    779   1.8  riastrad 
    780   1.8  riastrad 	/* Read the uncompressed block.  */
    781   1.8  riastrad 	const ssize_t n_read = read_block(in_fd, uncompbuf, readsize);
    782   1.8  riastrad 	if (n_read == -1)
    783   1.8  riastrad 		err(1, "read block %"PRIu32, blkno);
    784   1.8  riastrad 	assert(n_read >= 0);
    785  1.13  riastrad 	if ((size_t)n_read != readsize)
    786  1.13  riastrad 		errx(1, "partial read of block %"PRIu32": %zu != %"PRIu32,
    787  1.13  riastrad 		    blkno, (size_t)n_read, readsize);
    788   1.8  riastrad 
    789   1.8  riastrad 	/* Compress the block.  */
    790   1.8  riastrad 	/* XXX compression ratio bound */
    791   1.8  riastrad 	__CTASSERT(MAX_BLOCKSIZE <= (ULONG_MAX / 2));
    792   1.8  riastrad 	const unsigned long uncomplen =
    793   1.8  riastrad 	    (VNDCOMPRESS_COMPAT? blocksize : readsize); /* XXX */
    794   1.8  riastrad 	unsigned long complen = (uncomplen * 2);
    795   1.8  riastrad 	const int zerror = compress2(compbuf, &complen, uncompbuf, uncomplen,
    796   1.8  riastrad 	    Z_BEST_COMPRESSION);
    797   1.8  riastrad 	if (zerror != Z_OK)
    798   1.8  riastrad 		errx(1, "compressed failed at block %"PRIu32" (%d): %s", blkno,
    799   1.8  riastrad 		    zerror, zError(zerror));
    800   1.8  riastrad 	assert(complen <= (uncomplen * 2));
    801   1.8  riastrad 
    802   1.8  riastrad 	/* Write the compressed block.  */
    803   1.8  riastrad 	const ssize_t n_written = write(out_fd, compbuf, complen);
    804   1.8  riastrad 	if (n_written == -1)
    805   1.8  riastrad 		err(1, "write block %"PRIu32, blkno);
    806   1.8  riastrad 	assert(n_written >= 0);
    807  1.13  riastrad 	if ((size_t)n_written != complen)
    808  1.13  riastrad 		errx(1, "partial write of block %"PRIu32": %zu != %lu",
    809  1.13  riastrad 		    blkno, (size_t)n_written, complen);
    810   1.8  riastrad 
    811  1.13  riastrad 	return (size_t)n_written;
    812   1.1   hubertf }
    813   1.1   hubertf 
    814   1.1   hubertf /*
    815   1.8  riastrad  * Checkpoint if appropriate.
    816   1.1   hubertf  */
    817   1.8  riastrad static void
    818   1.8  riastrad compress_maybe_checkpoint(struct compress_state *S)
    819   1.1   hubertf {
    820   1.1   hubertf 
    821   1.8  riastrad 	if ((0 < S->checkpoint_blocks) && (0 < S->blkno) &&
    822   1.8  riastrad 	    ((S->blkno % S->checkpoint_blocks) == 0)) {
    823   1.8  riastrad 		assert(S->offset <= OFF_MAX);
    824   1.8  riastrad 		assert((off_t)S->offset == lseek(S->cloop2_fd, 0, SEEK_CUR));
    825   1.8  riastrad 		compress_checkpoint(S);
    826   1.1   hubertf 	}
    827   1.1   hubertf }
    828   1.1   hubertf 
    829   1.1   hubertf /*
    830   1.8  riastrad  * Write the prefix of the offset table that we have filled so far.
    831   1.8  riastrad  *
    832   1.8  riastrad  * We fsync the data blocks we have written, and then write the offset
    833   1.8  riastrad  * table, and then fsync the offset table and file metadata.  This
    834   1.8  riastrad  * should help to avoid offset tables that point at garbage data.
    835   1.8  riastrad  *
    836   1.8  riastrad  * This may be called from a signal handler, so it must not use stdio,
    837   1.8  riastrad  * malloc, &c. -- it may only (a) handle signal-safe state in S, and
    838   1.8  riastrad  * (b) do file descriptor I/O / fsync.
    839   1.8  riastrad  *
    840   1.8  riastrad  * XXX This requires further thought and heavy testing to be sure.
    841   1.8  riastrad  *
    842   1.8  riastrad  * XXX Should have an option to suppress fsync.
    843   1.8  riastrad  *
    844   1.8  riastrad  * XXX Should have an option to fail on fsync failures.
    845   1.8  riastrad  *
    846   1.8  riastrad  * XXX Would be nice if we could just do a barrier rather than an
    847   1.8  riastrad  * fsync.
    848   1.8  riastrad  *
    849   1.8  riastrad  * XXX How might we automatically test the fsyncs?
    850   1.1   hubertf  */
    851   1.7     joerg static void
    852   1.8  riastrad compress_checkpoint(struct compress_state *S)
    853   1.1   hubertf {
    854   1.8  riastrad 
    855   1.8  riastrad 	assert(S->blkno < S->n_offsets);
    856   1.8  riastrad 	const uint32_t n_offsets = (S->blkno + 1);
    857   1.8  riastrad 	assert(n_offsets <= S->n_offsets);
    858   1.8  riastrad 
    859   1.8  riastrad 	assert(S->offset <= OFF_MAX);
    860   1.8  riastrad 	assert((off_t)S->offset <= lseek(S->cloop2_fd, 0, SEEK_CUR));
    861   1.8  riastrad 
    862   1.8  riastrad 	/* Make sure the data hits the disk before we say it's ready.  */
    863   1.8  riastrad 	if (fsync_range(S->cloop2_fd, (FFILESYNC | FDISKSYNC), 0, S->offset)
    864   1.8  riastrad 	    == -1)
    865   1.8  riastrad 		warn_ss("fsync of output failed");
    866   1.8  riastrad 
    867   1.8  riastrad 	/* Say the data blocks are ready.  */
    868   1.8  riastrad 	const ssize_t n_written = pwrite(S->cloop2_fd, S->offset_table,
    869   1.8  riastrad 	    (n_offsets * sizeof(uint64_t)), CLOOP2_OFFSET_TABLE_OFFSET);
    870   1.8  riastrad 	if (n_written == -1)
    871   1.8  riastrad 		err_ss(1, "write partial offset table");
    872   1.8  riastrad 	assert(n_written >= 0);
    873   1.8  riastrad 	if ((size_t)n_written != (n_offsets * sizeof(uint64_t)))
    874  1.13  riastrad 		errx_ss(1, "partial write of partial offset table: %zu != %zu",
    875  1.13  riastrad 		    (size_t)n_written,
    876  1.13  riastrad 		    (size_t)(n_offsets * sizeof(uint64_t)));
    877   1.8  riastrad 
    878   1.1   hubertf 	/*
    879   1.8  riastrad 	 * If this is the first checkpoint, initialize the header.
    880   1.8  riastrad 	 * Signal handler can race with main code here, but it is
    881   1.8  riastrad 	 * harmless -- just an extra fsync and write of the header,
    882   1.8  riastrad 	 * which are both idempotent.
    883   1.1   hubertf 	 */
    884   1.8  riastrad 	if (S->n_checkpointed_blocks == 0) {
    885   1.8  riastrad 		static const struct cloop2_header zero_header;
    886   1.8  riastrad 		struct cloop2_header header = zero_header;
    887   1.8  riastrad 
    888   1.8  riastrad 		/* Force the offset table to disk before we set the header.  */
    889   1.8  riastrad 		if (fsync_range(S->cloop2_fd, (FFILESYNC | FDISKSYNC),
    890   1.8  riastrad 			0,
    891   1.8  riastrad 			(CLOOP2_OFFSET_TABLE_OFFSET
    892   1.8  riastrad 			    + (n_offsets * (sizeof(uint64_t)))))
    893   1.8  riastrad 		    == -1)
    894   1.8  riastrad 			warn_ss("fsync of offset table failed");
    895   1.8  riastrad 
    896   1.8  riastrad 		/* Subsequent writes will preserve a valid state.  */
    897   1.8  riastrad 
    898   1.8  riastrad 		/* Format the header.  */
    899   1.8  riastrad 		__CTASSERT(sizeof(cloop2_magic) <= sizeof(header.cl2h_magic));
    900   1.8  riastrad 		(void)memcpy(header.cl2h_magic, cloop2_magic,
    901   1.8  riastrad 		    sizeof(cloop2_magic));
    902   1.8  riastrad 		header.cl2h_blocksize = htobe32(S->blocksize);
    903   1.8  riastrad 		header.cl2h_n_blocks = htobe32(S->n_blocks);
    904   1.8  riastrad 
    905   1.8  riastrad 		/* Write the header.  */
    906   1.8  riastrad 		const ssize_t h_written = pwrite(S->cloop2_fd, &header,
    907   1.8  riastrad 		    sizeof(header), 0);
    908   1.8  riastrad 		if (h_written == -1)
    909   1.8  riastrad 			err_ss(1, "write header");
    910   1.8  riastrad 		assert(h_written >= 0);
    911   1.8  riastrad 		if ((size_t)h_written != sizeof(header))
    912  1.13  riastrad 			errx_ss(1, "partial write of header: %zu != %zu",
    913  1.13  riastrad 			    (size_t)h_written, sizeof(header));
    914   1.8  riastrad 	}
    915   1.8  riastrad 
    916   1.8  riastrad 	/* Record how many blocks we've checkpointed.  */
    917   1.8  riastrad     {
    918   1.8  riastrad 	sigset_t old_sigmask;
    919   1.8  riastrad 	block_signals(&old_sigmask);
    920   1.8  riastrad 	S->n_checkpointed_blocks = S->blkno;
    921   1.8  riastrad 	restore_sigmask(&old_sigmask);
    922   1.8  riastrad     }
    923   1.8  riastrad }
    924   1.8  riastrad 
    925   1.8  riastrad /*
    926   1.8  riastrad  * Release everything we allocated in compress_init.
    927   1.8  riastrad  */
    928   1.8  riastrad static void
    929   1.8  riastrad compress_exit(struct compress_state *S)
    930   1.8  riastrad {
    931   1.8  riastrad 
    932   1.8  riastrad 	/* Done with the offset table.  Free it.  */
    933   1.8  riastrad 	free(S->offset_table);
    934   1.8  riastrad 
    935   1.8  riastrad 	/* Done with the files.  Close them.  */
    936   1.8  riastrad 	if (close(S->cloop2_fd) == -1)
    937   1.8  riastrad 		warn("close(cloop2 fd)");
    938   1.8  riastrad 	if (close(S->image_fd) == -1)
    939   1.8  riastrad 		warn("close(image fd)");
    940   1.1   hubertf }
    941