You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
1105 lines
29 KiB
1105 lines
29 KiB
/*
|
|
* undo_io.c --- This is the undo io manager that copies the old data that
|
|
* copies the old data being overwritten into a tdb database
|
|
*
|
|
* Copyright IBM Corporation, 2007
|
|
* Author Aneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com>
|
|
*
|
|
* %Begin-Header%
|
|
* This file may be redistributed under the terms of the GNU Library
|
|
* General Public License, version 2.
|
|
* %End-Header%
|
|
*/
|
|
|
|
#ifndef _LARGEFILE_SOURCE
|
|
#define _LARGEFILE_SOURCE
|
|
#endif
|
|
#ifndef _LARGEFILE64_SOURCE
|
|
#define _LARGEFILE64_SOURCE
|
|
#endif
|
|
|
|
#include "config.h"
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#if HAVE_UNISTD_H
|
|
#include <unistd.h>
|
|
#endif
|
|
#if HAVE_ERRNO_H
|
|
#include <errno.h>
|
|
#endif
|
|
#include <fcntl.h>
|
|
#include <time.h>
|
|
#ifdef __linux__
|
|
#include <sys/utsname.h>
|
|
#endif
|
|
#if HAVE_SYS_STAT_H
|
|
#include <sys/stat.h>
|
|
#endif
|
|
#if HAVE_SYS_TYPES_H
|
|
#include <sys/types.h>
|
|
#endif
|
|
#if HAVE_SYS_RESOURCE_H
|
|
#include <sys/resource.h>
|
|
#endif
|
|
#include <limits.h>
|
|
|
|
#include "ext2_fs.h"
|
|
#include "ext2fs.h"
|
|
#include "ext2fsP.h"
|
|
|
|
#ifdef __GNUC__
|
|
#define ATTR(x) __attribute__(x)
|
|
#else
|
|
#define ATTR(x)
|
|
#endif
|
|
|
|
#undef DEBUG
|
|
|
|
#ifdef DEBUG
|
|
# define dbg_printf(f, a...) do {printf(f, ## a); fflush(stdout); } while (0)
|
|
#else
|
|
# define dbg_printf(f, a...)
|
|
#endif
|
|
|
|
/*
|
|
* For checking structure magic numbers...
|
|
*/
|
|
|
|
#define EXT2_CHECK_MAGIC(struct, code) \
|
|
if ((struct)->magic != (code)) return (code)
|
|
/*
|
|
* Undo file format: The file is cut up into undo_header.block_size blocks.
|
|
* The first block contains the header.
|
|
* The second block contains the superblock.
|
|
* There is then a repeating series of blocks as follows:
|
|
* A key block, which contains undo_keys to map the following data blocks.
|
|
* Data blocks
|
|
* (Note that there are pointers to the first key block and the sb, so this
|
|
* order isn't strictly necessary.)
|
|
*/
|
|
#define E2UNDO_MAGIC "E2UNDO02"
|
|
#define KEYBLOCK_MAGIC 0xCADECADE
|
|
|
|
#define E2UNDO_STATE_FINISHED 0x1 /* undo file is complete */
|
|
|
|
#define E2UNDO_MIN_BLOCK_SIZE 1024 /* undo blocks are no less than 1KB */
|
|
#define E2UNDO_MAX_BLOCK_SIZE 1048576 /* undo blocks are no more than 1MB */
|
|
|
|
struct undo_header {
|
|
char magic[8]; /* "E2UNDO02" */
|
|
__le64 num_keys; /* how many keys? */
|
|
__le64 super_offset; /* where in the file is the superblock copy? */
|
|
__le64 key_offset; /* where do the key/data block chunks start? */
|
|
__le32 block_size; /* block size of the undo file */
|
|
__le32 fs_block_size; /* block size of the target device */
|
|
__le32 sb_crc; /* crc32c of the superblock */
|
|
__le32 state; /* e2undo state flags */
|
|
__le32 f_compat; /* compatible features */
|
|
__le32 f_incompat; /* incompatible features (none so far) */
|
|
__le32 f_rocompat; /* ro compatible features (none so far) */
|
|
__le32 pad32; /* padding for fs_offset */
|
|
__le64 fs_offset; /* filesystem offset */
|
|
__u8 padding[436]; /* padding */
|
|
__le32 header_crc; /* crc32c of this header (but not this field) */
|
|
};
|
|
|
|
#define E2UNDO_MAX_EXTENT_BLOCKS 512 /* max extent size, in blocks */
|
|
|
|
struct undo_key {
|
|
__le64 fsblk; /* where in the fs does the block go */
|
|
__le32 blk_crc; /* crc32c of the block */
|
|
__le32 size; /* how many bytes in this block? */
|
|
};
|
|
|
|
struct undo_key_block {
|
|
__le32 magic; /* KEYBLOCK_MAGIC number */
|
|
__le32 crc; /* block checksum */
|
|
__le64 reserved; /* zero */
|
|
|
|
#if __STDC_VERSION__ >= 199901L
|
|
struct undo_key keys[]; /* keys, which come immediately after */
|
|
#else
|
|
struct undo_key keys[0]; /* keys, which come immediately after */
|
|
#endif
|
|
};
|
|
|
|
struct undo_private_data {
|
|
int magic;
|
|
|
|
/* the undo file io channel */
|
|
io_channel undo_file;
|
|
blk64_t undo_blk_num; /* next free block */
|
|
blk64_t key_blk_num; /* current key block location */
|
|
blk64_t super_blk_num; /* superblock location */
|
|
blk64_t first_key_blk; /* first key block location */
|
|
struct undo_key_block *keyb;
|
|
size_t num_keys, keys_in_block;
|
|
|
|
/* The backing io channel */
|
|
io_channel real;
|
|
|
|
unsigned long long tdb_data_size;
|
|
int tdb_written;
|
|
|
|
/* to support offset in unix I/O manager */
|
|
ext2_loff_t offset;
|
|
|
|
ext2fs_block_bitmap written_block_map;
|
|
struct struct_ext2_filsys fake_fs;
|
|
char *tdb_file;
|
|
struct undo_header hdr;
|
|
};
|
|
#define KEYS_PER_BLOCK(d) (((d)->tdb_data_size / sizeof(struct undo_key)) - 1)
|
|
|
|
#define E2UNDO_FEATURE_COMPAT_FS_OFFSET 0x1 /* the filesystem offset */
|
|
|
|
static inline void e2undo_set_feature_fs_offset(struct undo_header *header) {
|
|
header->f_compat |= ext2fs_le32_to_cpu(E2UNDO_FEATURE_COMPAT_FS_OFFSET);
|
|
}
|
|
|
|
static inline void e2undo_clear_feature_fs_offset(struct undo_header *header) {
|
|
header->f_compat &= ~ext2fs_le32_to_cpu(E2UNDO_FEATURE_COMPAT_FS_OFFSET);
|
|
}
|
|
|
|
static io_manager undo_io_backing_manager;
|
|
static char *tdb_file;
|
|
static int actual_size;
|
|
|
|
errcode_t set_undo_io_backing_manager(io_manager manager)
|
|
{
|
|
/*
|
|
* We may want to do some validation later
|
|
*/
|
|
undo_io_backing_manager = manager;
|
|
return 0;
|
|
}
|
|
|
|
errcode_t set_undo_io_backup_file(char *file_name)
|
|
{
|
|
tdb_file = strdup(file_name);
|
|
|
|
if (tdb_file == NULL) {
|
|
return EXT2_ET_NO_MEMORY;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static errcode_t write_undo_indexes(struct undo_private_data *data, int flush)
|
|
{
|
|
errcode_t retval;
|
|
struct ext2_super_block super;
|
|
io_channel channel;
|
|
int block_size;
|
|
__u32 sb_crc, hdr_crc;
|
|
|
|
/* Spit out a key block, if there's any data */
|
|
if (data->keys_in_block) {
|
|
data->keyb->magic = ext2fs_cpu_to_le32(KEYBLOCK_MAGIC);
|
|
data->keyb->crc = 0;
|
|
data->keyb->crc = ext2fs_cpu_to_le32(
|
|
ext2fs_crc32c_le(~0,
|
|
(unsigned char *)data->keyb,
|
|
data->tdb_data_size));
|
|
dbg_printf("Writing keyblock to blk %llu\n", data->key_blk_num);
|
|
retval = io_channel_write_blk64(data->undo_file,
|
|
data->key_blk_num,
|
|
1, data->keyb);
|
|
if (retval)
|
|
return retval;
|
|
/* Move on to the next key block if it's full. */
|
|
if (data->keys_in_block == KEYS_PER_BLOCK(data)) {
|
|
memset(data->keyb, 0, data->tdb_data_size);
|
|
data->keys_in_block = 0;
|
|
data->key_blk_num = data->undo_blk_num;
|
|
data->undo_blk_num++;
|
|
}
|
|
}
|
|
|
|
/* Prepare superblock for write */
|
|
channel = data->real;
|
|
block_size = channel->block_size;
|
|
|
|
io_channel_set_blksize(channel, SUPERBLOCK_OFFSET);
|
|
retval = io_channel_read_blk64(channel, 1, -SUPERBLOCK_SIZE, &super);
|
|
if (retval)
|
|
goto err_out;
|
|
sb_crc = ext2fs_crc32c_le(~0, (unsigned char *)&super, SUPERBLOCK_SIZE);
|
|
super.s_magic = ~super.s_magic;
|
|
|
|
/* Write the undo header to disk. */
|
|
memcpy(data->hdr.magic, E2UNDO_MAGIC, sizeof(data->hdr.magic));
|
|
data->hdr.num_keys = ext2fs_cpu_to_le64(data->num_keys);
|
|
data->hdr.super_offset = ext2fs_cpu_to_le64(data->super_blk_num);
|
|
data->hdr.key_offset = ext2fs_cpu_to_le64(data->first_key_blk);
|
|
data->hdr.fs_block_size = ext2fs_cpu_to_le32(block_size);
|
|
data->hdr.sb_crc = ext2fs_cpu_to_le32(sb_crc);
|
|
data->hdr.fs_offset = ext2fs_cpu_to_le64(data->offset);
|
|
if (data->offset)
|
|
e2undo_set_feature_fs_offset(&data->hdr);
|
|
else
|
|
e2undo_clear_feature_fs_offset(&data->hdr);
|
|
hdr_crc = ext2fs_crc32c_le(~0, (unsigned char *)&data->hdr,
|
|
sizeof(data->hdr) -
|
|
sizeof(data->hdr.header_crc));
|
|
data->hdr.header_crc = ext2fs_cpu_to_le32(hdr_crc);
|
|
retval = io_channel_write_blk64(data->undo_file, 0,
|
|
-(int)sizeof(data->hdr),
|
|
&data->hdr);
|
|
if (retval)
|
|
goto err_out;
|
|
|
|
/*
|
|
* Record the entire superblock (in FS byte order) so that we can't
|
|
* apply e2undo files to the wrong FS or out of order.
|
|
*/
|
|
dbg_printf("Writing superblock to block %llu\n", data->super_blk_num);
|
|
retval = io_channel_write_blk64(data->undo_file, data->super_blk_num,
|
|
-SUPERBLOCK_SIZE, &super);
|
|
if (retval)
|
|
goto err_out;
|
|
|
|
if (flush)
|
|
retval = io_channel_flush(data->undo_file);
|
|
err_out:
|
|
io_channel_set_blksize(channel, block_size);
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_setup_tdb(struct undo_private_data *data)
|
|
{
|
|
int i;
|
|
errcode_t retval;
|
|
|
|
if (data->tdb_written == 1)
|
|
return 0;
|
|
|
|
data->tdb_written = 1;
|
|
|
|
/* Make a bitmap to track what we've written */
|
|
memset(&data->fake_fs, 0, sizeof(data->fake_fs));
|
|
data->fake_fs.blocksize = data->tdb_data_size;
|
|
retval = ext2fs_alloc_generic_bmap(&data->fake_fs,
|
|
EXT2_ET_MAGIC_BLOCK_BITMAP64,
|
|
EXT2FS_BMAP64_RBTREE,
|
|
0, ~1ULL, ~1ULL,
|
|
"undo block map", &data->written_block_map);
|
|
if (retval)
|
|
return retval;
|
|
|
|
/* Allocate key block */
|
|
retval = ext2fs_get_mem(data->tdb_data_size, &data->keyb);
|
|
if (retval)
|
|
return retval;
|
|
data->key_blk_num = data->first_key_blk;
|
|
|
|
/* Record block size */
|
|
dbg_printf("Undo block size %llu\n", data->tdb_data_size);
|
|
dbg_printf("Keys per block %llu\n", KEYS_PER_BLOCK(data));
|
|
data->hdr.block_size = ext2fs_cpu_to_le32(data->tdb_data_size);
|
|
io_channel_set_blksize(data->undo_file, data->tdb_data_size);
|
|
|
|
/* Ensure that we have space for header blocks */
|
|
for (i = 0; i <= 2; i++) {
|
|
retval = io_channel_read_blk64(data->undo_file, i, 1,
|
|
data->keyb);
|
|
if (retval)
|
|
memset(data->keyb, 0, data->tdb_data_size);
|
|
retval = io_channel_write_blk64(data->undo_file, i, 1,
|
|
data->keyb);
|
|
if (retval)
|
|
return retval;
|
|
retval = io_channel_flush(data->undo_file);
|
|
if (retval)
|
|
return retval;
|
|
}
|
|
memset(data->keyb, 0, data->tdb_data_size);
|
|
return 0;
|
|
}
|
|
|
|
static errcode_t undo_write_tdb(io_channel channel,
|
|
unsigned long long block, int count)
|
|
|
|
{
|
|
int size, sz;
|
|
unsigned long long block_num, backing_blk_num;
|
|
errcode_t retval = 0;
|
|
ext2_loff_t offset;
|
|
struct undo_private_data *data;
|
|
unsigned char *read_ptr;
|
|
unsigned long long end_block;
|
|
unsigned long long data_size;
|
|
struct undo_key *key;
|
|
__u32 blk_crc;
|
|
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
|
|
if (data->undo_file == NULL) {
|
|
/*
|
|
* Transaction database not initialized
|
|
*/
|
|
return 0;
|
|
}
|
|
|
|
if (count == 1)
|
|
size = channel->block_size;
|
|
else {
|
|
if (count < 0)
|
|
size = -count;
|
|
else
|
|
size = count * channel->block_size;
|
|
}
|
|
|
|
retval = undo_setup_tdb(data);
|
|
if (retval)
|
|
return retval;
|
|
/*
|
|
* Data is stored in tdb database as blocks of tdb_data_size size
|
|
* This helps in efficient lookup further.
|
|
*
|
|
* We divide the disk to blocks of tdb_data_size.
|
|
*/
|
|
offset = (block * channel->block_size) + data->offset ;
|
|
block_num = offset / data->tdb_data_size;
|
|
end_block = (offset + size - 1) / data->tdb_data_size;
|
|
|
|
while (block_num <= end_block) {
|
|
__u32 keysz;
|
|
|
|
/*
|
|
* Check if we have the record already
|
|
*/
|
|
if (ext2fs_test_block_bitmap2(data->written_block_map,
|
|
block_num)) {
|
|
/* Try the next block */
|
|
block_num++;
|
|
continue;
|
|
}
|
|
ext2fs_mark_block_bitmap2(data->written_block_map, block_num);
|
|
|
|
/*
|
|
* Read one block using the backing I/O manager
|
|
* The backing I/O manager block size may be
|
|
* different from the tdb_data_size.
|
|
* Also we need to recalculate the block number with respect
|
|
* to the backing I/O manager.
|
|
*/
|
|
offset = block_num * data->tdb_data_size +
|
|
(data->offset % data->tdb_data_size);
|
|
backing_blk_num = (offset - data->offset) / channel->block_size;
|
|
|
|
retval = ext2fs_get_mem(data->tdb_data_size, &read_ptr);
|
|
if (retval) {
|
|
return retval;
|
|
}
|
|
|
|
memset(read_ptr, 0, data->tdb_data_size);
|
|
actual_size = 0;
|
|
if ((data->tdb_data_size % channel->block_size) == 0)
|
|
sz = data->tdb_data_size / channel->block_size;
|
|
else
|
|
sz = -data->tdb_data_size;
|
|
retval = io_channel_read_blk64(data->real, backing_blk_num,
|
|
sz, read_ptr);
|
|
if (retval) {
|
|
if (retval != EXT2_ET_SHORT_READ) {
|
|
free(read_ptr);
|
|
return retval;
|
|
}
|
|
/*
|
|
* short read so update the record size
|
|
* accordingly
|
|
*/
|
|
data_size = actual_size;
|
|
} else {
|
|
data_size = data->tdb_data_size;
|
|
}
|
|
if (data_size == 0) {
|
|
free(read_ptr);
|
|
block_num++;
|
|
continue;
|
|
}
|
|
dbg_printf("Read %llu bytes from FS block %llu (blk=%llu cnt=%llu)\n",
|
|
data_size, backing_blk_num, block, data->tdb_data_size);
|
|
if ((data_size % data->undo_file->block_size) == 0)
|
|
sz = data_size / data->undo_file->block_size;
|
|
else
|
|
sz = -data_size;;
|
|
/* extend this key? */
|
|
if (data->keys_in_block) {
|
|
key = data->keyb->keys + data->keys_in_block - 1;
|
|
keysz = ext2fs_le32_to_cpu(key->size);
|
|
} else {
|
|
key = NULL;
|
|
keysz = 0;
|
|
}
|
|
if (key != NULL &&
|
|
(ext2fs_le64_to_cpu(key->fsblk) * channel->block_size +
|
|
channel->block_size - 1 +
|
|
keysz) / channel->block_size == backing_blk_num &&
|
|
E2UNDO_MAX_EXTENT_BLOCKS * data->tdb_data_size >
|
|
keysz + data_size) {
|
|
blk_crc = ext2fs_le32_to_cpu(key->blk_crc);
|
|
blk_crc = ext2fs_crc32c_le(blk_crc, read_ptr, data_size);
|
|
key->blk_crc = ext2fs_cpu_to_le32(blk_crc);
|
|
key->size = ext2fs_cpu_to_le32(keysz + data_size);
|
|
} else {
|
|
data->num_keys++;
|
|
key = data->keyb->keys + data->keys_in_block;
|
|
data->keys_in_block++;
|
|
key->fsblk = ext2fs_cpu_to_le64(backing_blk_num);
|
|
blk_crc = ext2fs_crc32c_le(~0, read_ptr, data_size);
|
|
key->blk_crc = ext2fs_cpu_to_le32(blk_crc);
|
|
key->size = ext2fs_cpu_to_le32(data_size);
|
|
}
|
|
dbg_printf("Writing block %llu to offset %llu size %d key %zu\n",
|
|
block_num,
|
|
data->undo_blk_num,
|
|
sz, data->num_keys - 1);
|
|
retval = io_channel_write_blk64(data->undo_file,
|
|
data->undo_blk_num, sz, read_ptr);
|
|
if (retval) {
|
|
free(read_ptr);
|
|
return retval;
|
|
}
|
|
data->undo_blk_num++;
|
|
free(read_ptr);
|
|
|
|
/* Write out the key block */
|
|
retval = write_undo_indexes(data, 0);
|
|
if (retval)
|
|
return retval;
|
|
|
|
/* Next block */
|
|
block_num++;
|
|
}
|
|
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_io_read_error(io_channel channel ATTR((unused)),
|
|
unsigned long block ATTR((unused)),
|
|
int count ATTR((unused)),
|
|
void *data ATTR((unused)),
|
|
size_t size ATTR((unused)),
|
|
int actual,
|
|
errcode_t error ATTR((unused)))
|
|
{
|
|
actual_size = actual;
|
|
return error;
|
|
}
|
|
|
|
static void undo_err_handler_init(io_channel channel)
|
|
{
|
|
channel->read_error = undo_io_read_error;
|
|
}
|
|
|
|
static int check_filesystem(struct undo_header *hdr, io_channel undo_file,
|
|
unsigned int blocksize, blk64_t super_block,
|
|
io_channel channel)
|
|
{
|
|
struct ext2_super_block super, *sb;
|
|
char *buf;
|
|
__u32 sb_crc;
|
|
errcode_t retval;
|
|
|
|
io_channel_set_blksize(channel, SUPERBLOCK_OFFSET);
|
|
retval = io_channel_read_blk64(channel, 1, -SUPERBLOCK_SIZE, &super);
|
|
if (retval)
|
|
return retval;
|
|
|
|
/*
|
|
* Compare the FS and the undo file superblock so that we don't
|
|
* append to something that doesn't match this FS.
|
|
*/
|
|
retval = ext2fs_get_mem(blocksize, &buf);
|
|
if (retval)
|
|
return retval;
|
|
retval = io_channel_read_blk64(undo_file, super_block,
|
|
-SUPERBLOCK_SIZE, buf);
|
|
if (retval)
|
|
goto out;
|
|
sb = (struct ext2_super_block *)buf;
|
|
sb->s_magic = ~sb->s_magic;
|
|
if (memcmp(&super, buf, sizeof(super))) {
|
|
retval = -1;
|
|
goto out;
|
|
}
|
|
sb_crc = ext2fs_crc32c_le(~0, (unsigned char *)buf, SUPERBLOCK_SIZE);
|
|
if (ext2fs_le32_to_cpu(hdr->sb_crc) != sb_crc) {
|
|
retval = -1;
|
|
goto out;
|
|
}
|
|
|
|
out:
|
|
ext2fs_free_mem(&buf);
|
|
return retval;
|
|
}
|
|
|
|
/*
|
|
* Try to re-open the undo file, so that we can resume where we left off.
|
|
* That way, the user can pass the same undo file to various programs as
|
|
* part of an FS upgrade instead of having to create multiple files and
|
|
* then apply them in correct order.
|
|
*/
|
|
static errcode_t try_reopen_undo_file(int undo_fd,
|
|
struct undo_private_data *data)
|
|
{
|
|
struct undo_header hdr;
|
|
struct undo_key *dkey;
|
|
ext2fs_struct_stat statbuf;
|
|
unsigned int blocksize, fs_blocksize;
|
|
blk64_t super_block, lblk;
|
|
size_t num_keys, keys_per_block, i;
|
|
__u32 hdr_crc, key_crc;
|
|
errcode_t retval;
|
|
|
|
/* Zero size already? */
|
|
retval = ext2fs_fstat(undo_fd, &statbuf);
|
|
if (retval)
|
|
goto bad_file;
|
|
if (statbuf.st_size == 0)
|
|
goto out;
|
|
|
|
/* check the file header */
|
|
retval = io_channel_read_blk64(data->undo_file, 0, -(int)sizeof(hdr),
|
|
&hdr);
|
|
if (retval)
|
|
goto bad_file;
|
|
|
|
if (memcmp(hdr.magic, E2UNDO_MAGIC,
|
|
sizeof(hdr.magic)))
|
|
goto bad_file;
|
|
hdr_crc = ext2fs_crc32c_le(~0, (unsigned char *)&hdr,
|
|
sizeof(struct undo_header) -
|
|
sizeof(__u32));
|
|
if (ext2fs_le32_to_cpu(hdr.header_crc) != hdr_crc)
|
|
goto bad_file;
|
|
blocksize = ext2fs_le32_to_cpu(hdr.block_size);
|
|
fs_blocksize = ext2fs_le32_to_cpu(hdr.fs_block_size);
|
|
if (blocksize > E2UNDO_MAX_BLOCK_SIZE ||
|
|
blocksize < E2UNDO_MIN_BLOCK_SIZE ||
|
|
!blocksize || !fs_blocksize)
|
|
goto bad_file;
|
|
super_block = ext2fs_le64_to_cpu(hdr.super_offset);
|
|
num_keys = ext2fs_le64_to_cpu(hdr.num_keys);
|
|
io_channel_set_blksize(data->undo_file, blocksize);
|
|
/*
|
|
* Do not compare hdr.f_compat with the available compatible
|
|
* features set, because a "missing" compatible feature should
|
|
* not cause any problems.
|
|
*/
|
|
if (hdr.f_incompat || hdr.f_rocompat)
|
|
goto bad_file;
|
|
|
|
/* Superblock matches this FS? */
|
|
if (check_filesystem(&hdr, data->undo_file, blocksize, super_block,
|
|
data->real) != 0) {
|
|
retval = EXT2_ET_UNDO_FILE_WRONG;
|
|
goto out;
|
|
}
|
|
|
|
/* Try to set ourselves up */
|
|
data->tdb_data_size = blocksize;
|
|
retval = undo_setup_tdb(data);
|
|
if (retval)
|
|
goto bad_file;
|
|
data->num_keys = num_keys;
|
|
data->super_blk_num = super_block;
|
|
data->first_key_blk = ext2fs_le64_to_cpu(hdr.key_offset);
|
|
|
|
/* load the written block map */
|
|
keys_per_block = KEYS_PER_BLOCK(data);
|
|
lblk = data->first_key_blk;
|
|
dbg_printf("nr_keys=%lu, kpb=%zu, blksz=%u\n",
|
|
num_keys, keys_per_block, blocksize);
|
|
for (i = 0; i < num_keys; i += keys_per_block) {
|
|
size_t j, max_j;
|
|
__le32 crc;
|
|
|
|
data->key_blk_num = lblk;
|
|
retval = io_channel_read_blk64(data->undo_file,
|
|
lblk, 1, data->keyb);
|
|
if (retval)
|
|
goto bad_key_replay;
|
|
|
|
/* check keys */
|
|
if (ext2fs_le32_to_cpu(data->keyb->magic) != KEYBLOCK_MAGIC) {
|
|
retval = EXT2_ET_UNDO_FILE_CORRUPT;
|
|
goto bad_key_replay;
|
|
}
|
|
crc = data->keyb->crc;
|
|
data->keyb->crc = 0;
|
|
key_crc = ext2fs_crc32c_le(~0, (unsigned char *)data->keyb,
|
|
blocksize);
|
|
if (ext2fs_le32_to_cpu(crc) != key_crc) {
|
|
retval = EXT2_ET_UNDO_FILE_CORRUPT;
|
|
goto bad_key_replay;
|
|
}
|
|
|
|
/* load keys from key block */
|
|
lblk++;
|
|
max_j = data->num_keys - i;
|
|
if (max_j > keys_per_block)
|
|
max_j = keys_per_block;
|
|
for (j = 0, dkey = data->keyb->keys;
|
|
j < max_j;
|
|
j++, dkey++) {
|
|
blk64_t fsblk = ext2fs_le64_to_cpu(dkey->fsblk);
|
|
blk64_t undo_blk = fsblk * fs_blocksize / blocksize;
|
|
size_t size = ext2fs_le32_to_cpu(dkey->size);
|
|
|
|
ext2fs_mark_block_bitmap_range2(data->written_block_map,
|
|
undo_blk,
|
|
(size + blocksize - 1) / blocksize);
|
|
lblk += (size + blocksize - 1) / blocksize;
|
|
data->undo_blk_num = lblk;
|
|
data->keys_in_block = j + 1;
|
|
}
|
|
}
|
|
dbg_printf("Reopen undo, keyblk=%llu undoblk=%llu nrkeys=%zu kib=%zu\n",
|
|
data->key_blk_num, data->undo_blk_num, data->num_keys,
|
|
data->keys_in_block);
|
|
|
|
data->hdr.state = hdr.state & ~E2UNDO_STATE_FINISHED;
|
|
data->hdr.f_compat = hdr.f_compat;
|
|
data->hdr.f_incompat = hdr.f_incompat;
|
|
data->hdr.f_rocompat = hdr.f_rocompat;
|
|
return retval;
|
|
|
|
bad_key_replay:
|
|
data->key_blk_num = data->undo_blk_num = 0;
|
|
data->keys_in_block = 0;
|
|
ext2fs_free_mem(&data->keyb);
|
|
ext2fs_free_generic_bitmap(data->written_block_map);
|
|
data->tdb_written = 0;
|
|
goto out;
|
|
bad_file:
|
|
retval = EXT2_ET_UNDO_FILE_CORRUPT;
|
|
out:
|
|
return retval;
|
|
}
|
|
|
|
static void undo_atexit(void *p)
|
|
{
|
|
struct undo_private_data *data = p;
|
|
errcode_t err;
|
|
|
|
err = write_undo_indexes(data, 1);
|
|
io_channel_close(data->undo_file);
|
|
|
|
com_err(data->tdb_file, err, "while force-closing undo file");
|
|
}
|
|
|
|
static errcode_t undo_open(const char *name, int flags, io_channel *channel)
|
|
{
|
|
io_channel io = NULL;
|
|
struct undo_private_data *data = NULL;
|
|
int undo_fd = -1;
|
|
errcode_t retval;
|
|
|
|
if (name == 0)
|
|
return EXT2_ET_BAD_DEVICE_NAME;
|
|
retval = ext2fs_get_mem(sizeof(struct struct_io_channel), &io);
|
|
if (retval)
|
|
goto cleanup;
|
|
memset(io, 0, sizeof(struct struct_io_channel));
|
|
io->magic = EXT2_ET_MAGIC_IO_CHANNEL;
|
|
retval = ext2fs_get_mem(sizeof(struct undo_private_data), &data);
|
|
if (retval)
|
|
goto cleanup;
|
|
|
|
io->manager = undo_io_manager;
|
|
retval = ext2fs_get_mem(strlen(name)+1, &io->name);
|
|
if (retval)
|
|
goto cleanup;
|
|
|
|
strcpy(io->name, name);
|
|
io->private_data = data;
|
|
io->block_size = 1024;
|
|
io->read_error = 0;
|
|
io->write_error = 0;
|
|
io->refcount = 1;
|
|
|
|
memset(data, 0, sizeof(struct undo_private_data));
|
|
data->magic = EXT2_ET_MAGIC_UNIX_IO_CHANNEL;
|
|
data->super_blk_num = 1;
|
|
data->first_key_blk = 2;
|
|
data->undo_blk_num = 3;
|
|
|
|
if (undo_io_backing_manager) {
|
|
retval = undo_io_backing_manager->open(name, flags,
|
|
&data->real);
|
|
if (retval)
|
|
goto cleanup;
|
|
|
|
data->tdb_file = strdup(tdb_file);
|
|
if (data->tdb_file == NULL)
|
|
goto cleanup;
|
|
undo_fd = ext2fs_open_file(data->tdb_file, O_RDWR | O_CREAT,
|
|
0600);
|
|
if (undo_fd < 0)
|
|
goto cleanup;
|
|
|
|
retval = undo_io_backing_manager->open(data->tdb_file,
|
|
IO_FLAG_RW,
|
|
&data->undo_file);
|
|
if (retval)
|
|
goto cleanup;
|
|
} else {
|
|
data->real = NULL;
|
|
data->undo_file = NULL;
|
|
}
|
|
|
|
if (data->real)
|
|
io->flags = (io->flags & ~CHANNEL_FLAGS_DISCARD_ZEROES) |
|
|
(data->real->flags & CHANNEL_FLAGS_DISCARD_ZEROES);
|
|
|
|
/*
|
|
* setup err handler for read so that we know
|
|
* when the backing manager fails do short read
|
|
*/
|
|
if (data->real)
|
|
undo_err_handler_init(data->real);
|
|
|
|
if (data->undo_file) {
|
|
retval = try_reopen_undo_file(undo_fd, data);
|
|
if (retval)
|
|
goto cleanup;
|
|
}
|
|
retval = ext2fs_add_exit_fn(undo_atexit, data);
|
|
if (retval)
|
|
goto cleanup;
|
|
|
|
*channel = io;
|
|
if (undo_fd >= 0)
|
|
close(undo_fd);
|
|
return retval;
|
|
|
|
cleanup:
|
|
ext2fs_remove_exit_fn(undo_atexit, data);
|
|
if (undo_fd >= 0)
|
|
close(undo_fd);
|
|
if (data && data->undo_file)
|
|
io_channel_close(data->undo_file);
|
|
if (data && data->tdb_file)
|
|
free(data->tdb_file);
|
|
if (data && data->real)
|
|
io_channel_close(data->real);
|
|
if (data)
|
|
ext2fs_free_mem(&data);
|
|
if (io)
|
|
ext2fs_free_mem(&io);
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_close(io_channel channel)
|
|
{
|
|
struct undo_private_data *data;
|
|
errcode_t err, retval = 0;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (--channel->refcount > 0)
|
|
return 0;
|
|
/* Before closing write the file system identity */
|
|
if (!getenv("UNDO_IO_SIMULATE_UNFINISHED"))
|
|
data->hdr.state = ext2fs_cpu_to_le32(E2UNDO_STATE_FINISHED);
|
|
err = write_undo_indexes(data, 1);
|
|
ext2fs_remove_exit_fn(undo_atexit, data);
|
|
if (data->real)
|
|
retval = io_channel_close(data->real);
|
|
if (data->tdb_file)
|
|
free(data->tdb_file);
|
|
if (data->undo_file)
|
|
io_channel_close(data->undo_file);
|
|
ext2fs_free_mem(&data->keyb);
|
|
if (data->written_block_map)
|
|
ext2fs_free_generic_bitmap(data->written_block_map);
|
|
ext2fs_free_mem(&channel->private_data);
|
|
if (channel->name)
|
|
ext2fs_free_mem(&channel->name);
|
|
ext2fs_free_mem(&channel);
|
|
|
|
if (err)
|
|
return err;
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_set_blksize(io_channel channel, int blksize)
|
|
{
|
|
struct undo_private_data *data;
|
|
errcode_t retval = 0;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (blksize > E2UNDO_MAX_BLOCK_SIZE || blksize < E2UNDO_MIN_BLOCK_SIZE)
|
|
return EXT2_ET_INVALID_ARGUMENT;
|
|
|
|
if (data->real)
|
|
retval = io_channel_set_blksize(data->real, blksize);
|
|
/*
|
|
* Set the block size used for tdb
|
|
*/
|
|
if (!data->tdb_data_size || !data->tdb_written)
|
|
data->tdb_data_size = blksize;
|
|
channel->block_size = blksize;
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_read_blk64(io_channel channel, unsigned long long block,
|
|
int count, void *buf)
|
|
{
|
|
errcode_t retval = 0;
|
|
struct undo_private_data *data;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (data->real)
|
|
retval = io_channel_read_blk64(data->real, block, count, buf);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_read_blk(io_channel channel, unsigned long block,
|
|
int count, void *buf)
|
|
{
|
|
return undo_read_blk64(channel, block, count, buf);
|
|
}
|
|
|
|
static errcode_t undo_write_blk64(io_channel channel, unsigned long long block,
|
|
int count, const void *buf)
|
|
{
|
|
struct undo_private_data *data;
|
|
errcode_t retval = 0;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
/*
|
|
* First write the existing content into database
|
|
*/
|
|
retval = undo_write_tdb(channel, block, count);
|
|
if (retval)
|
|
return retval;
|
|
if (data->real)
|
|
retval = io_channel_write_blk64(data->real, block, count, buf);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_write_blk(io_channel channel, unsigned long block,
|
|
int count, const void *buf)
|
|
{
|
|
return undo_write_blk64(channel, block, count, buf);
|
|
}
|
|
|
|
static errcode_t undo_write_byte(io_channel channel, unsigned long offset,
|
|
int size, const void *buf)
|
|
{
|
|
struct undo_private_data *data;
|
|
errcode_t retval = 0;
|
|
ext2_loff_t location;
|
|
unsigned long blk_num, count;;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
location = offset + data->offset;
|
|
blk_num = location/channel->block_size;
|
|
/*
|
|
* the size specified may spread across multiple blocks
|
|
* also make sure we account for the fact that block start
|
|
* offset for tdb is different from the backing I/O manager
|
|
* due to possible different block size
|
|
*/
|
|
count = (size + (location % channel->block_size) +
|
|
channel->block_size -1)/channel->block_size;
|
|
retval = undo_write_tdb(channel, blk_num, count);
|
|
if (retval)
|
|
return retval;
|
|
if (data->real && data->real->manager->write_byte)
|
|
retval = io_channel_write_byte(data->real, offset, size, buf);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_discard(io_channel channel, unsigned long long block,
|
|
unsigned long long count)
|
|
{
|
|
struct undo_private_data *data;
|
|
errcode_t retval = 0;
|
|
int icount;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (count > INT_MAX)
|
|
return EXT2_ET_UNIMPLEMENTED;
|
|
icount = count;
|
|
|
|
/*
|
|
* First write the existing content into database
|
|
*/
|
|
retval = undo_write_tdb(channel, block, icount);
|
|
if (retval)
|
|
return retval;
|
|
if (data->real)
|
|
retval = io_channel_discard(data->real, block, count);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_zeroout(io_channel channel, unsigned long long block,
|
|
unsigned long long count)
|
|
{
|
|
struct undo_private_data *data;
|
|
errcode_t retval = 0;
|
|
int icount;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (count > INT_MAX)
|
|
return EXT2_ET_UNIMPLEMENTED;
|
|
icount = count;
|
|
|
|
/*
|
|
* First write the existing content into database
|
|
*/
|
|
retval = undo_write_tdb(channel, block, icount);
|
|
if (retval)
|
|
return retval;
|
|
if (data->real)
|
|
retval = io_channel_zeroout(data->real, block, count);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_cache_readahead(io_channel channel,
|
|
unsigned long long block,
|
|
unsigned long long count)
|
|
{
|
|
struct undo_private_data *data;
|
|
errcode_t retval = 0;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (data->real)
|
|
retval = io_channel_cache_readahead(data->real, block, count);
|
|
|
|
return retval;
|
|
}
|
|
|
|
/*
|
|
* Flush data buffers to disk.
|
|
*/
|
|
static errcode_t undo_flush(io_channel channel)
|
|
{
|
|
errcode_t retval = 0;
|
|
struct undo_private_data *data;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (data->real)
|
|
retval = io_channel_flush(data->real);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_set_option(io_channel channel, const char *option,
|
|
const char *arg)
|
|
{
|
|
errcode_t retval = 0;
|
|
struct undo_private_data *data;
|
|
unsigned long tmp;
|
|
char *end;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (!strcmp(option, "tdb_data_size")) {
|
|
if (!arg)
|
|
return EXT2_ET_INVALID_ARGUMENT;
|
|
|
|
tmp = strtoul(arg, &end, 0);
|
|
if (*end)
|
|
return EXT2_ET_INVALID_ARGUMENT;
|
|
if (tmp > E2UNDO_MAX_BLOCK_SIZE || tmp < E2UNDO_MIN_BLOCK_SIZE)
|
|
return EXT2_ET_INVALID_ARGUMENT;
|
|
if (!data->tdb_data_size || !data->tdb_written) {
|
|
data->tdb_written = -1;
|
|
data->tdb_data_size = tmp;
|
|
}
|
|
return 0;
|
|
}
|
|
/*
|
|
* Need to support offset option to work with
|
|
* Unix I/O manager
|
|
*/
|
|
if (data->real && data->real->manager->set_option) {
|
|
retval = data->real->manager->set_option(data->real,
|
|
option, arg);
|
|
}
|
|
if (!retval && !strcmp(option, "offset")) {
|
|
if (!arg)
|
|
return EXT2_ET_INVALID_ARGUMENT;
|
|
|
|
tmp = strtoul(arg, &end, 0);
|
|
if (*end)
|
|
return EXT2_ET_INVALID_ARGUMENT;
|
|
data->offset = tmp;
|
|
}
|
|
return retval;
|
|
}
|
|
|
|
static errcode_t undo_get_stats(io_channel channel, io_stats *stats)
|
|
{
|
|
errcode_t retval = 0;
|
|
struct undo_private_data *data;
|
|
|
|
EXT2_CHECK_MAGIC(channel, EXT2_ET_MAGIC_IO_CHANNEL);
|
|
data = (struct undo_private_data *) channel->private_data;
|
|
EXT2_CHECK_MAGIC(data, EXT2_ET_MAGIC_UNIX_IO_CHANNEL);
|
|
|
|
if (data->real)
|
|
retval = (data->real->manager->get_stats)(data->real, stats);
|
|
|
|
return retval;
|
|
}
|
|
|
|
static struct struct_io_manager struct_undo_manager = {
|
|
.magic = EXT2_ET_MAGIC_IO_MANAGER,
|
|
.name = "Undo I/O Manager",
|
|
.open = undo_open,
|
|
.close = undo_close,
|
|
.set_blksize = undo_set_blksize,
|
|
.read_blk = undo_read_blk,
|
|
.write_blk = undo_write_blk,
|
|
.flush = undo_flush,
|
|
.write_byte = undo_write_byte,
|
|
.set_option = undo_set_option,
|
|
.get_stats = undo_get_stats,
|
|
.read_blk64 = undo_read_blk64,
|
|
.write_blk64 = undo_write_blk64,
|
|
.discard = undo_discard,
|
|
.zeroout = undo_zeroout,
|
|
.cache_readahead = undo_cache_readahead,
|
|
};
|
|
|
|
io_manager undo_io_manager = &struct_undo_manager;
|