You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

546 lines
14 KiB

// SPDX-License-Identifier: GPL-2.0+
/*
* erofs-utils/lib/compress.c
*
* Copyright (C) 2018-2019 HUAWEI, Inc.
* http://www.huawei.com/
* Created by Miao Xie <miaoxie@huawei.com>
* with heavy changes by Gao Xiang <gaoxiang25@huawei.com>
*/
#ifndef _LARGEFILE64_SOURCE
#define _LARGEFILE64_SOURCE
#endif
#include <string.h>
#include <stdlib.h>
#include <unistd.h>
#include "erofs/print.h"
#include "erofs/io.h"
#include "erofs/cache.h"
#include "erofs/compress.h"
#include "compressor.h"
static struct erofs_compress compresshandle;
static int compressionlevel;
static struct z_erofs_map_header mapheader;
struct z_erofs_vle_compress_ctx {
u8 *metacur;
u8 queue[EROFS_CONFIG_COMPR_MAX_SZ * 2];
unsigned int head, tail;
erofs_blk_t blkaddr; /* pointing to the next blkaddr */
u16 clusterofs;
};
#define Z_EROFS_LEGACY_MAP_HEADER_SIZE \
(sizeof(struct z_erofs_map_header) + Z_EROFS_VLE_LEGACY_HEADER_PADDING)
static unsigned int vle_compressmeta_capacity(erofs_off_t filesize)
{
const unsigned int indexsize = BLK_ROUND_UP(filesize) *
sizeof(struct z_erofs_vle_decompressed_index);
return Z_EROFS_LEGACY_MAP_HEADER_SIZE + indexsize;
}
static void vle_write_indexes_final(struct z_erofs_vle_compress_ctx *ctx)
{
const unsigned int type = Z_EROFS_VLE_CLUSTER_TYPE_PLAIN;
struct z_erofs_vle_decompressed_index di;
if (!ctx->clusterofs)
return;
di.di_clusterofs = cpu_to_le16(ctx->clusterofs);
di.di_u.blkaddr = 0;
di.di_advise = cpu_to_le16(type << Z_EROFS_VLE_DI_CLUSTER_TYPE_BIT);
memcpy(ctx->metacur, &di, sizeof(di));
ctx->metacur += sizeof(di);
}
static void vle_write_indexes(struct z_erofs_vle_compress_ctx *ctx,
unsigned int count, bool raw)
{
unsigned int clusterofs = ctx->clusterofs;
unsigned int d0 = 0, d1 = (clusterofs + count) / EROFS_BLKSIZ;
struct z_erofs_vle_decompressed_index di;
unsigned int type;
__le16 advise;
di.di_clusterofs = cpu_to_le16(ctx->clusterofs);
/* whether the tail-end (un)compressed block or not */
if (!d1) {
type = raw ? Z_EROFS_VLE_CLUSTER_TYPE_PLAIN :
Z_EROFS_VLE_CLUSTER_TYPE_HEAD;
advise = cpu_to_le16(type << Z_EROFS_VLE_DI_CLUSTER_TYPE_BIT);
di.di_advise = advise;
di.di_u.blkaddr = cpu_to_le32(ctx->blkaddr);
memcpy(ctx->metacur, &di, sizeof(di));
ctx->metacur += sizeof(di);
/* don't add the final index if the tail-end block exists */
ctx->clusterofs = 0;
return;
}
do {
if (d0) {
type = Z_EROFS_VLE_CLUSTER_TYPE_NONHEAD;
di.di_u.delta[0] = cpu_to_le16(d0);
di.di_u.delta[1] = cpu_to_le16(d1);
} else {
type = raw ? Z_EROFS_VLE_CLUSTER_TYPE_PLAIN :
Z_EROFS_VLE_CLUSTER_TYPE_HEAD;
di.di_u.blkaddr = cpu_to_le32(ctx->blkaddr);
}
advise = cpu_to_le16(type << Z_EROFS_VLE_DI_CLUSTER_TYPE_BIT);
di.di_advise = advise;
memcpy(ctx->metacur, &di, sizeof(di));
ctx->metacur += sizeof(di);
count -= EROFS_BLKSIZ - clusterofs;
clusterofs = 0;
++d0;
--d1;
} while (clusterofs + count >= EROFS_BLKSIZ);
ctx->clusterofs = clusterofs + count;
}
static int write_uncompressed_block(struct z_erofs_vle_compress_ctx *ctx,
unsigned int *len,
char *dst)
{
int ret;
unsigned int count;
/* reset clusterofs to 0 if permitted */
if (!erofs_sb_has_lz4_0padding() &&
ctx->head >= ctx->clusterofs) {
ctx->head -= ctx->clusterofs;
*len += ctx->clusterofs;
ctx->clusterofs = 0;
}
/* write uncompressed data */
count = min(EROFS_BLKSIZ, *len);
memcpy(dst, ctx->queue + ctx->head, count);
memset(dst + count, 0, EROFS_BLKSIZ - count);
erofs_dbg("Writing %u uncompressed data to block %u",
count, ctx->blkaddr);
ret = blk_write(dst, ctx->blkaddr, 1);
if (ret)
return ret;
return count;
}
static int vle_compress_one(struct erofs_inode *inode,
struct z_erofs_vle_compress_ctx *ctx,
bool final)
{
struct erofs_compress *const h = &compresshandle;
unsigned int len = ctx->tail - ctx->head;
unsigned int count;
int ret;
static char dstbuf[EROFS_BLKSIZ * 2];
char *const dst = dstbuf + EROFS_BLKSIZ;
while (len) {
bool raw;
if (len <= EROFS_BLKSIZ) {
if (final)
goto nocompression;
break;
}
count = len;
ret = erofs_compress_destsize(h, compressionlevel,
ctx->queue + ctx->head,
&count, dst, EROFS_BLKSIZ);
if (ret <= 0) {
if (ret != -EAGAIN) {
erofs_err("failed to compress %s: %s",
inode->i_srcpath,
erofs_strerror(ret));
}
nocompression:
ret = write_uncompressed_block(ctx, &len, dst);
if (ret < 0)
return ret;
count = ret;
raw = true;
} else {
/* write compressed data */
erofs_dbg("Writing %u compressed data to block %u",
count, ctx->blkaddr);
if (erofs_sb_has_lz4_0padding())
ret = blk_write(dst - (EROFS_BLKSIZ - ret),
ctx->blkaddr, 1);
else
ret = blk_write(dst, ctx->blkaddr, 1);
if (ret)
return ret;
raw = false;
}
ctx->head += count;
/* write compression indexes for this blkaddr */
vle_write_indexes(ctx, count, raw);
++ctx->blkaddr;
len -= count;
if (!final && ctx->head >= EROFS_CONFIG_COMPR_MAX_SZ) {
const unsigned int qh_aligned =
round_down(ctx->head, EROFS_BLKSIZ);
const unsigned int qh_after = ctx->head - qh_aligned;
memmove(ctx->queue, ctx->queue + qh_aligned,
len + qh_after);
ctx->head = qh_after;
ctx->tail = qh_after + len;
break;
}
}
return 0;
}
struct z_erofs_compressindex_vec {
union {
erofs_blk_t blkaddr;
u16 delta[2];
} u;
u16 clusterofs;
u8 clustertype;
};
static void *parse_legacy_indexes(struct z_erofs_compressindex_vec *cv,
unsigned int nr, void *metacur)
{
struct z_erofs_vle_decompressed_index *const db = metacur;
unsigned int i;
for (i = 0; i < nr; ++i, ++cv) {
struct z_erofs_vle_decompressed_index *const di = db + i;
const unsigned int advise = le16_to_cpu(di->di_advise);
cv->clustertype = (advise >> Z_EROFS_VLE_DI_CLUSTER_TYPE_BIT) &
((1 << Z_EROFS_VLE_DI_CLUSTER_TYPE_BITS) - 1);
cv->clusterofs = le16_to_cpu(di->di_clusterofs);
if (cv->clustertype == Z_EROFS_VLE_CLUSTER_TYPE_NONHEAD) {
cv->u.delta[0] = le16_to_cpu(di->di_u.delta[0]);
cv->u.delta[1] = le16_to_cpu(di->di_u.delta[1]);
} else {
cv->u.blkaddr = le32_to_cpu(di->di_u.blkaddr);
}
}
return db + nr;
}
static void *write_compacted_indexes(u8 *out,
struct z_erofs_compressindex_vec *cv,
erofs_blk_t *blkaddr_ret,
unsigned int destsize,
unsigned int logical_clusterbits,
bool final)
{
unsigned int vcnt, encodebits, pos, i;
erofs_blk_t blkaddr;
if (destsize == 4) {
vcnt = 2;
} else if (destsize == 2 && logical_clusterbits == 12) {
vcnt = 16;
} else {
return ERR_PTR(-EINVAL);
}
encodebits = (vcnt * destsize * 8 - 32) / vcnt;
blkaddr = *blkaddr_ret;
pos = 0;
for (i = 0; i < vcnt; ++i) {
unsigned int offset, v;
u8 ch, rem;
if (cv[i].clustertype == Z_EROFS_VLE_CLUSTER_TYPE_NONHEAD) {
if (i + 1 == vcnt)
offset = cv[i].u.delta[1];
else
offset = cv[i].u.delta[0];
} else {
offset = cv[i].clusterofs;
++blkaddr;
if (cv[i].u.blkaddr != blkaddr) {
if (i + 1 != vcnt)
DBG_BUGON(!final);
DBG_BUGON(cv[i].u.blkaddr);
}
}
v = (cv[i].clustertype << logical_clusterbits) | offset;
rem = pos & 7;
ch = out[pos / 8] & ((1 << rem) - 1);
out[pos / 8] = (v << rem) | ch;
out[pos / 8 + 1] = v >> (8 - rem);
out[pos / 8 + 2] = v >> (16 - rem);
pos += encodebits;
}
DBG_BUGON(destsize * vcnt * 8 != pos + 32);
*(__le32 *)(out + destsize * vcnt - 4) = cpu_to_le32(*blkaddr_ret);
*blkaddr_ret = blkaddr;
return out + destsize * vcnt;
}
int z_erofs_convert_to_compacted_format(struct erofs_inode *inode,
erofs_blk_t blkaddr,
unsigned int legacymetasize,
unsigned int logical_clusterbits)
{
const unsigned int mpos = Z_EROFS_VLE_EXTENT_ALIGN(inode->inode_isize +
inode->xattr_isize) +
sizeof(struct z_erofs_map_header);
const unsigned int totalidx = (legacymetasize -
Z_EROFS_LEGACY_MAP_HEADER_SIZE) / 8;
u8 *out, *in;
struct z_erofs_compressindex_vec cv[16];
/* # of 8-byte units so that it can be aligned with 32 bytes */
unsigned int compacted_4b_initial, compacted_4b_end;
unsigned int compacted_2b;
if (logical_clusterbits < LOG_BLOCK_SIZE || LOG_BLOCK_SIZE < 12)
return -EINVAL;
if (logical_clusterbits > 14) /* currently not supported */
return -ENOTSUP;
if (logical_clusterbits == 12) {
compacted_4b_initial = (32 - mpos % 32) / 4;
if (compacted_4b_initial == 32 / 4)
compacted_4b_initial = 0;
if (compacted_4b_initial > totalidx) {
compacted_4b_initial = compacted_2b = 0;
compacted_4b_end = totalidx;
} else {
compacted_2b = rounddown(totalidx -
compacted_4b_initial, 16);
compacted_4b_end = totalidx - compacted_4b_initial -
compacted_2b;
}
} else {
compacted_2b = compacted_4b_initial = 0;
compacted_4b_end = totalidx;
}
out = in = inode->compressmeta;
/* write out compacted header */
memcpy(out, &mapheader, sizeof(mapheader));
out += sizeof(mapheader);
in += Z_EROFS_LEGACY_MAP_HEADER_SIZE;
/* generate compacted_4b_initial */
while (compacted_4b_initial) {
in = parse_legacy_indexes(cv, 2, in);
out = write_compacted_indexes(out, cv, &blkaddr,
4, logical_clusterbits, false);
compacted_4b_initial -= 2;
}
DBG_BUGON(compacted_4b_initial);
/* generate compacted_2b */
while (compacted_2b) {
in = parse_legacy_indexes(cv, 16, in);
out = write_compacted_indexes(out, cv, &blkaddr,
2, logical_clusterbits, false);
compacted_2b -= 16;
}
DBG_BUGON(compacted_2b);
/* generate compacted_4b_end */
while (compacted_4b_end > 1) {
in = parse_legacy_indexes(cv, 2, in);
out = write_compacted_indexes(out, cv, &blkaddr,
4, logical_clusterbits, false);
compacted_4b_end -= 2;
}
/* generate final compacted_4b_end if needed */
if (compacted_4b_end) {
memset(cv, 0, sizeof(cv));
in = parse_legacy_indexes(cv, 1, in);
out = write_compacted_indexes(out, cv, &blkaddr,
4, logical_clusterbits, true);
}
inode->extent_isize = out - (u8 *)inode->compressmeta;
inode->datalayout = EROFS_INODE_FLAT_COMPRESSION;
return 0;
}
int erofs_write_compressed_file(struct erofs_inode *inode)
{
struct erofs_buffer_head *bh;
struct z_erofs_vle_compress_ctx ctx;
erofs_off_t remaining;
erofs_blk_t blkaddr, compressed_blocks;
unsigned int legacymetasize;
int ret, fd;
u8 *compressmeta = malloc(vle_compressmeta_capacity(inode->i_size));
if (!compressmeta)
return -ENOMEM;
fd = open(inode->i_srcpath, O_RDONLY | O_BINARY);
if (fd < 0) {
ret = -errno;
goto err_free;
}
/* allocate main data buffer */
bh = erofs_balloc(DATA, 0, 0, 0);
if (IS_ERR(bh)) {
ret = PTR_ERR(bh);
goto err_close;
}
memset(compressmeta, 0, Z_EROFS_LEGACY_MAP_HEADER_SIZE);
blkaddr = erofs_mapbh(bh->block, true); /* start_blkaddr */
ctx.blkaddr = blkaddr;
ctx.metacur = compressmeta + Z_EROFS_LEGACY_MAP_HEADER_SIZE;
ctx.head = ctx.tail = 0;
ctx.clusterofs = 0;
remaining = inode->i_size;
while (remaining) {
const u64 readcount = min_t(u64, remaining,
sizeof(ctx.queue) - ctx.tail);
ret = read(fd, ctx.queue + ctx.tail, readcount);
if (ret != readcount) {
ret = -errno;
goto err_bdrop;
}
remaining -= readcount;
ctx.tail += readcount;
/* do one compress round */
ret = vle_compress_one(inode, &ctx, false);
if (ret)
goto err_bdrop;
}
/* do the final round */
ret = vle_compress_one(inode, &ctx, true);
if (ret)
goto err_bdrop;
/* fall back to no compression mode */
compressed_blocks = ctx.blkaddr - blkaddr;
if (compressed_blocks >= BLK_ROUND_UP(inode->i_size)) {
ret = -ENOSPC;
goto err_bdrop;
}
vle_write_indexes_final(&ctx);
close(fd);
ret = erofs_bh_balloon(bh, blknr_to_addr(compressed_blocks));
DBG_BUGON(ret);
erofs_info("compressed %s (%llu bytes) into %u blocks",
inode->i_srcpath, (unsigned long long)inode->i_size,
compressed_blocks);
/*
* TODO: need to move erofs_bdrop to erofs_write_tail_end
* when both mkfs & kernel support compression inline.
*/
erofs_bdrop(bh, false);
inode->compressmeta = compressmeta;
inode->idata_size = 0;
inode->u.i_blocks = compressed_blocks;
legacymetasize = ctx.metacur - compressmeta;
if (cfg.c_legacy_compress) {
inode->extent_isize = legacymetasize;
inode->datalayout = EROFS_INODE_FLAT_COMPRESSION_LEGACY;
} else {
ret = z_erofs_convert_to_compacted_format(inode, blkaddr - 1,
legacymetasize, 12);
DBG_BUGON(ret);
}
return 0;
err_bdrop:
erofs_bdrop(bh, true); /* revoke buffer */
err_close:
close(fd);
err_free:
free(compressmeta);
return ret;
}
static int erofs_get_compress_algorithm_id(const char *name)
{
if (!strcmp(name, "lz4") || !strcmp(name, "lz4hc"))
return Z_EROFS_COMPRESSION_LZ4;
return -ENOTSUP;
}
int z_erofs_compress_init(void)
{
unsigned int algorithmtype[2];
/* initialize for primary compression algorithm */
int ret = erofs_compressor_init(&compresshandle,
cfg.c_compr_alg_master);
if (ret)
return ret;
/*
* if primary algorithm is not lz4* (e.g. compression off),
* clear LZ4_0PADDING feature for old kernel compatibility.
*/
if (!cfg.c_compr_alg_master ||
strncmp(cfg.c_compr_alg_master, "lz4", 3))
erofs_sb_clear_lz4_0padding();
if (!cfg.c_compr_alg_master)
return 0;
compressionlevel = cfg.c_compr_level_master < 0 ?
compresshandle.alg->default_level :
cfg.c_compr_level_master;
/* figure out mapheader */
ret = erofs_get_compress_algorithm_id(cfg.c_compr_alg_master);
if (ret < 0)
return ret;
algorithmtype[0] = ret; /* primary algorithm (head 0) */
algorithmtype[1] = 0; /* secondary algorithm (head 1) */
mapheader.h_advise |= Z_EROFS_ADVISE_COMPACTED_2B;
mapheader.h_algorithmtype = algorithmtype[1] << 4 |
algorithmtype[0];
mapheader.h_clusterbits = LOG_BLOCK_SIZE - 12;
return 0;
}
int z_erofs_compress_exit(void)
{
return erofs_compressor_exit(&compresshandle);
}