Skip to content

Commit

Permalink
zio_compress: introduce max size threshold
Browse files Browse the repository at this point in the history
Now default compression is lz4, which can stop
compression process by itself on incompressible data.
If there are additional size checks -
we will only make our compressratio worse.

New usable compression thresholds are:
- less than BPE_PAYLOAD_SIZE (embedded_data feature);
- at least one saved sector.

Old 12.5% threshold is left to minimize affect
on existing user expectations of CPU utilization.

If data wasn't compressed - it will be saved as
ZIO_COMPRESS_OFF, so if we really need to recompress
data without ashift info and check anything -
we can just compress it with zero threshold.
So, we don't need a new feature flag here!

Signed-off-by: George Melikov <[email protected]>
  • Loading branch information
gmelikov committed Apr 4, 2024
1 parent 99741bd commit 7f578c4
Show file tree
Hide file tree
Showing 6 changed files with 52 additions and 26 deletions.
3 changes: 2 additions & 1 deletion include/sys/zio_compress.h
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@
* Copyright (c) 2019, Klara Inc.
* Use is subject to license terms.
* Copyright (c) 2015, 2016 by Delphix. All rights reserved.
* Copyright (c) 2021, 2024 by George Melikov. All rights reserved.
*/

#ifndef _SYS_ZIO_COMPRESS_H
Expand Down Expand Up @@ -184,7 +185,7 @@ extern int lz4_decompress_zfs(void *src, void *dst, size_t s_len, size_t d_len,
* Compress and decompress data if necessary.
*/
extern size_t zio_compress_data(enum zio_compress c, abd_t *src, void **dst,
size_t s_len, uint8_t level);
size_t s_len, size_t d_len, uint8_t level);
extern int zio_decompress_data(enum zio_compress c, abd_t *src, void *dst,
size_t s_len, size_t d_len, uint8_t *level);
extern int zio_decompress_data_buf(enum zio_compress c, void *src, void *dst,
Expand Down
26 changes: 18 additions & 8 deletions man/man7/zfsprops.7
Original file line number Diff line number Diff line change
Expand Up @@ -917,14 +917,24 @@ zeroes (the NUL byte).
When a zero-filled block is detected, it is stored as
a hole and not compressed using the indicated compression algorithm.
.Pp
Any block being compressed must be no larger than 7/8 of its original size
after compression, otherwise the compression will not be considered worthwhile
and the block saved uncompressed.
Note that when the logical block is less than
8 times the disk sector size this effectively reduces the necessary compression
ratio; for example, 8 KiB blocks on disks with 4 KiB disk sectors must compress
to 1/2
or less of their original size.
All blocks are allocated as a whole number of sectors
.Pq chunks of 2^ Ns Sy ashift No bytes , e.g . Sy 512B No or Sy 4KB .
Compression may result in a non-sector-aligned size, which will be rounded up
to a whole number of sectors.
If compression saves less than one whole sector,
the block will be stored uncompressed.
Therefore, blocks whose logical size is a small number of sectors will
experience less compression
(e.g. for
.Sy recordsize Ns = Ns Sy 16K
with
.Sy 4K
sectors, which have 4 sectors per block,
compression needs to save at least 25% to actually save space on disk).
.Pp
There is
.Sy 12.5%
default compression threshold in addition to sector rounding.
.It Xo
.Sy context Ns = Ns Sy none Ns | Ns
.Ar SELinux-User : Ns Ar SELinux-Role : Ns Ar SELinux-Type : Ns Ar Sensitivity-Level
Expand Down
15 changes: 11 additions & 4 deletions module/zfs/arc.c
Original file line number Diff line number Diff line change
Expand Up @@ -29,6 +29,7 @@
* Copyright (c) 2019, Klara Inc.
* Copyright (c) 2019, Allan Jude
* Copyright (c) 2020, The FreeBSD Foundation [1]
* Copyright (c) 2021, 2024 by George Melikov. All rights reserved.
*
* [1] Portions of this software were developed by Allan Jude
* under sponsorship from the FreeBSD Foundation.
Expand Down Expand Up @@ -1786,7 +1787,8 @@ arc_hdr_authenticate(arc_buf_hdr_t *hdr, spa_t *spa, uint64_t dsobj)
!HDR_COMPRESSION_ENABLED(hdr)) {

csize = zio_compress_data(HDR_GET_COMPRESS(hdr),
hdr->b_l1hdr.b_pabd, &tmpbuf, lsize, hdr->b_complevel);
hdr->b_l1hdr.b_pabd, &tmpbuf, lsize, lsize,
hdr->b_complevel);
ASSERT3P(tmpbuf, !=, NULL);
ASSERT3U(csize, <=, psize);
abd = abd_get_from_buf(tmpbuf, lsize);
Expand Down Expand Up @@ -8944,7 +8946,7 @@ l2arc_apply_transforms(spa_t *spa, arc_buf_hdr_t *hdr, uint64_t asize,
cabd = abd_alloc_for_io(bufsize, ismd);
tmp = abd_borrow_buf(cabd, bufsize);

psize = zio_compress_data(compress, to_write, &tmp, size,
psize = zio_compress_data(compress, to_write, &tmp, size, size,
hdr->b_complevel);

if (psize >= asize) {
Expand All @@ -8957,6 +8959,7 @@ l2arc_apply_transforms(spa_t *spa, arc_buf_hdr_t *hdr, uint64_t asize,
abd_zero_off(to_write, psize, asize - psize);
goto encrypt;
}

ASSERT3U(psize, <=, HDR_GET_PSIZE(hdr));
if (psize < asize)
memset((char *)tmp + psize, 0, bufsize - psize);
Expand Down Expand Up @@ -10417,6 +10420,7 @@ l2arc_log_blk_commit(l2arc_dev_t *dev, zio_t *pio, l2arc_write_callback_t *cb)
l2arc_log_blk_phys_t *lb = &dev->l2ad_log_blk;
l2arc_dev_hdr_phys_t *l2dhdr = dev->l2ad_dev_hdr;
uint64_t psize, asize;
size_t d_len;
zio_t *wzio;
l2arc_lb_abd_buf_t *abd_buf;
uint8_t *tmpbuf = NULL;
Expand All @@ -10440,9 +10444,12 @@ l2arc_log_blk_commit(l2arc_dev_t *dev, zio_t *pio, l2arc_write_callback_t *cb)
*/
list_insert_tail(&cb->l2wcb_abd_list, abd_buf);

/* try to compress the buffer */
/* try to compress the buffer, at least one sector to save */
d_len = sizeof (*lb) - (1 << dev->l2ad_vdev->vdev_ashift);
psize = zio_compress_data(ZIO_COMPRESS_LZ4,
abd_buf->abd, (void **) &tmpbuf, sizeof (*lb), 0);
abd_buf->abd, (void **) &tmpbuf, sizeof (*lb),
d_len - d_len % (1 << dev->l2ad_vdev->vdev_ashift),
0);

/* a log block is never entirely zero */
ASSERT(psize != 0);
Expand Down
2 changes: 1 addition & 1 deletion module/zfs/dmu_recv.c
Original file line number Diff line number Diff line change
Expand Up @@ -1409,7 +1409,7 @@ do_corrective_recv(struct receive_writer_arg *rwa, struct drr_write *drrw,
B_FALSE);
void *buf = abd_to_buf(cabd);
uint64_t csize = zio_compress_data(BP_GET_COMPRESS(bp),
abd, &buf, abd_get_size(abd),
abd, &buf, abd_get_size(abd), abd_get_size(abd),
rwa->os->os_complevel);
abd_zero_off(cabd, csize, BP_GET_PSIZE(bp) - csize);
/* Swap in newly compressed data into the abd */
Expand Down
18 changes: 17 additions & 1 deletion module/zfs/zio.c
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,7 @@
* Copyright (c) 2019, Klara Inc.
* Copyright (c) 2019, Allan Jude
* Copyright (c) 2021, Datto, Inc.
* Copyright (c) 2021, 2024 by George Melikov. All rights reserved.
*/

#include <sys/sysmacros.h>
Expand Down Expand Up @@ -1674,6 +1675,20 @@ zio_roundup_alloc_size(spa_t *spa, uint64_t size)
return (spa->spa_min_alloc);
}

static size_t
zio_get_compression_max_size(spa_t *spa, size_t s_len)
{
size_t d_len;

/* minimum 12.5% must be saved (legacy value, may be changed later) */
d_len = s_len - (s_len >> 3);

d_len = d_len - d_len % spa->spa_gcd_alloc;
if (d_len < spa->spa_min_alloc)
return (BPE_PAYLOAD_SIZE);
return (d_len);
}

/*
* ==========================================================================
* Prepare to read and write logical blocks
Expand Down Expand Up @@ -1850,6 +1865,7 @@ zio_write_compress(zio_t *zio)
!(zio->io_flags & ZIO_FLAG_RAW_COMPRESS)) {
void *cbuf = NULL;
psize = zio_compress_data(compress, zio->io_abd, &cbuf, lsize,
zio_get_compression_max_size(spa, lsize),
zp->zp_complevel);
if (psize == 0) {
compress = ZIO_COMPRESS_OFF;
Expand Down Expand Up @@ -1915,7 +1931,7 @@ zio_write_compress(zio_t *zio)
* to a hole.
*/
psize = zio_compress_data(ZIO_COMPRESS_EMPTY,
zio->io_abd, NULL, lsize, zp->zp_complevel);
zio->io_abd, NULL, lsize, lsize, zp->zp_complevel);
if (psize == 0 || psize >= lsize)
compress = ZIO_COMPRESS_OFF;
} else if (zio->io_flags & ZIO_FLAG_RAW_COMPRESS &&
Expand Down
14 changes: 3 additions & 11 deletions module/zfs/zio_compress.c
Original file line number Diff line number Diff line change
Expand Up @@ -22,15 +22,11 @@
/*
* Copyright 2009 Sun Microsystems, Inc. All rights reserved.
* Use is subject to license terms.
*/
/*
* Copyright (c) 2013 by Saso Kiselkov. All rights reserved.
*/

/*
* Copyright (c) 2013, 2018 by Delphix. All rights reserved.
* Copyright (c) 2019, Klara Inc.
* Copyright (c) 2019, Allan Jude
* Copyright (c) 2021, 2024 by George Melikov. All rights reserved.
*/

#include <sys/zfs_context.h>
Expand Down Expand Up @@ -126,9 +122,9 @@ zio_compress_zeroed_cb(void *data, size_t len, void *private)

size_t
zio_compress_data(enum zio_compress c, abd_t *src, void **dst, size_t s_len,
uint8_t level)
size_t d_len, uint8_t level)
{
size_t c_len, d_len;
size_t c_len;
uint8_t complevel;
zio_compress_info_t *ci = &zio_compress_table[c];

Expand All @@ -145,9 +141,6 @@ zio_compress_data(enum zio_compress c, abd_t *src, void **dst, size_t s_len,
if (c == ZIO_COMPRESS_EMPTY)
return (s_len);

/* Compress at least 12.5% */
d_len = s_len - (s_len >> 3);

complevel = ci->ci_level;

if (c == ZIO_COMPRESS_ZSTD) {
Expand All @@ -174,7 +167,6 @@ zio_compress_data(enum zio_compress c, abd_t *src, void **dst, size_t s_len,
if (c_len > d_len)
return (s_len);

ASSERT3U(c_len, <=, d_len);
return (c_len);
}

Expand Down

0 comments on commit 7f578c4

Please sign in to comment.