2018-06-05 19:42:14 -07:00
|
|
|
// SPDX-License-Identifier: GPL-2.0
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Copyright (c) 2000-2005 Silicon Graphics, Inc.
|
|
|
|
* All Rights Reserved.
|
|
|
|
*/
|
|
|
|
#include "xfs.h"
|
|
|
|
#include "xfs_fs.h"
|
|
|
|
#include "xfs_shared.h"
|
|
|
|
#include "xfs_format.h"
|
|
|
|
#include "xfs_log_format.h"
|
|
|
|
#include "xfs_trans_resv.h"
|
|
|
|
#include "xfs_bit.h"
|
|
|
|
#include "xfs_mount.h"
|
|
|
|
#include "xfs_inode.h"
|
|
|
|
#include "xfs_bmap.h"
|
|
|
|
#include "xfs_trans.h"
|
2013-10-29 22:11:58 +11:00
|
|
|
#include "xfs_rtalloc.h"
|
2019-11-02 09:40:53 -07:00
|
|
|
#include "xfs_error.h"
|
2023-10-16 09:21:47 -07:00
|
|
|
#include "xfs_rtbitmap.h"
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Realtime allocator bitmap functions shared with userspace.
|
|
|
|
*/
|
|
|
|
|
2016-02-09 16:41:45 +11:00
|
|
|
/*
|
|
|
|
* Real time buffers need verifiers to avoid runtime warnings during IO.
|
|
|
|
* We don't have anything to verify, however, so these are just dummy
|
|
|
|
* operations.
|
|
|
|
*/
|
|
|
|
static void
|
|
|
|
xfs_rtbuf_verify_read(
|
|
|
|
struct xfs_buf *bp)
|
|
|
|
{
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
static void
|
|
|
|
xfs_rtbuf_verify_write(
|
|
|
|
struct xfs_buf *bp)
|
|
|
|
{
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
const struct xfs_buf_ops xfs_rtbuf_ops = {
|
|
|
|
.name = "rtbuf",
|
|
|
|
.verify_read = xfs_rtbuf_verify_read,
|
|
|
|
.verify_write = xfs_rtbuf_verify_write,
|
|
|
|
};
|
|
|
|
|
2023-10-16 10:13:22 -07:00
|
|
|
/* Release cached rt bitmap and summary buffers. */
|
|
|
|
void
|
|
|
|
xfs_rtbuf_cache_relse(
|
|
|
|
struct xfs_rtalloc_args *args)
|
|
|
|
{
|
|
|
|
if (args->rbmbp) {
|
|
|
|
xfs_trans_brelse(args->tp, args->rbmbp);
|
|
|
|
args->rbmbp = NULL;
|
|
|
|
args->rbmoff = NULLFILEOFF;
|
|
|
|
}
|
|
|
|
if (args->sumbp) {
|
|
|
|
xfs_trans_brelse(args->tp, args->sumbp);
|
|
|
|
args->sumbp = NULL;
|
|
|
|
args->sumoff = NULLFILEOFF;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Get a buffer for the bitmap or summary file block specified.
|
|
|
|
* The buffer is returned read and locked.
|
|
|
|
*/
|
2017-06-16 11:00:07 -07:00
|
|
|
int
|
2013-10-15 09:17:56 +11:00
|
|
|
xfs_rtbuf_get(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
xfs_fileoff_t block, /* block number in bitmap or summary */
|
2023-10-18 10:19:41 -07:00
|
|
|
int issum) /* is summary not bitmap */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = args->mp;
|
2023-10-16 10:13:22 -07:00
|
|
|
struct xfs_buf **cbpp; /* cached block buffer */
|
|
|
|
xfs_fileoff_t *coffp; /* cached block number */
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_buf *bp; /* block buffer, result */
|
|
|
|
struct xfs_inode *ip; /* bitmap or summary inode */
|
|
|
|
struct xfs_bmbt_irec map;
|
2023-10-16 10:13:22 -07:00
|
|
|
enum xfs_blft type;
|
2023-10-16 09:54:19 -07:00
|
|
|
int nmap = 1;
|
|
|
|
int error;
|
2013-10-15 09:17:56 +11:00
|
|
|
|
2023-10-16 10:13:22 -07:00
|
|
|
if (issum) {
|
|
|
|
cbpp = &args->sumbp;
|
|
|
|
coffp = &args->sumoff;
|
|
|
|
ip = mp->m_rsumip;
|
|
|
|
type = XFS_BLFT_RTSUMMARY_BUF;
|
|
|
|
} else {
|
|
|
|
cbpp = &args->rbmbp;
|
|
|
|
coffp = &args->rbmoff;
|
|
|
|
ip = mp->m_rbmip;
|
|
|
|
type = XFS_BLFT_RTBITMAP_BUF;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* If we have a cached buffer, and the block number matches, use that.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
if (*cbpp && *coffp == block)
|
2023-10-16 10:13:22 -07:00
|
|
|
return 0;
|
2023-10-18 10:19:41 -07:00
|
|
|
|
2023-10-16 10:13:22 -07:00
|
|
|
/*
|
|
|
|
* Otherwise we have to have to get the buffer. If there was an old
|
|
|
|
* one, get rid of it first.
|
|
|
|
*/
|
|
|
|
if (*cbpp) {
|
|
|
|
xfs_trans_brelse(args->tp, *cbpp);
|
|
|
|
*cbpp = NULL;
|
|
|
|
}
|
2013-10-15 09:17:56 +11:00
|
|
|
|
2020-05-14 13:59:51 -07:00
|
|
|
error = xfs_bmapi_read(ip, block, 1, &map, &nmap, 0);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
|
2020-06-29 14:47:18 -07:00
|
|
|
if (XFS_IS_CORRUPT(mp, nmap == 0 || !xfs_bmap_is_written_extent(&map)))
|
2018-05-31 09:07:20 -07:00
|
|
|
return -EFSCORRUPTED;
|
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
ASSERT(map.br_startblock != NULLFSBLOCK);
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_trans_read_buf(mp, args->tp, mp->m_ddev_targp,
|
2013-10-15 09:17:56 +11:00
|
|
|
XFS_FSB_TO_DADDR(mp, map.br_startblock),
|
2016-02-09 16:41:45 +11:00
|
|
|
mp->m_bsize, 0, &bp, &xfs_rtbuf_ops);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error)
|
|
|
|
return error;
|
2016-02-09 16:41:31 +11:00
|
|
|
|
2023-10-16 10:13:22 -07:00
|
|
|
xfs_trans_buf_set_type(args->tp, bp, type);
|
2023-10-18 10:19:41 -07:00
|
|
|
*cbpp = bp;
|
2023-10-16 10:13:22 -07:00
|
|
|
*coffp = block;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Searching backward from start to limit, find the first block whose
|
|
|
|
* allocated/free state is different from start's.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
xfs_rtfind_back(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
xfs_rtxnum_t start, /* starting rtext to look at */
|
|
|
|
xfs_rtxnum_t limit, /* last rtext to look at */
|
|
|
|
xfs_rtxnum_t *rtx) /* out: start rtext found */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = args->mp;
|
|
|
|
int bit; /* bit number in the word */
|
|
|
|
xfs_fileoff_t block; /* bitmap block number */
|
|
|
|
int error; /* error value */
|
|
|
|
xfs_rtxnum_t firstbit; /* first useful bit in the word */
|
|
|
|
xfs_rtxnum_t i; /* current bit number rel. to start */
|
|
|
|
xfs_rtxnum_t len; /* length of inspected area */
|
|
|
|
xfs_rtword_t mask; /* mask of relevant bits for value */
|
|
|
|
xfs_rtword_t want; /* mask for "good" values */
|
|
|
|
xfs_rtword_t wdiff; /* difference from wanted value */
|
|
|
|
xfs_rtword_t incore;
|
|
|
|
unsigned int word; /* word number in the buffer */
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Compute and read in starting bitmap block for starting block.
|
|
|
|
*/
|
2023-10-16 09:44:13 -07:00
|
|
|
block = xfs_rtx_to_rbmblock(mp, start);
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Get the first word's index & point to it.
|
|
|
|
*/
|
2023-10-16 09:44:13 -07:00
|
|
|
word = xfs_rtx_to_rbmword(mp, start);
|
2013-10-15 09:17:56 +11:00
|
|
|
bit = (int)(start & (XFS_NBWORD - 1));
|
|
|
|
len = start - limit + 1;
|
|
|
|
/*
|
|
|
|
* Compute match value, based on the bit at start: if 1 (free)
|
|
|
|
* then all-ones, else all-zeroes.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
want = (incore & ((xfs_rtword_t)1 << bit)) ? -1 : 0;
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* If the starting position is not word-aligned, deal with the
|
|
|
|
* partial word.
|
|
|
|
*/
|
|
|
|
if (bit < XFS_NBWORD - 1) {
|
|
|
|
/*
|
|
|
|
* Calculate first (leftmost) bit number to look at,
|
|
|
|
* and mask for all the relevant bits in this word.
|
|
|
|
*/
|
|
|
|
firstbit = XFS_RTMAX((xfs_srtblock_t)(bit - len + 1), 0);
|
|
|
|
mask = (((xfs_rtword_t)1 << (bit - firstbit + 1)) - 1) <<
|
|
|
|
firstbit;
|
|
|
|
/*
|
|
|
|
* Calculate the difference between the value there
|
|
|
|
* and what we're looking for.
|
|
|
|
*/
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = (incore ^ want) & mask)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different. Mark where we are and return.
|
|
|
|
*/
|
|
|
|
i = bit - XFS_RTHIBIT(wdiff);
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start - i + 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
i = bit - firstbit + 1;
|
|
|
|
/*
|
|
|
|
* Go on to previous block if that's where the previous word is
|
|
|
|
* and we need the previous word.
|
|
|
|
*/
|
|
|
|
if (--word == -1 && i < len) {
|
|
|
|
/*
|
|
|
|
* If done with this block, get the previous one.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, --block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2023-10-16 09:46:08 -07:00
|
|
|
word = mp->m_blockwsize - 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* Starting on a word boundary, no partial word.
|
|
|
|
*/
|
|
|
|
i = 0;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Loop over whole words in buffers. When we use up one buffer
|
|
|
|
* we move on to the previous one.
|
|
|
|
*/
|
|
|
|
while (len - i >= XFS_NBWORD) {
|
|
|
|
/*
|
|
|
|
* Compute difference between actual and desired value.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = incore ^ want)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different, mark where we are and return.
|
|
|
|
*/
|
|
|
|
i += XFS_NBWORD - 1 - XFS_RTHIBIT(wdiff);
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start - i + 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
i += XFS_NBWORD;
|
|
|
|
/*
|
|
|
|
* Go on to previous block if that's where the previous word is
|
|
|
|
* and we need the previous word.
|
|
|
|
*/
|
|
|
|
if (--word == -1 && i < len) {
|
|
|
|
/*
|
|
|
|
* If done with this block, get the previous one.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, --block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2023-10-16 09:46:08 -07:00
|
|
|
word = mp->m_blockwsize - 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* If not ending on a word boundary, deal with the last
|
|
|
|
* (partial) word.
|
|
|
|
*/
|
|
|
|
if (len - i) {
|
|
|
|
/*
|
|
|
|
* Calculate first (leftmost) bit number to look at,
|
|
|
|
* and mask for all the relevant bits in this word.
|
|
|
|
*/
|
|
|
|
firstbit = XFS_NBWORD - (len - i);
|
|
|
|
mask = (((xfs_rtword_t)1 << (len - i)) - 1) << firstbit;
|
|
|
|
/*
|
|
|
|
* Compute difference between actual and desired value.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = (incore ^ want) & mask)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different, mark where we are and return.
|
|
|
|
*/
|
|
|
|
i += XFS_NBWORD - 1 - XFS_RTHIBIT(wdiff);
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start - i + 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
} else
|
|
|
|
i = len;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* No match, return that we scanned the whole area.
|
|
|
|
*/
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start - i + 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Searching forward from start to limit, find the first block whose
|
|
|
|
* allocated/free state is different from start's.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
xfs_rtfind_forw(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
xfs_rtxnum_t start, /* starting rtext to look at */
|
|
|
|
xfs_rtxnum_t limit, /* last rtext to look at */
|
|
|
|
xfs_rtxnum_t *rtx) /* out: start rtext found */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = args->mp;
|
|
|
|
int bit; /* bit number in the word */
|
|
|
|
xfs_fileoff_t block; /* bitmap block number */
|
|
|
|
int error;
|
|
|
|
xfs_rtxnum_t i; /* current bit number rel. to start */
|
|
|
|
xfs_rtxnum_t lastbit;/* last useful bit in the word */
|
|
|
|
xfs_rtxnum_t len; /* length of inspected area */
|
|
|
|
xfs_rtword_t mask; /* mask of relevant bits for value */
|
|
|
|
xfs_rtword_t want; /* mask for "good" values */
|
|
|
|
xfs_rtword_t wdiff; /* difference from wanted value */
|
|
|
|
xfs_rtword_t incore;
|
|
|
|
unsigned int word; /* word number in the buffer */
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Compute and read in starting bitmap block for starting block.
|
|
|
|
*/
|
2023-10-16 09:44:13 -07:00
|
|
|
block = xfs_rtx_to_rbmblock(mp, start);
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Get the first word's index & point to it.
|
|
|
|
*/
|
2023-10-16 09:44:13 -07:00
|
|
|
word = xfs_rtx_to_rbmword(mp, start);
|
2013-10-15 09:17:56 +11:00
|
|
|
bit = (int)(start & (XFS_NBWORD - 1));
|
|
|
|
len = limit - start + 1;
|
|
|
|
/*
|
|
|
|
* Compute match value, based on the bit at start: if 1 (free)
|
|
|
|
* then all-ones, else all-zeroes.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
want = (incore & ((xfs_rtword_t)1 << bit)) ? -1 : 0;
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* If the starting position is not word-aligned, deal with the
|
|
|
|
* partial word.
|
|
|
|
*/
|
|
|
|
if (bit) {
|
|
|
|
/*
|
|
|
|
* Calculate last (rightmost) bit number to look at,
|
|
|
|
* and mask for all the relevant bits in this word.
|
|
|
|
*/
|
|
|
|
lastbit = XFS_RTMIN(bit + len, XFS_NBWORD);
|
|
|
|
mask = (((xfs_rtword_t)1 << (lastbit - bit)) - 1) << bit;
|
|
|
|
/*
|
|
|
|
* Calculate the difference between the value there
|
|
|
|
* and what we're looking for.
|
|
|
|
*/
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = (incore ^ want) & mask)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different. Mark where we are and return.
|
|
|
|
*/
|
|
|
|
i = XFS_RTLOBIT(wdiff) - bit;
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start + i - 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
i = lastbit - bit;
|
|
|
|
/*
|
|
|
|
* Go on to next block if that's where the next word is
|
|
|
|
* and we need the next word.
|
|
|
|
*/
|
2023-10-16 09:46:08 -07:00
|
|
|
if (++word == mp->m_blockwsize && i < len) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* If done with this block, get the previous one.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, ++block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
word = 0;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* Starting on a word boundary, no partial word.
|
|
|
|
*/
|
|
|
|
i = 0;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Loop over whole words in buffers. When we use up one buffer
|
|
|
|
* we move on to the next one.
|
|
|
|
*/
|
|
|
|
while (len - i >= XFS_NBWORD) {
|
|
|
|
/*
|
|
|
|
* Compute difference between actual and desired value.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = incore ^ want)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different, mark where we are and return.
|
|
|
|
*/
|
|
|
|
i += XFS_RTLOBIT(wdiff);
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start + i - 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
i += XFS_NBWORD;
|
|
|
|
/*
|
|
|
|
* Go on to next block if that's where the next word is
|
|
|
|
* and we need the next word.
|
|
|
|
*/
|
2023-10-16 09:46:08 -07:00
|
|
|
if (++word == mp->m_blockwsize && i < len) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* If done with this block, get the next one.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, ++block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
word = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* If not ending on a word boundary, deal with the last
|
|
|
|
* (partial) word.
|
|
|
|
*/
|
|
|
|
if ((lastbit = len - i)) {
|
|
|
|
/*
|
|
|
|
* Calculate mask for all the relevant bits in this word.
|
|
|
|
*/
|
|
|
|
mask = ((xfs_rtword_t)1 << lastbit) - 1;
|
|
|
|
/*
|
|
|
|
* Compute difference between actual and desired value.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = (incore ^ want) & mask)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different, mark where we are and return.
|
|
|
|
*/
|
|
|
|
i += XFS_RTLOBIT(wdiff);
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start + i - 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
} else
|
|
|
|
i = len;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* No match, return that we scanned the whole area.
|
|
|
|
*/
|
2023-10-16 09:32:45 -07:00
|
|
|
*rtx = start + i - 1;
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2023-10-17 16:43:10 -07:00
|
|
|
/* Log rtsummary counter at @infoword. */
|
|
|
|
static inline void
|
|
|
|
xfs_trans_log_rtsummary(
|
2023-10-18 10:28:10 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
2023-10-17 16:43:10 -07:00
|
|
|
unsigned int infoword)
|
|
|
|
{
|
2023-10-18 10:28:10 -07:00
|
|
|
struct xfs_buf *bp = args->sumbp;
|
2023-10-17 16:43:10 -07:00
|
|
|
size_t first, last;
|
|
|
|
|
2023-10-18 10:28:10 -07:00
|
|
|
first = (void *)xfs_rsumblock_infoptr(args, infoword) - bp->b_addr;
|
2023-10-17 16:43:10 -07:00
|
|
|
last = first + sizeof(xfs_suminfo_t) - 1;
|
|
|
|
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_trans_log_buf(args->tp, bp, first, last);
|
2023-10-17 16:43:10 -07:00
|
|
|
}
|
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
2014-09-09 11:58:42 +10:00
|
|
|
* Read and/or modify the summary information for a given extent size,
|
2013-10-15 09:17:56 +11:00
|
|
|
* bitmap block combination.
|
|
|
|
* Keeps track of a current summary block, so we don't keep reading
|
|
|
|
* it from the buffer cache.
|
2014-09-09 11:58:42 +10:00
|
|
|
*
|
|
|
|
* Summary information is returned in *sum if specified.
|
|
|
|
* If no delta is specified, returns summary only.
|
2013-10-15 09:17:56 +11:00
|
|
|
*/
|
|
|
|
int
|
2014-09-09 11:58:42 +10:00
|
|
|
xfs_rtmodify_summary_int(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
int log, /* log2 of extent size */
|
|
|
|
xfs_fileoff_t bbno, /* bitmap block number */
|
|
|
|
int delta, /* change to make to summary info */
|
|
|
|
xfs_suminfo_t *sum) /* out: summary info for this block */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = args->mp;
|
|
|
|
int error;
|
|
|
|
xfs_fileoff_t sb; /* summary fsblock */
|
|
|
|
xfs_rtsumoff_t so; /* index into the summary file */
|
|
|
|
unsigned int infoword;
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Compute entry number in the summary file.
|
|
|
|
*/
|
2023-10-16 09:47:34 -07:00
|
|
|
so = xfs_rtsumoffs(mp, log, bbno);
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Compute the block number in the summary file.
|
|
|
|
*/
|
2023-10-16 09:47:34 -07:00
|
|
|
sb = xfs_rtsumoffs_to_block(mp, so);
|
2023-10-16 10:13:22 -07:00
|
|
|
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtsummary_read_buf(args, sb);
|
2023-10-16 10:13:22 -07:00
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
2014-09-09 11:58:42 +10:00
|
|
|
* Point to the summary information, modify/log it, and/or copy it out.
|
2013-10-15 09:17:56 +11:00
|
|
|
*/
|
2023-10-16 09:47:34 -07:00
|
|
|
infoword = xfs_rtsumoffs_to_infoword(mp, so);
|
2014-09-09 11:58:42 +10:00
|
|
|
if (delta) {
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_suminfo_t val = xfs_suminfo_add(args, infoword, delta);
|
2014-09-09 11:58:42 +10:00
|
|
|
|
xfs: cache minimum realtime summary level
The realtime summary is a two-dimensional array on disk, effectively:
u32 rsum[log2(number of realtime extents) + 1][number of blocks in the bitmap]
rsum[log][bbno] is the number of extents of size 2**log which start in
bitmap block bbno.
xfs_rtallocate_extent_near() uses xfs_rtany_summary() to check whether
rsum[log][bbno] != 0 for any log level. However, the summary array is
stored in row-major order (i.e., like an array in C), so all of these
entries are not adjacent, but rather spread across the entire summary
file. In the worst case (a full bitmap block), xfs_rtany_summary() has
to check every level.
This means that on a moderately-used realtime device, an allocation will
waste a lot of time finding, reading, and releasing buffers for the
realtime summary. In particular, one of our storage services (which runs
on servers with 8 very slow CPUs and 15 8 TB XFS realtime filesystems)
spends almost 5% of its CPU cycles in xfs_rtbuf_get() and
xfs_trans_brelse() called from xfs_rtany_summary().
One solution would be to also store the summary with the dimensions
swapped. However, this would require a disk format change to a very old
component of XFS.
Instead, we can cache the minimum size which contains any extents. We do
so lazily; rather than guaranteeing that the cache contains the precise
minimum, it always contains a loose lower bound which we tighten when we
read or update a summary block. This only uses a few kilobytes of memory
and is already serialized via the realtime bitmap and summary inode
locks, so the cost is minimal. With this change, the same workload only
spends 0.2% of its CPU cycles in the realtime allocator.
Signed-off-by: Omar Sandoval <osandov@fb.com>
Reviewed-by: Darrick J. Wong <darrick.wong@oracle.com>
Signed-off-by: Darrick J. Wong <darrick.wong@oracle.com>
2018-12-12 08:46:32 -08:00
|
|
|
if (mp->m_rsum_cache) {
|
2023-10-16 10:41:55 -07:00
|
|
|
if (val == 0 && log + 1 == mp->m_rsum_cache[bbno])
|
xfs: cache minimum realtime summary level
The realtime summary is a two-dimensional array on disk, effectively:
u32 rsum[log2(number of realtime extents) + 1][number of blocks in the bitmap]
rsum[log][bbno] is the number of extents of size 2**log which start in
bitmap block bbno.
xfs_rtallocate_extent_near() uses xfs_rtany_summary() to check whether
rsum[log][bbno] != 0 for any log level. However, the summary array is
stored in row-major order (i.e., like an array in C), so all of these
entries are not adjacent, but rather spread across the entire summary
file. In the worst case (a full bitmap block), xfs_rtany_summary() has
to check every level.
This means that on a moderately-used realtime device, an allocation will
waste a lot of time finding, reading, and releasing buffers for the
realtime summary. In particular, one of our storage services (which runs
on servers with 8 very slow CPUs and 15 8 TB XFS realtime filesystems)
spends almost 5% of its CPU cycles in xfs_rtbuf_get() and
xfs_trans_brelse() called from xfs_rtany_summary().
One solution would be to also store the summary with the dimensions
swapped. However, this would require a disk format change to a very old
component of XFS.
Instead, we can cache the minimum size which contains any extents. We do
so lazily; rather than guaranteeing that the cache contains the precise
minimum, it always contains a loose lower bound which we tighten when we
read or update a summary block. This only uses a few kilobytes of memory
and is already serialized via the realtime bitmap and summary inode
locks, so the cost is minimal. With this change, the same workload only
spends 0.2% of its CPU cycles in the realtime allocator.
Signed-off-by: Omar Sandoval <osandov@fb.com>
Reviewed-by: Darrick J. Wong <darrick.wong@oracle.com>
Signed-off-by: Darrick J. Wong <darrick.wong@oracle.com>
2018-12-12 08:46:32 -08:00
|
|
|
mp->m_rsum_cache[bbno] = log;
|
2023-10-16 10:41:55 -07:00
|
|
|
if (val != 0 && log >= mp->m_rsum_cache[bbno])
|
|
|
|
mp->m_rsum_cache[bbno] = log + 1;
|
xfs: cache minimum realtime summary level
The realtime summary is a two-dimensional array on disk, effectively:
u32 rsum[log2(number of realtime extents) + 1][number of blocks in the bitmap]
rsum[log][bbno] is the number of extents of size 2**log which start in
bitmap block bbno.
xfs_rtallocate_extent_near() uses xfs_rtany_summary() to check whether
rsum[log][bbno] != 0 for any log level. However, the summary array is
stored in row-major order (i.e., like an array in C), so all of these
entries are not adjacent, but rather spread across the entire summary
file. In the worst case (a full bitmap block), xfs_rtany_summary() has
to check every level.
This means that on a moderately-used realtime device, an allocation will
waste a lot of time finding, reading, and releasing buffers for the
realtime summary. In particular, one of our storage services (which runs
on servers with 8 very slow CPUs and 15 8 TB XFS realtime filesystems)
spends almost 5% of its CPU cycles in xfs_rtbuf_get() and
xfs_trans_brelse() called from xfs_rtany_summary().
One solution would be to also store the summary with the dimensions
swapped. However, this would require a disk format change to a very old
component of XFS.
Instead, we can cache the minimum size which contains any extents. We do
so lazily; rather than guaranteeing that the cache contains the precise
minimum, it always contains a loose lower bound which we tighten when we
read or update a summary block. This only uses a few kilobytes of memory
and is already serialized via the realtime bitmap and summary inode
locks, so the cost is minimal. With this change, the same workload only
spends 0.2% of its CPU cycles in the realtime allocator.
Signed-off-by: Omar Sandoval <osandov@fb.com>
Reviewed-by: Darrick J. Wong <darrick.wong@oracle.com>
Signed-off-by: Darrick J. Wong <darrick.wong@oracle.com>
2018-12-12 08:46:32 -08:00
|
|
|
}
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_trans_log_rtsummary(args, infoword);
|
2023-10-16 09:51:16 -07:00
|
|
|
if (sum)
|
|
|
|
*sum = val;
|
|
|
|
} else if (sum) {
|
2023-10-18 10:28:10 -07:00
|
|
|
*sum = xfs_suminfo_get(args, infoword);
|
2014-09-09 11:58:42 +10:00
|
|
|
}
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2014-09-09 11:58:42 +10:00
|
|
|
int
|
|
|
|
xfs_rtmodify_summary(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
int log, /* log2 of extent size */
|
|
|
|
xfs_fileoff_t bbno, /* bitmap block number */
|
2023-10-16 10:13:22 -07:00
|
|
|
int delta) /* in/out: summary block number */
|
2014-09-09 11:58:42 +10:00
|
|
|
{
|
2023-10-16 10:13:22 -07:00
|
|
|
return xfs_rtmodify_summary_int(args, log, bbno, delta, NULL);
|
2014-09-09 11:58:42 +10:00
|
|
|
}
|
|
|
|
|
2023-10-17 16:43:10 -07:00
|
|
|
/* Log rtbitmap block from the word @from to the byte before @next. */
|
|
|
|
static inline void
|
|
|
|
xfs_trans_log_rtbitmap(
|
2023-10-18 10:28:10 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
2023-10-17 16:43:10 -07:00
|
|
|
unsigned int from,
|
|
|
|
unsigned int next)
|
2014-09-09 11:58:42 +10:00
|
|
|
{
|
2023-10-18 10:28:10 -07:00
|
|
|
struct xfs_buf *bp = args->rbmbp;
|
2023-10-17 16:43:10 -07:00
|
|
|
size_t first, last;
|
|
|
|
|
2023-10-18 10:28:10 -07:00
|
|
|
first = (void *)xfs_rbmblock_wordptr(args, from) - bp->b_addr;
|
|
|
|
last = ((void *)xfs_rbmblock_wordptr(args, next) - 1) - bp->b_addr;
|
2023-10-17 16:43:10 -07:00
|
|
|
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_trans_log_buf(args->tp, bp, first, last);
|
2014-09-09 11:58:42 +10:00
|
|
|
}
|
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Set the given range of bitmap bits to the given value.
|
|
|
|
* Do whatever I/O and logging is required.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
xfs_rtmodify_range(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
xfs_rtxnum_t start, /* starting rtext to modify */
|
|
|
|
xfs_rtxlen_t len, /* length of extent to modify */
|
|
|
|
int val) /* 1 for free, 0 for allocated */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = args->mp;
|
|
|
|
int bit; /* bit number in the word */
|
|
|
|
xfs_fileoff_t block; /* bitmap block number */
|
|
|
|
int error;
|
|
|
|
int i; /* current bit number rel. to start */
|
|
|
|
int lastbit; /* last useful bit in word */
|
|
|
|
xfs_rtword_t mask; /* mask of relevant bits for value */
|
|
|
|
xfs_rtword_t incore;
|
|
|
|
unsigned int firstword; /* first word used in the buffer */
|
|
|
|
unsigned int word; /* word number in the buffer */
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Compute starting bitmap block number.
|
|
|
|
*/
|
2023-10-16 09:44:13 -07:00
|
|
|
block = xfs_rtx_to_rbmblock(mp, start);
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Read the bitmap block, and point to its data.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Compute the starting word's address, and starting bit.
|
|
|
|
*/
|
2023-10-17 16:43:10 -07:00
|
|
|
firstword = word = xfs_rtx_to_rbmword(mp, start);
|
2013-10-15 09:17:56 +11:00
|
|
|
bit = (int)(start & (XFS_NBWORD - 1));
|
|
|
|
/*
|
|
|
|
* 0 (allocated) => all zeroes; 1 (free) => all ones.
|
|
|
|
*/
|
|
|
|
val = -val;
|
|
|
|
/*
|
|
|
|
* If not starting on a word boundary, deal with the first
|
|
|
|
* (partial) word.
|
|
|
|
*/
|
|
|
|
if (bit) {
|
|
|
|
/*
|
|
|
|
* Compute first bit not changed and mask of relevant bits.
|
|
|
|
*/
|
|
|
|
lastbit = XFS_RTMIN(bit + len, XFS_NBWORD);
|
|
|
|
mask = (((xfs_rtword_t)1 << (lastbit - bit)) - 1) << bit;
|
|
|
|
/*
|
|
|
|
* Set/clear the active bits.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (val)
|
2023-10-16 09:49:01 -07:00
|
|
|
incore |= mask;
|
2013-10-15 09:17:56 +11:00
|
|
|
else
|
2023-10-16 09:49:01 -07:00
|
|
|
incore &= ~mask;
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_rtbitmap_setword(args, word, incore);
|
2013-10-15 09:17:56 +11:00
|
|
|
i = lastbit - bit;
|
|
|
|
/*
|
|
|
|
* Go on to the next block if that's where the next word is
|
|
|
|
* and we need the next word.
|
|
|
|
*/
|
2023-10-16 09:46:08 -07:00
|
|
|
if (++word == mp->m_blockwsize && i < len) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Log the changed part of this block.
|
|
|
|
* Get the next one.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_trans_log_rtbitmap(args, firstword, word);
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, ++block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2023-10-17 16:43:10 -07:00
|
|
|
firstword = word = 0;
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* Starting on a word boundary, no partial word.
|
|
|
|
*/
|
|
|
|
i = 0;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Loop over whole words in buffers. When we use up one buffer
|
|
|
|
* we move on to the next one.
|
|
|
|
*/
|
|
|
|
while (len - i >= XFS_NBWORD) {
|
|
|
|
/*
|
|
|
|
* Set the word value correctly.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_rtbitmap_setword(args, word, val);
|
2013-10-15 09:17:56 +11:00
|
|
|
i += XFS_NBWORD;
|
|
|
|
/*
|
|
|
|
* Go on to the next block if that's where the next word is
|
|
|
|
* and we need the next word.
|
|
|
|
*/
|
2023-10-16 09:46:08 -07:00
|
|
|
if (++word == mp->m_blockwsize && i < len) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Log the changed part of this block.
|
|
|
|
* Get the next one.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_trans_log_rtbitmap(args, firstword, word);
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, ++block);
|
2023-10-16 09:54:19 -07:00
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2023-10-17 16:43:10 -07:00
|
|
|
firstword = word = 0;
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* If not ending on a word boundary, deal with the last
|
|
|
|
* (partial) word.
|
|
|
|
*/
|
|
|
|
if ((lastbit = len - i)) {
|
|
|
|
/*
|
|
|
|
* Compute a mask of relevant bits.
|
|
|
|
*/
|
|
|
|
mask = ((xfs_rtword_t)1 << lastbit) - 1;
|
|
|
|
/*
|
|
|
|
* Set/clear the active bits.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (val)
|
2023-10-16 09:49:01 -07:00
|
|
|
incore |= mask;
|
2013-10-15 09:17:56 +11:00
|
|
|
else
|
2023-10-16 09:49:01 -07:00
|
|
|
incore &= ~mask;
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_rtbitmap_setword(args, word, incore);
|
2023-10-17 16:43:10 -07:00
|
|
|
word++;
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Log any remaining changed bytes.
|
|
|
|
*/
|
2023-10-16 09:49:01 -07:00
|
|
|
if (word > firstword)
|
2023-10-18 10:28:10 -07:00
|
|
|
xfs_trans_log_rtbitmap(args, firstword, word);
|
2013-10-15 09:17:56 +11:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Mark an extent specified by start and len freed.
|
|
|
|
* Updates all the summary information as well as the bitmap.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
xfs_rtfree_range(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
xfs_rtxnum_t start, /* starting rtext to free */
|
2023-10-16 10:13:22 -07:00
|
|
|
xfs_rtxlen_t len) /* in/out: summary block number */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = args->mp;
|
|
|
|
xfs_rtxnum_t end; /* end of the freed extent */
|
|
|
|
int error; /* error value */
|
|
|
|
xfs_rtxnum_t postblock; /* first rtext freed > end */
|
|
|
|
xfs_rtxnum_t preblock; /* first rtext freed < start */
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
end = start + len - 1;
|
|
|
|
/*
|
|
|
|
* Modify the bitmap to mark this extent freed.
|
|
|
|
*/
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtmodify_range(args, start, len, 1);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error) {
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Assume we're freeing out of the middle of an allocated extent.
|
|
|
|
* We need to find the beginning and end of the extent so we can
|
|
|
|
* properly update the summary.
|
|
|
|
*/
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtfind_back(args, start, 0, &preblock);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error) {
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Find the next allocated block (end of allocated extent).
|
|
|
|
*/
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtfind_forw(args, end, mp->m_sb.sb_rextents - 1,
|
2023-10-16 10:13:22 -07:00
|
|
|
&postblock);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
/*
|
|
|
|
* If there are blocks not being freed at the front of the
|
|
|
|
* old extent, add summary data for them to be allocated.
|
|
|
|
*/
|
|
|
|
if (preblock < start) {
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtmodify_summary(args,
|
2023-10-16 10:13:22 -07:00
|
|
|
XFS_RTBLOCKLOG(start - preblock),
|
|
|
|
xfs_rtx_to_rbmblock(mp, preblock), -1);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error) {
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* If there are blocks not being freed at the end of the
|
|
|
|
* old extent, add summary data for them to be allocated.
|
|
|
|
*/
|
|
|
|
if (postblock > end) {
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtmodify_summary(args,
|
2023-10-16 10:13:22 -07:00
|
|
|
XFS_RTBLOCKLOG(postblock - end),
|
|
|
|
xfs_rtx_to_rbmblock(mp, end + 1), -1);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error) {
|
|
|
|
return error;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Increment the summary information corresponding to the entire
|
|
|
|
* (new) free extent.
|
|
|
|
*/
|
2023-10-16 10:13:22 -07:00
|
|
|
return xfs_rtmodify_summary(args,
|
|
|
|
XFS_RTBLOCKLOG(postblock + 1 - preblock),
|
|
|
|
xfs_rtx_to_rbmblock(mp, preblock), 1);
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Check that the given range is either all allocated (val = 0) or
|
|
|
|
* all free (val = 1).
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
xfs_rtcheck_range(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
xfs_rtxnum_t start, /* starting rtext number of extent */
|
|
|
|
xfs_rtxlen_t len, /* length of extent */
|
|
|
|
int val, /* 1 for free, 0 for allocated */
|
|
|
|
xfs_rtxnum_t *new, /* out: first rtext not matching */
|
|
|
|
int *stat) /* out: 1 for matches, 0 for not */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = args->mp;
|
|
|
|
int bit; /* bit number in the word */
|
|
|
|
xfs_fileoff_t block; /* bitmap block number */
|
|
|
|
int error;
|
|
|
|
xfs_rtxnum_t i; /* current bit number rel. to start */
|
|
|
|
xfs_rtxnum_t lastbit; /* last useful bit in word */
|
|
|
|
xfs_rtword_t mask; /* mask of relevant bits for value */
|
|
|
|
xfs_rtword_t wdiff; /* difference from wanted value */
|
|
|
|
xfs_rtword_t incore;
|
|
|
|
unsigned int word; /* word number in the buffer */
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Compute starting bitmap block number
|
|
|
|
*/
|
2023-10-16 09:44:13 -07:00
|
|
|
block = xfs_rtx_to_rbmblock(mp, start);
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Read the bitmap block.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Compute the starting word's address, and starting bit.
|
|
|
|
*/
|
2023-10-16 09:44:13 -07:00
|
|
|
word = xfs_rtx_to_rbmword(mp, start);
|
2013-10-15 09:17:56 +11:00
|
|
|
bit = (int)(start & (XFS_NBWORD - 1));
|
|
|
|
/*
|
|
|
|
* 0 (allocated) => all zero's; 1 (free) => all one's.
|
|
|
|
*/
|
|
|
|
val = -val;
|
|
|
|
/*
|
|
|
|
* If not starting on a word boundary, deal with the first
|
|
|
|
* (partial) word.
|
|
|
|
*/
|
|
|
|
if (bit) {
|
|
|
|
/*
|
|
|
|
* Compute first bit not examined.
|
|
|
|
*/
|
|
|
|
lastbit = XFS_RTMIN(bit + len, XFS_NBWORD);
|
|
|
|
/*
|
|
|
|
* Mask of relevant bits.
|
|
|
|
*/
|
|
|
|
mask = (((xfs_rtword_t)1 << (lastbit - bit)) - 1) << bit;
|
|
|
|
/*
|
|
|
|
* Compute difference between actual and desired value.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = (incore ^ val) & mask)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different, compute first wrong bit and return.
|
|
|
|
*/
|
|
|
|
i = XFS_RTLOBIT(wdiff) - bit;
|
|
|
|
*new = start + i;
|
|
|
|
*stat = 0;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
i = lastbit - bit;
|
|
|
|
/*
|
|
|
|
* Go on to next block if that's where the next word is
|
|
|
|
* and we need the next word.
|
|
|
|
*/
|
2023-10-16 09:46:08 -07:00
|
|
|
if (++word == mp->m_blockwsize && i < len) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* If done with this block, get the next one.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, ++block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
word = 0;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
/*
|
|
|
|
* Starting on a word boundary, no partial word.
|
|
|
|
*/
|
|
|
|
i = 0;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Loop over whole words in buffers. When we use up one buffer
|
|
|
|
* we move on to the next one.
|
|
|
|
*/
|
|
|
|
while (len - i >= XFS_NBWORD) {
|
|
|
|
/*
|
|
|
|
* Compute difference between actual and desired value.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = incore ^ val)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different, compute first wrong bit and return.
|
|
|
|
*/
|
|
|
|
i += XFS_RTLOBIT(wdiff);
|
|
|
|
*new = start + i;
|
|
|
|
*stat = 0;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
i += XFS_NBWORD;
|
|
|
|
/*
|
|
|
|
* Go on to next block if that's where the next word is
|
|
|
|
* and we need the next word.
|
|
|
|
*/
|
2023-10-16 09:46:08 -07:00
|
|
|
if (++word == mp->m_blockwsize && i < len) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* If done with this block, get the next one.
|
|
|
|
*/
|
2023-10-18 10:19:41 -07:00
|
|
|
error = xfs_rtbitmap_read_buf(args, ++block);
|
|
|
|
if (error)
|
2013-10-15 09:17:56 +11:00
|
|
|
return error;
|
2023-10-16 09:46:53 -07:00
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
word = 0;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* If not ending on a word boundary, deal with the last
|
|
|
|
* (partial) word.
|
|
|
|
*/
|
|
|
|
if ((lastbit = len - i)) {
|
|
|
|
/*
|
|
|
|
* Mask of relevant bits.
|
|
|
|
*/
|
|
|
|
mask = ((xfs_rtword_t)1 << lastbit) - 1;
|
|
|
|
/*
|
|
|
|
* Compute difference between actual and desired value.
|
|
|
|
*/
|
2023-10-18 10:28:10 -07:00
|
|
|
incore = xfs_rtbitmap_getword(args, word);
|
2023-10-16 09:49:01 -07:00
|
|
|
if ((wdiff = (incore ^ val) & mask)) {
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Different, compute first wrong bit and return.
|
|
|
|
*/
|
|
|
|
i += XFS_RTLOBIT(wdiff);
|
|
|
|
*new = start + i;
|
|
|
|
*stat = 0;
|
|
|
|
return 0;
|
|
|
|
} else
|
|
|
|
i = len;
|
|
|
|
}
|
|
|
|
/*
|
|
|
|
* Successful, return.
|
|
|
|
*/
|
|
|
|
*new = start + i;
|
|
|
|
*stat = 1;
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
#ifdef DEBUG
|
|
|
|
/*
|
|
|
|
* Check that the given extent (block range) is allocated already.
|
|
|
|
*/
|
2023-10-16 09:54:19 -07:00
|
|
|
STATIC int
|
2013-10-15 09:17:56 +11:00
|
|
|
xfs_rtcheck_alloc_range(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args *args,
|
|
|
|
xfs_rtxnum_t start, /* starting rtext number of extent */
|
|
|
|
xfs_rtxlen_t len) /* length of extent */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
xfs_rtxnum_t new; /* dummy for xfs_rtcheck_range */
|
|
|
|
int stat;
|
|
|
|
int error;
|
2013-10-15 09:17:56 +11:00
|
|
|
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtcheck_range(args, start, len, 0, &new, &stat);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
ASSERT(stat);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#else
|
2023-10-16 09:54:19 -07:00
|
|
|
#define xfs_rtcheck_alloc_range(a,b,l) (0)
|
2013-10-15 09:17:56 +11:00
|
|
|
#endif
|
|
|
|
/*
|
|
|
|
* Free an extent in the realtime subvolume. Length is expressed in
|
|
|
|
* realtime extents, as is the block number.
|
|
|
|
*/
|
2023-10-16 09:54:19 -07:00
|
|
|
int
|
2013-10-15 09:17:56 +11:00
|
|
|
xfs_rtfree_extent(
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_trans *tp, /* transaction pointer */
|
|
|
|
xfs_rtxnum_t start, /* starting rtext number to free */
|
|
|
|
xfs_rtxlen_t len) /* length of extent freed */
|
2013-10-15 09:17:56 +11:00
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_mount *mp = tp->t_mountp;
|
|
|
|
struct xfs_rtalloc_args args = {
|
|
|
|
.mp = mp,
|
|
|
|
.tp = tp,
|
|
|
|
};
|
|
|
|
int error;
|
2023-11-08 13:22:16 -08:00
|
|
|
struct timespec64 atime;
|
2013-10-15 09:17:56 +11:00
|
|
|
|
|
|
|
ASSERT(mp->m_rbmip->i_itemp != NULL);
|
|
|
|
ASSERT(xfs_isilocked(mp->m_rbmip, XFS_ILOCK_EXCL));
|
|
|
|
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtcheck_alloc_range(&args, start, len);
|
2013-10-15 09:17:56 +11:00
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Free the range of realtime blocks.
|
|
|
|
*/
|
2023-10-16 10:13:22 -07:00
|
|
|
error = xfs_rtfree_range(&args, start, len);
|
|
|
|
if (error)
|
|
|
|
goto out;
|
|
|
|
|
2013-10-15 09:17:56 +11:00
|
|
|
/*
|
|
|
|
* Mark more blocks free in the superblock.
|
|
|
|
*/
|
|
|
|
xfs_trans_mod_sb(tp, XFS_TRANS_SB_FREXTENTS, (long)len);
|
|
|
|
/*
|
|
|
|
* If we've now freed all the blocks, reset the file sequence
|
|
|
|
* number to 0.
|
|
|
|
*/
|
|
|
|
if (tp->t_frextents_delta + mp->m_sb.sb_frextents ==
|
|
|
|
mp->m_sb.sb_rextents) {
|
2021-03-29 11:11:44 -07:00
|
|
|
if (!(mp->m_rbmip->i_diflags & XFS_DIFLAG_NEWRTBM))
|
|
|
|
mp->m_rbmip->i_diflags |= XFS_DIFLAG_NEWRTBM;
|
2023-10-04 14:53:02 -04:00
|
|
|
|
|
|
|
atime = inode_get_atime(VFS_I(mp->m_rbmip));
|
2023-11-08 13:22:16 -08:00
|
|
|
atime.tv_sec = 0;
|
2023-10-04 14:53:02 -04:00
|
|
|
inode_set_atime_to_ts(VFS_I(mp->m_rbmip), atime);
|
2013-10-15 09:17:56 +11:00
|
|
|
xfs_trans_log_inode(tp, mp->m_rbmip, XFS_ILOG_CORE);
|
|
|
|
}
|
2023-10-16 10:13:22 -07:00
|
|
|
error = 0;
|
|
|
|
out:
|
|
|
|
xfs_rtbuf_cache_relse(&args);
|
|
|
|
return error;
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
2017-03-28 14:56:36 -07:00
|
|
|
|
2023-10-16 09:16:22 -07:00
|
|
|
/*
|
|
|
|
* Free some blocks in the realtime subvolume. rtbno and rtlen are in units of
|
|
|
|
* rt blocks, not rt extents; must be aligned to the rt extent size; and rtlen
|
|
|
|
* cannot exceed XFS_MAX_BMBT_EXTLEN.
|
|
|
|
*/
|
|
|
|
int
|
|
|
|
xfs_rtfree_blocks(
|
|
|
|
struct xfs_trans *tp,
|
|
|
|
xfs_fsblock_t rtbno,
|
|
|
|
xfs_filblks_t rtlen)
|
|
|
|
{
|
|
|
|
struct xfs_mount *mp = tp->t_mountp;
|
2023-10-16 09:32:45 -07:00
|
|
|
xfs_rtxnum_t start;
|
2023-10-16 09:16:22 -07:00
|
|
|
xfs_filblks_t len;
|
|
|
|
xfs_extlen_t mod;
|
|
|
|
|
|
|
|
ASSERT(rtlen <= XFS_MAX_BMBT_EXTLEN);
|
|
|
|
|
2023-10-16 09:37:07 -07:00
|
|
|
len = xfs_rtb_to_rtxrem(mp, rtlen, &mod);
|
2023-10-16 09:16:22 -07:00
|
|
|
if (mod) {
|
|
|
|
ASSERT(mod == 0);
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
|
2023-10-16 09:37:07 -07:00
|
|
|
start = xfs_rtb_to_rtxrem(mp, rtbno, &mod);
|
2023-10-16 09:16:22 -07:00
|
|
|
if (mod) {
|
|
|
|
ASSERT(mod == 0);
|
|
|
|
return -EIO;
|
|
|
|
}
|
|
|
|
|
2023-10-16 09:32:45 -07:00
|
|
|
return xfs_rtfree_extent(tp, start, len);
|
2013-10-15 09:17:56 +11:00
|
|
|
}
|
2017-03-28 14:56:36 -07:00
|
|
|
|
|
|
|
/* Find all the free records within a given range. */
|
|
|
|
int
|
|
|
|
xfs_rtalloc_query_range(
|
2022-04-12 06:49:41 +10:00
|
|
|
struct xfs_mount *mp,
|
2017-03-28 14:56:36 -07:00
|
|
|
struct xfs_trans *tp,
|
2021-08-10 17:00:30 -07:00
|
|
|
const struct xfs_rtalloc_rec *low_rec,
|
|
|
|
const struct xfs_rtalloc_rec *high_rec,
|
2017-03-28 14:56:36 -07:00
|
|
|
xfs_rtalloc_query_range_fn fn,
|
|
|
|
void *priv)
|
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args args = {
|
|
|
|
.mp = mp,
|
|
|
|
.tp = tp,
|
|
|
|
};
|
2017-03-28 14:56:36 -07:00
|
|
|
struct xfs_rtalloc_rec rec;
|
2023-10-16 09:32:45 -07:00
|
|
|
xfs_rtxnum_t rtstart;
|
|
|
|
xfs_rtxnum_t rtend;
|
|
|
|
xfs_rtxnum_t high_key;
|
2017-03-28 14:56:36 -07:00
|
|
|
int is_free;
|
|
|
|
int error = 0;
|
|
|
|
|
2018-05-31 09:12:10 -07:00
|
|
|
if (low_rec->ar_startext > high_rec->ar_startext)
|
2017-03-28 14:56:36 -07:00
|
|
|
return -EINVAL;
|
2018-05-31 09:12:10 -07:00
|
|
|
if (low_rec->ar_startext >= mp->m_sb.sb_rextents ||
|
|
|
|
low_rec->ar_startext == high_rec->ar_startext)
|
2017-03-28 14:56:36 -07:00
|
|
|
return 0;
|
2021-08-10 17:00:30 -07:00
|
|
|
|
|
|
|
high_key = min(high_rec->ar_startext, mp->m_sb.sb_rextents - 1);
|
2017-03-28 14:56:36 -07:00
|
|
|
|
|
|
|
/* Iterate the bitmap, looking for discrepancies. */
|
2018-05-31 09:12:10 -07:00
|
|
|
rtstart = low_rec->ar_startext;
|
2021-08-10 17:00:30 -07:00
|
|
|
while (rtstart <= high_key) {
|
2017-03-28 14:56:36 -07:00
|
|
|
/* Is the first block free? */
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtcheck_range(&args, rtstart, 1, 1, &rtend,
|
2017-03-28 14:56:36 -07:00
|
|
|
&is_free);
|
|
|
|
if (error)
|
|
|
|
break;
|
|
|
|
|
|
|
|
/* How long does the extent go for? */
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtfind_forw(&args, rtstart, high_key, &rtend);
|
2017-03-28 14:56:36 -07:00
|
|
|
if (error)
|
|
|
|
break;
|
|
|
|
|
|
|
|
if (is_free) {
|
2018-05-31 09:12:10 -07:00
|
|
|
rec.ar_startext = rtstart;
|
|
|
|
rec.ar_extcount = rtend - rtstart + 1;
|
2017-03-28 14:56:36 -07:00
|
|
|
|
2022-04-12 06:49:41 +10:00
|
|
|
error = fn(mp, tp, &rec, priv);
|
2017-03-28 14:56:36 -07:00
|
|
|
if (error)
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
rtstart = rtend + 1;
|
|
|
|
}
|
|
|
|
|
2023-10-16 10:13:22 -07:00
|
|
|
xfs_rtbuf_cache_relse(&args);
|
2017-03-28 14:56:36 -07:00
|
|
|
return error;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Find all the free records. */
|
|
|
|
int
|
|
|
|
xfs_rtalloc_query_all(
|
2022-04-12 06:49:41 +10:00
|
|
|
struct xfs_mount *mp,
|
2017-03-28 14:56:36 -07:00
|
|
|
struct xfs_trans *tp,
|
|
|
|
xfs_rtalloc_query_range_fn fn,
|
|
|
|
void *priv)
|
|
|
|
{
|
|
|
|
struct xfs_rtalloc_rec keys[2];
|
|
|
|
|
2018-05-31 09:12:10 -07:00
|
|
|
keys[0].ar_startext = 0;
|
2022-04-12 06:49:41 +10:00
|
|
|
keys[1].ar_startext = mp->m_sb.sb_rextents - 1;
|
2018-05-31 09:12:10 -07:00
|
|
|
keys[0].ar_extcount = keys[1].ar_extcount = 0;
|
2017-03-28 14:56:36 -07:00
|
|
|
|
2022-04-12 06:49:41 +10:00
|
|
|
return xfs_rtalloc_query_range(mp, tp, &keys[0], &keys[1], fn, priv);
|
2017-03-28 14:56:36 -07:00
|
|
|
}
|
2017-10-17 21:37:32 -07:00
|
|
|
|
2018-01-16 18:53:10 -08:00
|
|
|
/* Is the given extent all free? */
|
|
|
|
int
|
|
|
|
xfs_rtalloc_extent_is_free(
|
|
|
|
struct xfs_mount *mp,
|
|
|
|
struct xfs_trans *tp,
|
2023-10-16 09:32:45 -07:00
|
|
|
xfs_rtxnum_t start,
|
2023-10-16 09:31:11 -07:00
|
|
|
xfs_rtxlen_t len,
|
2018-01-16 18:53:10 -08:00
|
|
|
bool *is_free)
|
|
|
|
{
|
2023-10-16 09:54:19 -07:00
|
|
|
struct xfs_rtalloc_args args = {
|
|
|
|
.mp = mp,
|
|
|
|
.tp = tp,
|
|
|
|
};
|
2023-10-16 09:32:45 -07:00
|
|
|
xfs_rtxnum_t end;
|
2018-01-16 18:53:10 -08:00
|
|
|
int matches;
|
|
|
|
int error;
|
|
|
|
|
2023-10-16 09:54:19 -07:00
|
|
|
error = xfs_rtcheck_range(&args, start, len, 1, &end, &matches);
|
2023-10-16 10:13:22 -07:00
|
|
|
xfs_rtbuf_cache_relse(&args);
|
2018-01-16 18:53:10 -08:00
|
|
|
if (error)
|
|
|
|
return error;
|
|
|
|
|
|
|
|
*is_free = matches;
|
|
|
|
return 0;
|
|
|
|
}
|
2023-10-16 09:48:20 -07:00
|
|
|
|
|
|
|
/*
|
|
|
|
* Compute the number of rtbitmap blocks needed to track the given number of rt
|
|
|
|
* extents.
|
|
|
|
*/
|
|
|
|
xfs_filblks_t
|
|
|
|
xfs_rtbitmap_blockcount(
|
|
|
|
struct xfs_mount *mp,
|
|
|
|
xfs_rtbxlen_t rtextents)
|
|
|
|
{
|
|
|
|
return howmany_64(rtextents, NBBY * mp->m_sb.sb_blocksize);
|
|
|
|
}
|
|
|
|
|
xfs: make rextslog computation consistent with mkfs
There's a weird discrepancy in xfsprogs dating back to the creation of
the Linux port -- if there are zero rt extents, mkfs will set
sb_rextents and sb_rextslog both to zero:
sbp->sb_rextslog =
(uint8_t)(rtextents ?
libxfs_highbit32((unsigned int)rtextents) : 0);
However, that's not the check that xfs_repair uses for nonzero rtblocks:
if (sb->sb_rextslog !=
libxfs_highbit32((unsigned int)sb->sb_rextents))
The difference here is that xfs_highbit32 returns -1 if its argument is
zero. Unfortunately, this means that in the weird corner case of a
realtime volume shorter than 1 rt extent, xfs_repair will immediately
flag a freshly formatted filesystem as corrupt. Because mkfs has been
writing ondisk artifacts like this for decades, we have to accept that
as "correct". TBH, zero rextslog for zero rtextents makes more sense to
me anyway.
Regrettably, the superblock verifier checks created in commit copied
xfs_repair even though mkfs has been writing out such filesystems for
ages. Fix the superblock verifier to accept what mkfs spits out; the
userspace version of this patch will have to fix xfs_repair as well.
Note that the new helper leaves the zeroday bug where the upper 32 bits
of sb_rextents is ripped off and fed to highbit32. This leads to a
seriously undersized rt summary file, which immediately breaks mkfs:
$ hugedisk.sh foo /dev/sdc $(( 0x100000080 * 4096))B
$ /sbin/mkfs.xfs -f /dev/sda -m rmapbt=0,reflink=0 -r rtdev=/dev/mapper/foo
meta-data=/dev/sda isize=512 agcount=4, agsize=1298176 blks
= sectsz=512 attr=2, projid32bit=1
= crc=1 finobt=1, sparse=1, rmapbt=0
= reflink=0 bigtime=1 inobtcount=1 nrext64=1
data = bsize=4096 blocks=5192704, imaxpct=25
= sunit=0 swidth=0 blks
naming =version 2 bsize=4096 ascii-ci=0, ftype=1
log =internal log bsize=4096 blocks=16384, version=2
= sectsz=512 sunit=0 blks, lazy-count=1
realtime =/dev/mapper/foo extsz=4096 blocks=4294967424, rtextents=4294967424
Discarding blocks...Done.
mkfs.xfs: Error initializing the realtime space [117 - Structure needs cleaning]
The next patch will drop support for rt volumes with fewer than 1 or
more than 2^32-1 rt extents, since they've clearly been broken forever.
Fixes: f8e566c0f5e1f ("xfs: validate the realtime geometry in xfs_validate_sb_common")
Signed-off-by: Darrick J. Wong <djwong@kernel.org>
Reviewed-by: Christoph Hellwig <hch@lst.de>
2023-12-01 09:17:40 -08:00
|
|
|
/*
|
|
|
|
* Compute the maximum level number of the realtime summary file, as defined by
|
2023-12-03 09:19:44 -08:00
|
|
|
* mkfs. The historic use of highbit32 on a 64-bit quantity prohibited correct
|
|
|
|
* use of rt volumes with more than 2^32 extents.
|
xfs: make rextslog computation consistent with mkfs
There's a weird discrepancy in xfsprogs dating back to the creation of
the Linux port -- if there are zero rt extents, mkfs will set
sb_rextents and sb_rextslog both to zero:
sbp->sb_rextslog =
(uint8_t)(rtextents ?
libxfs_highbit32((unsigned int)rtextents) : 0);
However, that's not the check that xfs_repair uses for nonzero rtblocks:
if (sb->sb_rextslog !=
libxfs_highbit32((unsigned int)sb->sb_rextents))
The difference here is that xfs_highbit32 returns -1 if its argument is
zero. Unfortunately, this means that in the weird corner case of a
realtime volume shorter than 1 rt extent, xfs_repair will immediately
flag a freshly formatted filesystem as corrupt. Because mkfs has been
writing ondisk artifacts like this for decades, we have to accept that
as "correct". TBH, zero rextslog for zero rtextents makes more sense to
me anyway.
Regrettably, the superblock verifier checks created in commit copied
xfs_repair even though mkfs has been writing out such filesystems for
ages. Fix the superblock verifier to accept what mkfs spits out; the
userspace version of this patch will have to fix xfs_repair as well.
Note that the new helper leaves the zeroday bug where the upper 32 bits
of sb_rextents is ripped off and fed to highbit32. This leads to a
seriously undersized rt summary file, which immediately breaks mkfs:
$ hugedisk.sh foo /dev/sdc $(( 0x100000080 * 4096))B
$ /sbin/mkfs.xfs -f /dev/sda -m rmapbt=0,reflink=0 -r rtdev=/dev/mapper/foo
meta-data=/dev/sda isize=512 agcount=4, agsize=1298176 blks
= sectsz=512 attr=2, projid32bit=1
= crc=1 finobt=1, sparse=1, rmapbt=0
= reflink=0 bigtime=1 inobtcount=1 nrext64=1
data = bsize=4096 blocks=5192704, imaxpct=25
= sunit=0 swidth=0 blks
naming =version 2 bsize=4096 ascii-ci=0, ftype=1
log =internal log bsize=4096 blocks=16384, version=2
= sectsz=512 sunit=0 blks, lazy-count=1
realtime =/dev/mapper/foo extsz=4096 blocks=4294967424, rtextents=4294967424
Discarding blocks...Done.
mkfs.xfs: Error initializing the realtime space [117 - Structure needs cleaning]
The next patch will drop support for rt volumes with fewer than 1 or
more than 2^32-1 rt extents, since they've clearly been broken forever.
Fixes: f8e566c0f5e1f ("xfs: validate the realtime geometry in xfs_validate_sb_common")
Signed-off-by: Darrick J. Wong <djwong@kernel.org>
Reviewed-by: Christoph Hellwig <hch@lst.de>
2023-12-01 09:17:40 -08:00
|
|
|
*/
|
|
|
|
uint8_t
|
|
|
|
xfs_compute_rextslog(
|
|
|
|
xfs_rtbxlen_t rtextents)
|
|
|
|
{
|
2023-12-03 09:19:44 -08:00
|
|
|
if (!rtextents)
|
|
|
|
return 0;
|
|
|
|
return xfs_highbit64(rtextents);
|
xfs: make rextslog computation consistent with mkfs
There's a weird discrepancy in xfsprogs dating back to the creation of
the Linux port -- if there are zero rt extents, mkfs will set
sb_rextents and sb_rextslog both to zero:
sbp->sb_rextslog =
(uint8_t)(rtextents ?
libxfs_highbit32((unsigned int)rtextents) : 0);
However, that's not the check that xfs_repair uses for nonzero rtblocks:
if (sb->sb_rextslog !=
libxfs_highbit32((unsigned int)sb->sb_rextents))
The difference here is that xfs_highbit32 returns -1 if its argument is
zero. Unfortunately, this means that in the weird corner case of a
realtime volume shorter than 1 rt extent, xfs_repair will immediately
flag a freshly formatted filesystem as corrupt. Because mkfs has been
writing ondisk artifacts like this for decades, we have to accept that
as "correct". TBH, zero rextslog for zero rtextents makes more sense to
me anyway.
Regrettably, the superblock verifier checks created in commit copied
xfs_repair even though mkfs has been writing out such filesystems for
ages. Fix the superblock verifier to accept what mkfs spits out; the
userspace version of this patch will have to fix xfs_repair as well.
Note that the new helper leaves the zeroday bug where the upper 32 bits
of sb_rextents is ripped off and fed to highbit32. This leads to a
seriously undersized rt summary file, which immediately breaks mkfs:
$ hugedisk.sh foo /dev/sdc $(( 0x100000080 * 4096))B
$ /sbin/mkfs.xfs -f /dev/sda -m rmapbt=0,reflink=0 -r rtdev=/dev/mapper/foo
meta-data=/dev/sda isize=512 agcount=4, agsize=1298176 blks
= sectsz=512 attr=2, projid32bit=1
= crc=1 finobt=1, sparse=1, rmapbt=0
= reflink=0 bigtime=1 inobtcount=1 nrext64=1
data = bsize=4096 blocks=5192704, imaxpct=25
= sunit=0 swidth=0 blks
naming =version 2 bsize=4096 ascii-ci=0, ftype=1
log =internal log bsize=4096 blocks=16384, version=2
= sectsz=512 sunit=0 blks, lazy-count=1
realtime =/dev/mapper/foo extsz=4096 blocks=4294967424, rtextents=4294967424
Discarding blocks...Done.
mkfs.xfs: Error initializing the realtime space [117 - Structure needs cleaning]
The next patch will drop support for rt volumes with fewer than 1 or
more than 2^32-1 rt extents, since they've clearly been broken forever.
Fixes: f8e566c0f5e1f ("xfs: validate the realtime geometry in xfs_validate_sb_common")
Signed-off-by: Darrick J. Wong <djwong@kernel.org>
Reviewed-by: Christoph Hellwig <hch@lst.de>
2023-12-01 09:17:40 -08:00
|
|
|
}
|
|
|
|
|
2023-10-16 09:48:20 -07:00
|
|
|
/*
|
|
|
|
* Compute the number of rtbitmap words needed to populate every block of a
|
|
|
|
* bitmap that is large enough to track the given number of rt extents.
|
|
|
|
*/
|
|
|
|
unsigned long long
|
|
|
|
xfs_rtbitmap_wordcount(
|
|
|
|
struct xfs_mount *mp,
|
|
|
|
xfs_rtbxlen_t rtextents)
|
|
|
|
{
|
|
|
|
xfs_filblks_t blocks;
|
|
|
|
|
|
|
|
blocks = xfs_rtbitmap_blockcount(mp, rtextents);
|
|
|
|
return XFS_FSB_TO_B(mp, blocks) >> XFS_WORDLOG;
|
|
|
|
}
|
2023-10-16 09:50:34 -07:00
|
|
|
|
|
|
|
/* Compute the number of rtsummary blocks needed to track the given rt space. */
|
|
|
|
xfs_filblks_t
|
|
|
|
xfs_rtsummary_blockcount(
|
|
|
|
struct xfs_mount *mp,
|
|
|
|
unsigned int rsumlevels,
|
|
|
|
xfs_extlen_t rbmblocks)
|
|
|
|
{
|
|
|
|
unsigned long long rsumwords;
|
|
|
|
|
|
|
|
rsumwords = (unsigned long long)rsumlevels * rbmblocks;
|
|
|
|
return XFS_B_TO_FSB(mp, rsumwords << XFS_WORDLOG);
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Compute the number of rtsummary info words needed to populate every block of
|
|
|
|
* a summary file that is large enough to track the given rt space.
|
|
|
|
*/
|
|
|
|
unsigned long long
|
|
|
|
xfs_rtsummary_wordcount(
|
|
|
|
struct xfs_mount *mp,
|
|
|
|
unsigned int rsumlevels,
|
|
|
|
xfs_extlen_t rbmblocks)
|
|
|
|
{
|
|
|
|
xfs_filblks_t blocks;
|
|
|
|
|
|
|
|
blocks = xfs_rtsummary_blockcount(mp, rsumlevels, rbmblocks);
|
|
|
|
return XFS_FSB_TO_B(mp, blocks) >> XFS_WORDLOG;
|
|
|
|
}
|