2017-03-16 22:18:50 -08:00
|
|
|
// SPDX-License-Identifier: GPL-2.0
|
|
|
|
/*
|
|
|
|
* bcache sysfs interfaces
|
|
|
|
*
|
|
|
|
* Copyright 2010, 2011 Kent Overstreet <kent.overstreet@gmail.com>
|
|
|
|
* Copyright 2012 Google, Inc.
|
|
|
|
*/
|
|
|
|
|
|
|
|
#ifndef NO_BCACHEFS_SYSFS
|
|
|
|
|
|
|
|
#include "bcachefs.h"
|
2018-10-06 00:46:55 -04:00
|
|
|
#include "alloc_background.h"
|
2021-12-25 21:21:46 -05:00
|
|
|
#include "alloc_foreground.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "sysfs.h"
|
|
|
|
#include "btree_cache.h"
|
|
|
|
#include "btree_io.h"
|
|
|
|
#include "btree_iter.h"
|
2020-06-15 19:53:46 -04:00
|
|
|
#include "btree_key_cache.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "btree_update.h"
|
2024-07-11 16:30:41 -04:00
|
|
|
#include "btree_update_interior.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "btree_gc.h"
|
|
|
|
#include "buckets.h"
|
2019-12-19 15:07:51 -05:00
|
|
|
#include "clock.h"
|
2024-01-06 21:01:47 -05:00
|
|
|
#include "compress.h"
|
2024-02-24 21:09:51 -05:00
|
|
|
#include "disk_accounting.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "disk_groups.h"
|
2018-11-01 15:13:19 -04:00
|
|
|
#include "ec.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "inode.h"
|
|
|
|
#include "journal.h"
|
2024-04-13 22:43:11 -04:00
|
|
|
#include "journal_reclaim.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "keylist.h"
|
|
|
|
#include "move.h"
|
2023-03-01 23:10:39 -05:00
|
|
|
#include "movinggc.h"
|
2022-12-14 20:52:11 -05:00
|
|
|
#include "nocow_locking.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "opts.h"
|
|
|
|
#include "rebalance.h"
|
|
|
|
#include "replicas.h"
|
|
|
|
#include "super-io.h"
|
|
|
|
#include "tests.h"
|
|
|
|
|
|
|
|
#include <linux/blkdev.h>
|
|
|
|
#include <linux/sort.h>
|
|
|
|
#include <linux/sched/clock.h>
|
|
|
|
|
|
|
|
#include "util.h"
|
|
|
|
|
|
|
|
#define SYSFS_OPS(type) \
|
2022-09-18 15:43:50 -04:00
|
|
|
const struct sysfs_ops type ## _sysfs_ops = { \
|
2017-03-16 22:18:50 -08:00
|
|
|
.show = type ## _show, \
|
|
|
|
.store = type ## _store \
|
|
|
|
}
|
|
|
|
|
|
|
|
#define SHOW(fn) \
|
2022-02-25 13:18:19 -05:00
|
|
|
static ssize_t fn ## _to_text(struct printbuf *, \
|
2022-09-18 15:43:50 -04:00
|
|
|
struct kobject *, struct attribute *); \
|
2022-02-25 13:18:19 -05:00
|
|
|
\
|
2017-03-16 22:18:50 -08:00
|
|
|
static ssize_t fn ## _show(struct kobject *kobj, struct attribute *attr,\
|
|
|
|
char *buf) \
|
2022-02-25 13:18:19 -05:00
|
|
|
{ \
|
|
|
|
struct printbuf out = PRINTBUF; \
|
|
|
|
ssize_t ret = fn ## _to_text(&out, kobj, attr); \
|
|
|
|
\
|
2022-04-14 20:30:30 -04:00
|
|
|
if (out.pos && out.buf[out.pos - 1] != '\n') \
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_newline(&out); \
|
2022-04-14 20:30:30 -04:00
|
|
|
\
|
2022-02-25 13:18:19 -05:00
|
|
|
if (!ret && out.allocation_failure) \
|
|
|
|
ret = -ENOMEM; \
|
|
|
|
\
|
|
|
|
if (!ret) { \
|
|
|
|
ret = min_t(size_t, out.pos, PAGE_SIZE - 1); \
|
|
|
|
memcpy(buf, out.buf, ret); \
|
|
|
|
} \
|
|
|
|
printbuf_exit(&out); \
|
2022-09-18 15:43:50 -04:00
|
|
|
return bch2_err_class(ret); \
|
2022-02-25 13:18:19 -05:00
|
|
|
} \
|
|
|
|
\
|
|
|
|
static ssize_t fn ## _to_text(struct printbuf *out, struct kobject *kobj,\
|
|
|
|
struct attribute *attr)
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
#define STORE(fn) \
|
2022-09-18 15:43:50 -04:00
|
|
|
static ssize_t fn ## _store_inner(struct kobject *, struct attribute *,\
|
|
|
|
const char *, size_t); \
|
|
|
|
\
|
2017-03-16 22:18:50 -08:00
|
|
|
static ssize_t fn ## _store(struct kobject *kobj, struct attribute *attr,\
|
|
|
|
const char *buf, size_t size) \
|
2022-09-18 15:43:50 -04:00
|
|
|
{ \
|
|
|
|
return bch2_err_class(fn##_store_inner(kobj, attr, buf, size)); \
|
|
|
|
} \
|
|
|
|
\
|
|
|
|
static ssize_t fn ## _store_inner(struct kobject *kobj, struct attribute *attr,\
|
|
|
|
const char *buf, size_t size)
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
#define __sysfs_attribute(_name, _mode) \
|
|
|
|
static struct attribute sysfs_##_name = \
|
|
|
|
{ .name = #_name, .mode = _mode }
|
|
|
|
|
2022-10-22 15:59:53 -04:00
|
|
|
#define write_attribute(n) __sysfs_attribute(n, 0200)
|
|
|
|
#define read_attribute(n) __sysfs_attribute(n, 0444)
|
|
|
|
#define rw_attribute(n) __sysfs_attribute(n, 0644)
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
#define sysfs_printf(file, fmt, ...) \
|
|
|
|
do { \
|
|
|
|
if (attr == &sysfs_ ## file) \
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_printf(out, fmt "\n", __VA_ARGS__); \
|
2017-03-16 22:18:50 -08:00
|
|
|
} while (0)
|
|
|
|
|
|
|
|
#define sysfs_print(file, var) \
|
|
|
|
do { \
|
|
|
|
if (attr == &sysfs_ ## file) \
|
2022-02-25 13:18:19 -05:00
|
|
|
snprint(out, var); \
|
2017-03-16 22:18:50 -08:00
|
|
|
} while (0)
|
|
|
|
|
|
|
|
#define sysfs_hprint(file, val) \
|
|
|
|
do { \
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_ ## file) \
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_human_readable_s64(out, val); \
|
2017-03-16 22:18:50 -08:00
|
|
|
} while (0)
|
|
|
|
|
|
|
|
#define sysfs_strtoul(file, var) \
|
|
|
|
do { \
|
|
|
|
if (attr == &sysfs_ ## file) \
|
|
|
|
return strtoul_safe(buf, var) ?: (ssize_t) size; \
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
#define sysfs_strtoul_clamp(file, var, min, max) \
|
|
|
|
do { \
|
|
|
|
if (attr == &sysfs_ ## file) \
|
|
|
|
return strtoul_safe_clamp(buf, var, min, max) \
|
|
|
|
?: (ssize_t) size; \
|
|
|
|
} while (0)
|
|
|
|
|
|
|
|
#define strtoul_or_return(cp) \
|
|
|
|
({ \
|
|
|
|
unsigned long _v; \
|
|
|
|
int _r = kstrtoul(cp, 10, &_v); \
|
|
|
|
if (_r) \
|
|
|
|
return _r; \
|
|
|
|
_v; \
|
|
|
|
})
|
|
|
|
|
|
|
|
write_attribute(trigger_gc);
|
2022-04-07 18:38:16 -04:00
|
|
|
write_attribute(trigger_discards);
|
2022-06-13 19:34:17 -04:00
|
|
|
write_attribute(trigger_invalidates);
|
2024-04-13 22:43:11 -04:00
|
|
|
write_attribute(trigger_journal_flush);
|
2024-06-28 21:40:00 -04:00
|
|
|
write_attribute(trigger_journal_writes);
|
2024-04-20 14:49:22 -04:00
|
|
|
write_attribute(trigger_btree_cache_shrink);
|
|
|
|
write_attribute(trigger_btree_key_cache_shrink);
|
2024-07-11 16:11:45 -04:00
|
|
|
write_attribute(trigger_freelist_wakeup);
|
2021-04-13 15:00:40 -04:00
|
|
|
rw_attribute(gc_gens_pos);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
read_attribute(uuid);
|
|
|
|
read_attribute(minor);
|
2023-11-26 17:05:02 -05:00
|
|
|
read_attribute(flags);
|
2017-03-16 22:18:50 -08:00
|
|
|
read_attribute(bucket_size);
|
|
|
|
read_attribute(first_bucket);
|
|
|
|
read_attribute(nbuckets);
|
2022-05-25 16:11:56 +12:00
|
|
|
rw_attribute(durability);
|
2023-10-25 16:29:37 -04:00
|
|
|
read_attribute(io_done);
|
|
|
|
read_attribute(io_errors);
|
|
|
|
write_attribute(io_errors_reset);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
read_attribute(io_latency_read);
|
|
|
|
read_attribute(io_latency_write);
|
|
|
|
read_attribute(io_latency_stats_read);
|
|
|
|
read_attribute(io_latency_stats_write);
|
|
|
|
read_attribute(congested);
|
|
|
|
|
2022-10-28 17:08:41 -04:00
|
|
|
read_attribute(btree_write_stats);
|
2021-03-31 21:07:37 -04:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
read_attribute(btree_cache_size);
|
|
|
|
read_attribute(compression_stats);
|
|
|
|
read_attribute(journal_debug);
|
2020-11-19 20:13:30 -05:00
|
|
|
read_attribute(btree_cache);
|
2020-06-15 19:53:46 -04:00
|
|
|
read_attribute(btree_key_cache);
|
2024-07-11 16:30:41 -04:00
|
|
|
read_attribute(btree_reserve_cache);
|
2020-07-06 20:18:13 -04:00
|
|
|
read_attribute(stripes_heap);
|
2021-07-12 23:52:49 -04:00
|
|
|
read_attribute(open_buckets);
|
2023-02-28 23:08:48 -05:00
|
|
|
read_attribute(open_buckets_partial);
|
2022-10-31 16:13:05 -04:00
|
|
|
read_attribute(write_points);
|
2022-12-07 18:41:21 +13:00
|
|
|
read_attribute(nocow_lock_table);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2023-02-09 12:21:45 -05:00
|
|
|
#ifdef BCH_WRITE_REF_DEBUG
|
|
|
|
read_attribute(write_refs);
|
|
|
|
|
2023-07-06 22:47:42 -04:00
|
|
|
static const char * const bch2_write_refs[] = {
|
2023-02-09 12:21:45 -05:00
|
|
|
#define x(n) #n,
|
|
|
|
BCH_WRITE_REFS()
|
|
|
|
#undef x
|
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
|
|
|
static void bch2_write_refs_to_text(struct printbuf *out, struct bch_fs *c)
|
|
|
|
{
|
|
|
|
bch2_printbuf_tabstop_push(out, 24);
|
|
|
|
|
2024-04-10 16:08:24 -04:00
|
|
|
for (unsigned i = 0; i < ARRAY_SIZE(c->writes); i++)
|
|
|
|
prt_printf(out, "%s\t%li\n", bch2_write_refs[i], atomic_long_read(&c->writes[i]));
|
2023-02-09 12:21:45 -05:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
read_attribute(internal_uuid);
|
2023-05-30 14:41:50 -04:00
|
|
|
read_attribute(disk_groups);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
read_attribute(has_data);
|
|
|
|
read_attribute(alloc_debug);
|
2024-02-24 19:58:07 -05:00
|
|
|
read_attribute(accounting);
|
2024-02-23 17:23:41 -05:00
|
|
|
read_attribute(usage_base);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-03-15 21:36:33 +13:00
|
|
|
#define x(t, n, ...) read_attribute(t);
|
|
|
|
BCH_PERSISTENT_COUNTERS()
|
|
|
|
#undef x
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
rw_attribute(discard);
|
|
|
|
rw_attribute(label);
|
|
|
|
|
|
|
|
rw_attribute(copy_gc_enabled);
|
2021-04-13 14:45:55 -04:00
|
|
|
read_attribute(copy_gc_wait);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
rw_attribute(rebalance_enabled);
|
|
|
|
sysfs_pd_controller_attribute(rebalance);
|
bcachefs: rebalance_work
This adds a new btree, rebalance_work, to eliminate scanning required
for finding extents that need work done on them in the background - i.e.
for the background_target and background_compression options.
rebalance_work is a bitset btree, where a KEY_TYPE_set corresponds to an
extent in the extents or reflink btree at the same pos.
A new extent field is added, bch_extent_rebalance, which indicates that
this extent has work that needs to be done in the background - and which
options to use. This allows per-inode options to be propagated to
indirect extents - at least in some circumstances. In this patch,
changing IO options on a file will not propagate the new options to
indirect extents pointed to by that file.
Updating (setting/clearing) the rebalance_work btree is done by the
extent trigger, which looks at the bch_extent_rebalance field.
Scanning is still requrired after changing IO path options - either just
for a given inode, or for the whole filesystem. We indicate that
scanning is required by adding a KEY_TYPE_cookie key to the
rebalance_work btree: the cookie counter is so that we can detect that
scanning is still required when an option has been flipped mid-way
through an existing scan.
Future possible work:
- Propagate options to indirect extents when being changed
- Add other IO path options - nr_replicas, ec, to rebalance_work so
they can be applied in the background when they change
- Add a counter, for bcachefs fs usage output, showing the pending
amount of rebalance work: we'll probably want to do this after the
disk space accounting rewrite (moving it to a new btree)
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2023-10-20 13:33:14 -04:00
|
|
|
read_attribute(rebalance_status);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2018-11-01 15:13:19 -04:00
|
|
|
read_attribute(new_stripes);
|
|
|
|
|
2019-12-19 15:07:51 -05:00
|
|
|
read_attribute(io_timers_read);
|
|
|
|
read_attribute(io_timers_write);
|
|
|
|
|
2023-03-11 20:38:46 -05:00
|
|
|
read_attribute(moving_ctxts);
|
2021-07-23 13:57:19 -06:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
#ifdef CONFIG_BCACHEFS_TESTS
|
|
|
|
write_attribute(perf_test);
|
|
|
|
#endif /* CONFIG_BCACHEFS_TESTS */
|
|
|
|
|
|
|
|
#define x(_name) \
|
|
|
|
static struct attribute sysfs_time_stat_##_name = \
|
2024-08-19 15:33:38 -04:00
|
|
|
{ .name = #_name, .mode = 0644 };
|
2017-03-16 22:18:50 -08:00
|
|
|
BCH_TIME_STATS()
|
|
|
|
#undef x
|
|
|
|
|
|
|
|
static struct attribute sysfs_state_rw = {
|
|
|
|
.name = "state",
|
2022-10-22 15:59:53 -04:00
|
|
|
.mode = 0444,
|
2017-03-16 22:18:50 -08:00
|
|
|
};
|
|
|
|
|
|
|
|
static size_t bch2_btree_cache_size(struct bch_fs *c)
|
|
|
|
{
|
bcachefs: Rework btree node pinning
In backpointers fsck, we do a seqential scan of one btree, and check
references to another: extents <-> backpointers
Checking references generates random lookups, so we want to pin that
btree in memory (or only a range, if it doesn't fit in ram).
Previously, this was done with a simple check in the shrinker - "if
btree node is in range being pinned, don't free it" - but this generated
OOMs, as our shrinker wasn't well behaved if there was less memory
available than expected.
Instead, we now have two different shrinkers and lru lists; the second
shrinker being for pinned nodes, with seeks set much higher than normal
- so they can still be freed if necessary, but we'll prefer not to.
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2024-09-04 20:49:37 -04:00
|
|
|
struct btree_cache *bc = &c->btree_cache;
|
2017-03-16 22:18:50 -08:00
|
|
|
size_t ret = 0;
|
|
|
|
struct btree *b;
|
|
|
|
|
bcachefs: Rework btree node pinning
In backpointers fsck, we do a seqential scan of one btree, and check
references to another: extents <-> backpointers
Checking references generates random lookups, so we want to pin that
btree in memory (or only a range, if it doesn't fit in ram).
Previously, this was done with a simple check in the shrinker - "if
btree node is in range being pinned, don't free it" - but this generated
OOMs, as our shrinker wasn't well behaved if there was less memory
available than expected.
Instead, we now have two different shrinkers and lru lists; the second
shrinker being for pinned nodes, with seeks set much higher than normal
- so they can still be freed if necessary, but we'll prefer not to.
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2024-09-04 20:49:37 -04:00
|
|
|
mutex_lock(&bc->lock);
|
|
|
|
list_for_each_entry(b, &bc->live[0].list, list)
|
2024-01-16 13:29:59 -05:00
|
|
|
ret += btree_buf_bytes(b);
|
bcachefs: Rework btree node pinning
In backpointers fsck, we do a seqential scan of one btree, and check
references to another: extents <-> backpointers
Checking references generates random lookups, so we want to pin that
btree in memory (or only a range, if it doesn't fit in ram).
Previously, this was done with a simple check in the shrinker - "if
btree node is in range being pinned, don't free it" - but this generated
OOMs, as our shrinker wasn't well behaved if there was less memory
available than expected.
Instead, we now have two different shrinkers and lru lists; the second
shrinker being for pinned nodes, with seeks set much higher than normal
- so they can still be freed if necessary, but we'll prefer not to.
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2024-09-04 20:49:37 -04:00
|
|
|
list_for_each_entry(b, &bc->live[1].list, list)
|
|
|
|
ret += btree_buf_bytes(b);
|
|
|
|
list_for_each_entry(b, &bc->freeable, list)
|
|
|
|
ret += btree_buf_bytes(b);
|
|
|
|
mutex_unlock(&bc->lock);
|
2017-03-16 22:18:50 -08:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2020-07-25 17:06:11 -04:00
|
|
|
static int bch2_compression_stats_to_text(struct printbuf *out, struct bch_fs *c)
|
2017-03-16 22:18:50 -08:00
|
|
|
{
|
2024-02-24 21:09:51 -05:00
|
|
|
prt_str(out, "type");
|
2023-11-24 23:40:08 -05:00
|
|
|
printbuf_tabstop_push(out, 12);
|
|
|
|
printbuf_tabstop_push(out, 16);
|
|
|
|
printbuf_tabstop_push(out, 16);
|
|
|
|
printbuf_tabstop_push(out, 24);
|
2024-04-10 16:08:24 -04:00
|
|
|
prt_printf(out, "type\tcompressed\runcompressed\raverage extent size\r\n");
|
2023-11-24 23:40:08 -05:00
|
|
|
|
2024-02-24 21:09:51 -05:00
|
|
|
for (unsigned i = 1; i < BCH_COMPRESSION_TYPE_NR; i++) {
|
|
|
|
struct disk_accounting_pos a = {
|
|
|
|
.type = BCH_DISK_ACCOUNTING_compression,
|
|
|
|
.compression.type = i,
|
|
|
|
};
|
|
|
|
struct bpos p = disk_accounting_pos_to_bpos(&a);
|
|
|
|
u64 v[3];
|
|
|
|
bch2_accounting_mem_read(c, p, v, ARRAY_SIZE(v));
|
|
|
|
|
|
|
|
u64 nr_extents = v[0];
|
|
|
|
u64 sectors_uncompressed = v[1];
|
|
|
|
u64 sectors_compressed = v[2];
|
|
|
|
|
2024-01-06 21:01:47 -05:00
|
|
|
bch2_prt_compression_type(out, i);
|
2023-11-24 23:40:08 -05:00
|
|
|
prt_tab(out);
|
|
|
|
|
2024-02-24 21:09:51 -05:00
|
|
|
prt_human_readable_u64(out, sectors_compressed << 9);
|
2023-11-24 23:40:08 -05:00
|
|
|
prt_tab_rjust(out);
|
|
|
|
|
2024-02-24 21:09:51 -05:00
|
|
|
prt_human_readable_u64(out, sectors_uncompressed << 9);
|
2023-11-24 23:40:08 -05:00
|
|
|
prt_tab_rjust(out);
|
|
|
|
|
2024-02-24 21:09:51 -05:00
|
|
|
prt_human_readable_u64(out, nr_extents
|
2024-09-05 16:59:29 +00:00
|
|
|
? div64_u64(sectors_uncompressed << 9, nr_extents)
|
2023-11-24 23:40:08 -05:00
|
|
|
: 0);
|
|
|
|
prt_tab_rjust(out);
|
|
|
|
prt_newline(out);
|
|
|
|
}
|
|
|
|
|
2020-07-25 17:06:11 -04:00
|
|
|
return 0;
|
2018-11-01 15:13:19 -04:00
|
|
|
}
|
|
|
|
|
2021-05-23 17:04:13 -04:00
|
|
|
static void bch2_gc_gens_pos_to_text(struct printbuf *out, struct bch_fs *c)
|
2021-04-13 15:00:40 -04:00
|
|
|
{
|
2023-10-19 22:49:08 -04:00
|
|
|
prt_printf(out, "%s: ", bch2_btree_id_str(c->gc_gens_btree));
|
2021-04-13 15:00:40 -04:00
|
|
|
bch2_bpos_to_text(out, c->gc_gens_pos);
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_printf(out, "\n");
|
2021-04-13 15:00:40 -04:00
|
|
|
}
|
|
|
|
|
2024-02-23 17:23:41 -05:00
|
|
|
static void bch2_fs_usage_base_to_text(struct printbuf *out, struct bch_fs *c)
|
|
|
|
{
|
|
|
|
struct bch_fs_usage_base b = {};
|
|
|
|
|
|
|
|
acc_u64s_percpu(&b.hidden, &c->usage->hidden, sizeof(b) / sizeof(u64));
|
|
|
|
|
|
|
|
prt_printf(out, "hidden:\t\t%llu\n", b.hidden);
|
|
|
|
prt_printf(out, "btree:\t\t%llu\n", b.btree);
|
|
|
|
prt_printf(out, "data:\t\t%llu\n", b.data);
|
|
|
|
prt_printf(out, "cached:\t%llu\n", b.cached);
|
|
|
|
prt_printf(out, "reserved:\t\t%llu\n", b.reserved);
|
|
|
|
prt_printf(out, "nr_inodes:\t%llu\n", b.nr_inodes);
|
|
|
|
}
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
SHOW(bch2_fs)
|
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, kobj);
|
|
|
|
|
|
|
|
sysfs_print(minor, c->minor);
|
|
|
|
sysfs_printf(internal_uuid, "%pU", c->sb.uuid.b);
|
|
|
|
|
2023-11-26 17:05:02 -05:00
|
|
|
if (attr == &sysfs_flags)
|
|
|
|
prt_bitflags(out, bch2_fs_flag_strs, c->flags);
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
sysfs_hprint(btree_cache_size, bch2_btree_cache_size(c));
|
2022-10-28 17:08:41 -04:00
|
|
|
|
|
|
|
if (attr == &sysfs_btree_write_stats)
|
|
|
|
bch2_btree_write_stats_to_text(out, c);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_gc_gens_pos)
|
|
|
|
bch2_gc_gens_pos_to_text(out, c);
|
2021-04-13 15:00:40 -04:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
sysfs_printf(copy_gc_enabled, "%i", c->copy_gc_enabled);
|
|
|
|
|
|
|
|
sysfs_printf(rebalance_enabled, "%i", c->rebalance.enabled);
|
|
|
|
sysfs_pd_controller_show(rebalance, &c->rebalance.pd); /* XXX */
|
2023-03-01 23:10:39 -05:00
|
|
|
|
|
|
|
if (attr == &sysfs_copy_gc_wait)
|
|
|
|
bch2_copygc_wait_to_text(out, c);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
bcachefs: rebalance_work
This adds a new btree, rebalance_work, to eliminate scanning required
for finding extents that need work done on them in the background - i.e.
for the background_target and background_compression options.
rebalance_work is a bitset btree, where a KEY_TYPE_set corresponds to an
extent in the extents or reflink btree at the same pos.
A new extent field is added, bch_extent_rebalance, which indicates that
this extent has work that needs to be done in the background - and which
options to use. This allows per-inode options to be propagated to
indirect extents - at least in some circumstances. In this patch,
changing IO options on a file will not propagate the new options to
indirect extents pointed to by that file.
Updating (setting/clearing) the rebalance_work btree is done by the
extent trigger, which looks at the bch_extent_rebalance field.
Scanning is still requrired after changing IO path options - either just
for a given inode, or for the whole filesystem. We indicate that
scanning is required by adding a KEY_TYPE_cookie key to the
rebalance_work btree: the cookie counter is so that we can detect that
scanning is still required when an option has been flipped mid-way
through an existing scan.
Future possible work:
- Propagate options to indirect extents when being changed
- Add other IO path options - nr_replicas, ec, to rebalance_work so
they can be applied in the background when they change
- Add a counter, for bcachefs fs usage output, showing the pending
amount of rebalance work: we'll probably want to do this after the
disk space accounting rewrite (moving it to a new btree)
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2023-10-20 13:33:14 -04:00
|
|
|
if (attr == &sysfs_rebalance_status)
|
|
|
|
bch2_rebalance_status_to_text(out, c);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
/* Debugging: */
|
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_journal_debug)
|
|
|
|
bch2_journal_debug_to_text(out, &c->journal);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_btree_cache)
|
2022-09-30 16:37:15 +13:00
|
|
|
bch2_btree_cache_to_text(out, &c->btree_cache);
|
2020-11-19 20:13:30 -05:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_btree_key_cache)
|
|
|
|
bch2_btree_key_cache_to_text(out, &c->btree_key_cache);
|
2020-06-15 19:53:46 -04:00
|
|
|
|
2024-07-11 16:30:41 -04:00
|
|
|
if (attr == &sysfs_btree_reserve_cache)
|
|
|
|
bch2_btree_reserve_cache_to_text(out, c);
|
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_stripes_heap)
|
|
|
|
bch2_stripes_heap_to_text(out, c);
|
2020-07-06 20:18:13 -04:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_open_buckets)
|
2024-08-06 21:02:34 -04:00
|
|
|
bch2_open_buckets_to_text(out, c, NULL);
|
2021-07-12 23:52:49 -04:00
|
|
|
|
2023-02-28 23:08:48 -05:00
|
|
|
if (attr == &sysfs_open_buckets_partial)
|
|
|
|
bch2_open_buckets_partial_to_text(out, c);
|
|
|
|
|
2022-10-31 16:13:05 -04:00
|
|
|
if (attr == &sysfs_write_points)
|
|
|
|
bch2_write_points_to_text(out, c);
|
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_compression_stats)
|
|
|
|
bch2_compression_stats_to_text(out, c);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_new_stripes)
|
|
|
|
bch2_new_stripes_to_text(out, c);
|
2018-11-01 15:13:19 -04:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_io_timers_read)
|
|
|
|
bch2_io_timers_to_text(out, &c->io_clock[READ]);
|
2019-12-19 15:07:51 -05:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_io_timers_write)
|
|
|
|
bch2_io_timers_to_text(out, &c->io_clock[WRITE]);
|
|
|
|
|
2023-03-11 20:38:46 -05:00
|
|
|
if (attr == &sysfs_moving_ctxts)
|
|
|
|
bch2_fs_moving_ctxts_to_text(out, c);
|
2021-07-23 13:57:19 -06:00
|
|
|
|
2023-02-09 12:21:45 -05:00
|
|
|
#ifdef BCH_WRITE_REF_DEBUG
|
|
|
|
if (attr == &sysfs_write_refs)
|
|
|
|
bch2_write_refs_to_text(out, c);
|
|
|
|
#endif
|
|
|
|
|
2022-12-14 20:52:11 -05:00
|
|
|
if (attr == &sysfs_nocow_lock_table)
|
|
|
|
bch2_nocow_locks_to_text(out, &c->nocow_locks);
|
2022-12-07 18:41:21 +13:00
|
|
|
|
2023-05-30 14:41:50 -04:00
|
|
|
if (attr == &sysfs_disk_groups)
|
|
|
|
bch2_disk_groups_to_text(out, c);
|
|
|
|
|
2024-04-16 00:11:33 -04:00
|
|
|
if (attr == &sysfs_alloc_debug)
|
2024-05-03 14:49:23 -04:00
|
|
|
bch2_fs_alloc_debug_to_text(out, c);
|
2024-04-16 00:11:33 -04:00
|
|
|
|
2024-02-24 19:58:07 -05:00
|
|
|
if (attr == &sysfs_accounting)
|
|
|
|
bch2_fs_accounting_to_text(out, c);
|
|
|
|
|
2024-02-23 17:23:41 -05:00
|
|
|
if (attr == &sysfs_usage_base)
|
|
|
|
bch2_fs_usage_base_to_text(out, c);
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2020-06-15 14:58:47 -04:00
|
|
|
STORE(bch2_fs)
|
2017-03-16 22:18:50 -08:00
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, kobj);
|
|
|
|
|
|
|
|
if (attr == &sysfs_copy_gc_enabled) {
|
|
|
|
ssize_t ret = strtoul_safe(buf, c->copy_gc_enabled)
|
|
|
|
?: (ssize_t) size;
|
|
|
|
|
2020-07-11 16:28:54 -04:00
|
|
|
if (c->copygc_thread)
|
|
|
|
wake_up_process(c->copygc_thread);
|
2017-03-16 22:18:50 -08:00
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (attr == &sysfs_rebalance_enabled) {
|
|
|
|
ssize_t ret = strtoul_safe(buf, c->rebalance.enabled)
|
|
|
|
?: (ssize_t) size;
|
|
|
|
|
|
|
|
rebalance_wakeup(c);
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
sysfs_pd_controller_store(rebalance, &c->rebalance.pd);
|
|
|
|
|
|
|
|
/* Debugging: */
|
|
|
|
|
2023-11-26 17:05:02 -05:00
|
|
|
if (!test_bit(BCH_FS_started, &c->flags))
|
2017-03-16 22:18:50 -08:00
|
|
|
return -EPERM;
|
|
|
|
|
|
|
|
/* Debugging: */
|
|
|
|
|
2024-04-13 22:43:11 -04:00
|
|
|
if (!bch2_write_ref_tryget(c, BCH_WRITE_REF_sysfs))
|
2021-12-24 04:51:10 -05:00
|
|
|
return -EROFS;
|
|
|
|
|
2024-04-20 14:49:22 -04:00
|
|
|
if (attr == &sysfs_trigger_btree_cache_shrink) {
|
bcachefs: Rework btree node pinning
In backpointers fsck, we do a seqential scan of one btree, and check
references to another: extents <-> backpointers
Checking references generates random lookups, so we want to pin that
btree in memory (or only a range, if it doesn't fit in ram).
Previously, this was done with a simple check in the shrinker - "if
btree node is in range being pinned, don't free it" - but this generated
OOMs, as our shrinker wasn't well behaved if there was less memory
available than expected.
Instead, we now have two different shrinkers and lru lists; the second
shrinker being for pinned nodes, with seeks set much higher than normal
- so they can still be freed if necessary, but we'll prefer not to.
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2024-09-04 20:49:37 -04:00
|
|
|
struct btree_cache *bc = &c->btree_cache;
|
2021-12-24 04:51:10 -05:00
|
|
|
struct shrink_control sc;
|
|
|
|
|
|
|
|
sc.gfp_mask = GFP_KERNEL;
|
|
|
|
sc.nr_to_scan = strtoul_or_return(buf);
|
bcachefs: Rework btree node pinning
In backpointers fsck, we do a seqential scan of one btree, and check
references to another: extents <-> backpointers
Checking references generates random lookups, so we want to pin that
btree in memory (or only a range, if it doesn't fit in ram).
Previously, this was done with a simple check in the shrinker - "if
btree node is in range being pinned, don't free it" - but this generated
OOMs, as our shrinker wasn't well behaved if there was less memory
available than expected.
Instead, we now have two different shrinkers and lru lists; the second
shrinker being for pinned nodes, with seeks set much higher than normal
- so they can still be freed if necessary, but we'll prefer not to.
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2024-09-04 20:49:37 -04:00
|
|
|
bc->live[0].shrink->scan_objects(bc->live[0].shrink, &sc);
|
2021-12-24 04:51:10 -05:00
|
|
|
}
|
|
|
|
|
2024-04-20 14:49:22 -04:00
|
|
|
if (attr == &sysfs_trigger_btree_key_cache_shrink) {
|
|
|
|
struct shrink_control sc;
|
|
|
|
|
|
|
|
sc.gfp_mask = GFP_KERNEL;
|
|
|
|
sc.nr_to_scan = strtoul_or_return(buf);
|
2024-09-05 21:18:57 -04:00
|
|
|
c->btree_key_cache.shrink->scan_objects(c->btree_key_cache.shrink, &sc);
|
2024-04-20 14:49:22 -04:00
|
|
|
}
|
2022-09-17 15:20:13 -04:00
|
|
|
|
2024-04-06 00:11:01 -04:00
|
|
|
if (attr == &sysfs_trigger_gc)
|
2020-06-15 15:10:54 -04:00
|
|
|
bch2_gc_gens(c);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-04-07 18:38:16 -04:00
|
|
|
if (attr == &sysfs_trigger_discards)
|
|
|
|
bch2_do_discards(c);
|
|
|
|
|
2022-06-13 19:34:17 -04:00
|
|
|
if (attr == &sysfs_trigger_invalidates)
|
|
|
|
bch2_do_invalidates(c);
|
|
|
|
|
2024-04-13 22:43:11 -04:00
|
|
|
if (attr == &sysfs_trigger_journal_flush) {
|
|
|
|
bch2_journal_flush_all_pins(&c->journal);
|
|
|
|
bch2_journal_meta(&c->journal);
|
|
|
|
}
|
|
|
|
|
2024-06-28 21:40:00 -04:00
|
|
|
if (attr == &sysfs_trigger_journal_writes)
|
|
|
|
bch2_journal_do_writes(&c->journal);
|
|
|
|
|
2024-07-11 16:11:45 -04:00
|
|
|
if (attr == &sysfs_trigger_freelist_wakeup)
|
|
|
|
closure_wake_up(&c->freelist_wait);
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
#ifdef CONFIG_BCACHEFS_TESTS
|
|
|
|
if (attr == &sysfs_perf_test) {
|
|
|
|
char *tmp = kstrdup(buf, GFP_KERNEL), *p = tmp;
|
|
|
|
char *test = strsep(&p, " \t\n");
|
|
|
|
char *nr_str = strsep(&p, " \t\n");
|
|
|
|
char *threads_str = strsep(&p, " \t\n");
|
|
|
|
unsigned threads;
|
|
|
|
u64 nr;
|
|
|
|
int ret = -EINVAL;
|
|
|
|
|
|
|
|
if (threads_str &&
|
|
|
|
!(ret = kstrtouint(threads_str, 10, &threads)) &&
|
|
|
|
!(ret = bch2_strtoull_h(nr_str, &nr)))
|
2020-12-01 12:23:55 -05:00
|
|
|
ret = bch2_btree_perf_test(c, test, nr, threads);
|
2017-03-16 22:18:50 -08:00
|
|
|
kfree(tmp);
|
2020-12-01 12:23:55 -05:00
|
|
|
|
|
|
|
if (ret)
|
|
|
|
size = ret;
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
#endif
|
2024-04-13 22:43:11 -04:00
|
|
|
bch2_write_ref_put(c, BCH_WRITE_REF_sysfs);
|
2017-03-16 22:18:50 -08:00
|
|
|
return size;
|
|
|
|
}
|
|
|
|
SYSFS_OPS(bch2_fs);
|
|
|
|
|
|
|
|
struct attribute *bch2_fs_files[] = {
|
|
|
|
&sysfs_minor,
|
|
|
|
&sysfs_btree_cache_size,
|
2022-10-28 17:08:41 -04:00
|
|
|
&sysfs_btree_write_stats,
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2024-07-31 23:39:49 -04:00
|
|
|
&sysfs_rebalance_status,
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
&sysfs_compression_stats,
|
|
|
|
|
|
|
|
#ifdef CONFIG_BCACHEFS_TESTS
|
|
|
|
&sysfs_perf_test,
|
|
|
|
#endif
|
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
2022-03-15 21:36:33 +13:00
|
|
|
/* counters dir */
|
|
|
|
|
|
|
|
SHOW(bch2_fs_counters)
|
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, counters_kobj);
|
|
|
|
u64 counter = 0;
|
|
|
|
u64 counter_since_mount = 0;
|
|
|
|
|
2023-02-03 21:01:40 -05:00
|
|
|
printbuf_tabstop_push(out, 32);
|
|
|
|
|
2022-03-15 21:36:33 +13:00
|
|
|
#define x(t, ...) \
|
|
|
|
if (attr == &sysfs_##t) { \
|
|
|
|
counter = percpu_u64_get(&c->counters[BCH_COUNTER_##t]);\
|
|
|
|
counter_since_mount = counter - c->counters_on_mount[BCH_COUNTER_##t];\
|
2024-04-10 16:08:24 -04:00
|
|
|
prt_printf(out, "since mount:\t"); \
|
2023-03-30 18:49:02 -04:00
|
|
|
prt_human_readable_u64(out, counter_since_mount); \
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_newline(out); \
|
2022-03-15 21:36:33 +13:00
|
|
|
\
|
2024-04-10 16:08:24 -04:00
|
|
|
prt_printf(out, "since filesystem creation:\t"); \
|
2023-03-30 18:49:02 -04:00
|
|
|
prt_human_readable_u64(out, counter); \
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_newline(out); \
|
2022-03-15 21:36:33 +13:00
|
|
|
}
|
|
|
|
BCH_PERSISTENT_COUNTERS()
|
|
|
|
#undef x
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
STORE(bch2_fs_counters) {
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
SYSFS_OPS(bch2_fs_counters);
|
|
|
|
|
|
|
|
struct attribute *bch2_fs_counters_files[] = {
|
|
|
|
#define x(t, ...) \
|
|
|
|
&sysfs_##t,
|
|
|
|
BCH_PERSISTENT_COUNTERS()
|
|
|
|
#undef x
|
|
|
|
NULL
|
|
|
|
};
|
2017-03-16 22:18:50 -08:00
|
|
|
/* internal dir - just a wrapper */
|
|
|
|
|
|
|
|
SHOW(bch2_fs_internal)
|
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, internal);
|
2022-10-22 15:59:53 -04:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
return bch2_fs_to_text(out, &c->kobj, attr);
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
STORE(bch2_fs_internal)
|
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, internal);
|
2022-10-22 15:59:53 -04:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
return bch2_fs_store(&c->kobj, attr, buf, size);
|
|
|
|
}
|
|
|
|
SYSFS_OPS(bch2_fs_internal);
|
|
|
|
|
|
|
|
struct attribute *bch2_fs_internal_files[] = {
|
2023-11-26 17:05:02 -05:00
|
|
|
&sysfs_flags,
|
2017-03-16 22:18:50 -08:00
|
|
|
&sysfs_journal_debug,
|
2020-11-19 20:13:30 -05:00
|
|
|
&sysfs_btree_cache,
|
2020-06-15 19:53:46 -04:00
|
|
|
&sysfs_btree_key_cache,
|
2024-07-11 16:30:41 -04:00
|
|
|
&sysfs_btree_reserve_cache,
|
2021-12-14 14:24:04 -05:00
|
|
|
&sysfs_new_stripes,
|
2020-07-06 20:18:13 -04:00
|
|
|
&sysfs_stripes_heap,
|
2021-07-12 23:52:49 -04:00
|
|
|
&sysfs_open_buckets,
|
2023-02-28 23:08:48 -05:00
|
|
|
&sysfs_open_buckets_partial,
|
2022-10-31 16:13:05 -04:00
|
|
|
&sysfs_write_points,
|
2023-02-09 12:21:45 -05:00
|
|
|
#ifdef BCH_WRITE_REF_DEBUG
|
|
|
|
&sysfs_write_refs,
|
|
|
|
#endif
|
2022-12-07 18:41:21 +13:00
|
|
|
&sysfs_nocow_lock_table,
|
2021-12-14 14:24:04 -05:00
|
|
|
&sysfs_io_timers_read,
|
|
|
|
&sysfs_io_timers_write,
|
|
|
|
|
|
|
|
&sysfs_trigger_gc,
|
2022-04-07 18:38:16 -04:00
|
|
|
&sysfs_trigger_discards,
|
2022-06-13 19:34:17 -04:00
|
|
|
&sysfs_trigger_invalidates,
|
2024-04-13 22:43:11 -04:00
|
|
|
&sysfs_trigger_journal_flush,
|
2024-06-28 21:40:00 -04:00
|
|
|
&sysfs_trigger_journal_writes,
|
2024-04-20 14:49:22 -04:00
|
|
|
&sysfs_trigger_btree_cache_shrink,
|
|
|
|
&sysfs_trigger_btree_key_cache_shrink,
|
2024-07-11 16:11:45 -04:00
|
|
|
&sysfs_trigger_freelist_wakeup,
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2021-04-13 15:00:40 -04:00
|
|
|
&sysfs_gc_gens_pos,
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
&sysfs_copy_gc_enabled,
|
2021-04-13 14:45:55 -04:00
|
|
|
&sysfs_copy_gc_wait,
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
&sysfs_rebalance_enabled,
|
|
|
|
sysfs_pd_controller_files(rebalance),
|
|
|
|
|
2023-03-11 20:38:46 -05:00
|
|
|
&sysfs_moving_ctxts,
|
2021-07-23 13:57:19 -06:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
&sysfs_internal_uuid,
|
2023-05-30 14:41:50 -04:00
|
|
|
|
|
|
|
&sysfs_disk_groups,
|
2024-04-16 00:11:33 -04:00
|
|
|
&sysfs_alloc_debug,
|
2024-02-24 19:58:07 -05:00
|
|
|
&sysfs_accounting,
|
2024-02-23 17:23:41 -05:00
|
|
|
&sysfs_usage_base,
|
2017-03-16 22:18:50 -08:00
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
|
|
|
/* options */
|
|
|
|
|
|
|
|
SHOW(bch2_fs_opts_dir)
|
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, opts_dir);
|
|
|
|
const struct bch_option *opt = container_of(attr, struct bch_option, attr);
|
|
|
|
int id = opt - bch2_opt_table;
|
|
|
|
u64 v = bch2_opt_get_by_id(&c->opts, id);
|
|
|
|
|
2022-03-05 12:01:16 -05:00
|
|
|
bch2_opt_to_text(out, c, c->disk_sb.sb, opt, v, OPT_SHOW_FULL_LIST);
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_char(out, '\n');
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
return 0;
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
STORE(bch2_fs_opts_dir)
|
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, opts_dir);
|
|
|
|
const struct bch_option *opt = container_of(attr, struct bch_option, attr);
|
|
|
|
int ret, id = opt - bch2_opt_table;
|
|
|
|
char *tmp;
|
|
|
|
u64 v;
|
|
|
|
|
2022-03-06 15:15:41 -05:00
|
|
|
/*
|
|
|
|
* We don't need to take c->writes for correctness, but it eliminates an
|
|
|
|
* unsightly error message in the dmesg log when we're RO:
|
|
|
|
*/
|
2023-02-09 12:21:45 -05:00
|
|
|
if (unlikely(!bch2_write_ref_tryget(c, BCH_WRITE_REF_sysfs)))
|
2022-03-06 15:15:41 -05:00
|
|
|
return -EROFS;
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
tmp = kstrdup(buf, GFP_KERNEL);
|
2022-03-06 15:15:41 -05:00
|
|
|
if (!tmp) {
|
|
|
|
ret = -ENOMEM;
|
|
|
|
goto err;
|
|
|
|
}
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-03-21 00:15:38 -04:00
|
|
|
ret = bch2_opt_parse(c, opt, strim(tmp), &v, NULL);
|
2017-03-16 22:18:50 -08:00
|
|
|
kfree(tmp);
|
|
|
|
|
|
|
|
if (ret < 0)
|
2022-03-06 15:15:41 -05:00
|
|
|
goto err;
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2018-11-12 18:30:55 -05:00
|
|
|
ret = bch2_opt_check_may_set(c, id, v);
|
|
|
|
if (ret < 0)
|
2022-03-06 15:15:41 -05:00
|
|
|
goto err;
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2024-07-15 19:26:46 -04:00
|
|
|
bch2_opt_set_sb(c, NULL, opt, v);
|
2017-03-16 22:18:50 -08:00
|
|
|
bch2_opt_set_by_id(&c->opts, id, v);
|
|
|
|
|
2024-01-16 16:20:21 -05:00
|
|
|
if (v &&
|
|
|
|
(id == Opt_background_target ||
|
|
|
|
id == Opt_background_compression ||
|
|
|
|
(id == Opt_compression && !c->opts.background_compression)))
|
bcachefs: rebalance_work
This adds a new btree, rebalance_work, to eliminate scanning required
for finding extents that need work done on them in the background - i.e.
for the background_target and background_compression options.
rebalance_work is a bitset btree, where a KEY_TYPE_set corresponds to an
extent in the extents or reflink btree at the same pos.
A new extent field is added, bch_extent_rebalance, which indicates that
this extent has work that needs to be done in the background - and which
options to use. This allows per-inode options to be propagated to
indirect extents - at least in some circumstances. In this patch,
changing IO options on a file will not propagate the new options to
indirect extents pointed to by that file.
Updating (setting/clearing) the rebalance_work btree is done by the
extent trigger, which looks at the bch_extent_rebalance field.
Scanning is still requrired after changing IO path options - either just
for a given inode, or for the whole filesystem. We indicate that
scanning is required by adding a KEY_TYPE_cookie key to the
rebalance_work btree: the cookie counter is so that we can detect that
scanning is still required when an option has been flipped mid-way
through an existing scan.
Future possible work:
- Propagate options to indirect extents when being changed
- Add other IO path options - nr_replicas, ec, to rebalance_work so
they can be applied in the background when they change
- Add a counter, for bcachefs fs usage output, showing the pending
amount of rebalance work: we'll probably want to do this after the
disk space accounting rewrite (moving it to a new btree)
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2023-10-20 13:33:14 -04:00
|
|
|
bch2_set_rebalance_needs_scan(c, 0);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2022-03-06 15:15:41 -05:00
|
|
|
ret = size;
|
|
|
|
err:
|
2023-02-09 12:21:45 -05:00
|
|
|
bch2_write_ref_put(c, BCH_WRITE_REF_sysfs);
|
2022-03-06 15:15:41 -05:00
|
|
|
return ret;
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
SYSFS_OPS(bch2_fs_opts_dir);
|
|
|
|
|
|
|
|
struct attribute *bch2_fs_opts_dir_files[] = { NULL };
|
|
|
|
|
|
|
|
int bch2_opts_create_sysfs_files(struct kobject *kobj)
|
|
|
|
{
|
|
|
|
const struct bch_option *i;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
for (i = bch2_opt_table;
|
|
|
|
i < bch2_opt_table + bch2_opts_nr;
|
|
|
|
i++) {
|
2021-12-14 14:24:41 -05:00
|
|
|
if (!(i->flags & OPT_FS))
|
2017-03-16 22:18:50 -08:00
|
|
|
continue;
|
|
|
|
|
|
|
|
ret = sysfs_create_file(kobj, &i->attr);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* time stats */
|
|
|
|
|
|
|
|
SHOW(bch2_fs_time_stats)
|
|
|
|
{
|
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, time_stats);
|
|
|
|
|
2020-07-25 17:06:11 -04:00
|
|
|
#define x(name) \
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_time_stat_##name) \
|
|
|
|
bch2_time_stats_to_text(out, &c->times[BCH_TIME_##name]);
|
2017-03-16 22:18:50 -08:00
|
|
|
BCH_TIME_STATS()
|
|
|
|
#undef x
|
|
|
|
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
STORE(bch2_fs_time_stats)
|
|
|
|
{
|
2024-08-19 15:33:38 -04:00
|
|
|
struct bch_fs *c = container_of(kobj, struct bch_fs, time_stats);
|
|
|
|
|
|
|
|
#define x(name) \
|
|
|
|
if (attr == &sysfs_time_stat_##name) \
|
|
|
|
bch2_time_stats_reset(&c->times[BCH_TIME_##name]);
|
|
|
|
BCH_TIME_STATS()
|
|
|
|
#undef x
|
2017-03-16 22:18:50 -08:00
|
|
|
return size;
|
|
|
|
}
|
|
|
|
SYSFS_OPS(bch2_fs_time_stats);
|
|
|
|
|
|
|
|
struct attribute *bch2_fs_time_stats_files[] = {
|
|
|
|
#define x(name) \
|
|
|
|
&sysfs_time_stat_##name,
|
|
|
|
BCH_TIME_STATS()
|
|
|
|
#undef x
|
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
|
|
|
static const char * const bch2_rw[] = {
|
|
|
|
"read",
|
|
|
|
"write",
|
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
2023-10-25 16:29:37 -04:00
|
|
|
static void dev_io_done_to_text(struct printbuf *out, struct bch_dev *ca)
|
2017-03-16 22:18:50 -08:00
|
|
|
{
|
2019-02-06 11:42:13 -05:00
|
|
|
int rw, i;
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
for (rw = 0; rw < 2; rw++) {
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_printf(out, "%s:\n", bch2_rw[rw]);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2019-02-06 11:42:13 -05:00
|
|
|
for (i = 1; i < BCH_DATA_NR; i++)
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_printf(out, "%-12s:%12llu\n",
|
2024-01-06 20:57:43 -05:00
|
|
|
bch2_data_type_str(i),
|
2019-02-06 11:42:13 -05:00
|
|
|
percpu_u64_get(&ca->io_done->sectors[rw][i]) << 9);
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
SHOW(bch2_dev)
|
|
|
|
{
|
|
|
|
struct bch_dev *ca = container_of(kobj, struct bch_dev, kobj);
|
|
|
|
struct bch_fs *c = ca->fs;
|
|
|
|
|
|
|
|
sysfs_printf(uuid, "%pU\n", ca->uuid.b);
|
|
|
|
|
|
|
|
sysfs_print(bucket_size, bucket_bytes(ca));
|
|
|
|
sysfs_print(first_bucket, ca->mi.first_bucket);
|
|
|
|
sysfs_print(nbuckets, ca->mi.nbuckets);
|
|
|
|
sysfs_print(durability, ca->mi.durability);
|
|
|
|
sysfs_print(discard, ca->mi.discard);
|
|
|
|
|
|
|
|
if (attr == &sysfs_label) {
|
2023-10-22 11:12:14 -04:00
|
|
|
if (ca->mi.group)
|
|
|
|
bch2_disk_path_to_text(out, c, ca->mi.group - 1);
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_char(out, '\n');
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (attr == &sysfs_has_data) {
|
2024-01-06 20:57:43 -05:00
|
|
|
prt_bitflags(out, __bch2_data_types, bch2_dev_has_data(c, ca));
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_char(out, '\n');
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
if (attr == &sysfs_state_rw) {
|
2023-02-03 21:01:40 -05:00
|
|
|
prt_string_option(out, bch2_member_states, ca->mi.state);
|
|
|
|
prt_char(out, '\n');
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
2023-10-25 16:29:37 -04:00
|
|
|
if (attr == &sysfs_io_done)
|
|
|
|
dev_io_done_to_text(out, ca);
|
|
|
|
|
|
|
|
if (attr == &sysfs_io_errors)
|
|
|
|
bch2_dev_io_errors_to_text(out, ca);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
sysfs_print(io_latency_read, atomic64_read(&ca->cur_latency[READ]));
|
|
|
|
sysfs_print(io_latency_write, atomic64_read(&ca->cur_latency[WRITE]));
|
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_io_latency_stats_read)
|
2024-02-01 12:41:42 -08:00
|
|
|
bch2_time_stats_to_text(out, &ca->io_latency[READ].stats);
|
2022-02-25 13:18:19 -05:00
|
|
|
|
|
|
|
if (attr == &sysfs_io_latency_stats_write)
|
2024-02-01 12:41:42 -08:00
|
|
|
bch2_time_stats_to_text(out, &ca->io_latency[WRITE].stats);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
sysfs_printf(congested, "%u%%",
|
|
|
|
clamp(atomic_read(&ca->congested), 0, CONGESTED_MAX)
|
|
|
|
* 100 / CONGESTED_MAX);
|
|
|
|
|
2022-02-25 13:18:19 -05:00
|
|
|
if (attr == &sysfs_alloc_debug)
|
2024-05-03 14:49:23 -04:00
|
|
|
bch2_dev_alloc_debug_to_text(out, ca);
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2024-08-06 21:02:34 -04:00
|
|
|
if (attr == &sysfs_open_buckets)
|
|
|
|
bch2_open_buckets_to_text(out, c, ca);
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
STORE(bch2_dev)
|
|
|
|
{
|
|
|
|
struct bch_dev *ca = container_of(kobj, struct bch_dev, kobj);
|
|
|
|
struct bch_fs *c = ca->fs;
|
|
|
|
|
|
|
|
if (attr == &sysfs_discard) {
|
|
|
|
bool v = strtoul_or_return(buf);
|
|
|
|
|
2024-07-15 19:26:46 -04:00
|
|
|
bch2_opt_set_sb(c, ca, bch2_opt_table + Opt_discard, v);
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
2022-05-25 16:11:56 +12:00
|
|
|
if (attr == &sysfs_durability) {
|
|
|
|
u64 v = strtoul_or_return(buf);
|
|
|
|
|
2024-07-15 19:54:51 -04:00
|
|
|
bch2_opt_set_sb(c, ca, bch2_opt_table + Opt_durability, v);
|
2022-05-25 16:11:56 +12:00
|
|
|
}
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
if (attr == &sysfs_label) {
|
|
|
|
char *tmp;
|
|
|
|
int ret;
|
|
|
|
|
|
|
|
tmp = kstrdup(buf, GFP_KERNEL);
|
|
|
|
if (!tmp)
|
|
|
|
return -ENOMEM;
|
|
|
|
|
|
|
|
ret = bch2_dev_group_set(c, ca, strim(tmp));
|
|
|
|
kfree(tmp);
|
|
|
|
if (ret)
|
|
|
|
return ret;
|
|
|
|
}
|
|
|
|
|
2023-10-25 16:29:37 -04:00
|
|
|
if (attr == &sysfs_io_errors_reset)
|
|
|
|
bch2_dev_errors_reset(ca);
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
return size;
|
|
|
|
}
|
|
|
|
SYSFS_OPS(bch2_dev);
|
|
|
|
|
|
|
|
struct attribute *bch2_dev_files[] = {
|
|
|
|
&sysfs_uuid,
|
|
|
|
&sysfs_bucket_size,
|
|
|
|
&sysfs_first_bucket,
|
|
|
|
&sysfs_nbuckets,
|
|
|
|
&sysfs_durability,
|
|
|
|
|
|
|
|
/* settings: */
|
|
|
|
&sysfs_discard,
|
|
|
|
&sysfs_state_rw,
|
|
|
|
&sysfs_label,
|
|
|
|
|
|
|
|
&sysfs_has_data,
|
2023-10-25 16:29:37 -04:00
|
|
|
&sysfs_io_done,
|
|
|
|
&sysfs_io_errors,
|
|
|
|
&sysfs_io_errors_reset,
|
2017-03-16 22:18:50 -08:00
|
|
|
|
|
|
|
&sysfs_io_latency_read,
|
|
|
|
&sysfs_io_latency_write,
|
|
|
|
&sysfs_io_latency_stats_read,
|
|
|
|
&sysfs_io_latency_stats_write,
|
|
|
|
&sysfs_congested,
|
|
|
|
|
|
|
|
/* debug: */
|
|
|
|
&sysfs_alloc_debug,
|
2024-08-06 21:02:34 -04:00
|
|
|
&sysfs_open_buckets,
|
2017-03-16 22:18:50 -08:00
|
|
|
NULL
|
|
|
|
};
|
|
|
|
|
|
|
|
#endif /* _BCACHEFS_SYSFS_H_ */
|