2017-03-16 22:18:50 -08:00
|
|
|
/* SPDX-License-Identifier: GPL-2.0 */
|
|
|
|
#ifndef _BCACHEFS_IO_H
|
|
|
|
#define _BCACHEFS_IO_H
|
|
|
|
|
|
|
|
#include "checksum.h"
|
2020-12-17 15:08:58 -05:00
|
|
|
#include "bkey_buf.h"
|
2017-03-16 22:18:50 -08:00
|
|
|
#include "io_types.h"
|
|
|
|
|
|
|
|
#define to_wbio(_bio) \
|
|
|
|
container_of((_bio), struct bch_write_bio, bio)
|
|
|
|
|
|
|
|
#define to_rbio(_bio) \
|
|
|
|
container_of((_bio), struct bch_read_bio, bio)
|
|
|
|
|
|
|
|
void bch2_bio_free_pages_pool(struct bch_fs *, struct bio *);
|
|
|
|
void bch2_bio_alloc_pages_pool(struct bch_fs *, struct bio *, size_t);
|
|
|
|
|
|
|
|
#ifndef CONFIG_BCACHEFS_NO_LATENCY_ACCT
|
|
|
|
void bch2_latency_acct(struct bch_dev *, u64, int);
|
|
|
|
#else
|
|
|
|
static inline void bch2_latency_acct(struct bch_dev *ca, u64 submit_time, int rw) {}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
void bch2_submit_wbio_replicas(struct bch_write_bio *, struct bch_fs *,
|
|
|
|
enum bch_data_type, const struct bkey_i *);
|
|
|
|
|
|
|
|
#define BLK_STS_REMOVED ((__force blk_status_t)128)
|
|
|
|
|
2020-07-21 13:34:22 -04:00
|
|
|
const char *bch2_blk_status_to_str(blk_status_t);
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
enum bch_write_flags {
|
2022-10-28 23:57:01 -04:00
|
|
|
__BCH_WRITE_ALLOC_NOWAIT,
|
|
|
|
__BCH_WRITE_CACHED,
|
|
|
|
__BCH_WRITE_FLUSH,
|
|
|
|
__BCH_WRITE_DATA_ENCODED,
|
|
|
|
__BCH_WRITE_PAGES_STABLE,
|
|
|
|
__BCH_WRITE_PAGES_OWNED,
|
|
|
|
__BCH_WRITE_ONLY_SPECIFIED_DEVS,
|
|
|
|
__BCH_WRITE_WROTE_DATA_INLINE,
|
|
|
|
__BCH_WRITE_FROM_INTERNAL,
|
|
|
|
__BCH_WRITE_CHECK_ENOSPC,
|
|
|
|
__BCH_WRITE_MOVE,
|
|
|
|
__BCH_WRITE_JOURNAL_SEQ_PTR,
|
|
|
|
__BCH_WRITE_SKIP_CLOSURE_PUT,
|
|
|
|
__BCH_WRITE_DONE,
|
2017-03-16 22:18:50 -08:00
|
|
|
};
|
|
|
|
|
2022-10-28 23:57:01 -04:00
|
|
|
#define BCH_WRITE_ALLOC_NOWAIT (1U << __BCH_WRITE_ALLOC_NOWAIT)
|
|
|
|
#define BCH_WRITE_CACHED (1U << __BCH_WRITE_CACHED)
|
|
|
|
#define BCH_WRITE_FLUSH (1U << __BCH_WRITE_FLUSH)
|
|
|
|
#define BCH_WRITE_DATA_ENCODED (1U << __BCH_WRITE_DATA_ENCODED)
|
|
|
|
#define BCH_WRITE_PAGES_STABLE (1U << __BCH_WRITE_PAGES_STABLE)
|
|
|
|
#define BCH_WRITE_PAGES_OWNED (1U << __BCH_WRITE_PAGES_OWNED)
|
|
|
|
#define BCH_WRITE_ONLY_SPECIFIED_DEVS (1U << __BCH_WRITE_ONLY_SPECIFIED_DEVS)
|
|
|
|
#define BCH_WRITE_WROTE_DATA_INLINE (1U << __BCH_WRITE_WROTE_DATA_INLINE)
|
|
|
|
#define BCH_WRITE_FROM_INTERNAL (1U << __BCH_WRITE_FROM_INTERNAL)
|
|
|
|
#define BCH_WRITE_CHECK_ENOSPC (1U << __BCH_WRITE_CHECK_ENOSPC)
|
|
|
|
#define BCH_WRITE_MOVE (1U << __BCH_WRITE_MOVE)
|
|
|
|
|
|
|
|
/* Internal: */
|
|
|
|
#define BCH_WRITE_JOURNAL_SEQ_PTR (1U << __BCH_WRITE_JOURNAL_SEQ_PTR)
|
|
|
|
#define BCH_WRITE_SKIP_CLOSURE_PUT (1U << __BCH_WRITE_SKIP_CLOSURE_PUT)
|
|
|
|
#define BCH_WRITE_DONE (1U << __BCH_WRITE_DONE)
|
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
static inline u64 *op_journal_seq(struct bch_write_op *op)
|
|
|
|
{
|
|
|
|
return (op->flags & BCH_WRITE_JOURNAL_SEQ_PTR)
|
|
|
|
? op->journal_seq_p : &op->journal_seq;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline void op_journal_seq_set(struct bch_write_op *op, u64 *journal_seq)
|
|
|
|
{
|
|
|
|
op->journal_seq_p = journal_seq;
|
|
|
|
op->flags |= BCH_WRITE_JOURNAL_SEQ_PTR;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline struct workqueue_struct *index_update_wq(struct bch_write_op *op)
|
|
|
|
{
|
|
|
|
return op->alloc_reserve == RESERVE_MOVINGGC
|
|
|
|
? op->c->copygc_wq
|
2021-05-22 17:37:25 -04:00
|
|
|
: op->c->btree_update_wq;
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
bcachefs: Change when we allow overwrites
Originally, we'd check for -ENOSPC when getting a disk reservation
whenever the new extent took up more space on disk than the old extent.
Erasure coding screwed this up, because with erasure coding writes are
initially replicated, and then in the background the extra replicas are
dropped when the stripe is created. This means that with erasure coding
enabled, writes will always take up more space on disk than the data
they're overwriting - but, according to posix, overwrites aren't
supposed to return ENOSPC.
So, in this patch we fudge things: if the new extent has more replicas
than the _effective_ replicas of the old extent, or if the old extent is
compressed and the new one isn't, we check for ENOSPC when getting the
disk reservation - otherwise, we don't.
Signed-off-by: Kent Overstreet <kent.overstreet@gmail.com>
Signed-off-by: Kent Overstreet <kent.overstreet@linux.dev>
2020-12-14 21:59:33 -05:00
|
|
|
int bch2_sum_sector_overwrites(struct btree_trans *, struct btree_iter *,
|
|
|
|
struct bkey_i *, bool *, bool *, s64 *, s64 *);
|
2021-03-12 20:30:39 -05:00
|
|
|
int bch2_extent_update(struct btree_trans *, subvol_inum,
|
|
|
|
struct btree_iter *, struct bkey_i *,
|
|
|
|
struct disk_reservation *, u64 *, u64, s64 *, bool);
|
|
|
|
|
2019-10-10 12:47:22 -04:00
|
|
|
int bch2_fpunch_at(struct btree_trans *, struct btree_iter *,
|
2021-03-12 20:30:39 -05:00
|
|
|
subvol_inum, u64, u64 *, s64 *);
|
|
|
|
int bch2_fpunch(struct bch_fs *c, subvol_inum, u64, u64, u64 *, s64 *);
|
2019-10-10 12:47:22 -04:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
static inline void bch2_write_op_init(struct bch_write_op *op, struct bch_fs *c,
|
|
|
|
struct bch_io_opts opts)
|
|
|
|
{
|
|
|
|
op->c = c;
|
2019-11-01 21:16:51 -04:00
|
|
|
op->end_io = NULL;
|
2017-03-16 22:18:50 -08:00
|
|
|
op->flags = 0;
|
|
|
|
op->written = 0;
|
|
|
|
op->error = 0;
|
|
|
|
op->csum_type = bch2_data_checksum_type(c, opts.data_checksum);
|
|
|
|
op->compression_type = bch2_compression_opt_to_type[opts.compression];
|
|
|
|
op->nr_replicas = 0;
|
|
|
|
op->nr_replicas_required = c->opts.data_replicas_required;
|
|
|
|
op->alloc_reserve = RESERVE_NONE;
|
2020-01-29 13:05:04 -05:00
|
|
|
op->incompressible = 0;
|
2018-10-06 04:12:42 -04:00
|
|
|
op->open_buckets.nr = 0;
|
2017-03-16 22:18:50 -08:00
|
|
|
op->devs_have.nr = 0;
|
|
|
|
op->target = 0;
|
|
|
|
op->opts = opts;
|
2021-03-12 20:30:39 -05:00
|
|
|
op->subvol = 0;
|
2017-03-16 22:18:50 -08:00
|
|
|
op->pos = POS_MAX;
|
|
|
|
op->version = ZERO_VERSION;
|
|
|
|
op->write_point = (struct write_point_specifier) { 0 };
|
|
|
|
op->res = (struct disk_reservation) { 0 };
|
|
|
|
op->journal_seq = 0;
|
2019-10-09 12:50:39 -04:00
|
|
|
op->new_i_size = U64_MAX;
|
|
|
|
op->i_sectors_delta = 0;
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
void bch2_write(struct closure *);
|
|
|
|
|
|
|
|
static inline struct bch_write_bio *wbio_init(struct bio *bio)
|
|
|
|
{
|
|
|
|
struct bch_write_bio *wbio = to_wbio(bio);
|
|
|
|
|
|
|
|
memset(&wbio->wbio, 0, sizeof(wbio->wbio));
|
|
|
|
return wbio;
|
|
|
|
}
|
|
|
|
|
|
|
|
struct bch_devs_mask;
|
|
|
|
struct cache_promote_op;
|
2018-10-02 11:03:39 -04:00
|
|
|
struct extent_ptr_decoded;
|
2017-03-16 22:18:50 -08:00
|
|
|
|
2019-08-22 16:07:37 -04:00
|
|
|
int __bch2_read_indirect_extent(struct btree_trans *, unsigned *,
|
2020-12-17 15:08:58 -05:00
|
|
|
struct bkey_buf *);
|
2019-08-22 16:07:37 -04:00
|
|
|
|
|
|
|
static inline int bch2_read_indirect_extent(struct btree_trans *trans,
|
2021-03-14 21:30:08 -04:00
|
|
|
enum btree_id *data_btree,
|
2019-08-22 16:07:37 -04:00
|
|
|
unsigned *offset_into_extent,
|
2020-12-17 15:08:58 -05:00
|
|
|
struct bkey_buf *k)
|
2019-08-22 16:07:37 -04:00
|
|
|
{
|
2021-03-14 21:30:08 -04:00
|
|
|
if (k->k->k.type != KEY_TYPE_reflink_p)
|
|
|
|
return 0;
|
|
|
|
|
|
|
|
*data_btree = BTREE_ID_reflink;
|
|
|
|
return __bch2_read_indirect_extent(trans, offset_into_extent, k);
|
2019-08-22 16:07:37 -04:00
|
|
|
}
|
2019-08-16 09:59:56 -04:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
enum bch_read_flags {
|
|
|
|
BCH_READ_RETRY_IF_STALE = 1 << 0,
|
|
|
|
BCH_READ_MAY_PROMOTE = 1 << 1,
|
|
|
|
BCH_READ_USER_MAPPED = 1 << 2,
|
|
|
|
BCH_READ_NODECODE = 1 << 3,
|
|
|
|
BCH_READ_LAST_FRAGMENT = 1 << 4,
|
|
|
|
|
|
|
|
/* internal: */
|
|
|
|
BCH_READ_MUST_BOUNCE = 1 << 5,
|
|
|
|
BCH_READ_MUST_CLONE = 1 << 6,
|
|
|
|
BCH_READ_IN_RETRY = 1 << 7,
|
|
|
|
};
|
|
|
|
|
2020-10-16 21:39:16 -04:00
|
|
|
int __bch2_read_extent(struct btree_trans *, struct bch_read_bio *,
|
2021-03-14 21:30:08 -04:00
|
|
|
struct bvec_iter, struct bpos, enum btree_id,
|
|
|
|
struct bkey_s_c, unsigned,
|
2019-07-09 12:56:43 -04:00
|
|
|
struct bch_io_failures *, unsigned);
|
|
|
|
|
2020-10-16 21:39:16 -04:00
|
|
|
static inline void bch2_read_extent(struct btree_trans *trans,
|
2021-03-14 21:30:08 -04:00
|
|
|
struct bch_read_bio *rbio, struct bpos read_pos,
|
|
|
|
enum btree_id data_btree, struct bkey_s_c k,
|
|
|
|
unsigned offset_into_extent, unsigned flags)
|
2017-03-16 22:18:50 -08:00
|
|
|
{
|
2021-03-14 21:30:08 -04:00
|
|
|
__bch2_read_extent(trans, rbio, rbio->bio.bi_iter, read_pos,
|
|
|
|
data_btree, k, offset_into_extent, NULL, flags);
|
2017-03-16 22:18:50 -08:00
|
|
|
}
|
|
|
|
|
2021-03-12 20:29:28 -05:00
|
|
|
void __bch2_read(struct bch_fs *, struct bch_read_bio *, struct bvec_iter,
|
2021-03-12 20:30:39 -05:00
|
|
|
subvol_inum, struct bch_io_failures *, unsigned flags);
|
2021-03-12 20:29:28 -05:00
|
|
|
|
|
|
|
static inline void bch2_read(struct bch_fs *c, struct bch_read_bio *rbio,
|
2021-03-12 20:30:39 -05:00
|
|
|
subvol_inum inum)
|
2021-03-12 20:29:28 -05:00
|
|
|
{
|
|
|
|
struct bch_io_failures failed = { .nr = 0 };
|
|
|
|
|
|
|
|
BUG_ON(rbio->_state);
|
|
|
|
|
|
|
|
rbio->c = c;
|
|
|
|
rbio->start_time = local_clock();
|
2021-03-12 20:30:39 -05:00
|
|
|
rbio->subvol = inum.subvol;
|
2021-03-12 20:29:28 -05:00
|
|
|
|
2021-03-12 20:30:39 -05:00
|
|
|
__bch2_read(c, rbio, rbio->bio.bi_iter, inum, &failed,
|
2021-03-12 20:29:28 -05:00
|
|
|
BCH_READ_RETRY_IF_STALE|
|
|
|
|
BCH_READ_MAY_PROMOTE|
|
|
|
|
BCH_READ_USER_MAPPED);
|
|
|
|
}
|
2019-07-09 12:56:43 -04:00
|
|
|
|
2017-03-16 22:18:50 -08:00
|
|
|
static inline struct bch_read_bio *rbio_init(struct bio *bio,
|
|
|
|
struct bch_io_opts opts)
|
|
|
|
{
|
|
|
|
struct bch_read_bio *rbio = to_rbio(bio);
|
|
|
|
|
|
|
|
rbio->_state = 0;
|
|
|
|
rbio->promote = NULL;
|
|
|
|
rbio->opts = opts;
|
|
|
|
return rbio;
|
|
|
|
}
|
|
|
|
|
|
|
|
void bch2_fs_io_exit(struct bch_fs *);
|
|
|
|
int bch2_fs_io_init(struct bch_fs *);
|
|
|
|
|
|
|
|
#endif /* _BCACHEFS_IO_H */
|