Update bcachefs sources to 2e8463c770 bcachefs: Rework lru btree

This commit is contained in:
Kent Overstreet 2022-12-19 18:31:44 -05:00
parent b6fca67693
commit 177f05106c
7 changed files with 90 additions and 129 deletions

View File

@ -1 +1 @@
c801fa69f0e35d0e203af95fc59240f96a04d107 2e8463c770e9f1e2269e0fc9f64d044424758f4f

View File

@ -915,8 +915,9 @@ int bch2_trans_mark_alloc(struct btree_trans *trans,
new_lru = alloc_lru_idx(*new_a); new_lru = alloc_lru_idx(*new_a);
if (old_lru != new_lru) { if (old_lru != new_lru) {
ret = bch2_lru_change(trans, new->k.p.inode, new->k.p.offset, ret = bch2_lru_change(trans, new->k.p.inode,
old_lru, &new_lru, old); bucket_to_u64(new->k.p),
old_lru, new_lru);
if (ret) if (ret)
return ret; return ret;
@ -1540,7 +1541,7 @@ static int bch2_check_alloc_to_lru_ref(struct btree_trans *trans,
" %s", " %s",
(printbuf_reset(&buf), (printbuf_reset(&buf),
bch2_bkey_val_to_text(&buf, c, alloc_k), buf.buf)) || bch2_bkey_val_to_text(&buf, c, alloc_k), buf.buf)) ||
fsck_err_on(k.k->type != KEY_TYPE_lru || fsck_err_on(k.k->type != KEY_TYPE_set ||
le64_to_cpu(bkey_s_c_to_lru(k).v->idx) != alloc_k.k->p.offset, c, le64_to_cpu(bkey_s_c_to_lru(k).v->idx) != alloc_k.k->p.offset, c,
"incorrect/missing lru entry\n" "incorrect/missing lru entry\n"
" %s\n" " %s\n"
@ -1553,8 +1554,8 @@ static int bch2_check_alloc_to_lru_ref(struct btree_trans *trans,
ret = bch2_lru_set(trans, ret = bch2_lru_set(trans,
alloc_k.k->p.inode, alloc_k.k->p.inode,
alloc_k.k->p.offset, bucket_to_u64(alloc_k.k->p),
&read_time); read_time);
if (ret) if (ret)
goto err; goto err;
@ -1762,51 +1763,34 @@ void bch2_do_discards(struct bch_fs *c)
} }
static int invalidate_one_bucket(struct btree_trans *trans, static int invalidate_one_bucket(struct btree_trans *trans,
struct btree_iter *lru_iter, struct bkey_s_c k, struct btree_iter *lru_iter,
unsigned dev_idx, s64 *nr_to_invalidate) struct bpos bucket,
s64 *nr_to_invalidate)
{ {
struct bch_fs *c = trans->c; struct bch_fs *c = trans->c;
struct btree_iter alloc_iter = { NULL }; struct btree_iter alloc_iter = { NULL };
struct bkey_i_alloc_v4 *a; struct bkey_i_alloc_v4 *a;
struct bpos bucket;
struct printbuf buf = PRINTBUF; struct printbuf buf = PRINTBUF;
unsigned cached_sectors; unsigned cached_sectors;
int ret = 0; int ret = 0;
if (*nr_to_invalidate <= 0 || k.k->p.inode != dev_idx) if (*nr_to_invalidate <= 0)
return 1; return 1;
if (k.k->type != KEY_TYPE_lru) {
prt_printf(&buf, "non lru key in lru btree:\n ");
bch2_bkey_val_to_text(&buf, c, k);
if (!test_bit(BCH_FS_CHECK_LRUS_DONE, &c->flags)) {
bch_err(c, "%s", buf.buf);
} else {
bch2_trans_inconsistent(trans, "%s", buf.buf);
ret = -EINVAL;
}
goto out;
}
bucket = POS(dev_idx, le64_to_cpu(bkey_s_c_to_lru(k).v->idx));
a = bch2_trans_start_alloc_update(trans, &alloc_iter, bucket); a = bch2_trans_start_alloc_update(trans, &alloc_iter, bucket);
ret = PTR_ERR_OR_ZERO(a); ret = PTR_ERR_OR_ZERO(a);
if (ret) if (ret)
goto out; goto out;
if (k.k->p.offset != alloc_lru_idx(a->v)) { if (lru_pos_time(lru_iter->pos) != alloc_lru_idx(a->v)) {
prt_printf(&buf, "alloc key does not point back to lru entry when invalidating bucket:\n "); prt_printf(&buf, "alloc key does not point back to lru entry when invalidating bucket:\n ");
bch2_bkey_val_to_text(&buf, c, bkey_i_to_s_c(&a->k_i)); bch2_bpos_to_text(&buf, lru_iter->pos);
prt_printf(&buf, "\n "); prt_printf(&buf, "\n ");
bch2_bkey_val_to_text(&buf, c, k); bch2_bkey_val_to_text(&buf, c, bkey_i_to_s_c(&a->k_i));
if (!test_bit(BCH_FS_CHECK_LRUS_DONE, &c->flags)) { bch_err(c, "%s", buf.buf);
bch_err(c, "%s", buf.buf); if (test_bit(BCH_FS_CHECK_LRUS_DONE, &c->flags)) {
} else { bch2_inconsistent_error(c);
bch2_trans_inconsistent(trans, "%s", buf.buf);
ret = -EINVAL; ret = -EINVAL;
} }
@ -1857,9 +1841,13 @@ static void bch2_do_invalidates_work(struct work_struct *work)
s64 nr_to_invalidate = s64 nr_to_invalidate =
should_invalidate_buckets(ca, bch2_dev_usage_read(ca)); should_invalidate_buckets(ca, bch2_dev_usage_read(ca));
ret = for_each_btree_key2(&trans, iter, BTREE_ID_lru, ret = for_each_btree_key2_upto(&trans, iter, BTREE_ID_lru,
POS(ca->dev_idx, 0), BTREE_ITER_INTENT, k, lru_pos(ca->dev_idx, 0, 0),
invalidate_one_bucket(&trans, &iter, k, ca->dev_idx, &nr_to_invalidate)); lru_pos(ca->dev_idx, U64_MAX, LRU_TIME_MAX),
BTREE_ITER_INTENT, k,
invalidate_one_bucket(&trans, &iter,
u64_to_bucket(k.k->p.offset),
&nr_to_invalidate));
if (ret < 0) { if (ret < 0) {
percpu_ref_put(&ca->ref); percpu_ref_put(&ca->ref);

View File

@ -1557,7 +1557,8 @@ struct bch_sb_field_journal_seq_blacklist {
x(backpointers, 22) \ x(backpointers, 22) \
x(inode_v3, 23) \ x(inode_v3, 23) \
x(unwritten_extents, 24) \ x(unwritten_extents, 24) \
x(bucket_gens, 25) x(bucket_gens, 25) \
x(lru_v2, 26)
enum bcachefs_metadata_version { enum bcachefs_metadata_version {
bcachefs_metadata_version_min = 9, bcachefs_metadata_version_min = 9,

View File

@ -186,7 +186,7 @@ static unsigned bch2_key_types_allowed[] = {
(1U << KEY_TYPE_snapshot), (1U << KEY_TYPE_snapshot),
[BKEY_TYPE_lru] = [BKEY_TYPE_lru] =
(1U << KEY_TYPE_deleted)| (1U << KEY_TYPE_deleted)|
(1U << KEY_TYPE_lru), (1U << KEY_TYPE_set),
[BKEY_TYPE_freespace] = [BKEY_TYPE_freespace] =
(1U << KEY_TYPE_deleted)| (1U << KEY_TYPE_deleted)|
(1U << KEY_TYPE_set), (1U << KEY_TYPE_set),

View File

@ -8,6 +8,7 @@
#include "lru.h" #include "lru.h"
#include "recovery.h" #include "recovery.h"
/* KEY_TYPE_lru is obsolete: */
int bch2_lru_invalid(const struct bch_fs *c, struct bkey_s_c k, int bch2_lru_invalid(const struct bch_fs *c, struct bkey_s_c k,
int rw, struct printbuf *err) int rw, struct printbuf *err)
{ {
@ -30,101 +31,57 @@ void bch2_lru_to_text(struct printbuf *out, struct bch_fs *c,
prt_printf(out, "idx %llu", le64_to_cpu(lru->idx)); prt_printf(out, "idx %llu", le64_to_cpu(lru->idx));
} }
int bch2_lru_delete(struct btree_trans *trans, u64 id, u64 idx, u64 time, static int __bch2_lru_set(struct btree_trans *trans, u16 lru_id,
struct bkey_s_c orig_k) u64 dev_bucket, u64 time, unsigned key_type)
{ {
struct btree_iter iter; struct btree_iter iter;
struct bkey_s_c k; struct bkey_i *k;
u64 existing_idx;
struct printbuf buf = PRINTBUF;
int ret = 0; int ret = 0;
if (!time) if (!time)
return 0; return 0;
k = bch2_trans_kmalloc_nomemzero(trans, sizeof(*k));
ret = PTR_ERR_OR_ZERO(k);
if (unlikely(ret))
return ret;
bkey_init(&k->k);
k->k.type = key_type;
k->k.p = lru_pos(lru_id, dev_bucket, time);
EBUG_ON(lru_pos_id(k->k.p) != lru_id);
EBUG_ON(lru_pos_time(k->k.p) != time);
EBUG_ON(k->k.p.offset != dev_bucket);
bch2_trans_iter_init(trans, &iter, BTREE_ID_lru, bch2_trans_iter_init(trans, &iter, BTREE_ID_lru,
POS(id, time), k->k.p, BTREE_ITER_INTENT);
BTREE_ITER_INTENT|
BTREE_ITER_WITH_UPDATES);
k = bch2_btree_iter_peek_slot(&iter);
ret = bkey_err(k);
if (ret)
goto err;
if (k.k->type != KEY_TYPE_lru) { ret = bch2_btree_iter_traverse(&iter) ?:
bch2_bkey_val_to_text(&buf, trans->c, orig_k); bch2_btree_delete_at(trans, &iter, 0);
bch2_trans_inconsistent(trans,
"pointer to nonexistent lru %llu:%llu\n%s",
id, time, buf.buf);
ret = -EIO;
goto err;
}
existing_idx = le64_to_cpu(bkey_s_c_to_lru(k).v->idx);
if (existing_idx != idx) {
bch2_bkey_val_to_text(&buf, trans->c, orig_k);
bch2_trans_inconsistent(trans,
"lru %llu:%llu with wrong backpointer: got %llu, should be %llu\n%s",
id, time, existing_idx, idx, buf.buf);
ret = -EIO;
goto err;
}
ret = bch2_btree_delete_at(trans, &iter, 0);
err:
bch2_trans_iter_exit(trans, &iter);
printbuf_exit(&buf);
return ret;
}
int bch2_lru_set(struct btree_trans *trans, u64 lru_id, u64 idx, u64 *time)
{
struct btree_iter iter;
struct bkey_s_c k;
struct bkey_i_lru *lru;
int ret = 0;
if (!*time)
return 0;
for_each_btree_key_norestart(trans, iter, BTREE_ID_lru,
POS(lru_id, *time),
BTREE_ITER_SLOTS|
BTREE_ITER_INTENT|
BTREE_ITER_WITH_UPDATES, k, ret)
if (bkey_deleted(k.k))
break;
if (ret)
goto err;
BUG_ON(iter.pos.inode != lru_id);
*time = iter.pos.offset;
lru = bch2_bkey_alloc(trans, &iter, lru);
ret = PTR_ERR_OR_ZERO(lru);
if (ret)
goto err;
lru->v.idx = cpu_to_le64(idx);
ret = bch2_trans_update(trans, &iter, &lru->k_i, 0);
if (ret)
goto err;
err:
bch2_trans_iter_exit(trans, &iter); bch2_trans_iter_exit(trans, &iter);
return ret; return ret;
} }
int bch2_lru_change(struct btree_trans *trans, u64 id, u64 idx, int bch2_lru_del(struct btree_trans *trans, u16 lru_id, u64 dev_bucket, u64 time)
u64 old_time, u64 *new_time,
struct bkey_s_c k)
{ {
if (old_time == *new_time) return __bch2_lru_set(trans, lru_id, dev_bucket, time, KEY_TYPE_deleted);
}
int bch2_lru_set(struct btree_trans *trans, u16 lru_id, u64 dev_bucket, u64 time)
{
return __bch2_lru_set(trans, lru_id, dev_bucket, time, KEY_TYPE_set);
}
int bch2_lru_change(struct btree_trans *trans,
u16 lru_id, u64 dev_bucket,
u64 old_time, u64 new_time)
{
if (old_time == new_time)
return 0; return 0;
return bch2_lru_delete(trans, id, idx, old_time, k) ?: return bch2_lru_del(trans, lru_id, dev_bucket, old_time) ?:
bch2_lru_set(trans, id, idx, new_time); bch2_lru_set(trans, lru_id, dev_bucket, new_time);
} }
static int bch2_check_lru_key(struct btree_trans *trans, static int bch2_check_lru_key(struct btree_trans *trans,
@ -138,12 +95,9 @@ static int bch2_check_lru_key(struct btree_trans *trans,
const struct bch_alloc_v4 *a; const struct bch_alloc_v4 *a;
struct printbuf buf1 = PRINTBUF; struct printbuf buf1 = PRINTBUF;
struct printbuf buf2 = PRINTBUF; struct printbuf buf2 = PRINTBUF;
struct bpos alloc_pos; struct bpos alloc_pos = u64_to_bucket(lru_k.k->p.offset);
int ret; int ret;
alloc_pos = POS(lru_k.k->p.inode,
le64_to_cpu(bkey_s_c_to_lru(lru_k).v->idx));
if (fsck_err_on(!bch2_dev_bucket_exists(c, alloc_pos), c, if (fsck_err_on(!bch2_dev_bucket_exists(c, alloc_pos), c,
"lru key points to nonexistent device:bucket %llu:%llu", "lru key points to nonexistent device:bucket %llu:%llu",
alloc_pos.inode, alloc_pos.offset)) alloc_pos.inode, alloc_pos.offset))
@ -157,7 +111,8 @@ static int bch2_check_lru_key(struct btree_trans *trans,
a = bch2_alloc_to_v4(k, &a_convert); a = bch2_alloc_to_v4(k, &a_convert);
if (fsck_err_on(a->data_type != BCH_DATA_cached || if (fsck_err_on(k.k->type != KEY_TYPE_set ||
a->data_type != BCH_DATA_cached ||
a->io_time[READ] != lru_k.k->p.offset, c, a->io_time[READ] != lru_k.k->p.offset, c,
"incorrect lru entry %s\n" "incorrect lru entry %s\n"
" for %s", " for %s",

View File

@ -2,6 +2,26 @@
#ifndef _BCACHEFS_LRU_H #ifndef _BCACHEFS_LRU_H
#define _BCACHEFS_LRU_H #define _BCACHEFS_LRU_H
#define LRU_TIME_BITS 48
#define LRU_TIME_MAX ((1ULL << LRU_TIME_BITS) - 1)
static inline struct bpos lru_pos(u16 lru_id, u64 dev_bucket, u64 time)
{
EBUG_ON(time > LRU_TIME_MAX);
return POS(((u64) lru_id << LRU_TIME_BITS)|time, dev_bucket);
}
static inline u64 lru_pos_id(struct bpos pos)
{
return pos.inode >> LRU_TIME_BITS;
}
static inline u64 lru_pos_time(struct bpos pos)
{
return pos.inode & ~(~0ULL << LRU_TIME_BITS);
}
int bch2_lru_invalid(const struct bch_fs *, struct bkey_s_c, int, struct printbuf *); int bch2_lru_invalid(const struct bch_fs *, struct bkey_s_c, int, struct printbuf *);
void bch2_lru_to_text(struct printbuf *, struct bch_fs *, struct bkey_s_c); void bch2_lru_to_text(struct printbuf *, struct bch_fs *, struct bkey_s_c);
@ -10,9 +30,9 @@ void bch2_lru_to_text(struct printbuf *, struct bch_fs *, struct bkey_s_c);
.val_to_text = bch2_lru_to_text, \ .val_to_text = bch2_lru_to_text, \
}) })
int bch2_lru_delete(struct btree_trans *, u64, u64, u64, struct bkey_s_c); int bch2_lru_del(struct btree_trans *, u16, u64, u64);
int bch2_lru_set(struct btree_trans *, u64, u64, u64 *); int bch2_lru_set(struct btree_trans *, u16, u64, u64);
int bch2_lru_change(struct btree_trans *, u64, u64, u64, u64 *, struct bkey_s_c); int bch2_lru_change(struct btree_trans *, u16, u64, u64, u64);
int bch2_check_lrus(struct bch_fs *); int bch2_check_lrus(struct bch_fs *);

View File

@ -1094,14 +1094,11 @@ int bch2_fs_recovery(struct bch_fs *c)
} }
if (!c->opts.nochanges) { if (!c->opts.nochanges) {
if (c->sb.version < bcachefs_metadata_version_backpointers) { if (c->sb.version < bcachefs_metadata_version_lru_v2) {
bch_info(c, "version prior to backpointers, upgrade and fsck required"); bch_info(c, "version prior to backpointers, upgrade and fsck required");
c->opts.version_upgrade = true; c->opts.version_upgrade = true;
c->opts.fsck = true; c->opts.fsck = true;
c->opts.fix_errors = FSCK_OPT_YES; c->opts.fix_errors = FSCK_OPT_YES;
} else if (c->sb.version < bcachefs_metadata_version_inode_v3) {
bch_info(c, "version prior to inode_v3, upgrade required");
c->opts.version_upgrade = true;
} }
} }