1 /* SPDX-License-Identifier: GPL-2.0 */
2 #ifndef _BCACHEFS_BTREE_IO_H
3 #define _BCACHEFS_BTREE_IO_H
5 #include "bkey_methods.h"
7 #include "btree_locking.h"
16 struct btree_node_read_all;
18 static inline bool btree_node_dirty(struct btree *b)
20 return test_bit(BTREE_NODE_dirty, &b->flags);
23 static inline void set_btree_node_dirty(struct bch_fs *c, struct btree *b)
25 if (!test_and_set_bit(BTREE_NODE_dirty, &b->flags))
26 atomic_inc(&c->btree_cache.dirty);
29 static inline void clear_btree_node_dirty(struct bch_fs *c, struct btree *b)
31 if (test_and_clear_bit(BTREE_NODE_dirty, &b->flags))
32 atomic_dec(&c->btree_cache.dirty);
35 struct btree_read_bio {
38 struct btree_node_read_all *ra;
40 unsigned have_ioref:1;
42 struct extent_ptr_decoded pick;
43 struct work_struct work;
47 struct btree_write_bio {
48 struct work_struct work;
49 __BKEY_PADDED(key, BKEY_BTREE_PTR_VAL_U64s_MAX);
52 struct bch_write_bio wbio;
55 static inline void btree_node_io_unlock(struct btree *b)
57 EBUG_ON(!btree_node_write_in_flight(b));
58 clear_btree_node_write_in_flight(b);
59 wake_up_bit(&b->flags, BTREE_NODE_write_in_flight);
62 static inline void btree_node_io_lock(struct btree *b)
64 wait_on_bit_lock_io(&b->flags, BTREE_NODE_write_in_flight,
65 TASK_UNINTERRUPTIBLE);
68 static inline void btree_node_wait_on_io(struct btree *b)
70 wait_on_bit_io(&b->flags, BTREE_NODE_write_in_flight,
71 TASK_UNINTERRUPTIBLE);
74 static inline bool btree_node_may_write(struct btree *b)
76 return list_empty_careful(&b->write_blocked) &&
77 (!b->written || !b->will_make_reachable);
85 bool bch2_compact_whiteouts(struct bch_fs *, struct btree *,
88 static inline bool should_compact_bset_lazy(struct btree *b,
91 unsigned total_u64s = bset_u64s(t);
92 unsigned dead_u64s = bset_dead_u64s(b, t);
94 return dead_u64s > 64 && dead_u64s * 3 > total_u64s;
97 static inline bool bch2_maybe_compact_whiteouts(struct bch_fs *c, struct btree *b)
102 if (should_compact_bset_lazy(b, t))
103 return bch2_compact_whiteouts(c, b, COMPACT_LAZY);
108 static inline struct nonce btree_nonce(struct bset *i, unsigned offset)
110 return (struct nonce) {{
111 [0] = cpu_to_le32(offset),
112 [1] = ((__le32 *) &i->seq)[0],
113 [2] = ((__le32 *) &i->seq)[1],
114 [3] = ((__le32 *) &i->journal_seq)[0]^BCH_NONCE_BTREE,
118 static inline void bset_encrypt(struct bch_fs *c, struct bset *i, unsigned offset)
120 struct nonce nonce = btree_nonce(i, offset);
123 struct btree_node *bn = container_of(i, struct btree_node, keys);
124 unsigned bytes = (void *) &bn->keys - (void *) &bn->flags;
126 bch2_encrypt(c, BSET_CSUM_TYPE(i), nonce, &bn->flags,
129 nonce = nonce_add(nonce, round_up(bytes, CHACHA_BLOCK_SIZE));
132 bch2_encrypt(c, BSET_CSUM_TYPE(i), nonce, i->_data,
133 vstruct_end(i) - (void *) i->_data);
136 void bch2_btree_sort_into(struct bch_fs *, struct btree *, struct btree *);
138 void bch2_btree_node_drop_keys_outside_node(struct btree *);
140 void bch2_btree_build_aux_trees(struct btree *);
141 void bch2_btree_init_next(struct bch_fs *, struct btree *,
142 struct btree_iter *);
144 int bch2_btree_node_read_done(struct bch_fs *, struct bch_dev *,
145 struct btree *, bool);
146 void bch2_btree_node_read(struct bch_fs *, struct btree *, bool);
147 int bch2_btree_root_read(struct bch_fs *, enum btree_id,
148 const struct bkey_i *, unsigned);
150 void bch2_btree_complete_write(struct bch_fs *, struct btree *,
151 struct btree_write *);
152 void bch2_btree_write_error_work(struct work_struct *);
154 void __bch2_btree_node_write(struct bch_fs *, struct btree *);
155 bool bch2_btree_post_write_cleanup(struct bch_fs *, struct btree *);
157 void bch2_btree_node_write(struct bch_fs *, struct btree *,
160 static inline void btree_node_write_if_need(struct bch_fs *c, struct btree *b,
161 enum six_lock_type lock_held)
164 btree_node_need_write(b) &&
165 btree_node_may_write(b)) {
166 if (!btree_node_write_in_flight(b)) {
167 bch2_btree_node_write(c, b, lock_held);
171 six_unlock_type(&b->c.lock, lock_held);
172 btree_node_wait_on_io(b);
173 btree_node_lock_type(c, b, lock_held);
177 #define bch2_btree_node_write_cond(_c, _b, cond) \
179 unsigned long old, new, v = READ_ONCE((_b)->flags); \
184 if (!(old & (1 << BTREE_NODE_dirty)) || !(cond)) \
187 new |= (1 << BTREE_NODE_need_write); \
188 } while ((v = cmpxchg(&(_b)->flags, old, new)) != old); \
190 btree_node_write_if_need(_c, _b, SIX_LOCK_read); \
193 void bch2_btree_flush_all_reads(struct bch_fs *);
194 void bch2_btree_flush_all_writes(struct bch_fs *);
195 void bch2_dirty_btree_nodes_to_text(struct printbuf *, struct bch_fs *);
197 static inline void compat_bformat(unsigned level, enum btree_id btree_id,
198 unsigned version, unsigned big_endian,
199 int write, struct bkey_format *f)
201 if (version < bcachefs_metadata_version_inode_btree_change &&
202 btree_id == BTREE_ID_inodes) {
203 swap(f->bits_per_field[BKEY_FIELD_INODE],
204 f->bits_per_field[BKEY_FIELD_OFFSET]);
205 swap(f->field_offset[BKEY_FIELD_INODE],
206 f->field_offset[BKEY_FIELD_OFFSET]);
209 if (version < bcachefs_metadata_version_snapshot &&
210 (level || btree_type_has_snapshots(btree_id))) {
212 ~(~0ULL << f->bits_per_field[BKEY_FIELD_SNAPSHOT]);
214 f->field_offset[BKEY_FIELD_SNAPSHOT] = write
216 : U32_MAX - max_packed;
220 static inline void compat_bpos(unsigned level, enum btree_id btree_id,
221 unsigned version, unsigned big_endian,
222 int write, struct bpos *p)
224 if (big_endian != CPU_BIG_ENDIAN)
227 if (version < bcachefs_metadata_version_inode_btree_change &&
228 btree_id == BTREE_ID_inodes)
229 swap(p->inode, p->offset);
232 static inline void compat_btree_node(unsigned level, enum btree_id btree_id,
233 unsigned version, unsigned big_endian,
235 struct btree_node *bn)
237 if (version < bcachefs_metadata_version_inode_btree_change &&
238 btree_node_type_is_extents(btree_id) &&
239 bpos_cmp(bn->min_key, POS_MIN) &&
241 bn->min_key = bpos_nosnap_predecessor(bn->min_key);
243 if (version < bcachefs_metadata_version_snapshot &&
245 bn->max_key.snapshot = 0;
247 compat_bpos(level, btree_id, version, big_endian, write, &bn->min_key);
248 compat_bpos(level, btree_id, version, big_endian, write, &bn->max_key);
250 if (version < bcachefs_metadata_version_snapshot &&
252 bn->max_key.snapshot = U32_MAX;
254 if (version < bcachefs_metadata_version_inode_btree_change &&
255 btree_node_type_is_extents(btree_id) &&
256 bpos_cmp(bn->min_key, POS_MIN) &&
258 bn->min_key = bpos_nosnap_successor(bn->min_key);
261 #endif /* _BCACHEFS_BTREE_IO_H */