]> git.sesse.net Git - bcachefs-tools-debian/blob - libbcachefs/disk_groups.c
Update bcachefs sources to 7bf1ac0d46 bcachefs: Correctly initialize new buckets...
[bcachefs-tools-debian] / libbcachefs / disk_groups.c
1 // SPDX-License-Identifier: GPL-2.0
2 #include "bcachefs.h"
3 #include "disk_groups.h"
4 #include "sb-members.h"
5 #include "super-io.h"
6
7 #include <linux/sort.h>
8
9 static int group_cmp(const void *_l, const void *_r)
10 {
11         const struct bch_disk_group *l = _l;
12         const struct bch_disk_group *r = _r;
13
14         return ((BCH_GROUP_DELETED(l) > BCH_GROUP_DELETED(r)) -
15                 (BCH_GROUP_DELETED(l) < BCH_GROUP_DELETED(r))) ?:
16                 ((BCH_GROUP_PARENT(l) > BCH_GROUP_PARENT(r)) -
17                  (BCH_GROUP_PARENT(l) < BCH_GROUP_PARENT(r))) ?:
18                 strncmp(l->label, r->label, sizeof(l->label));
19 }
20
21 static int bch2_sb_disk_groups_validate(struct bch_sb *sb,
22                                         struct bch_sb_field *f,
23                                         struct printbuf *err)
24 {
25         struct bch_sb_field_disk_groups *groups =
26                 field_to_type(f, disk_groups);
27         struct bch_disk_group *g, *sorted = NULL;
28         unsigned nr_groups = disk_groups_nr(groups);
29         unsigned i, len;
30         int ret = 0;
31
32         for (i = 0; i < sb->nr_devices; i++) {
33                 struct bch_member m = bch2_sb_member_get(sb, i);
34                 unsigned group_id;
35
36                 if (!BCH_MEMBER_GROUP(&m))
37                         continue;
38
39                 group_id = BCH_MEMBER_GROUP(&m) - 1;
40
41                 if (group_id >= nr_groups) {
42                         prt_printf(err, "disk %u has invalid label %u (have %u)",
43                                    i, group_id, nr_groups);
44                         return -BCH_ERR_invalid_sb_disk_groups;
45                 }
46
47                 if (BCH_GROUP_DELETED(&groups->entries[group_id])) {
48                         prt_printf(err, "disk %u has deleted label %u", i, group_id);
49                         return -BCH_ERR_invalid_sb_disk_groups;
50                 }
51         }
52
53         if (!nr_groups)
54                 return 0;
55
56         for (i = 0; i < nr_groups; i++) {
57                 g = groups->entries + i;
58
59                 if (BCH_GROUP_DELETED(g))
60                         continue;
61
62                 len = strnlen(g->label, sizeof(g->label));
63                 if (!len) {
64                         prt_printf(err, "label %u empty", i);
65                         return -BCH_ERR_invalid_sb_disk_groups;
66                 }
67         }
68
69         sorted = kmalloc_array(nr_groups, sizeof(*sorted), GFP_KERNEL);
70         if (!sorted)
71                 return -BCH_ERR_ENOMEM_disk_groups_validate;
72
73         memcpy(sorted, groups->entries, nr_groups * sizeof(*sorted));
74         sort(sorted, nr_groups, sizeof(*sorted), group_cmp, NULL);
75
76         for (g = sorted; g + 1 < sorted + nr_groups; g++)
77                 if (!BCH_GROUP_DELETED(g) &&
78                     !group_cmp(&g[0], &g[1])) {
79                         prt_printf(err, "duplicate label %llu.%.*s",
80                                BCH_GROUP_PARENT(g),
81                                (int) sizeof(g->label), g->label);
82                         ret = -BCH_ERR_invalid_sb_disk_groups;
83                         goto err;
84                 }
85 err:
86         kfree(sorted);
87         return ret;
88 }
89
90 void bch2_disk_groups_to_text(struct printbuf *out, struct bch_fs *c)
91 {
92         struct bch_disk_groups_cpu *g;
93         struct bch_dev *ca;
94         int i;
95         unsigned iter;
96
97         out->atomic++;
98         rcu_read_lock();
99
100         g = rcu_dereference(c->disk_groups);
101         if (!g)
102                 goto out;
103
104         for (i = 0; i < g->nr; i++) {
105                 if (i)
106                         prt_printf(out, " ");
107
108                 if (g->entries[i].deleted) {
109                         prt_printf(out, "[deleted]");
110                         continue;
111                 }
112
113                 prt_printf(out, "[parent %d devs", g->entries[i].parent);
114                 for_each_member_device_rcu(ca, c, iter, &g->entries[i].devs)
115                         prt_printf(out, " %s", ca->name);
116                 prt_printf(out, "]");
117         }
118
119 out:
120         rcu_read_unlock();
121         out->atomic--;
122 }
123
124 static void bch2_sb_disk_groups_to_text(struct printbuf *out,
125                                         struct bch_sb *sb,
126                                         struct bch_sb_field *f)
127 {
128         struct bch_sb_field_disk_groups *groups =
129                 field_to_type(f, disk_groups);
130         struct bch_disk_group *g;
131         unsigned nr_groups = disk_groups_nr(groups);
132
133         for (g = groups->entries;
134              g < groups->entries + nr_groups;
135              g++) {
136                 if (g != groups->entries)
137                         prt_printf(out, " ");
138
139                 if (BCH_GROUP_DELETED(g))
140                         prt_printf(out, "[deleted]");
141                 else
142                         prt_printf(out, "[parent %llu name %s]",
143                                BCH_GROUP_PARENT(g), g->label);
144         }
145 }
146
147 const struct bch_sb_field_ops bch_sb_field_ops_disk_groups = {
148         .validate       = bch2_sb_disk_groups_validate,
149         .to_text        = bch2_sb_disk_groups_to_text
150 };
151
152 int bch2_sb_disk_groups_to_cpu(struct bch_fs *c)
153 {
154         struct bch_sb_field_disk_groups *groups;
155         struct bch_disk_groups_cpu *cpu_g, *old_g;
156         unsigned i, g, nr_groups;
157
158         lockdep_assert_held(&c->sb_lock);
159
160         groups          = bch2_sb_get_disk_groups(c->disk_sb.sb);
161         nr_groups       = disk_groups_nr(groups);
162
163         if (!groups)
164                 return 0;
165
166         cpu_g = kzalloc(sizeof(*cpu_g) +
167                         sizeof(cpu_g->entries[0]) * nr_groups, GFP_KERNEL);
168         if (!cpu_g)
169                 return -BCH_ERR_ENOMEM_disk_groups_to_cpu;
170
171         cpu_g->nr = nr_groups;
172
173         for (i = 0; i < nr_groups; i++) {
174                 struct bch_disk_group *src      = &groups->entries[i];
175                 struct bch_disk_group_cpu *dst  = &cpu_g->entries[i];
176
177                 dst->deleted    = BCH_GROUP_DELETED(src);
178                 dst->parent     = BCH_GROUP_PARENT(src);
179         }
180
181         for (i = 0; i < c->disk_sb.sb->nr_devices; i++) {
182                 struct bch_member m = bch2_sb_member_get(c->disk_sb.sb, i);
183                 struct bch_disk_group_cpu *dst;
184
185                 if (!bch2_member_exists(&m))
186                         continue;
187
188                 g = BCH_MEMBER_GROUP(&m);
189                 while (g) {
190                         dst = &cpu_g->entries[g - 1];
191                         __set_bit(i, dst->devs.d);
192                         g = dst->parent;
193                 }
194         }
195
196         old_g = rcu_dereference_protected(c->disk_groups,
197                                 lockdep_is_held(&c->sb_lock));
198         rcu_assign_pointer(c->disk_groups, cpu_g);
199         if (old_g)
200                 kfree_rcu(old_g, rcu);
201
202         return 0;
203 }
204
205 const struct bch_devs_mask *bch2_target_to_mask(struct bch_fs *c, unsigned target)
206 {
207         struct target t = target_decode(target);
208         struct bch_devs_mask *devs;
209
210         rcu_read_lock();
211
212         switch (t.type) {
213         case TARGET_NULL:
214                 devs = NULL;
215                 break;
216         case TARGET_DEV: {
217                 struct bch_dev *ca = t.dev < c->sb.nr_devices
218                         ? rcu_dereference(c->devs[t.dev])
219                         : NULL;
220                 devs = ca ? &ca->self : NULL;
221                 break;
222         }
223         case TARGET_GROUP: {
224                 struct bch_disk_groups_cpu *g = rcu_dereference(c->disk_groups);
225
226                 devs = g && t.group < g->nr && !g->entries[t.group].deleted
227                         ? &g->entries[t.group].devs
228                         : NULL;
229                 break;
230         }
231         default:
232                 BUG();
233         }
234
235         rcu_read_unlock();
236
237         return devs;
238 }
239
240 bool bch2_dev_in_target(struct bch_fs *c, unsigned dev, unsigned target)
241 {
242         struct target t = target_decode(target);
243
244         switch (t.type) {
245         case TARGET_NULL:
246                 return false;
247         case TARGET_DEV:
248                 return dev == t.dev;
249         case TARGET_GROUP: {
250                 struct bch_disk_groups_cpu *g;
251                 const struct bch_devs_mask *m;
252                 bool ret;
253
254                 rcu_read_lock();
255                 g = rcu_dereference(c->disk_groups);
256                 m = g && t.group < g->nr && !g->entries[t.group].deleted
257                         ? &g->entries[t.group].devs
258                         : NULL;
259
260                 ret = m ? test_bit(dev, m->d) : false;
261                 rcu_read_unlock();
262
263                 return ret;
264         }
265         default:
266                 BUG();
267         }
268 }
269
270 static int __bch2_disk_group_find(struct bch_sb_field_disk_groups *groups,
271                                   unsigned parent,
272                                   const char *name, unsigned namelen)
273 {
274         unsigned i, nr_groups = disk_groups_nr(groups);
275
276         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
277                 return -EINVAL;
278
279         for (i = 0; i < nr_groups; i++) {
280                 struct bch_disk_group *g = groups->entries + i;
281
282                 if (BCH_GROUP_DELETED(g))
283                         continue;
284
285                 if (!BCH_GROUP_DELETED(g) &&
286                     BCH_GROUP_PARENT(g) == parent &&
287                     strnlen(g->label, sizeof(g->label)) == namelen &&
288                     !memcmp(name, g->label, namelen))
289                         return i;
290         }
291
292         return -1;
293 }
294
295 static int __bch2_disk_group_add(struct bch_sb_handle *sb, unsigned parent,
296                                  const char *name, unsigned namelen)
297 {
298         struct bch_sb_field_disk_groups *groups =
299                 bch2_sb_get_disk_groups(sb->sb);
300         unsigned i, nr_groups = disk_groups_nr(groups);
301         struct bch_disk_group *g;
302
303         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
304                 return -EINVAL;
305
306         for (i = 0;
307              i < nr_groups && !BCH_GROUP_DELETED(&groups->entries[i]);
308              i++)
309                 ;
310
311         if (i == nr_groups) {
312                 unsigned u64s =
313                         (sizeof(struct bch_sb_field_disk_groups) +
314                          sizeof(struct bch_disk_group) * (nr_groups + 1)) /
315                         sizeof(u64);
316
317                 groups = bch2_sb_resize_disk_groups(sb, u64s);
318                 if (!groups)
319                         return -BCH_ERR_ENOSPC_disk_label_add;
320
321                 nr_groups = disk_groups_nr(groups);
322         }
323
324         BUG_ON(i >= nr_groups);
325
326         g = &groups->entries[i];
327
328         memcpy(g->label, name, namelen);
329         if (namelen < sizeof(g->label))
330                 g->label[namelen] = '\0';
331         SET_BCH_GROUP_DELETED(g, 0);
332         SET_BCH_GROUP_PARENT(g, parent);
333         SET_BCH_GROUP_DATA_ALLOWED(g, ~0);
334
335         return i;
336 }
337
338 int bch2_disk_path_find(struct bch_sb_handle *sb, const char *name)
339 {
340         struct bch_sb_field_disk_groups *groups =
341                 bch2_sb_get_disk_groups(sb->sb);
342         int v = -1;
343
344         do {
345                 const char *next = strchrnul(name, '.');
346                 unsigned len = next - name;
347
348                 if (*next == '.')
349                         next++;
350
351                 v = __bch2_disk_group_find(groups, v + 1, name, len);
352                 name = next;
353         } while (*name && v >= 0);
354
355         return v;
356 }
357
358 int bch2_disk_path_find_or_create(struct bch_sb_handle *sb, const char *name)
359 {
360         struct bch_sb_field_disk_groups *groups;
361         unsigned parent = 0;
362         int v = -1;
363
364         do {
365                 const char *next = strchrnul(name, '.');
366                 unsigned len = next - name;
367
368                 if (*next == '.')
369                         next++;
370
371                 groups = bch2_sb_get_disk_groups(sb->sb);
372
373                 v = __bch2_disk_group_find(groups, parent, name, len);
374                 if (v < 0)
375                         v = __bch2_disk_group_add(sb, parent, name, len);
376                 if (v < 0)
377                         return v;
378
379                 parent = v + 1;
380                 name = next;
381         } while (*name && v >= 0);
382
383         return v;
384 }
385
386 void bch2_disk_path_to_text(struct printbuf *out, struct bch_sb *sb, unsigned v)
387 {
388         struct bch_sb_field_disk_groups *groups =
389                 bch2_sb_get_disk_groups(sb);
390         struct bch_disk_group *g;
391         unsigned nr = 0;
392         u16 path[32];
393
394         while (1) {
395                 if (nr == ARRAY_SIZE(path))
396                         goto inval;
397
398                 if (v >= disk_groups_nr(groups))
399                         goto inval;
400
401                 g = groups->entries + v;
402
403                 if (BCH_GROUP_DELETED(g))
404                         goto inval;
405
406                 path[nr++] = v;
407
408                 if (!BCH_GROUP_PARENT(g))
409                         break;
410
411                 v = BCH_GROUP_PARENT(g) - 1;
412         }
413
414         while (nr) {
415                 v = path[--nr];
416                 g = groups->entries + v;
417
418                 prt_printf(out, "%.*s", (int) sizeof(g->label), g->label);
419                 if (nr)
420                         prt_printf(out, ".");
421         }
422         return;
423 inval:
424         prt_printf(out, "invalid label %u", v);
425 }
426
427 int __bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
428 {
429         struct bch_member *mi;
430         int ret, v = -1;
431
432         if (!strlen(name) || !strcmp(name, "none"))
433                 return 0;
434
435         v = bch2_disk_path_find_or_create(&c->disk_sb, name);
436         if (v < 0)
437                 return v;
438
439         ret = bch2_sb_disk_groups_to_cpu(c);
440         if (ret)
441                 return ret;
442
443         mi = bch2_members_v2_get_mut(c->disk_sb.sb, ca->dev_idx);
444         SET_BCH_MEMBER_GROUP(mi, v + 1);
445         return 0;
446 }
447
448 int bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
449 {
450         int ret;
451
452         mutex_lock(&c->sb_lock);
453         ret = __bch2_dev_group_set(c, ca, name) ?:
454                 bch2_write_super(c);
455         mutex_unlock(&c->sb_lock);
456
457         return ret;
458 }
459
460 int bch2_opt_target_parse(struct bch_fs *c, const char *val, u64 *res,
461                           struct printbuf *err)
462 {
463         struct bch_dev *ca;
464         int g;
465
466         if (!val)
467                 return -EINVAL;
468
469         if (!c)
470                 return 0;
471
472         if (!strlen(val) || !strcmp(val, "none")) {
473                 *res = 0;
474                 return 0;
475         }
476
477         /* Is it a device? */
478         ca = bch2_dev_lookup(c, val);
479         if (!IS_ERR(ca)) {
480                 *res = dev_to_target(ca->dev_idx);
481                 percpu_ref_put(&ca->ref);
482                 return 0;
483         }
484
485         mutex_lock(&c->sb_lock);
486         g = bch2_disk_path_find(&c->disk_sb, val);
487         mutex_unlock(&c->sb_lock);
488
489         if (g >= 0) {
490                 *res = group_to_target(g);
491                 return 0;
492         }
493
494         return -EINVAL;
495 }
496
497 void bch2_opt_target_to_text(struct printbuf *out,
498                              struct bch_fs *c,
499                              struct bch_sb *sb,
500                              u64 v)
501 {
502         struct target t = target_decode(v);
503
504         switch (t.type) {
505         case TARGET_NULL:
506                 prt_printf(out, "none");
507                 break;
508         case TARGET_DEV:
509                 if (c) {
510                         struct bch_dev *ca;
511
512                         rcu_read_lock();
513                         ca = t.dev < c->sb.nr_devices
514                                 ? rcu_dereference(c->devs[t.dev])
515                                 : NULL;
516
517                         if (ca && percpu_ref_tryget(&ca->io_ref)) {
518                                 prt_printf(out, "/dev/%pg", ca->disk_sb.bdev);
519                                 percpu_ref_put(&ca->io_ref);
520                         } else if (ca) {
521                                 prt_printf(out, "offline device %u", t.dev);
522                         } else {
523                                 prt_printf(out, "invalid device %u", t.dev);
524                         }
525
526                         rcu_read_unlock();
527                 } else {
528                         struct bch_member m = bch2_sb_member_get(sb, t.dev);
529
530                         if (bch2_dev_exists(sb, t.dev)) {
531                                 prt_printf(out, "Device ");
532                                 pr_uuid(out, m.uuid.b);
533                                 prt_printf(out, " (%u)", t.dev);
534                         } else {
535                                 prt_printf(out, "Bad device %u", t.dev);
536                         }
537                 }
538                 break;
539         case TARGET_GROUP:
540                 if (c) {
541                         mutex_lock(&c->sb_lock);
542                         bch2_disk_path_to_text(out, c->disk_sb.sb, t.group);
543                         mutex_unlock(&c->sb_lock);
544                 } else {
545                         bch2_disk_path_to_text(out, sb, t.group);
546                 }
547                 break;
548         default:
549                 BUG();
550         }
551 }