]> git.sesse.net Git - bcachefs-tools-debian/blob - libbcachefs/disk_groups.c
b292dbef799211ca71bf132152c9d9d5ff464d70
[bcachefs-tools-debian] / libbcachefs / disk_groups.c
1 // SPDX-License-Identifier: GPL-2.0
2 #include "bcachefs.h"
3 #include "disk_groups.h"
4 #include "sb-members.h"
5 #include "super-io.h"
6
7 #include <linux/sort.h>
8
9 static int group_cmp(const void *_l, const void *_r)
10 {
11         const struct bch_disk_group *l = _l;
12         const struct bch_disk_group *r = _r;
13
14         return ((BCH_GROUP_DELETED(l) > BCH_GROUP_DELETED(r)) -
15                 (BCH_GROUP_DELETED(l) < BCH_GROUP_DELETED(r))) ?:
16                 ((BCH_GROUP_PARENT(l) > BCH_GROUP_PARENT(r)) -
17                  (BCH_GROUP_PARENT(l) < BCH_GROUP_PARENT(r))) ?:
18                 strncmp(l->label, r->label, sizeof(l->label));
19 }
20
21 static int bch2_sb_disk_groups_validate(struct bch_sb *sb,
22                                         struct bch_sb_field *f,
23                                         struct printbuf *err)
24 {
25         struct bch_sb_field_disk_groups *groups =
26                 field_to_type(f, disk_groups);
27         struct bch_disk_group *g, *sorted = NULL;
28         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
29         unsigned nr_groups = disk_groups_nr(groups);
30         unsigned i, len;
31         int ret = 0;
32
33         for (i = 0; i < sb->nr_devices; i++) {
34                 struct bch_member *m = mi->members + i;
35                 unsigned group_id;
36
37                 if (!BCH_MEMBER_GROUP(m))
38                         continue;
39
40                 group_id = BCH_MEMBER_GROUP(m) - 1;
41
42                 if (group_id >= nr_groups) {
43                         prt_printf(err, "disk %u has invalid label %u (have %u)",
44                                    i, group_id, nr_groups);
45                         return -BCH_ERR_invalid_sb_disk_groups;
46                 }
47
48                 if (BCH_GROUP_DELETED(&groups->entries[group_id])) {
49                         prt_printf(err, "disk %u has deleted label %u", i, group_id);
50                         return -BCH_ERR_invalid_sb_disk_groups;
51                 }
52         }
53
54         if (!nr_groups)
55                 return 0;
56
57         for (i = 0; i < nr_groups; i++) {
58                 g = groups->entries + i;
59
60                 if (BCH_GROUP_DELETED(g))
61                         continue;
62
63                 len = strnlen(g->label, sizeof(g->label));
64                 if (!len) {
65                         prt_printf(err, "label %u empty", i);
66                         return -BCH_ERR_invalid_sb_disk_groups;
67                 }
68         }
69
70         sorted = kmalloc_array(nr_groups, sizeof(*sorted), GFP_KERNEL);
71         if (!sorted)
72                 return -BCH_ERR_ENOMEM_disk_groups_validate;
73
74         memcpy(sorted, groups->entries, nr_groups * sizeof(*sorted));
75         sort(sorted, nr_groups, sizeof(*sorted), group_cmp, NULL);
76
77         for (g = sorted; g + 1 < sorted + nr_groups; g++)
78                 if (!BCH_GROUP_DELETED(g) &&
79                     !group_cmp(&g[0], &g[1])) {
80                         prt_printf(err, "duplicate label %llu.%.*s",
81                                BCH_GROUP_PARENT(g),
82                                (int) sizeof(g->label), g->label);
83                         ret = -BCH_ERR_invalid_sb_disk_groups;
84                         goto err;
85                 }
86 err:
87         kfree(sorted);
88         return ret;
89 }
90
91 void bch2_disk_groups_to_text(struct printbuf *out, struct bch_fs *c)
92 {
93         struct bch_disk_groups_cpu *g;
94         struct bch_dev *ca;
95         int i;
96         unsigned iter;
97
98         out->atomic++;
99         rcu_read_lock();
100
101         g = rcu_dereference(c->disk_groups);
102         if (!g)
103                 goto out;
104
105         for (i = 0; i < g->nr; i++) {
106                 if (i)
107                         prt_printf(out, " ");
108
109                 if (g->entries[i].deleted) {
110                         prt_printf(out, "[deleted]");
111                         continue;
112                 }
113
114                 prt_printf(out, "[parent %d devs", g->entries[i].parent);
115                 for_each_member_device_rcu(ca, c, iter, &g->entries[i].devs)
116                         prt_printf(out, " %s", ca->name);
117                 prt_printf(out, "]");
118         }
119
120 out:
121         rcu_read_unlock();
122         out->atomic--;
123 }
124
125 static void bch2_sb_disk_groups_to_text(struct printbuf *out,
126                                         struct bch_sb *sb,
127                                         struct bch_sb_field *f)
128 {
129         struct bch_sb_field_disk_groups *groups =
130                 field_to_type(f, disk_groups);
131         struct bch_disk_group *g;
132         unsigned nr_groups = disk_groups_nr(groups);
133
134         for (g = groups->entries;
135              g < groups->entries + nr_groups;
136              g++) {
137                 if (g != groups->entries)
138                         prt_printf(out, " ");
139
140                 if (BCH_GROUP_DELETED(g))
141                         prt_printf(out, "[deleted]");
142                 else
143                         prt_printf(out, "[parent %llu name %s]",
144                                BCH_GROUP_PARENT(g), g->label);
145         }
146 }
147
148 const struct bch_sb_field_ops bch_sb_field_ops_disk_groups = {
149         .validate       = bch2_sb_disk_groups_validate,
150         .to_text        = bch2_sb_disk_groups_to_text
151 };
152
153 int bch2_sb_disk_groups_to_cpu(struct bch_fs *c)
154 {
155         struct bch_sb_field_members *mi;
156         struct bch_sb_field_disk_groups *groups;
157         struct bch_disk_groups_cpu *cpu_g, *old_g;
158         unsigned i, g, nr_groups;
159
160         lockdep_assert_held(&c->sb_lock);
161
162         mi              = bch2_sb_get_members(c->disk_sb.sb);
163         groups          = bch2_sb_get_disk_groups(c->disk_sb.sb);
164         nr_groups       = disk_groups_nr(groups);
165
166         if (!groups)
167                 return 0;
168
169         cpu_g = kzalloc(sizeof(*cpu_g) +
170                         sizeof(cpu_g->entries[0]) * nr_groups, GFP_KERNEL);
171         if (!cpu_g)
172                 return -BCH_ERR_ENOMEM_disk_groups_to_cpu;
173
174         cpu_g->nr = nr_groups;
175
176         for (i = 0; i < nr_groups; i++) {
177                 struct bch_disk_group *src      = &groups->entries[i];
178                 struct bch_disk_group_cpu *dst  = &cpu_g->entries[i];
179
180                 dst->deleted    = BCH_GROUP_DELETED(src);
181                 dst->parent     = BCH_GROUP_PARENT(src);
182         }
183
184         for (i = 0; i < c->disk_sb.sb->nr_devices; i++) {
185                 struct bch_member *m = mi->members + i;
186                 struct bch_disk_group_cpu *dst;
187
188                 if (!bch2_member_exists(m))
189                         continue;
190
191                 g = BCH_MEMBER_GROUP(m);
192                 while (g) {
193                         dst = &cpu_g->entries[g - 1];
194                         __set_bit(i, dst->devs.d);
195                         g = dst->parent;
196                 }
197         }
198
199         old_g = rcu_dereference_protected(c->disk_groups,
200                                 lockdep_is_held(&c->sb_lock));
201         rcu_assign_pointer(c->disk_groups, cpu_g);
202         if (old_g)
203                 kfree_rcu(old_g, rcu);
204
205         return 0;
206 }
207
208 const struct bch_devs_mask *bch2_target_to_mask(struct bch_fs *c, unsigned target)
209 {
210         struct target t = target_decode(target);
211         struct bch_devs_mask *devs;
212
213         rcu_read_lock();
214
215         switch (t.type) {
216         case TARGET_NULL:
217                 devs = NULL;
218                 break;
219         case TARGET_DEV: {
220                 struct bch_dev *ca = t.dev < c->sb.nr_devices
221                         ? rcu_dereference(c->devs[t.dev])
222                         : NULL;
223                 devs = ca ? &ca->self : NULL;
224                 break;
225         }
226         case TARGET_GROUP: {
227                 struct bch_disk_groups_cpu *g = rcu_dereference(c->disk_groups);
228
229                 devs = g && t.group < g->nr && !g->entries[t.group].deleted
230                         ? &g->entries[t.group].devs
231                         : NULL;
232                 break;
233         }
234         default:
235                 BUG();
236         }
237
238         rcu_read_unlock();
239
240         return devs;
241 }
242
243 bool bch2_dev_in_target(struct bch_fs *c, unsigned dev, unsigned target)
244 {
245         struct target t = target_decode(target);
246
247         switch (t.type) {
248         case TARGET_NULL:
249                 return false;
250         case TARGET_DEV:
251                 return dev == t.dev;
252         case TARGET_GROUP: {
253                 struct bch_disk_groups_cpu *g;
254                 const struct bch_devs_mask *m;
255                 bool ret;
256
257                 rcu_read_lock();
258                 g = rcu_dereference(c->disk_groups);
259                 m = g && t.group < g->nr && !g->entries[t.group].deleted
260                         ? &g->entries[t.group].devs
261                         : NULL;
262
263                 ret = m ? test_bit(dev, m->d) : false;
264                 rcu_read_unlock();
265
266                 return ret;
267         }
268         default:
269                 BUG();
270         }
271 }
272
273 static int __bch2_disk_group_find(struct bch_sb_field_disk_groups *groups,
274                                   unsigned parent,
275                                   const char *name, unsigned namelen)
276 {
277         unsigned i, nr_groups = disk_groups_nr(groups);
278
279         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
280                 return -EINVAL;
281
282         for (i = 0; i < nr_groups; i++) {
283                 struct bch_disk_group *g = groups->entries + i;
284
285                 if (BCH_GROUP_DELETED(g))
286                         continue;
287
288                 if (!BCH_GROUP_DELETED(g) &&
289                     BCH_GROUP_PARENT(g) == parent &&
290                     strnlen(g->label, sizeof(g->label)) == namelen &&
291                     !memcmp(name, g->label, namelen))
292                         return i;
293         }
294
295         return -1;
296 }
297
298 static int __bch2_disk_group_add(struct bch_sb_handle *sb, unsigned parent,
299                                  const char *name, unsigned namelen)
300 {
301         struct bch_sb_field_disk_groups *groups =
302                 bch2_sb_get_disk_groups(sb->sb);
303         unsigned i, nr_groups = disk_groups_nr(groups);
304         struct bch_disk_group *g;
305
306         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
307                 return -EINVAL;
308
309         for (i = 0;
310              i < nr_groups && !BCH_GROUP_DELETED(&groups->entries[i]);
311              i++)
312                 ;
313
314         if (i == nr_groups) {
315                 unsigned u64s =
316                         (sizeof(struct bch_sb_field_disk_groups) +
317                          sizeof(struct bch_disk_group) * (nr_groups + 1)) /
318                         sizeof(u64);
319
320                 groups = bch2_sb_resize_disk_groups(sb, u64s);
321                 if (!groups)
322                         return -BCH_ERR_ENOSPC_disk_label_add;
323
324                 nr_groups = disk_groups_nr(groups);
325         }
326
327         BUG_ON(i >= nr_groups);
328
329         g = &groups->entries[i];
330
331         memcpy(g->label, name, namelen);
332         if (namelen < sizeof(g->label))
333                 g->label[namelen] = '\0';
334         SET_BCH_GROUP_DELETED(g, 0);
335         SET_BCH_GROUP_PARENT(g, parent);
336         SET_BCH_GROUP_DATA_ALLOWED(g, ~0);
337
338         return i;
339 }
340
341 int bch2_disk_path_find(struct bch_sb_handle *sb, const char *name)
342 {
343         struct bch_sb_field_disk_groups *groups =
344                 bch2_sb_get_disk_groups(sb->sb);
345         int v = -1;
346
347         do {
348                 const char *next = strchrnul(name, '.');
349                 unsigned len = next - name;
350
351                 if (*next == '.')
352                         next++;
353
354                 v = __bch2_disk_group_find(groups, v + 1, name, len);
355                 name = next;
356         } while (*name && v >= 0);
357
358         return v;
359 }
360
361 int bch2_disk_path_find_or_create(struct bch_sb_handle *sb, const char *name)
362 {
363         struct bch_sb_field_disk_groups *groups;
364         unsigned parent = 0;
365         int v = -1;
366
367         do {
368                 const char *next = strchrnul(name, '.');
369                 unsigned len = next - name;
370
371                 if (*next == '.')
372                         next++;
373
374                 groups = bch2_sb_get_disk_groups(sb->sb);
375
376                 v = __bch2_disk_group_find(groups, parent, name, len);
377                 if (v < 0)
378                         v = __bch2_disk_group_add(sb, parent, name, len);
379                 if (v < 0)
380                         return v;
381
382                 parent = v + 1;
383                 name = next;
384         } while (*name && v >= 0);
385
386         return v;
387 }
388
389 void bch2_disk_path_to_text(struct printbuf *out, struct bch_sb *sb, unsigned v)
390 {
391         struct bch_sb_field_disk_groups *groups =
392                 bch2_sb_get_disk_groups(sb);
393         struct bch_disk_group *g;
394         unsigned nr = 0;
395         u16 path[32];
396
397         while (1) {
398                 if (nr == ARRAY_SIZE(path))
399                         goto inval;
400
401                 if (v >= disk_groups_nr(groups))
402                         goto inval;
403
404                 g = groups->entries + v;
405
406                 if (BCH_GROUP_DELETED(g))
407                         goto inval;
408
409                 path[nr++] = v;
410
411                 if (!BCH_GROUP_PARENT(g))
412                         break;
413
414                 v = BCH_GROUP_PARENT(g) - 1;
415         }
416
417         while (nr) {
418                 v = path[--nr];
419                 g = groups->entries + v;
420
421                 prt_printf(out, "%.*s", (int) sizeof(g->label), g->label);
422                 if (nr)
423                         prt_printf(out, ".");
424         }
425         return;
426 inval:
427         prt_printf(out, "invalid label %u", v);
428 }
429
430 int __bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
431 {
432         struct bch_member *mi;
433         int ret, v = -1;
434
435         if (!strlen(name) || !strcmp(name, "none"))
436                 return 0;
437
438         v = bch2_disk_path_find_or_create(&c->disk_sb, name);
439         if (v < 0)
440                 return v;
441
442         ret = bch2_sb_disk_groups_to_cpu(c);
443         if (ret)
444                 return ret;
445
446         mi = &bch2_sb_get_members(c->disk_sb.sb)->members[ca->dev_idx];
447         SET_BCH_MEMBER_GROUP(mi, v + 1);
448         return 0;
449 }
450
451 int bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
452 {
453         int ret;
454
455         mutex_lock(&c->sb_lock);
456         ret = __bch2_dev_group_set(c, ca, name) ?:
457                 bch2_write_super(c);
458         mutex_unlock(&c->sb_lock);
459
460         return ret;
461 }
462
463 int bch2_opt_target_parse(struct bch_fs *c, const char *val, u64 *res,
464                           struct printbuf *err)
465 {
466         struct bch_dev *ca;
467         int g;
468
469         if (!val)
470                 return -EINVAL;
471
472         if (!c)
473                 return 0;
474
475         if (!strlen(val) || !strcmp(val, "none")) {
476                 *res = 0;
477                 return 0;
478         }
479
480         /* Is it a device? */
481         ca = bch2_dev_lookup(c, val);
482         if (!IS_ERR(ca)) {
483                 *res = dev_to_target(ca->dev_idx);
484                 percpu_ref_put(&ca->ref);
485                 return 0;
486         }
487
488         mutex_lock(&c->sb_lock);
489         g = bch2_disk_path_find(&c->disk_sb, val);
490         mutex_unlock(&c->sb_lock);
491
492         if (g >= 0) {
493                 *res = group_to_target(g);
494                 return 0;
495         }
496
497         return -EINVAL;
498 }
499
500 void bch2_opt_target_to_text(struct printbuf *out,
501                              struct bch_fs *c,
502                              struct bch_sb *sb,
503                              u64 v)
504 {
505         struct target t = target_decode(v);
506
507         switch (t.type) {
508         case TARGET_NULL:
509                 prt_printf(out, "none");
510                 break;
511         case TARGET_DEV:
512                 if (c) {
513                         struct bch_dev *ca;
514
515                         rcu_read_lock();
516                         ca = t.dev < c->sb.nr_devices
517                                 ? rcu_dereference(c->devs[t.dev])
518                                 : NULL;
519
520                         if (ca && percpu_ref_tryget(&ca->io_ref)) {
521                                 prt_printf(out, "/dev/%pg", ca->disk_sb.bdev);
522                                 percpu_ref_put(&ca->io_ref);
523                         } else if (ca) {
524                                 prt_printf(out, "offline device %u", t.dev);
525                         } else {
526                                 prt_printf(out, "invalid device %u", t.dev);
527                         }
528
529                         rcu_read_unlock();
530                 } else {
531                         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
532                         struct bch_member *m = mi->members + t.dev;
533
534                         if (bch2_dev_exists(sb, mi, t.dev)) {
535                                 prt_printf(out, "Device ");
536                                 pr_uuid(out, m->uuid.b);
537                                 prt_printf(out, " (%u)", t.dev);
538                         } else {
539                                 prt_printf(out, "Bad device %u", t.dev);
540                         }
541                 }
542                 break;
543         case TARGET_GROUP:
544                 if (c) {
545                         mutex_lock(&c->sb_lock);
546                         bch2_disk_path_to_text(out, c->disk_sb.sb, t.group);
547                         mutex_unlock(&c->sb_lock);
548                 } else {
549                         bch2_disk_path_to_text(out, sb, t.group);
550                 }
551                 break;
552         default:
553                 BUG();
554         }
555 }