]> git.sesse.net Git - bcachefs-tools-debian/blob - libbcachefs/disk_groups.c
Update bcachefs sources to 070ec8d07b bcachefs: Snapshot depth, skiplist fields
[bcachefs-tools-debian] / libbcachefs / disk_groups.c
1 // SPDX-License-Identifier: GPL-2.0
2 #include "bcachefs.h"
3 #include "disk_groups.h"
4 #include "super-io.h"
5
6 #include <linux/sort.h>
7
8 static int group_cmp(const void *_l, const void *_r)
9 {
10         const struct bch_disk_group *l = _l;
11         const struct bch_disk_group *r = _r;
12
13         return ((BCH_GROUP_DELETED(l) > BCH_GROUP_DELETED(r)) -
14                 (BCH_GROUP_DELETED(l) < BCH_GROUP_DELETED(r))) ?:
15                 ((BCH_GROUP_PARENT(l) > BCH_GROUP_PARENT(r)) -
16                  (BCH_GROUP_PARENT(l) < BCH_GROUP_PARENT(r))) ?:
17                 strncmp(l->label, r->label, sizeof(l->label));
18 }
19
20 static int bch2_sb_disk_groups_validate(struct bch_sb *sb,
21                                         struct bch_sb_field *f,
22                                         struct printbuf *err)
23 {
24         struct bch_sb_field_disk_groups *groups =
25                 field_to_type(f, disk_groups);
26         struct bch_disk_group *g, *sorted = NULL;
27         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
28         unsigned nr_groups = disk_groups_nr(groups);
29         unsigned i, len;
30         int ret = 0;
31
32         for (i = 0; i < sb->nr_devices; i++) {
33                 struct bch_member *m = mi->members + i;
34                 unsigned g;
35
36                 if (!BCH_MEMBER_GROUP(m))
37                         continue;
38
39                 g = BCH_MEMBER_GROUP(m) - 1;
40
41                 if (g >= nr_groups) {
42                         prt_printf(err, "disk %u has invalid label %u (have %u)",
43                                i, g, nr_groups);
44                         return -BCH_ERR_invalid_sb_disk_groups;
45                 }
46
47                 if (BCH_GROUP_DELETED(&groups->entries[g])) {
48                         prt_printf(err, "disk %u has deleted label %u", i, g);
49                         return -BCH_ERR_invalid_sb_disk_groups;
50                 }
51         }
52
53         if (!nr_groups)
54                 return 0;
55
56         for (i = 0; i < nr_groups; i++) {
57                 g = groups->entries + i;
58
59                 if (BCH_GROUP_DELETED(g))
60                         continue;
61
62                 len = strnlen(g->label, sizeof(g->label));
63                 if (!len) {
64                         prt_printf(err, "label %u empty", i);
65                         return -BCH_ERR_invalid_sb_disk_groups;
66                 }
67         }
68
69         sorted = kmalloc_array(nr_groups, sizeof(*sorted), GFP_KERNEL);
70         if (!sorted)
71                 return -BCH_ERR_ENOMEM_disk_groups_validate;
72
73         memcpy(sorted, groups->entries, nr_groups * sizeof(*sorted));
74         sort(sorted, nr_groups, sizeof(*sorted), group_cmp, NULL);
75
76         for (g = sorted; g + 1 < sorted + nr_groups; g++)
77                 if (!BCH_GROUP_DELETED(g) &&
78                     !group_cmp(&g[0], &g[1])) {
79                         prt_printf(err, "duplicate label %llu.%.*s",
80                                BCH_GROUP_PARENT(g),
81                                (int) sizeof(g->label), g->label);
82                         ret = -BCH_ERR_invalid_sb_disk_groups;
83                         goto err;
84                 }
85 err:
86         kfree(sorted);
87         return ret;
88 }
89
90 void bch2_disk_groups_to_text(struct printbuf *out, struct bch_fs *c)
91 {
92         struct bch_disk_groups_cpu *g;
93         struct bch_dev *ca;
94         int i;
95         unsigned iter;
96
97         out->atomic++;
98         rcu_read_lock();
99
100         g = rcu_dereference(c->disk_groups);
101         if (!g)
102                 goto out;
103
104         for (i = 0; i < g->nr; i++) {
105                 if (i)
106                         prt_printf(out, " ");
107
108                 if (g->entries[i].deleted) {
109                         prt_printf(out, "[deleted]");
110                         continue;
111                 }
112
113                 prt_printf(out, "[parent %d devs", g->entries[i].parent);
114                 for_each_member_device_rcu(ca, c, iter, &g->entries[i].devs)
115                         prt_printf(out, " %s", ca->name);
116                 prt_printf(out, "]");
117         }
118
119 out:
120         rcu_read_unlock();
121         out->atomic--;
122 }
123
124 static void bch2_sb_disk_groups_to_text(struct printbuf *out,
125                                         struct bch_sb *sb,
126                                         struct bch_sb_field *f)
127 {
128         struct bch_sb_field_disk_groups *groups =
129                 field_to_type(f, disk_groups);
130         struct bch_disk_group *g;
131         unsigned nr_groups = disk_groups_nr(groups);
132
133         for (g = groups->entries;
134              g < groups->entries + nr_groups;
135              g++) {
136                 if (g != groups->entries)
137                         prt_printf(out, " ");
138
139                 if (BCH_GROUP_DELETED(g))
140                         prt_printf(out, "[deleted]");
141                 else
142                         prt_printf(out, "[parent %llu name %s]",
143                                BCH_GROUP_PARENT(g), g->label);
144         }
145 }
146
147 const struct bch_sb_field_ops bch_sb_field_ops_disk_groups = {
148         .validate       = bch2_sb_disk_groups_validate,
149         .to_text        = bch2_sb_disk_groups_to_text
150 };
151
152 int bch2_sb_disk_groups_to_cpu(struct bch_fs *c)
153 {
154         struct bch_sb_field_members *mi;
155         struct bch_sb_field_disk_groups *groups;
156         struct bch_disk_groups_cpu *cpu_g, *old_g;
157         unsigned i, g, nr_groups;
158
159         lockdep_assert_held(&c->sb_lock);
160
161         mi              = bch2_sb_get_members(c->disk_sb.sb);
162         groups          = bch2_sb_get_disk_groups(c->disk_sb.sb);
163         nr_groups       = disk_groups_nr(groups);
164
165         if (!groups)
166                 return 0;
167
168         cpu_g = kzalloc(sizeof(*cpu_g) +
169                         sizeof(cpu_g->entries[0]) * nr_groups, GFP_KERNEL);
170         if (!cpu_g)
171                 return -BCH_ERR_ENOMEM_disk_groups_to_cpu;
172
173         cpu_g->nr = nr_groups;
174
175         for (i = 0; i < nr_groups; i++) {
176                 struct bch_disk_group *src      = &groups->entries[i];
177                 struct bch_disk_group_cpu *dst  = &cpu_g->entries[i];
178
179                 dst->deleted    = BCH_GROUP_DELETED(src);
180                 dst->parent     = BCH_GROUP_PARENT(src);
181         }
182
183         for (i = 0; i < c->disk_sb.sb->nr_devices; i++) {
184                 struct bch_member *m = mi->members + i;
185                 struct bch_disk_group_cpu *dst =
186                         &cpu_g->entries[BCH_MEMBER_GROUP(m)];
187
188                 if (!bch2_member_exists(m))
189                         continue;
190
191                 g = BCH_MEMBER_GROUP(m);
192                 while (g) {
193                         dst = &cpu_g->entries[g - 1];
194                         __set_bit(i, dst->devs.d);
195                         g = dst->parent;
196                 }
197         }
198
199         old_g = rcu_dereference_protected(c->disk_groups,
200                                 lockdep_is_held(&c->sb_lock));
201         rcu_assign_pointer(c->disk_groups, cpu_g);
202         if (old_g)
203                 kfree_rcu(old_g, rcu);
204
205         return 0;
206 }
207
208 const struct bch_devs_mask *bch2_target_to_mask(struct bch_fs *c, unsigned target)
209 {
210         struct target t = target_decode(target);
211         struct bch_devs_mask *devs;
212
213         rcu_read_lock();
214
215         switch (t.type) {
216         case TARGET_NULL:
217                 devs = NULL;
218                 break;
219         case TARGET_DEV: {
220                 struct bch_dev *ca = t.dev < c->sb.nr_devices
221                         ? rcu_dereference(c->devs[t.dev])
222                         : NULL;
223                 devs = ca ? &ca->self : NULL;
224                 break;
225         }
226         case TARGET_GROUP: {
227                 struct bch_disk_groups_cpu *g = rcu_dereference(c->disk_groups);
228
229                 devs = g && t.group < g->nr && !g->entries[t.group].deleted
230                         ? &g->entries[t.group].devs
231                         : NULL;
232                 break;
233         }
234         default:
235                 BUG();
236         }
237
238         rcu_read_unlock();
239
240         return devs;
241 }
242
243 bool bch2_dev_in_target(struct bch_fs *c, unsigned dev, unsigned target)
244 {
245         struct target t = target_decode(target);
246
247         switch (t.type) {
248         case TARGET_NULL:
249                 return false;
250         case TARGET_DEV:
251                 return dev == t.dev;
252         case TARGET_GROUP: {
253                 struct bch_disk_groups_cpu *g;
254                 const struct bch_devs_mask *m;
255                 bool ret;
256
257                 rcu_read_lock();
258                 g = rcu_dereference(c->disk_groups);
259                 m = g && t.group < g->nr && !g->entries[t.group].deleted
260                         ? &g->entries[t.group].devs
261                         : NULL;
262
263                 ret = m ? test_bit(dev, m->d) : false;
264                 rcu_read_unlock();
265
266                 return ret;
267         }
268         default:
269                 BUG();
270         }
271 }
272
273 static int __bch2_disk_group_find(struct bch_sb_field_disk_groups *groups,
274                                   unsigned parent,
275                                   const char *name, unsigned namelen)
276 {
277         unsigned i, nr_groups = disk_groups_nr(groups);
278
279         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
280                 return -EINVAL;
281
282         for (i = 0; i < nr_groups; i++) {
283                 struct bch_disk_group *g = groups->entries + i;
284
285                 if (BCH_GROUP_DELETED(g))
286                         continue;
287
288                 if (!BCH_GROUP_DELETED(g) &&
289                     BCH_GROUP_PARENT(g) == parent &&
290                     strnlen(g->label, sizeof(g->label)) == namelen &&
291                     !memcmp(name, g->label, namelen))
292                         return i;
293         }
294
295         return -1;
296 }
297
298 static int __bch2_disk_group_add(struct bch_sb_handle *sb, unsigned parent,
299                                  const char *name, unsigned namelen)
300 {
301         struct bch_sb_field_disk_groups *groups =
302                 bch2_sb_get_disk_groups(sb->sb);
303         unsigned i, nr_groups = disk_groups_nr(groups);
304         struct bch_disk_group *g;
305
306         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
307                 return -EINVAL;
308
309         for (i = 0;
310              i < nr_groups && !BCH_GROUP_DELETED(&groups->entries[i]);
311              i++)
312                 ;
313
314         if (i == nr_groups) {
315                 unsigned u64s =
316                         (sizeof(struct bch_sb_field_disk_groups) +
317                          sizeof(struct bch_disk_group) * (nr_groups + 1)) /
318                         sizeof(u64);
319
320                 groups = bch2_sb_resize_disk_groups(sb, u64s);
321                 if (!groups)
322                         return -BCH_ERR_ENOSPC_disk_label_add;
323
324                 nr_groups = disk_groups_nr(groups);
325         }
326
327         BUG_ON(i >= nr_groups);
328
329         g = &groups->entries[i];
330
331         memcpy(g->label, name, namelen);
332         if (namelen < sizeof(g->label))
333                 g->label[namelen] = '\0';
334         SET_BCH_GROUP_DELETED(g, 0);
335         SET_BCH_GROUP_PARENT(g, parent);
336         SET_BCH_GROUP_DATA_ALLOWED(g, ~0);
337
338         return i;
339 }
340
341 int bch2_disk_path_find(struct bch_sb_handle *sb, const char *name)
342 {
343         struct bch_sb_field_disk_groups *groups =
344                 bch2_sb_get_disk_groups(sb->sb);
345         int v = -1;
346
347         do {
348                 const char *next = strchrnul(name, '.');
349                 unsigned len = next - name;
350
351                 if (*next == '.')
352                         next++;
353
354                 v = __bch2_disk_group_find(groups, v + 1, name, len);
355                 name = next;
356         } while (*name && v >= 0);
357
358         return v;
359 }
360
361 int bch2_disk_path_find_or_create(struct bch_sb_handle *sb, const char *name)
362 {
363         struct bch_sb_field_disk_groups *groups;
364         unsigned parent = 0;
365         int v = -1;
366
367         do {
368                 const char *next = strchrnul(name, '.');
369                 unsigned len = next - name;
370
371                 if (*next == '.')
372                         next++;
373
374                 groups = bch2_sb_get_disk_groups(sb->sb);
375
376                 v = __bch2_disk_group_find(groups, parent, name, len);
377                 if (v < 0)
378                         v = __bch2_disk_group_add(sb, parent, name, len);
379                 if (v < 0)
380                         return v;
381
382                 parent = v + 1;
383                 name = next;
384         } while (*name && v >= 0);
385
386         return v;
387 }
388
389 void bch2_disk_path_to_text(struct printbuf *out, struct bch_sb *sb, unsigned v)
390 {
391         struct bch_sb_field_disk_groups *groups =
392                 bch2_sb_get_disk_groups(sb);
393         struct bch_disk_group *g;
394         unsigned nr = 0;
395         u16 path[32];
396
397         while (1) {
398                 if (nr == ARRAY_SIZE(path))
399                         goto inval;
400
401                 if (v >= disk_groups_nr(groups))
402                         goto inval;
403
404                 g = groups->entries + v;
405
406                 if (BCH_GROUP_DELETED(g))
407                         goto inval;
408
409                 path[nr++] = v;
410
411                 if (!BCH_GROUP_PARENT(g))
412                         break;
413
414                 v = BCH_GROUP_PARENT(g) - 1;
415         }
416
417         while (nr) {
418                 v = path[--nr];
419                 g = groups->entries + v;
420
421                 prt_printf(out, "%.*s", (int) sizeof(g->label), g->label);
422                 if (nr)
423                         prt_printf(out, ".");
424         }
425         return;
426 inval:
427         prt_printf(out, "invalid label %u", v);
428 }
429
430 int __bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
431 {
432         struct bch_member *mi;
433         int ret, v = -1;
434
435         if (!strlen(name) || !strcmp(name, "none"))
436                 return 0;
437
438         v = bch2_disk_path_find_or_create(&c->disk_sb, name);
439         if (v < 0)
440                 return v;
441
442         ret = bch2_sb_disk_groups_to_cpu(c);
443         if (ret)
444                 return ret;
445
446         mi = &bch2_sb_get_members(c->disk_sb.sb)->members[ca->dev_idx];
447         SET_BCH_MEMBER_GROUP(mi, v + 1);
448         return 0;
449 }
450
451 int bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
452 {
453         int ret;
454
455         mutex_lock(&c->sb_lock);
456         ret = __bch2_dev_group_set(c, ca, name) ?:
457                 bch2_write_super(c);
458         mutex_unlock(&c->sb_lock);
459
460         return ret;
461 }
462
463 int bch2_opt_target_parse(struct bch_fs *c, const char *buf, u64 *v)
464 {
465         struct bch_dev *ca;
466         int g;
467
468         if (!strlen(buf) || !strcmp(buf, "none")) {
469                 *v = 0;
470                 return 0;
471         }
472
473         /* Is it a device? */
474         ca = bch2_dev_lookup(c, buf);
475         if (!IS_ERR(ca)) {
476                 *v = dev_to_target(ca->dev_idx);
477                 percpu_ref_put(&ca->ref);
478                 return 0;
479         }
480
481         mutex_lock(&c->sb_lock);
482         g = bch2_disk_path_find(&c->disk_sb, buf);
483         mutex_unlock(&c->sb_lock);
484
485         if (g >= 0) {
486                 *v = group_to_target(g);
487                 return 0;
488         }
489
490         return -EINVAL;
491 }
492
493 void bch2_opt_target_to_text(struct printbuf *out,
494                              struct bch_fs *c,
495                              struct bch_sb *sb,
496                              u64 v)
497 {
498         struct target t = target_decode(v);
499
500         switch (t.type) {
501         case TARGET_NULL:
502                 prt_printf(out, "none");
503                 break;
504         case TARGET_DEV:
505                 if (c) {
506                         struct bch_dev *ca;
507
508                         rcu_read_lock();
509                         ca = t.dev < c->sb.nr_devices
510                                 ? rcu_dereference(c->devs[t.dev])
511                                 : NULL;
512
513                         if (ca && percpu_ref_tryget(&ca->io_ref)) {
514                                 prt_printf(out, "/dev/%pg", ca->disk_sb.bdev);
515                                 percpu_ref_put(&ca->io_ref);
516                         } else if (ca) {
517                                 prt_printf(out, "offline device %u", t.dev);
518                         } else {
519                                 prt_printf(out, "invalid device %u", t.dev);
520                         }
521
522                         rcu_read_unlock();
523                 } else {
524                         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
525                         struct bch_member *m = mi->members + t.dev;
526
527                         if (bch2_dev_exists(sb, mi, t.dev)) {
528                                 prt_printf(out, "Device ");
529                                 pr_uuid(out, m->uuid.b);
530                                 prt_printf(out, " (%u)", t.dev);
531                         } else {
532                                 prt_printf(out, "Bad device %u", t.dev);
533                         }
534                 }
535                 break;
536         case TARGET_GROUP:
537                 if (c) {
538                         mutex_lock(&c->sb_lock);
539                         bch2_disk_path_to_text(out, c->disk_sb.sb, t.group);
540                         mutex_unlock(&c->sb_lock);
541                 } else {
542                         bch2_disk_path_to_text(out, sb, t.group);
543                 }
544                 break;
545         default:
546                 BUG();
547         }
548 }