]> git.sesse.net Git - bcachefs-tools-debian/blob - libbcachefs/disk_groups.c
Update bcachefs sources to 259ff91605 bcachefs: Don't keep around btree_paths unneces...
[bcachefs-tools-debian] / libbcachefs / disk_groups.c
1 // SPDX-License-Identifier: GPL-2.0
2 #include "bcachefs.h"
3 #include "disk_groups.h"
4 #include "super-io.h"
5
6 #include <linux/sort.h>
7
8 static int group_cmp(const void *_l, const void *_r)
9 {
10         const struct bch_disk_group *l = _l;
11         const struct bch_disk_group *r = _r;
12
13         return ((BCH_GROUP_DELETED(l) > BCH_GROUP_DELETED(r)) -
14                 (BCH_GROUP_DELETED(l) < BCH_GROUP_DELETED(r))) ?:
15                 ((BCH_GROUP_PARENT(l) > BCH_GROUP_PARENT(r)) -
16                  (BCH_GROUP_PARENT(l) < BCH_GROUP_PARENT(r))) ?:
17                 strncmp(l->label, r->label, sizeof(l->label));
18 }
19
20 static int bch2_sb_disk_groups_validate(struct bch_sb *sb,
21                                         struct bch_sb_field *f,
22                                         struct printbuf *err)
23 {
24         struct bch_sb_field_disk_groups *groups =
25                 field_to_type(f, disk_groups);
26         struct bch_disk_group *g, *sorted = NULL;
27         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
28         unsigned nr_groups = disk_groups_nr(groups);
29         unsigned i, len;
30         int ret = -EINVAL;
31
32         for (i = 0; i < sb->nr_devices; i++) {
33                 struct bch_member *m = mi->members + i;
34                 unsigned g;
35
36                 if (!BCH_MEMBER_GROUP(m))
37                         continue;
38
39                 g = BCH_MEMBER_GROUP(m) - 1;
40
41                 if (g >= nr_groups) {
42                         pr_buf(err, "disk %u has invalid label %u (have %u)",
43                                i, g, nr_groups);
44                         return -EINVAL;
45                 }
46
47                 if (BCH_GROUP_DELETED(&groups->entries[g])) {
48                         pr_buf(err, "disk %u has deleted label %u", i, g);
49                         return -EINVAL;
50                 }
51         }
52
53         if (!nr_groups)
54                 return 0;
55
56         for (i = 0; i < nr_groups; i++) {
57                 g = groups->entries + i;
58
59                 if (BCH_GROUP_DELETED(g))
60                         continue;
61
62                 len = strnlen(g->label, sizeof(g->label));
63                 if (!len) {
64                         pr_buf(err, "label %u empty", i);
65                         return -EINVAL;
66                 }
67         }
68
69         sorted = kmalloc_array(nr_groups, sizeof(*sorted), GFP_KERNEL);
70         if (!sorted)
71                 return -ENOMEM;
72
73         memcpy(sorted, groups->entries, nr_groups * sizeof(*sorted));
74         sort(sorted, nr_groups, sizeof(*sorted), group_cmp, NULL);
75
76         for (g = sorted; g + 1 < sorted + nr_groups; g++)
77                 if (!BCH_GROUP_DELETED(g) &&
78                     !group_cmp(&g[0], &g[1])) {
79                         pr_buf(err, "duplicate label %llu.%.*s",
80                                BCH_GROUP_PARENT(g),
81                                (int) sizeof(g->label), g->label);
82                         goto err;
83                 }
84
85         ret = 0;
86 err:
87         kfree(sorted);
88         return 0;
89 }
90
91 static void bch2_sb_disk_groups_to_text(struct printbuf *out,
92                                         struct bch_sb *sb,
93                                         struct bch_sb_field *f)
94 {
95         struct bch_sb_field_disk_groups *groups =
96                 field_to_type(f, disk_groups);
97         struct bch_disk_group *g;
98         unsigned nr_groups = disk_groups_nr(groups);
99
100         for (g = groups->entries;
101              g < groups->entries + nr_groups;
102              g++) {
103                 if (g != groups->entries)
104                         pr_buf(out, " ");
105
106                 if (BCH_GROUP_DELETED(g))
107                         pr_buf(out, "[deleted]");
108                 else
109                         pr_buf(out, "[parent %llu name %s]",
110                                BCH_GROUP_PARENT(g), g->label);
111         }
112 }
113
114 const struct bch_sb_field_ops bch_sb_field_ops_disk_groups = {
115         .validate       = bch2_sb_disk_groups_validate,
116         .to_text        = bch2_sb_disk_groups_to_text
117 };
118
119 int bch2_sb_disk_groups_to_cpu(struct bch_fs *c)
120 {
121         struct bch_sb_field_members *mi;
122         struct bch_sb_field_disk_groups *groups;
123         struct bch_disk_groups_cpu *cpu_g, *old_g;
124         unsigned i, g, nr_groups;
125
126         lockdep_assert_held(&c->sb_lock);
127
128         mi              = bch2_sb_get_members(c->disk_sb.sb);
129         groups          = bch2_sb_get_disk_groups(c->disk_sb.sb);
130         nr_groups       = disk_groups_nr(groups);
131
132         if (!groups)
133                 return 0;
134
135         cpu_g = kzalloc(sizeof(*cpu_g) +
136                         sizeof(cpu_g->entries[0]) * nr_groups, GFP_KERNEL);
137         if (!cpu_g)
138                 return -ENOMEM;
139
140         cpu_g->nr = nr_groups;
141
142         for (i = 0; i < nr_groups; i++) {
143                 struct bch_disk_group *src      = &groups->entries[i];
144                 struct bch_disk_group_cpu *dst  = &cpu_g->entries[i];
145
146                 dst->deleted    = BCH_GROUP_DELETED(src);
147                 dst->parent     = BCH_GROUP_PARENT(src);
148         }
149
150         for (i = 0; i < c->disk_sb.sb->nr_devices; i++) {
151                 struct bch_member *m = mi->members + i;
152                 struct bch_disk_group_cpu *dst =
153                         &cpu_g->entries[BCH_MEMBER_GROUP(m)];
154
155                 if (!bch2_member_exists(m))
156                         continue;
157
158                 g = BCH_MEMBER_GROUP(m);
159                 while (g) {
160                         dst = &cpu_g->entries[g - 1];
161                         __set_bit(i, dst->devs.d);
162                         g = dst->parent;
163                 }
164         }
165
166         old_g = rcu_dereference_protected(c->disk_groups,
167                                 lockdep_is_held(&c->sb_lock));
168         rcu_assign_pointer(c->disk_groups, cpu_g);
169         if (old_g)
170                 kfree_rcu(old_g, rcu);
171
172         return 0;
173 }
174
175 const struct bch_devs_mask *bch2_target_to_mask(struct bch_fs *c, unsigned target)
176 {
177         struct target t = target_decode(target);
178
179         switch (t.type) {
180         case TARGET_NULL:
181                 return NULL;
182         case TARGET_DEV: {
183                 struct bch_dev *ca = t.dev < c->sb.nr_devices
184                         ? rcu_dereference(c->devs[t.dev])
185                         : NULL;
186                 return ca ? &ca->self : NULL;
187         }
188         case TARGET_GROUP: {
189                 struct bch_disk_groups_cpu *g = rcu_dereference(c->disk_groups);
190
191                 return g && t.group < g->nr && !g->entries[t.group].deleted
192                         ? &g->entries[t.group].devs
193                         : NULL;
194         }
195         default:
196                 BUG();
197         }
198 }
199
200 bool bch2_dev_in_target(struct bch_fs *c, unsigned dev, unsigned target)
201 {
202         struct target t = target_decode(target);
203
204         switch (t.type) {
205         case TARGET_NULL:
206                 return false;
207         case TARGET_DEV:
208                 return dev == t.dev;
209         case TARGET_GROUP: {
210                 struct bch_disk_groups_cpu *g;
211                 const struct bch_devs_mask *m;
212                 bool ret;
213
214                 rcu_read_lock();
215                 g = rcu_dereference(c->disk_groups);
216                 m = g && t.group < g->nr && !g->entries[t.group].deleted
217                         ? &g->entries[t.group].devs
218                         : NULL;
219
220                 ret = m ? test_bit(dev, m->d) : false;
221                 rcu_read_unlock();
222
223                 return ret;
224         }
225         default:
226                 BUG();
227         }
228 }
229
230 static int __bch2_disk_group_find(struct bch_sb_field_disk_groups *groups,
231                                   unsigned parent,
232                                   const char *name, unsigned namelen)
233 {
234         unsigned i, nr_groups = disk_groups_nr(groups);
235
236         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
237                 return -EINVAL;
238
239         for (i = 0; i < nr_groups; i++) {
240                 struct bch_disk_group *g = groups->entries + i;
241
242                 if (BCH_GROUP_DELETED(g))
243                         continue;
244
245                 if (!BCH_GROUP_DELETED(g) &&
246                     BCH_GROUP_PARENT(g) == parent &&
247                     strnlen(g->label, sizeof(g->label)) == namelen &&
248                     !memcmp(name, g->label, namelen))
249                         return i;
250         }
251
252         return -1;
253 }
254
255 static int __bch2_disk_group_add(struct bch_sb_handle *sb, unsigned parent,
256                                  const char *name, unsigned namelen)
257 {
258         struct bch_sb_field_disk_groups *groups =
259                 bch2_sb_get_disk_groups(sb->sb);
260         unsigned i, nr_groups = disk_groups_nr(groups);
261         struct bch_disk_group *g;
262
263         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
264                 return -EINVAL;
265
266         for (i = 0;
267              i < nr_groups && !BCH_GROUP_DELETED(&groups->entries[i]);
268              i++)
269                 ;
270
271         if (i == nr_groups) {
272                 unsigned u64s =
273                         (sizeof(struct bch_sb_field_disk_groups) +
274                          sizeof(struct bch_disk_group) * (nr_groups + 1)) /
275                         sizeof(u64);
276
277                 groups = bch2_sb_resize_disk_groups(sb, u64s);
278                 if (!groups)
279                         return -ENOSPC;
280
281                 nr_groups = disk_groups_nr(groups);
282         }
283
284         BUG_ON(i >= nr_groups);
285
286         g = &groups->entries[i];
287
288         memcpy(g->label, name, namelen);
289         if (namelen < sizeof(g->label))
290                 g->label[namelen] = '\0';
291         SET_BCH_GROUP_DELETED(g, 0);
292         SET_BCH_GROUP_PARENT(g, parent);
293         SET_BCH_GROUP_DATA_ALLOWED(g, ~0);
294
295         return i;
296 }
297
298 int bch2_disk_path_find(struct bch_sb_handle *sb, const char *name)
299 {
300         struct bch_sb_field_disk_groups *groups =
301                 bch2_sb_get_disk_groups(sb->sb);
302         int v = -1;
303
304         do {
305                 const char *next = strchrnul(name, '.');
306                 unsigned len = next - name;
307
308                 if (*next == '.')
309                         next++;
310
311                 v = __bch2_disk_group_find(groups, v + 1, name, len);
312                 name = next;
313         } while (*name && v >= 0);
314
315         return v;
316 }
317
318 int bch2_disk_path_find_or_create(struct bch_sb_handle *sb, const char *name)
319 {
320         struct bch_sb_field_disk_groups *groups;
321         unsigned parent = 0;
322         int v = -1;
323
324         do {
325                 const char *next = strchrnul(name, '.');
326                 unsigned len = next - name;
327
328                 if (*next == '.')
329                         next++;
330
331                 groups = bch2_sb_get_disk_groups(sb->sb);
332
333                 v = __bch2_disk_group_find(groups, parent, name, len);
334                 if (v < 0)
335                         v = __bch2_disk_group_add(sb, parent, name, len);
336                 if (v < 0)
337                         return v;
338
339                 parent = v + 1;
340                 name = next;
341         } while (*name && v >= 0);
342
343         return v;
344 }
345
346 void bch2_disk_path_to_text(struct printbuf *out, struct bch_sb *sb, unsigned v)
347 {
348         struct bch_sb_field_disk_groups *groups =
349                 bch2_sb_get_disk_groups(sb);
350         struct bch_disk_group *g;
351         unsigned nr = 0;
352         u16 path[32];
353
354         while (1) {
355                 if (nr == ARRAY_SIZE(path))
356                         goto inval;
357
358                 if (v >= disk_groups_nr(groups))
359                         goto inval;
360
361                 g = groups->entries + v;
362
363                 if (BCH_GROUP_DELETED(g))
364                         goto inval;
365
366                 path[nr++] = v;
367
368                 if (!BCH_GROUP_PARENT(g))
369                         break;
370
371                 v = BCH_GROUP_PARENT(g) - 1;
372         }
373
374         while (nr) {
375                 v = path[--nr];
376                 g = groups->entries + v;
377
378                 pr_buf(out, "%.*s", (int) sizeof(g->label), g->label);
379                 if (nr)
380                         pr_buf(out, ".");
381         }
382         return;
383 inval:
384         pr_buf(out, "invalid label %u", v);
385 }
386
387 int bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
388 {
389         struct bch_member *mi;
390         int v = -1;
391         int ret = 0;
392
393         mutex_lock(&c->sb_lock);
394
395         if (!strlen(name) || !strcmp(name, "none"))
396                 goto write_sb;
397
398         v = bch2_disk_path_find_or_create(&c->disk_sb, name);
399         if (v < 0) {
400                 mutex_unlock(&c->sb_lock);
401                 return v;
402         }
403
404         ret = bch2_sb_disk_groups_to_cpu(c);
405         if (ret)
406                 goto unlock;
407 write_sb:
408         mi = &bch2_sb_get_members(c->disk_sb.sb)->members[ca->dev_idx];
409         SET_BCH_MEMBER_GROUP(mi, v + 1);
410
411         bch2_write_super(c);
412 unlock:
413         mutex_unlock(&c->sb_lock);
414
415         return ret;
416 }
417
418 int bch2_opt_target_parse(struct bch_fs *c, const char *buf, u64 *v)
419 {
420         struct bch_dev *ca;
421         int g;
422
423         if (!strlen(buf) || !strcmp(buf, "none")) {
424                 *v = 0;
425                 return 0;
426         }
427
428         /* Is it a device? */
429         ca = bch2_dev_lookup(c, buf);
430         if (!IS_ERR(ca)) {
431                 *v = dev_to_target(ca->dev_idx);
432                 percpu_ref_put(&ca->ref);
433                 return 0;
434         }
435
436         mutex_lock(&c->sb_lock);
437         g = bch2_disk_path_find(&c->disk_sb, buf);
438         mutex_unlock(&c->sb_lock);
439
440         if (g >= 0) {
441                 *v = group_to_target(g);
442                 return 0;
443         }
444
445         return -EINVAL;
446 }
447
448 void bch2_opt_target_to_text(struct printbuf *out,
449                              struct bch_fs *c,
450                              struct bch_sb *sb,
451                              u64 v)
452 {
453         struct target t = target_decode(v);
454
455         switch (t.type) {
456         case TARGET_NULL:
457                 pr_buf(out, "none");
458                 break;
459         case TARGET_DEV:
460                 if (c) {
461                         struct bch_dev *ca;
462
463                         rcu_read_lock();
464                         ca = t.dev < c->sb.nr_devices
465                                 ? rcu_dereference(c->devs[t.dev])
466                                 : NULL;
467
468                         if (ca && percpu_ref_tryget(&ca->io_ref)) {
469                                 char b[BDEVNAME_SIZE];
470
471                                 pr_buf(out, "/dev/%s",
472                                        bdevname(ca->disk_sb.bdev, b));
473                                 percpu_ref_put(&ca->io_ref);
474                         } else if (ca) {
475                                 pr_buf(out, "offline device %u", t.dev);
476                         } else {
477                                 pr_buf(out, "invalid device %u", t.dev);
478                         }
479
480                         rcu_read_unlock();
481                 } else {
482                         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
483                         struct bch_member *m = mi->members + t.dev;
484
485                         if (bch2_dev_exists(sb, mi, t.dev)) {
486                                 pr_buf(out, "Device ");
487                                 pr_uuid(out, m->uuid.b);
488                                 pr_buf(out, " (%u)", t.dev);
489                         } else {
490                                 pr_buf(out, "Bad device %u", t.dev);
491                         }
492                 }
493                 break;
494         case TARGET_GROUP:
495                 if (c) {
496                         mutex_lock(&c->sb_lock);
497                         bch2_disk_path_to_text(out, c->disk_sb.sb, t.group);
498                         mutex_unlock(&c->sb_lock);
499                 } else {
500                         bch2_disk_path_to_text(out, sb, t.group);
501                 }
502                 break;
503         default:
504                 BUG();
505         }
506 }