]> git.sesse.net Git - bcachefs-tools-debian/blob - libbcachefs/disk_groups.c
Update bcachefs sources to 717b356d1d bcachefs: Convert journal validation to bkey_in...
[bcachefs-tools-debian] / libbcachefs / disk_groups.c
1 // SPDX-License-Identifier: GPL-2.0
2 #include "bcachefs.h"
3 #include "disk_groups.h"
4 #include "sb-members.h"
5 #include "super-io.h"
6
7 #include <linux/sort.h>
8
9 static int group_cmp(const void *_l, const void *_r)
10 {
11         const struct bch_disk_group *l = _l;
12         const struct bch_disk_group *r = _r;
13
14         return ((BCH_GROUP_DELETED(l) > BCH_GROUP_DELETED(r)) -
15                 (BCH_GROUP_DELETED(l) < BCH_GROUP_DELETED(r))) ?:
16                 ((BCH_GROUP_PARENT(l) > BCH_GROUP_PARENT(r)) -
17                  (BCH_GROUP_PARENT(l) < BCH_GROUP_PARENT(r))) ?:
18                 strncmp(l->label, r->label, sizeof(l->label));
19 }
20
21 static int bch2_sb_disk_groups_validate(struct bch_sb *sb,
22                                         struct bch_sb_field *f,
23                                         struct printbuf *err)
24 {
25         struct bch_sb_field_disk_groups *groups =
26                 field_to_type(f, disk_groups);
27         struct bch_disk_group *g, *sorted = NULL;
28         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
29         unsigned nr_groups = disk_groups_nr(groups);
30         unsigned i, len;
31         int ret = 0;
32
33         for (i = 0; i < sb->nr_devices; i++) {
34                 struct bch_member *m = mi->members + i;
35                 unsigned g;
36
37                 if (!BCH_MEMBER_GROUP(m))
38                         continue;
39
40                 g = BCH_MEMBER_GROUP(m) - 1;
41
42                 if (g >= nr_groups) {
43                         prt_printf(err, "disk %u has invalid label %u (have %u)",
44                                i, g, nr_groups);
45                         return -BCH_ERR_invalid_sb_disk_groups;
46                 }
47
48                 if (BCH_GROUP_DELETED(&groups->entries[g])) {
49                         prt_printf(err, "disk %u has deleted label %u", i, g);
50                         return -BCH_ERR_invalid_sb_disk_groups;
51                 }
52         }
53
54         if (!nr_groups)
55                 return 0;
56
57         for (i = 0; i < nr_groups; i++) {
58                 g = groups->entries + i;
59
60                 if (BCH_GROUP_DELETED(g))
61                         continue;
62
63                 len = strnlen(g->label, sizeof(g->label));
64                 if (!len) {
65                         prt_printf(err, "label %u empty", i);
66                         return -BCH_ERR_invalid_sb_disk_groups;
67                 }
68         }
69
70         sorted = kmalloc_array(nr_groups, sizeof(*sorted), GFP_KERNEL);
71         if (!sorted)
72                 return -BCH_ERR_ENOMEM_disk_groups_validate;
73
74         memcpy(sorted, groups->entries, nr_groups * sizeof(*sorted));
75         sort(sorted, nr_groups, sizeof(*sorted), group_cmp, NULL);
76
77         for (g = sorted; g + 1 < sorted + nr_groups; g++)
78                 if (!BCH_GROUP_DELETED(g) &&
79                     !group_cmp(&g[0], &g[1])) {
80                         prt_printf(err, "duplicate label %llu.%.*s",
81                                BCH_GROUP_PARENT(g),
82                                (int) sizeof(g->label), g->label);
83                         ret = -BCH_ERR_invalid_sb_disk_groups;
84                         goto err;
85                 }
86 err:
87         kfree(sorted);
88         return ret;
89 }
90
91 void bch2_disk_groups_to_text(struct printbuf *out, struct bch_fs *c)
92 {
93         struct bch_disk_groups_cpu *g;
94         struct bch_dev *ca;
95         int i;
96         unsigned iter;
97
98         out->atomic++;
99         rcu_read_lock();
100
101         g = rcu_dereference(c->disk_groups);
102         if (!g)
103                 goto out;
104
105         for (i = 0; i < g->nr; i++) {
106                 if (i)
107                         prt_printf(out, " ");
108
109                 if (g->entries[i].deleted) {
110                         prt_printf(out, "[deleted]");
111                         continue;
112                 }
113
114                 prt_printf(out, "[parent %d devs", g->entries[i].parent);
115                 for_each_member_device_rcu(ca, c, iter, &g->entries[i].devs)
116                         prt_printf(out, " %s", ca->name);
117                 prt_printf(out, "]");
118         }
119
120 out:
121         rcu_read_unlock();
122         out->atomic--;
123 }
124
125 static void bch2_sb_disk_groups_to_text(struct printbuf *out,
126                                         struct bch_sb *sb,
127                                         struct bch_sb_field *f)
128 {
129         struct bch_sb_field_disk_groups *groups =
130                 field_to_type(f, disk_groups);
131         struct bch_disk_group *g;
132         unsigned nr_groups = disk_groups_nr(groups);
133
134         for (g = groups->entries;
135              g < groups->entries + nr_groups;
136              g++) {
137                 if (g != groups->entries)
138                         prt_printf(out, " ");
139
140                 if (BCH_GROUP_DELETED(g))
141                         prt_printf(out, "[deleted]");
142                 else
143                         prt_printf(out, "[parent %llu name %s]",
144                                BCH_GROUP_PARENT(g), g->label);
145         }
146 }
147
148 const struct bch_sb_field_ops bch_sb_field_ops_disk_groups = {
149         .validate       = bch2_sb_disk_groups_validate,
150         .to_text        = bch2_sb_disk_groups_to_text
151 };
152
153 int bch2_sb_disk_groups_to_cpu(struct bch_fs *c)
154 {
155         struct bch_sb_field_members *mi;
156         struct bch_sb_field_disk_groups *groups;
157         struct bch_disk_groups_cpu *cpu_g, *old_g;
158         unsigned i, g, nr_groups;
159
160         lockdep_assert_held(&c->sb_lock);
161
162         mi              = bch2_sb_get_members(c->disk_sb.sb);
163         groups          = bch2_sb_get_disk_groups(c->disk_sb.sb);
164         nr_groups       = disk_groups_nr(groups);
165
166         if (!groups)
167                 return 0;
168
169         cpu_g = kzalloc(sizeof(*cpu_g) +
170                         sizeof(cpu_g->entries[0]) * nr_groups, GFP_KERNEL);
171         if (!cpu_g)
172                 return -BCH_ERR_ENOMEM_disk_groups_to_cpu;
173
174         cpu_g->nr = nr_groups;
175
176         for (i = 0; i < nr_groups; i++) {
177                 struct bch_disk_group *src      = &groups->entries[i];
178                 struct bch_disk_group_cpu *dst  = &cpu_g->entries[i];
179
180                 dst->deleted    = BCH_GROUP_DELETED(src);
181                 dst->parent     = BCH_GROUP_PARENT(src);
182         }
183
184         for (i = 0; i < c->disk_sb.sb->nr_devices; i++) {
185                 struct bch_member *m = mi->members + i;
186                 struct bch_disk_group_cpu *dst =
187                         &cpu_g->entries[BCH_MEMBER_GROUP(m)];
188
189                 if (!bch2_member_exists(m))
190                         continue;
191
192                 g = BCH_MEMBER_GROUP(m);
193                 while (g) {
194                         dst = &cpu_g->entries[g - 1];
195                         __set_bit(i, dst->devs.d);
196                         g = dst->parent;
197                 }
198         }
199
200         old_g = rcu_dereference_protected(c->disk_groups,
201                                 lockdep_is_held(&c->sb_lock));
202         rcu_assign_pointer(c->disk_groups, cpu_g);
203         if (old_g)
204                 kfree_rcu(old_g, rcu);
205
206         return 0;
207 }
208
209 const struct bch_devs_mask *bch2_target_to_mask(struct bch_fs *c, unsigned target)
210 {
211         struct target t = target_decode(target);
212         struct bch_devs_mask *devs;
213
214         rcu_read_lock();
215
216         switch (t.type) {
217         case TARGET_NULL:
218                 devs = NULL;
219                 break;
220         case TARGET_DEV: {
221                 struct bch_dev *ca = t.dev < c->sb.nr_devices
222                         ? rcu_dereference(c->devs[t.dev])
223                         : NULL;
224                 devs = ca ? &ca->self : NULL;
225                 break;
226         }
227         case TARGET_GROUP: {
228                 struct bch_disk_groups_cpu *g = rcu_dereference(c->disk_groups);
229
230                 devs = g && t.group < g->nr && !g->entries[t.group].deleted
231                         ? &g->entries[t.group].devs
232                         : NULL;
233                 break;
234         }
235         default:
236                 BUG();
237         }
238
239         rcu_read_unlock();
240
241         return devs;
242 }
243
244 bool bch2_dev_in_target(struct bch_fs *c, unsigned dev, unsigned target)
245 {
246         struct target t = target_decode(target);
247
248         switch (t.type) {
249         case TARGET_NULL:
250                 return false;
251         case TARGET_DEV:
252                 return dev == t.dev;
253         case TARGET_GROUP: {
254                 struct bch_disk_groups_cpu *g;
255                 const struct bch_devs_mask *m;
256                 bool ret;
257
258                 rcu_read_lock();
259                 g = rcu_dereference(c->disk_groups);
260                 m = g && t.group < g->nr && !g->entries[t.group].deleted
261                         ? &g->entries[t.group].devs
262                         : NULL;
263
264                 ret = m ? test_bit(dev, m->d) : false;
265                 rcu_read_unlock();
266
267                 return ret;
268         }
269         default:
270                 BUG();
271         }
272 }
273
274 static int __bch2_disk_group_find(struct bch_sb_field_disk_groups *groups,
275                                   unsigned parent,
276                                   const char *name, unsigned namelen)
277 {
278         unsigned i, nr_groups = disk_groups_nr(groups);
279
280         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
281                 return -EINVAL;
282
283         for (i = 0; i < nr_groups; i++) {
284                 struct bch_disk_group *g = groups->entries + i;
285
286                 if (BCH_GROUP_DELETED(g))
287                         continue;
288
289                 if (!BCH_GROUP_DELETED(g) &&
290                     BCH_GROUP_PARENT(g) == parent &&
291                     strnlen(g->label, sizeof(g->label)) == namelen &&
292                     !memcmp(name, g->label, namelen))
293                         return i;
294         }
295
296         return -1;
297 }
298
299 static int __bch2_disk_group_add(struct bch_sb_handle *sb, unsigned parent,
300                                  const char *name, unsigned namelen)
301 {
302         struct bch_sb_field_disk_groups *groups =
303                 bch2_sb_get_disk_groups(sb->sb);
304         unsigned i, nr_groups = disk_groups_nr(groups);
305         struct bch_disk_group *g;
306
307         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
308                 return -EINVAL;
309
310         for (i = 0;
311              i < nr_groups && !BCH_GROUP_DELETED(&groups->entries[i]);
312              i++)
313                 ;
314
315         if (i == nr_groups) {
316                 unsigned u64s =
317                         (sizeof(struct bch_sb_field_disk_groups) +
318                          sizeof(struct bch_disk_group) * (nr_groups + 1)) /
319                         sizeof(u64);
320
321                 groups = bch2_sb_resize_disk_groups(sb, u64s);
322                 if (!groups)
323                         return -BCH_ERR_ENOSPC_disk_label_add;
324
325                 nr_groups = disk_groups_nr(groups);
326         }
327
328         BUG_ON(i >= nr_groups);
329
330         g = &groups->entries[i];
331
332         memcpy(g->label, name, namelen);
333         if (namelen < sizeof(g->label))
334                 g->label[namelen] = '\0';
335         SET_BCH_GROUP_DELETED(g, 0);
336         SET_BCH_GROUP_PARENT(g, parent);
337         SET_BCH_GROUP_DATA_ALLOWED(g, ~0);
338
339         return i;
340 }
341
342 int bch2_disk_path_find(struct bch_sb_handle *sb, const char *name)
343 {
344         struct bch_sb_field_disk_groups *groups =
345                 bch2_sb_get_disk_groups(sb->sb);
346         int v = -1;
347
348         do {
349                 const char *next = strchrnul(name, '.');
350                 unsigned len = next - name;
351
352                 if (*next == '.')
353                         next++;
354
355                 v = __bch2_disk_group_find(groups, v + 1, name, len);
356                 name = next;
357         } while (*name && v >= 0);
358
359         return v;
360 }
361
362 int bch2_disk_path_find_or_create(struct bch_sb_handle *sb, const char *name)
363 {
364         struct bch_sb_field_disk_groups *groups;
365         unsigned parent = 0;
366         int v = -1;
367
368         do {
369                 const char *next = strchrnul(name, '.');
370                 unsigned len = next - name;
371
372                 if (*next == '.')
373                         next++;
374
375                 groups = bch2_sb_get_disk_groups(sb->sb);
376
377                 v = __bch2_disk_group_find(groups, parent, name, len);
378                 if (v < 0)
379                         v = __bch2_disk_group_add(sb, parent, name, len);
380                 if (v < 0)
381                         return v;
382
383                 parent = v + 1;
384                 name = next;
385         } while (*name && v >= 0);
386
387         return v;
388 }
389
390 void bch2_disk_path_to_text(struct printbuf *out, struct bch_sb *sb, unsigned v)
391 {
392         struct bch_sb_field_disk_groups *groups =
393                 bch2_sb_get_disk_groups(sb);
394         struct bch_disk_group *g;
395         unsigned nr = 0;
396         u16 path[32];
397
398         while (1) {
399                 if (nr == ARRAY_SIZE(path))
400                         goto inval;
401
402                 if (v >= disk_groups_nr(groups))
403                         goto inval;
404
405                 g = groups->entries + v;
406
407                 if (BCH_GROUP_DELETED(g))
408                         goto inval;
409
410                 path[nr++] = v;
411
412                 if (!BCH_GROUP_PARENT(g))
413                         break;
414
415                 v = BCH_GROUP_PARENT(g) - 1;
416         }
417
418         while (nr) {
419                 v = path[--nr];
420                 g = groups->entries + v;
421
422                 prt_printf(out, "%.*s", (int) sizeof(g->label), g->label);
423                 if (nr)
424                         prt_printf(out, ".");
425         }
426         return;
427 inval:
428         prt_printf(out, "invalid label %u", v);
429 }
430
431 int __bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
432 {
433         struct bch_member *mi;
434         int ret, v = -1;
435
436         if (!strlen(name) || !strcmp(name, "none"))
437                 return 0;
438
439         v = bch2_disk_path_find_or_create(&c->disk_sb, name);
440         if (v < 0)
441                 return v;
442
443         ret = bch2_sb_disk_groups_to_cpu(c);
444         if (ret)
445                 return ret;
446
447         mi = &bch2_sb_get_members(c->disk_sb.sb)->members[ca->dev_idx];
448         SET_BCH_MEMBER_GROUP(mi, v + 1);
449         return 0;
450 }
451
452 int bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
453 {
454         int ret;
455
456         mutex_lock(&c->sb_lock);
457         ret = __bch2_dev_group_set(c, ca, name) ?:
458                 bch2_write_super(c);
459         mutex_unlock(&c->sb_lock);
460
461         return ret;
462 }
463
464 int bch2_opt_target_parse(struct bch_fs *c, const char *val, u64 *res,
465                           struct printbuf *err)
466 {
467         struct bch_dev *ca;
468         int g;
469
470         if (!val)
471                 return -EINVAL;
472
473         if (!c)
474                 return 0;
475
476         if (!strlen(val) || !strcmp(val, "none")) {
477                 *res = 0;
478                 return 0;
479         }
480
481         /* Is it a device? */
482         ca = bch2_dev_lookup(c, val);
483         if (!IS_ERR(ca)) {
484                 *res = dev_to_target(ca->dev_idx);
485                 percpu_ref_put(&ca->ref);
486                 return 0;
487         }
488
489         mutex_lock(&c->sb_lock);
490         g = bch2_disk_path_find(&c->disk_sb, val);
491         mutex_unlock(&c->sb_lock);
492
493         if (g >= 0) {
494                 *res = group_to_target(g);
495                 return 0;
496         }
497
498         return -EINVAL;
499 }
500
501 void bch2_opt_target_to_text(struct printbuf *out,
502                              struct bch_fs *c,
503                              struct bch_sb *sb,
504                              u64 v)
505 {
506         struct target t = target_decode(v);
507
508         switch (t.type) {
509         case TARGET_NULL:
510                 prt_printf(out, "none");
511                 break;
512         case TARGET_DEV:
513                 if (c) {
514                         struct bch_dev *ca;
515
516                         rcu_read_lock();
517                         ca = t.dev < c->sb.nr_devices
518                                 ? rcu_dereference(c->devs[t.dev])
519                                 : NULL;
520
521                         if (ca && percpu_ref_tryget(&ca->io_ref)) {
522                                 prt_printf(out, "/dev/%pg", ca->disk_sb.bdev);
523                                 percpu_ref_put(&ca->io_ref);
524                         } else if (ca) {
525                                 prt_printf(out, "offline device %u", t.dev);
526                         } else {
527                                 prt_printf(out, "invalid device %u", t.dev);
528                         }
529
530                         rcu_read_unlock();
531                 } else {
532                         struct bch_sb_field_members *mi = bch2_sb_get_members(sb);
533                         struct bch_member *m = mi->members + t.dev;
534
535                         if (bch2_dev_exists(sb, mi, t.dev)) {
536                                 prt_printf(out, "Device ");
537                                 pr_uuid(out, m->uuid.b);
538                                 prt_printf(out, " (%u)", t.dev);
539                         } else {
540                                 prt_printf(out, "Bad device %u", t.dev);
541                         }
542                 }
543                 break;
544         case TARGET_GROUP:
545                 if (c) {
546                         mutex_lock(&c->sb_lock);
547                         bch2_disk_path_to_text(out, c->disk_sb.sb, t.group);
548                         mutex_unlock(&c->sb_lock);
549                 } else {
550                         bch2_disk_path_to_text(out, sb, t.group);
551                 }
552                 break;
553         default:
554                 BUG();
555         }
556 }