]> git.sesse.net Git - bcachefs-tools-debian/blob - libbcachefs/disk_groups.c
87f3940e1df5087d3111c518505a154ad10a8acd
[bcachefs-tools-debian] / libbcachefs / disk_groups.c
1 #include "bcachefs.h"
2 #include "disk_groups.h"
3 #include "super-io.h"
4
5 #include <linux/sort.h>
6
7 static int group_cmp(const void *_l, const void *_r)
8 {
9         const struct bch_disk_group *l = _l;
10         const struct bch_disk_group *r = _r;
11
12         return ((BCH_GROUP_DELETED(l) > BCH_GROUP_DELETED(r)) -
13                 (BCH_GROUP_DELETED(l) < BCH_GROUP_DELETED(r))) ?:
14                 ((BCH_GROUP_PARENT(l) > BCH_GROUP_PARENT(r)) -
15                  (BCH_GROUP_PARENT(l) < BCH_GROUP_PARENT(r))) ?:
16                 strncmp(l->label, r->label, sizeof(l->label));
17 }
18
19 static const char *bch2_sb_disk_groups_validate(struct bch_sb *sb,
20                                                 struct bch_sb_field *f)
21 {
22         struct bch_sb_field_disk_groups *groups =
23                 field_to_type(f, disk_groups);
24         struct bch_disk_group *g, *sorted = NULL;
25         struct bch_sb_field_members *mi;
26         struct bch_member *m;
27         unsigned i, nr_groups, len;
28         const char *err = NULL;
29
30         mi              = bch2_sb_get_members(sb);
31         groups          = bch2_sb_get_disk_groups(sb);
32         nr_groups       = disk_groups_nr(groups);
33
34         for (m = mi->members;
35              m < mi->members + sb->nr_devices;
36              m++) {
37                 unsigned g;
38
39                 if (!BCH_MEMBER_GROUP(m))
40                         continue;
41
42                 g = BCH_MEMBER_GROUP(m) - 1;
43
44                 if (g >= nr_groups ||
45                     BCH_GROUP_DELETED(&groups->entries[g]))
46                         return "disk has invalid group";
47         }
48
49         if (!nr_groups)
50                 return NULL;
51
52         for (g = groups->entries;
53              g < groups->entries + nr_groups;
54              g++) {
55                 if (BCH_GROUP_DELETED(g))
56                         continue;
57
58                 len = strnlen(g->label, sizeof(g->label));
59                 if (!len) {
60                         err = "group with empty label";
61                         goto err;
62                 }
63         }
64
65         sorted = kmalloc_array(nr_groups, sizeof(*sorted), GFP_KERNEL);
66         if (!sorted)
67                 return "cannot allocate memory";
68
69         memcpy(sorted, groups->entries, nr_groups * sizeof(*sorted));
70         sort(sorted, nr_groups, sizeof(*sorted), group_cmp, NULL);
71
72         for (i = 0; i + 1 < nr_groups; i++)
73                 if (!BCH_GROUP_DELETED(sorted + i) &&
74                     !group_cmp(sorted + i, sorted + i + 1)) {
75                         err = "duplicate groups";
76                         goto err;
77                 }
78
79         err = NULL;
80 err:
81         kfree(sorted);
82         return err;
83 }
84
85 static size_t bch2_sb_disk_groups_to_text(char *buf, size_t size,
86                                         struct bch_sb *sb,
87                                         struct bch_sb_field *f)
88 {
89         char *out = buf, *end = buf + size;
90         struct bch_sb_field_disk_groups *groups =
91                 field_to_type(f, disk_groups);
92         struct bch_disk_group *g;
93         unsigned nr_groups = disk_groups_nr(groups);
94
95         for (g = groups->entries;
96              g < groups->entries + nr_groups;
97              g++) {
98                 if (g != groups->entries)
99                         out += scnprintf(out, end - out, " ");
100
101                 if (BCH_GROUP_DELETED(g))
102                         out += scnprintf(out, end - out, "[deleted]");
103                 else
104                         out += scnprintf(out, end - out,
105                                          "[parent %llu name %s]",
106                                          BCH_GROUP_PARENT(g),
107                                          g->label);
108         }
109
110         return out - buf;
111 }
112
113 const struct bch_sb_field_ops bch_sb_field_ops_disk_groups = {
114         .validate       = bch2_sb_disk_groups_validate,
115         .to_text        = bch2_sb_disk_groups_to_text
116 };
117
118 int bch2_sb_disk_groups_to_cpu(struct bch_fs *c)
119 {
120         struct bch_sb_field_members *mi;
121         struct bch_sb_field_disk_groups *groups;
122         struct bch_disk_groups_cpu *cpu_g, *old_g;
123         unsigned i, g, nr_groups;
124
125         lockdep_assert_held(&c->sb_lock);
126
127         mi              = bch2_sb_get_members(c->disk_sb.sb);
128         groups          = bch2_sb_get_disk_groups(c->disk_sb.sb);
129         nr_groups       = disk_groups_nr(groups);
130
131         if (!groups)
132                 return 0;
133
134         cpu_g = kzalloc(sizeof(*cpu_g) +
135                         sizeof(cpu_g->entries[0]) * nr_groups, GFP_KERNEL);
136         if (!cpu_g)
137                 return -ENOMEM;
138
139         cpu_g->nr = nr_groups;
140
141         for (i = 0; i < nr_groups; i++) {
142                 struct bch_disk_group *src      = &groups->entries[i];
143                 struct bch_disk_group_cpu *dst  = &cpu_g->entries[i];
144
145                 dst->deleted    = BCH_GROUP_DELETED(src);
146                 dst->parent     = BCH_GROUP_PARENT(src);
147         }
148
149         for (i = 0; i < c->disk_sb.sb->nr_devices; i++) {
150                 struct bch_member *m = mi->members + i;
151                 struct bch_disk_group_cpu *dst =
152                         &cpu_g->entries[BCH_MEMBER_GROUP(m)];
153
154                 if (!bch2_member_exists(m))
155                         continue;
156
157                 g = BCH_MEMBER_GROUP(m);
158                 while (g) {
159                         dst = &cpu_g->entries[g - 1];
160                         __set_bit(i, dst->devs.d);
161                         g = dst->parent;
162                 }
163         }
164
165         old_g = rcu_dereference_protected(c->disk_groups,
166                                 lockdep_is_held(&c->sb_lock));
167         rcu_assign_pointer(c->disk_groups, cpu_g);
168         if (old_g)
169                 kfree_rcu(old_g, rcu);
170
171         return 0;
172 }
173
174 const struct bch_devs_mask *bch2_target_to_mask(struct bch_fs *c, unsigned target)
175 {
176         struct target t = target_decode(target);
177
178         switch (t.type) {
179         case TARGET_NULL:
180                 return NULL;
181         case TARGET_DEV: {
182                 struct bch_dev *ca = t.dev < c->sb.nr_devices
183                         ? rcu_dereference(c->devs[t.dev])
184                         : NULL;
185                 return ca ? &ca->self : NULL;
186         }
187         case TARGET_GROUP: {
188                 struct bch_disk_groups_cpu *g = rcu_dereference(c->disk_groups);
189
190                 return t.group < g->nr && !g->entries[t.group].deleted
191                         ? &g->entries[t.group].devs
192                         : NULL;
193         }
194         default:
195                 BUG();
196         }
197 }
198
199 bool bch2_dev_in_target(struct bch_fs *c, unsigned dev, unsigned target)
200 {
201         struct target t = target_decode(target);
202
203         switch (t.type) {
204         case TARGET_NULL:
205                 return false;
206         case TARGET_DEV:
207                 return dev == t.dev;
208         case TARGET_GROUP: {
209                 struct bch_disk_groups_cpu *g;
210                 const struct bch_devs_mask *m;
211                 bool ret;
212
213                 rcu_read_lock();
214                 g = rcu_dereference(c->disk_groups);
215                 m = t.group < g->nr && !g->entries[t.group].deleted
216                         ? &g->entries[t.group].devs
217                         : NULL;
218
219                 ret = m ? test_bit(dev, m->d) : false;
220                 rcu_read_unlock();
221
222                 return ret;
223         }
224         default:
225                 BUG();
226         }
227 }
228
229 static int __bch2_disk_group_find(struct bch_sb_field_disk_groups *groups,
230                                   unsigned parent,
231                                   const char *name, unsigned namelen)
232 {
233         unsigned i, nr_groups = disk_groups_nr(groups);
234
235         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
236                 return -EINVAL;
237
238         for (i = 0; i < nr_groups; i++) {
239                 struct bch_disk_group *g = groups->entries + i;
240
241                 if (BCH_GROUP_DELETED(g))
242                         continue;
243
244                 if (!BCH_GROUP_DELETED(g) &&
245                     BCH_GROUP_PARENT(g) == parent &&
246                     strnlen(g->label, sizeof(g->label)) == namelen &&
247                     !memcmp(name, g->label, namelen))
248                         return i;
249         }
250
251         return -1;
252 }
253
254 static int __bch2_disk_group_add(struct bch_sb_handle *sb, unsigned parent,
255                                  const char *name, unsigned namelen)
256 {
257         struct bch_sb_field_disk_groups *groups =
258                 bch2_sb_get_disk_groups(sb->sb);
259         unsigned i, nr_groups = disk_groups_nr(groups);
260         struct bch_disk_group *g;
261
262         if (!namelen || namelen > BCH_SB_LABEL_SIZE)
263                 return -EINVAL;
264
265         for (i = 0;
266              i < nr_groups && !BCH_GROUP_DELETED(&groups->entries[i]);
267              i++)
268                 ;
269
270         if (i == nr_groups) {
271                 unsigned u64s =
272                         (sizeof(struct bch_sb_field_disk_groups) +
273                          sizeof(struct bch_disk_group) * (nr_groups + 1)) /
274                         sizeof(u64);
275
276                 groups = bch2_sb_resize_disk_groups(sb, u64s);
277                 if (!groups)
278                         return -ENOSPC;
279
280                 nr_groups = disk_groups_nr(groups);
281         }
282
283         BUG_ON(i >= nr_groups);
284
285         g = &groups->entries[i];
286
287         memcpy(g->label, name, namelen);
288         if (namelen < sizeof(g->label))
289                 g->label[namelen] = '\0';
290         SET_BCH_GROUP_DELETED(g, 0);
291         SET_BCH_GROUP_PARENT(g, parent);
292         SET_BCH_GROUP_DATA_ALLOWED(g, ~0);
293
294         return i;
295 }
296
297 int bch2_disk_path_find(struct bch_sb_handle *sb, const char *name)
298 {
299         struct bch_sb_field_disk_groups *groups =
300                 bch2_sb_get_disk_groups(sb->sb);
301         int v = -1;
302
303         do {
304                 const char *next = strchrnul(name, '.');
305                 unsigned len = next - name;
306
307                 if (*next == '.')
308                         next++;
309
310                 v = __bch2_disk_group_find(groups, v + 1, name, len);
311                 name = next;
312         } while (*name && v >= 0);
313
314         return v;
315 }
316
317 int bch2_disk_path_find_or_create(struct bch_sb_handle *sb, const char *name)
318 {
319         struct bch_sb_field_disk_groups *groups;
320         unsigned parent = 0;
321         int v = -1;
322
323         do {
324                 const char *next = strchrnul(name, '.');
325                 unsigned len = next - name;
326
327                 if (*next == '.')
328                         next++;
329
330                 groups = bch2_sb_get_disk_groups(sb->sb);
331
332                 v = __bch2_disk_group_find(groups, parent, name, len);
333                 if (v < 0)
334                         v = __bch2_disk_group_add(sb, parent, name, len);
335                 if (v < 0)
336                         return v;
337
338                 parent = v + 1;
339                 name = next;
340         } while (*name && v >= 0);
341
342         return v;
343 }
344
345 int bch2_disk_path_print(struct bch_sb_handle *sb,
346                          char *buf, size_t len, unsigned v)
347 {
348         char *out = buf, *end = out + len;
349         struct bch_sb_field_disk_groups *groups =
350                 bch2_sb_get_disk_groups(sb->sb);
351         struct bch_disk_group *g;
352         unsigned nr = 0;
353         u16 path[32];
354
355         while (1) {
356                 if (nr == ARRAY_SIZE(path))
357                         goto inval;
358
359                 if (v >= disk_groups_nr(groups))
360                         goto inval;
361
362                 g = groups->entries + v;
363
364                 if (BCH_GROUP_DELETED(g))
365                         goto inval;
366
367                 path[nr++] = v;
368
369                 if (!BCH_GROUP_PARENT(g))
370                         break;
371
372                 v = BCH_GROUP_PARENT(g) - 1;
373         }
374
375         while (nr) {
376                 unsigned b = 0;
377
378                 v = path[--nr];
379                 g = groups->entries + v;
380
381                 if (end != out)
382                         b = min_t(size_t, end - out,
383                                   strnlen(g->label, sizeof(g->label)));
384                 memcpy(out, g->label, b);
385                 if (b < end - out)
386                         out[b] = '\0';
387                 out += b;
388
389                 if (nr)
390                         out += scnprintf(out, end - out, ".");
391         }
392
393         return out - buf;
394 inval:
395         return scnprintf(buf, len, "invalid group %u", v);
396 }
397
398 int bch2_dev_group_set(struct bch_fs *c, struct bch_dev *ca, const char *name)
399 {
400         struct bch_member *mi;
401         int v = -1;
402
403         mutex_lock(&c->sb_lock);
404
405         if (!strlen(name) || !strcmp(name, "none"))
406                 goto write_sb;
407
408         v = bch2_disk_path_find_or_create(&c->disk_sb, name);
409         if (v < 0) {
410                 mutex_unlock(&c->sb_lock);
411                 return v;
412         }
413
414 write_sb:
415         mi = &bch2_sb_get_members(c->disk_sb.sb)->members[ca->dev_idx];
416         SET_BCH_MEMBER_GROUP(mi, v + 1);
417
418         bch2_write_super(c);
419         mutex_unlock(&c->sb_lock);
420
421         return 0;
422 }
423
424 int bch2_opt_target_parse(struct bch_fs *c, const char *buf, u64 *v)
425 {
426         struct bch_dev *ca;
427         int g;
428
429         if (!strlen(buf) || !strcmp(buf, "none")) {
430                 *v = 0;
431                 return 0;
432         }
433
434         /* Is it a device? */
435         ca = bch2_dev_lookup(c, buf);
436         if (!IS_ERR(ca)) {
437                 *v = dev_to_target(ca->dev_idx);
438                 percpu_ref_put(&ca->ref);
439                 return 0;
440         }
441
442         mutex_lock(&c->sb_lock);
443         g = bch2_disk_path_find(&c->disk_sb, buf);
444         mutex_unlock(&c->sb_lock);
445
446         if (g >= 0) {
447                 *v = group_to_target(g);
448                 return 0;
449         }
450
451         return -EINVAL;
452 }
453
454 int bch2_opt_target_print(struct bch_fs *c, char *buf, size_t len, u64 v)
455 {
456         struct target t = target_decode(v);
457         int ret;
458
459         switch (t.type) {
460         case TARGET_NULL:
461                 return scnprintf(buf, len, "none");
462         case TARGET_DEV: {
463                 struct bch_dev *ca;
464
465                 rcu_read_lock();
466                 ca = t.dev < c->sb.nr_devices
467                         ? rcu_dereference(c->devs[t.dev])
468                         : NULL;
469
470                 if (ca && percpu_ref_tryget(&ca->io_ref)) {
471                         char b[BDEVNAME_SIZE];
472
473                         ret = scnprintf(buf, len, "/dev/%s",
474                                         bdevname(ca->disk_sb.bdev, b));
475                         percpu_ref_put(&ca->io_ref);
476                 } else if (ca) {
477                         ret = scnprintf(buf, len, "offline device %u", t.dev);
478                 } else {
479                         ret = scnprintf(buf, len, "invalid device %u", t.dev);
480                 }
481
482                 rcu_read_unlock();
483                 break;
484         }
485         case TARGET_GROUP:
486                 mutex_lock(&c->sb_lock);
487                 ret = bch2_disk_path_print(&c->disk_sb, buf, len, t.group);
488                 mutex_unlock(&c->sb_lock);
489                 break;
490         default:
491                 BUG();
492         }
493
494         return ret;
495 }