]> git.sesse.net Git - bcachefs-tools-debian/blobdiff - libbcachefs/sysfs.c
check if fs is mounted before running fsck
[bcachefs-tools-debian] / libbcachefs / sysfs.c
index 4987ee76a08cbdeb4153b04990941643bda39e0d..a6d70ce524e91042ca3d426ca99c97f1f50dc1c2 100644 (file)
@@ -8,8 +8,7 @@
 #ifndef NO_BCACHEFS_SYSFS
 
 #include "bcachefs.h"
-#include "alloc.h"
-#include "compress.h"
+#include "alloc_background.h"
 #include "sysfs.h"
 #include "btree_cache.h"
 #include "btree_io.h"
@@ -19,6 +18,7 @@
 #include "btree_gc.h"
 #include "buckets.h"
 #include "disk_groups.h"
+#include "ec.h"
 #include "inode.h"
 #include "journal.h"
 #include "keylist.h"
@@ -72,9 +72,10 @@ do {                                                                 \
 #define sysfs_hprint(file, val)                                                \
 do {                                                                   \
        if (attr == &sysfs_ ## file) {                                  \
-               ssize_t ret = bch2_hprint(buf, val);                    \
-               strcat(buf, "\n");                                      \
-               return ret + 1;                                         \
+               struct printbuf out = _PBUF(buf, PAGE_SIZE);            \
+               bch2_hprint(&out, val);                                 \
+               pr_buf(&out, "\n");                                     \
+               return out.pos - buf;                                   \
        }                                                               \
 } while (0)
 
@@ -131,6 +132,7 @@ do {                                                                        \
 write_attribute(trigger_journal_flush);
 write_attribute(trigger_btree_coalesce);
 write_attribute(trigger_gc);
+write_attribute(trigger_alloc_write);
 write_attribute(prune_cache);
 rw_attribute(btree_gc_periodic);
 
@@ -188,6 +190,8 @@ sysfs_pd_controller_attribute(rebalance);
 read_attribute(rebalance_work);
 rw_attribute(promote_whole_extents);
 
+read_attribute(new_stripes);
+
 rw_attribute(pd_controllers_update_seconds);
 
 read_attribute(meta_replicas_have);
@@ -229,41 +233,50 @@ static size_t bch2_btree_cache_size(struct bch_fs *c)
 
 static ssize_t show_fs_alloc_debug(struct bch_fs *c, char *buf)
 {
-       struct bch_fs_usage stats = bch2_fs_usage_read(c);
+       struct printbuf out = _PBUF(buf, PAGE_SIZE);
+       struct bch_fs_usage *fs_usage = bch2_fs_usage_read(c);
+       unsigned i;
 
-       return scnprintf(buf, PAGE_SIZE,
-                        "capacity:\t\t%llu\n"
-                        "1 replicas:\n"
-                        "\tmeta:\t\t%llu\n"
-                        "\tdirty:\t\t%llu\n"
-                        "\treserved:\t%llu\n"
-                        "2 replicas:\n"
-                        "\tmeta:\t\t%llu\n"
-                        "\tdirty:\t\t%llu\n"
-                        "\treserved:\t%llu\n"
-                        "3 replicas:\n"
-                        "\tmeta:\t\t%llu\n"
-                        "\tdirty:\t\t%llu\n"
-                        "\treserved:\t%llu\n"
-                        "4 replicas:\n"
-                        "\tmeta:\t\t%llu\n"
-                        "\tdirty:\t\t%llu\n"
-                        "\treserved:\t%llu\n"
-                        "online reserved:\t%llu\n",
-                        c->capacity,
-                        stats.s[0].data[S_META],
-                        stats.s[0].data[S_DIRTY],
-                        stats.s[0].persistent_reserved,
-                        stats.s[1].data[S_META],
-                        stats.s[1].data[S_DIRTY],
-                        stats.s[1].persistent_reserved,
-                        stats.s[2].data[S_META],
-                        stats.s[2].data[S_DIRTY],
-                        stats.s[2].persistent_reserved,
-                        stats.s[3].data[S_META],
-                        stats.s[3].data[S_DIRTY],
-                        stats.s[3].persistent_reserved,
-                        stats.online_reserved);
+       if (!fs_usage)
+               return -ENOMEM;
+
+       pr_buf(&out, "capacity:\t\t\t%llu\n", c->capacity);
+
+       pr_buf(&out, "hidden:\t\t\t\t%llu\n",
+              fs_usage->hidden);
+       pr_buf(&out, "data:\t\t\t\t%llu\n",
+              fs_usage->data);
+       pr_buf(&out, "cached:\t\t\t\t%llu\n",
+              fs_usage->cached);
+       pr_buf(&out, "reserved:\t\t\t%llu\n",
+              fs_usage->reserved);
+       pr_buf(&out, "nr_inodes:\t\t\t%llu\n",
+              fs_usage->nr_inodes);
+       pr_buf(&out, "online reserved:\t\t%llu\n",
+              fs_usage->online_reserved);
+
+       for (i = 0;
+            i < ARRAY_SIZE(fs_usage->persistent_reserved);
+            i++) {
+               pr_buf(&out, "%u replicas:\n", i + 1);
+               pr_buf(&out, "\treserved:\t\t%llu\n",
+                      fs_usage->persistent_reserved[i]);
+       }
+
+       for (i = 0; i < c->replicas.nr; i++) {
+               struct bch_replicas_entry *e =
+                       cpu_replicas_entry(&c->replicas, i);
+
+               pr_buf(&out, "\t");
+               bch2_replicas_entry_to_text(&out, e);
+               pr_buf(&out, ":\t%llu\n", fs_usage->replicas[i]);
+       }
+
+       percpu_up_read_preempt_enable(&c->mark_lock);
+
+       kfree(fs_usage);
+
+       return out.pos - buf;
 }
 
 static ssize_t bch2_compression_stats(struct bch_fs *c, char *buf)
@@ -275,25 +288,25 @@ static ssize_t bch2_compression_stats(struct bch_fs *c, char *buf)
            compressed_sectors_compressed = 0,
            compressed_sectors_uncompressed = 0;
 
-       if (!bch2_fs_running(c))
+       if (!test_bit(BCH_FS_STARTED, &c->flags))
                return -EPERM;
 
        for_each_btree_key(&iter, c, BTREE_ID_EXTENTS, POS_MIN, 0, k)
-               if (k.k->type == BCH_EXTENT) {
+               if (k.k->type == KEY_TYPE_extent) {
                        struct bkey_s_c_extent e = bkey_s_c_to_extent(k);
-                       const struct bch_extent_ptr *ptr;
-                       struct bch_extent_crc_unpacked crc;
+                       const union bch_extent_entry *entry;
+                       struct extent_ptr_decoded p;
 
-                       extent_for_each_ptr_crc(e, ptr, crc) {
-                               if (crc.compression_type == BCH_COMPRESSION_NONE) {
+                       extent_for_each_ptr_decode(e, p, entry) {
+                               if (p.crc.compression_type == BCH_COMPRESSION_NONE) {
                                        nr_uncompressed_extents++;
                                        uncompressed_sectors += e.k->size;
                                } else {
                                        nr_compressed_extents++;
                                        compressed_sectors_compressed +=
-                                               crc.compressed_size;
+                                               p.crc.compressed_size;
                                        compressed_sectors_uncompressed +=
-                                               crc.uncompressed_size;
+                                               p.crc.uncompressed_size;
                                }
 
                                /* only looking at the first ptr */
@@ -317,6 +330,41 @@ static ssize_t bch2_compression_stats(struct bch_fs *c, char *buf)
                        compressed_sectors_uncompressed << 9);
 }
 
+static ssize_t bch2_new_stripes(struct bch_fs *c, char *buf)
+{
+       char *out = buf, *end = buf + PAGE_SIZE;
+       struct ec_stripe_head *h;
+       struct ec_stripe_new *s;
+
+       mutex_lock(&c->ec_new_stripe_lock);
+       list_for_each_entry(h, &c->ec_new_stripe_list, list) {
+               out += scnprintf(out, end - out,
+                                "target %u algo %u redundancy %u:\n",
+                                h->target, h->algo, h->redundancy);
+
+               if (h->s)
+                       out += scnprintf(out, end - out,
+                                        "\tpending: blocks %u allocated %u\n",
+                                        h->s->blocks.nr,
+                                        bitmap_weight(h->s->blocks_allocated,
+                                                      h->s->blocks.nr));
+
+               mutex_lock(&h->lock);
+               list_for_each_entry(s, &h->stripes, list)
+                       out += scnprintf(out, end - out,
+                                        "\tin flight: blocks %u allocated %u pin %u\n",
+                                        s->blocks.nr,
+                                        bitmap_weight(s->blocks_allocated,
+                                                      s->blocks.nr),
+                                        atomic_read(&s->pin));
+               mutex_unlock(&h->lock);
+
+       }
+       mutex_unlock(&c->ec_new_stripe_lock);
+
+       return out - buf;
+}
+
 SHOW(bch2_fs)
 {
        struct bch_fs *c = container_of(kobj, struct bch_fs, kobj);
@@ -353,8 +401,8 @@ SHOW(bch2_fs)
 
        sysfs_print(promote_whole_extents,      c->promote_whole_extents);
 
-       sysfs_printf(meta_replicas_have, "%u",  bch2_replicas_online(c, true));
-       sysfs_printf(data_replicas_have, "%u",  bch2_replicas_online(c, false));
+       sysfs_printf(meta_replicas_have, "%i",  bch2_replicas_online(c, true));
+       sysfs_printf(data_replicas_have, "%i",  bch2_replicas_online(c, false));
 
        /* Debugging: */
 
@@ -376,6 +424,9 @@ SHOW(bch2_fs)
        if (attr == &sysfs_compression_stats)
                return bch2_compression_stats(c, buf);
 
+       if (attr == &sysfs_new_stripes)
+               return bch2_new_stripes(c, buf);
+
 #define BCH_DEBUG_PARAM(name, description) sysfs_print(name, c->name);
        BCH_DEBUG_PARAMS()
 #undef BCH_DEBUG_PARAM
@@ -430,7 +481,7 @@ STORE(__bch2_fs)
        BCH_DEBUG_PARAMS()
 #undef BCH_DEBUG_PARAM
 
-       if (!bch2_fs_running(c))
+       if (!test_bit(BCH_FS_STARTED, &c->flags))
                return -EPERM;
 
        /* Debugging: */
@@ -442,7 +493,13 @@ STORE(__bch2_fs)
                bch2_coalesce(c);
 
        if (attr == &sysfs_trigger_gc)
-               bch2_gc(c);
+               bch2_gc(c, NULL, false);
+
+       if (attr == &sysfs_trigger_alloc_write) {
+               bool wrote;
+
+               bch2_alloc_write(c, false, &wrote);
+       }
 
        if (attr == &sysfs_prune_cache) {
                struct shrink_control sc;
@@ -536,6 +593,7 @@ struct attribute *bch2_fs_internal_files[] = {
        &sysfs_trigger_journal_flush,
        &sysfs_trigger_btree_coalesce,
        &sysfs_trigger_gc,
+       &sysfs_trigger_alloc_write,
        &sysfs_prune_cache,
 
        &sysfs_copy_gc_enabled,
@@ -544,6 +602,8 @@ struct attribute *bch2_fs_internal_files[] = {
        &sysfs_rebalance_work,
        sysfs_pd_controller_files(rebalance),
 
+       &sysfs_new_stripes,
+
        &sysfs_internal_uuid,
 
 #define BCH_DEBUG_PARAM(name, description) &sysfs_##name,
@@ -557,16 +617,16 @@ struct attribute *bch2_fs_internal_files[] = {
 
 SHOW(bch2_fs_opts_dir)
 {
-       char *out = buf, *end = buf + PAGE_SIZE;
+       struct printbuf out = _PBUF(buf, PAGE_SIZE);
        struct bch_fs *c = container_of(kobj, struct bch_fs, opts_dir);
        const struct bch_option *opt = container_of(attr, struct bch_option, attr);
        int id = opt - bch2_opt_table;
        u64 v = bch2_opt_get_by_id(&c->opts, id);
 
-       out += bch2_opt_to_text(c, out, end - out, opt, v, OPT_SHOW_FULL_LIST);
-       out += scnprintf(out, end - out, "\n");
+       bch2_opt_to_text(&out, c, opt, v, OPT_SHOW_FULL_LIST);
+       pr_buf(&out, "\n");
 
-       return out - buf;
+       return out.pos - buf;
 }
 
 STORE(bch2_fs_opts_dir)
@@ -587,14 +647,9 @@ STORE(bch2_fs_opts_dir)
        if (ret < 0)
                return ret;
 
-       if (id == Opt_compression ||
-           id == Opt_background_compression) {
-               int ret = bch2_check_set_has_compressed_data(c, v);
-               if (ret) {
-                       mutex_unlock(&c->sb_lock);
-                       return ret;
-               }
-       }
+       ret = bch2_opt_check_may_set(c, id, v);
+       if (ret < 0)
+               return ret;
 
        if (opt->set_sb != SET_NO_SB_OPT) {
                mutex_lock(&c->sb_lock);
@@ -625,7 +680,7 @@ int bch2_opts_create_sysfs_files(struct kobject *kobj)
        for (i = bch2_opt_table;
             i < bch2_opt_table + bch2_opts_nr;
             i++) {
-               if (i->mode == OPT_INTERNAL)
+               if (!(i->mode & (OPT_FORMAT|OPT_MOUNT|OPT_RUNTIME)))
                        continue;
 
                ret = sysfs_create_file(kobj, &i->attr);
@@ -740,31 +795,35 @@ static ssize_t show_quantiles(struct bch_fs *c, struct bch_dev *ca,
 
 static ssize_t show_reserve_stats(struct bch_dev *ca, char *buf)
 {
+       struct printbuf out = _PBUF(buf, PAGE_SIZE);
        enum alloc_reserve i;
-       ssize_t ret;
 
        spin_lock(&ca->freelist_lock);
 
-       ret = scnprintf(buf, PAGE_SIZE,
-                       "free_inc:\t%zu\t%zu\n",
-                       fifo_used(&ca->free_inc),
-                       ca->free_inc.size);
+       pr_buf(&out, "free_inc:\t%zu\t%zu\n",
+              fifo_used(&ca->free_inc),
+              ca->free_inc.size);
 
        for (i = 0; i < RESERVE_NR; i++)
-               ret += scnprintf(buf + ret, PAGE_SIZE - ret,
-                                "free[%u]:\t%zu\t%zu\n", i,
-                                fifo_used(&ca->free[i]),
-                                ca->free[i].size);
+               pr_buf(&out, "free[%u]:\t%zu\t%zu\n", i,
+                      fifo_used(&ca->free[i]),
+                      ca->free[i].size);
 
        spin_unlock(&ca->freelist_lock);
 
-       return ret;
+       return out.pos - buf;
 }
 
 static ssize_t show_dev_alloc_debug(struct bch_dev *ca, char *buf)
 {
        struct bch_fs *c = ca->fs;
        struct bch_dev_usage stats = bch2_dev_usage_read(c, ca);
+       unsigned i, nr[BCH_DATA_NR];
+
+       memset(nr, 0, sizeof(nr));
+
+       for (i = 0; i < ARRAY_SIZE(c->open_buckets); i++)
+               nr[c->open_buckets[i].type]++;
 
        return scnprintf(buf, PAGE_SIZE,
                "free_inc:               %zu/%zu\n"
@@ -779,16 +838,22 @@ static ssize_t show_dev_alloc_debug(struct bch_dev *ca, char *buf)
                "    meta:               %llu\n"
                "    user:               %llu\n"
                "    cached:             %llu\n"
-               "    available:          %llu\n"
+               "    erasure coded:      %llu\n"
+               "    available:          %lli\n"
                "sectors:\n"
                "    sb:                 %llu\n"
                "    journal:            %llu\n"
                "    meta:               %llu\n"
                "    user:               %llu\n"
                "    cached:             %llu\n"
+               "    fragmented:         %llu\n"
+               "    copygc threshold:   %llu\n"
                "freelist_wait:          %s\n"
                "open buckets:           %u/%u (reserved %u)\n"
-               "open_buckets_wait:      %s\n",
+               "open_buckets_wait:      %s\n"
+               "open_buckets_btree:     %u\n"
+               "open_buckets_user:      %u\n"
+               "btree reserve cache:    %u\n",
                fifo_used(&ca->free_inc),               ca->free_inc.size,
                fifo_used(&ca->free[RESERVE_BTREE]),    ca->free[RESERVE_BTREE].size,
                fifo_used(&ca->free[RESERVE_MOVINGGC]), ca->free[RESERVE_MOVINGGC].size,
@@ -800,15 +865,22 @@ static ssize_t show_dev_alloc_debug(struct bch_dev *ca, char *buf)
                stats.buckets[BCH_DATA_BTREE],
                stats.buckets[BCH_DATA_USER],
                stats.buckets[BCH_DATA_CACHED],
-               __dev_buckets_available(ca, stats),
+               stats.buckets_ec,
+               ca->mi.nbuckets - ca->mi.first_bucket - stats.buckets_unavailable,
                stats.sectors[BCH_DATA_SB],
                stats.sectors[BCH_DATA_JOURNAL],
                stats.sectors[BCH_DATA_BTREE],
                stats.sectors[BCH_DATA_USER],
                stats.sectors[BCH_DATA_CACHED],
+               stats.sectors_fragmented,
+               ca->copygc_threshold,
                c->freelist_wait.list.first             ? "waiting" : "empty",
-               c->open_buckets_nr_free, OPEN_BUCKETS_COUNT, BTREE_NODE_RESERVE,
-               c->open_buckets_wait.list.first         ? "waiting" : "empty");
+               c->open_buckets_nr_free, OPEN_BUCKETS_COUNT,
+               BTREE_NODE_OPEN_BUCKET_RESERVE,
+               c->open_buckets_wait.list.first         ? "waiting" : "empty",
+               nr[BCH_DATA_BTREE],
+               nr[BCH_DATA_USER],
+               c->btree_reserve_cache_nr);
 }
 
 static const char * const bch2_rw[] = {
@@ -819,31 +891,26 @@ static const char * const bch2_rw[] = {
 
 static ssize_t show_dev_iodone(struct bch_dev *ca, char *buf)
 {
-       char *out = buf, *end = buf + PAGE_SIZE;
-       int rw, i, cpu;
+       struct printbuf out = _PBUF(buf, PAGE_SIZE);
+       int rw, i;
 
        for (rw = 0; rw < 2; rw++) {
-               out += scnprintf(out, end - out, "%s:\n", bch2_rw[rw]);
+               pr_buf(&out, "%s:\n", bch2_rw[rw]);
 
-               for (i = 1; i < BCH_DATA_NR; i++) {
-                       u64 n = 0;
-
-                       for_each_possible_cpu(cpu)
-                               n += per_cpu_ptr(ca->io_done, cpu)->sectors[rw][i];
-
-                       out += scnprintf(out, end - out, "%-12s:%12llu\n",
-                                        bch2_data_types[i], n << 9);
-               }
+               for (i = 1; i < BCH_DATA_NR; i++)
+                       pr_buf(&out, "%-12s:%12llu\n",
+                              bch2_data_types[i],
+                              percpu_u64_get(&ca->io_done->sectors[rw][i]) << 9);
        }
 
-       return out - buf;
+       return out.pos - buf;
 }
 
 SHOW(bch2_dev)
 {
        struct bch_dev *ca = container_of(kobj, struct bch_dev, kobj);
        struct bch_fs *c = ca->fs;
-       char *out = buf, *end = buf + PAGE_SIZE;
+       struct printbuf out = _PBUF(buf, PAGE_SIZE);
 
        sysfs_printf(uuid,              "%pU\n", ca->uuid.b);
 
@@ -857,41 +924,39 @@ SHOW(bch2_dev)
        if (attr == &sysfs_label) {
                if (ca->mi.group) {
                        mutex_lock(&c->sb_lock);
-                       out += bch2_disk_path_print(&c->disk_sb, out, end - out,
-                                                   ca->mi.group - 1);
+                       bch2_disk_path_to_text(&out, &c->disk_sb,
+                                              ca->mi.group - 1);
                        mutex_unlock(&c->sb_lock);
                } else {
-                       out += scnprintf(out, end - out, "none");
+                       pr_buf(&out, "none");
                }
 
-               out += scnprintf(out, end - out, "\n");
-               return out - buf;
+               pr_buf(&out, "\n");
+               return out.pos - buf;
        }
 
        if (attr == &sysfs_has_data) {
-               out += bch2_scnprint_flag_list(out, end - out,
-                                              bch2_data_types,
-                                              bch2_dev_has_data(c, ca));
-               out += scnprintf(out, end - out, "\n");
-               return out - buf;
+               bch2_flags_to_text(&out, bch2_data_types,
+                                  bch2_dev_has_data(c, ca));
+               pr_buf(&out, "\n");
+               return out.pos - buf;
        }
 
        sysfs_pd_controller_show(copy_gc, &ca->copygc_pd);
 
        if (attr == &sysfs_cache_replacement_policy) {
-               out += bch2_scnprint_string_list(out, end - out,
-                                                bch2_cache_replacement_policies,
-                                                ca->mi.replacement);
-               out += scnprintf(out, end - out, "\n");
-               return out - buf;
+               bch2_string_opt_to_text(&out,
+                                       bch2_cache_replacement_policies,
+                                       ca->mi.replacement);
+               pr_buf(&out, "\n");
+               return out.pos - buf;
        }
 
        if (attr == &sysfs_state_rw) {
-               out += bch2_scnprint_string_list(out, end - out,
-                                                bch2_dev_state,
-                                                ca->mi.state);
-               out += scnprintf(out, end - out, "\n");
-               return out - buf;
+               bch2_string_opt_to_text(&out, bch2_dev_state,
+                                       ca->mi.state);
+               pr_buf(&out, "\n");
+               return out.pos - buf;
        }
 
        if (attr == &sysfs_iodone)