r5c_state have 4 states: * no-cache; * write-through (write journal only); * write-back (w/ write cache); * cache-broken (journal missing or Faulty) When there is functional write cache, r5c_state is a knob to switch between write-back and write-through. When the journal device is broken, the raid array is forced in readonly mode. In this case, r5c_state can be used to remove "journal feature", and thus make the array read-write without journal. By writing into r5c_cache_mode, the array can transit from cache-broken to no-cache, which removes journal feature for the array. Signed-off-by: Song Liu <songliubraving@xxxxxx> Signed-off-by: Shaohua Li <shli@xxxxxx> --- drivers/md/raid5-cache.c | 57 ++++++++++++++++++++++++++++++++++++++++++++++++ drivers/md/raid5.c | 1 + drivers/md/raid5.h | 2 ++ 3 files changed, 60 insertions(+) diff --git a/drivers/md/raid5-cache.c b/drivers/md/raid5-cache.c index cc7b80d..78eeb6df 100644 --- a/drivers/md/raid5-cache.c +++ b/drivers/md/raid5-cache.c @@ -47,6 +47,9 @@ enum r5c_state { R5C_STATE_CACHE_BROKEN = 3, }; +static char *r5c_state_str[] = {"no-cache", "write-through", + "write-back", "cache-broken"}; + struct r5l_log { struct md_rdev *rdev; @@ -1219,6 +1222,60 @@ int r5c_flush_cache(struct r5conf *conf) return count; } +ssize_t r5c_state_show(struct mddev *mddev, char *page) +{ + struct r5conf *conf = mddev->private; + int val = 0; + int ret = 0; + + if (conf->log) + val = conf->log->r5c_state; + else if (test_bit(MD_HAS_JOURNAL, &mddev->flags)) + val = R5C_STATE_CACHE_BROKEN; + ret += snprintf(page, PAGE_SIZE - ret, "%d: %s\n", + val, r5c_state_str[val]); + return ret; +} + +ssize_t r5c_state_store(struct mddev *mddev, const char *page, size_t len) +{ + struct r5conf *conf = mddev->private; + struct r5l_log *log = conf->log; + int val; + + if (kstrtoint(page, 10, &val)) + return -EINVAL; + if (!log && val != R5C_STATE_NO_CACHE) + return -EINVAL; + + if (val < R5C_STATE_NO_CACHE || val > R5C_STATE_WRITE_BACK) + return -EINVAL; + if (val == R5C_STATE_NO_CACHE) { + if (conf->log && + !test_bit(Faulty, &log->rdev->flags)) { + pr_err("md/raid:%s: journal device is in use, cannot remove it\n", + mdname(mddev)); + return -EINVAL; + } + } + + spin_lock_irq(&conf->device_lock); + if (log) + conf->log->r5c_state = val; + if (val == R5C_STATE_NO_CACHE) { + clear_bit(MD_HAS_JOURNAL, &mddev->flags); + set_bit(MD_UPDATE_SB_FLAGS, &mddev->flags); + } + spin_unlock_irq(&conf->device_lock); + pr_info("md/raid:%s: setting r5c cache mode to %d: %s\n", + mdname(mddev), val, r5c_state_str[val]); + return len; +} + +struct md_sysfs_entry +r5c_state = __ATTR(r5c_state, S_IRUGO | S_IWUSR, + r5c_state_show, r5c_state_store); + int r5c_handle_stripe_dirtying(struct r5conf *conf, struct stripe_head *sh, struct stripe_head_state *s, diff --git a/drivers/md/raid5.c b/drivers/md/raid5.c index ed6efd0..7956d13 100644 --- a/drivers/md/raid5.c +++ b/drivers/md/raid5.c @@ -6355,6 +6355,7 @@ static struct attribute *raid5_attrs[] = { &raid5_group_thread_cnt.attr, &raid5_skip_copy.attr, &raid5_rmw_level.attr, + &r5c_state.attr, NULL, }; static struct attribute_group raid5_attrs_group = { diff --git a/drivers/md/raid5.h b/drivers/md/raid5.h index e301d0e..dbc128e 100644 --- a/drivers/md/raid5.h +++ b/drivers/md/raid5.h @@ -658,4 +658,6 @@ r5c_handle_stripe_written(struct r5conf *conf, struct stripe_head *sh); extern void r5c_freeze_stripe_for_reclaim(struct stripe_head *sh); extern void r5c_do_reclaim(struct r5conf *conf); extern int r5c_flush_cache(struct r5conf *conf); +extern struct md_sysfs_entry r5c_state; + #endif -- 2.8.0.rc2 -- To unsubscribe from this list: send the line "unsubscribe linux-raid" in the body of a message to majordomo@xxxxxxxxxxxxxxx More majordomo info at http://vger.kernel.org/majordomo-info.html