X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Fofd%2Flproc_ofd.c;h=abc67a8b973ea26f82f86a52cd65e57198095923;hp=6b31949d7165503c95df35619896b1d598d15a9a;hb=2b905746ee3b5d9dbafcdb1af5930aea18120a7b;hpb=6794d7654b4c459519a9e6d85ed439c8c594c2e7 diff --git a/lustre/ofd/lproc_ofd.c b/lustre/ofd/lproc_ofd.c index 6b31949..abc67a8 100644 --- a/lustre/ofd/lproc_ofd.c +++ b/lustre/ofd/lproc_ofd.c @@ -15,11 +15,7 @@ * * You should have received a copy of the GNU General Public License * version 2 along with this program; If not, see - * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf - * - * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara, - * CA 95054 USA or visit www.sun.com if you need additional information or - * have any questions. + * http://www.gnu.org/licenses/gpl-2.0.html * * GPL HEADER END */ @@ -27,13 +23,20 @@ * Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved. * Use is subject to license terms. * - * Copyright (c) 2012, Intel Corporation. + * Copyright (c) 2012, 2017, Intel Corporation. */ /* * This file is part of Lustre, http://www.lustre.org/ * Lustre is a trademark of Sun Microsystems, Inc. * * lustre/ofd/lproc_ofd.c + * + * This file provides functions of procfs interface for OBD Filter Device (OFD). + * + * Author: Andreas Dilger + * Author: Mikhail Pershin + * Author: Johann Lombardi + * Author: Fan Yong */ #define DEBUG_SUBSYSTEM S_CLASS @@ -41,499 +44,897 @@ #include #include #include +#include #include "ofd_internal.h" -#ifdef LPROCFS +#ifdef CONFIG_PROC_FS -static int lprocfs_ofd_rd_seqs(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Show number of FID allocation sequences. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t seqs_allocated_show(struct kobject *kobj, struct attribute *attr, + char *buf) { - struct obd_device *obd = (struct obd_device *)data; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - *eof = 1; - return snprintf(page, count, "%u\n", ofd->ofd_seq_count); + return sprintf(buf, "%u\n", ofd->ofd_seq_count); } +LUSTRE_RO_ATTR(seqs_allocated); -static int lprocfs_ofd_rd_tot_dirty(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Show total number of grants for precreate. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t grant_precreate_show(struct kobject *kobj, + struct attribute *attr, + char *buf) { - struct obd_device *obd = (struct obd_device *)data; - struct ofd_device *ofd; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); - LASSERT(obd != NULL); - ofd = ofd_dev(obd->obd_lu_dev); - *eof = 1; - return snprintf(page, count, LPU64"\n", ofd->ofd_tot_dirty); + return sprintf(buf, "%ld\n", + obd->obd_self_export->exp_target_data.ted_grant); } +LUSTRE_RO_ATTR(grant_precreate); -static int lprocfs_ofd_rd_tot_granted(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Show number of precreates allowed in a single transaction. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t precreate_batch_show(struct kobject *kobj, + struct attribute *attr, + char *buf) { - struct obd_device *obd = (struct obd_device *)data; - struct ofd_device *ofd; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - LASSERT(obd != NULL); - ofd = ofd_dev(obd->obd_lu_dev); - *eof = 1; - return snprintf(page, count, LPU64"\n", ofd->ofd_tot_granted); + return sprintf(buf, "%d\n", ofd->ofd_precreate_batch); } -static int lprocfs_ofd_rd_tot_pending(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Change number of precreates allowed in a single transaction. + * + * \param[in] file proc file + * \param[in] buffer string which represents maximum number + * \param[in] count \a buffer length + * \param[in] off unused for single entry + * + * \retval \a count on success + * \retval negative number on error + */ +static ssize_t precreate_batch_store(struct kobject *kobj, + struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = (struct obd_device *)data; - struct ofd_device *ofd; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + unsigned int val; + int rc; - LASSERT(obd != NULL); - ofd = ofd_dev(obd->obd_lu_dev); - *eof = 1; - return snprintf(page, count, LPU64"\n", ofd->ofd_tot_pending); + rc = kstrtouint(buffer, 0, &val); + if (rc) + return rc; + + if (val < 1 || val > 65536) + return -EINVAL; + + spin_lock(&ofd->ofd_batch_lock); + ofd->ofd_precreate_batch = val; + spin_unlock(&ofd->ofd_batch_lock); + return count; } +LUSTRE_RW_ATTR(precreate_batch); -static int lprocfs_ofd_rd_grant_precreate(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Show the last used ID for each FID sequence used by OFD. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static int ofd_last_id_seq_show(struct seq_file *m, void *data) { - struct obd_device *obd = (struct obd_device *)data; + struct obd_device *obd = m->private; + struct ofd_device *ofd; + struct ofd_seq *oseq = NULL; + + if (obd == NULL) + return 0; + + ofd = ofd_dev(obd->obd_lu_dev); - LASSERT(obd != NULL); - *eof = 1; - return snprintf(page, count, "%ld\n", - obd->obd_self_export->exp_filter_data.fed_grant); + read_lock(&ofd->ofd_seq_list_lock); + list_for_each_entry(oseq, &ofd->ofd_seq_list, os_list) { + __u64 seq; + + seq = ostid_seq(&oseq->os_oi) == 0 ? + fid_idif_seq(ostid_id(&oseq->os_oi), + ofd->ofd_lut.lut_lsd.lsd_osd_index) : + ostid_seq(&oseq->os_oi); + seq_printf(m, DOSTID"\n", seq, ostid_id(&oseq->os_oi)); + } + read_unlock(&ofd->ofd_seq_list_lock); + return 0; } -static int lprocfs_ofd_rd_grant_ratio(char *page, char **start, off_t off, - int count, int *eof, void *data) +LPROC_SEQ_FOPS_RO(ofd_last_id); + +/** + * Show if the OFD is in degraded mode. + * + * Degraded means OFD has a failed drive or is undergoing RAID rebuild. + * The MDS will try to avoid using this OST for new object allocations + * to reduce the impact to global IO performance when clients writing to + * this OST are slowed down. It also reduces the contention on the OST + * RAID device, allowing it to rebuild more quickly. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t degraded_show(struct kobject *kobj, struct attribute *attr, + char *buf) { - struct obd_device *obd = (struct obd_device *)data; - struct ofd_device *ofd; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - LASSERT(obd != NULL); - ofd = ofd_dev(obd->obd_lu_dev); - *eof = 1; - return snprintf(page, count, "%d%%\n", - (int) ofd_grant_reserved(ofd, 100)); + return sprintf(buf, "%u\n", ofd->ofd_raid_degraded); } -static int lprocfs_ofd_wr_grant_ratio(struct file *file, const char *buffer, - unsigned long count, void *data) +/** + * Set OFD to degraded mode. + * + * This is used to interface to userspace administrative tools for + * the underlying RAID storage, so that they can mark an OST + * as having degraded performance. + * + * \param[in] file proc file + * \param[in] buffer string which represents mode + * 1: set degraded mode + * 0: unset degraded mode + * \param[in] count \a buffer length + * \param[in] off unused for single entry + * + * \retval \a count on success + * \retval negative number on error + */ +static ssize_t degraded_store(struct kobject *kobj, struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = (struct obd_device *)data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val; - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + bool val; + int rc; - rc = lprocfs_write_helper(buffer, count, &val); + rc = kstrtobool(buffer, &val); if (rc) return rc; - if (val > 100 || val < 0) - return -EINVAL; + spin_lock(&ofd->ofd_flags_lock); + ofd->ofd_raid_degraded = val; + spin_unlock(&ofd->ofd_flags_lock); + return count; +} +LUSTRE_RW_ATTR(degraded); - if (val == 0) - CWARN("%s: disabling grant error margin\n", obd->obd_name); - if (val > 50) - CWARN("%s: setting grant error margin >50%%, be warned that " - "a huge part of the free space is now reserved for " - "grants\n", obd->obd_name); +/** + * Show OFD filesystem type. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t fstype_show(struct kobject *kobj, struct attribute *attr, + char *buf) +{ + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + struct lu_device *d; - spin_lock(&ofd->ofd_grant_lock); - ofd->ofd_grant_ratio = ofd_grant_ratio_conv(val); - spin_unlock(&ofd->ofd_grant_lock); - return count; + LASSERT(ofd->ofd_osd); + d = &ofd->ofd_osd->dd_lu_dev; + LASSERT(d->ld_type); + return sprintf(buf, "%s\n", d->ld_type->ldt_name); } +LUSTRE_RO_ATTR(fstype); -static int lprocfs_ofd_rd_precreate_batch(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Show journal handling mode: synchronous or asynchronous. + * + * When running in asynchronous mode the journal transactions are not + * committed to disk before the RPC is replied back to the client. + * This will typically improve client performance when only a small number + * of clients are writing, since the client(s) can have more write RPCs + * in flight. However, it also means that the client has to handle recovery + * on bulk RPCs, and will have to keep more dirty pages in cache before they + * are committed on the OST. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t sync_journal_show(struct kobject *kobj, struct attribute *attr, + char *buf) { - struct obd_device *obd = (struct obd_device *)data; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - LASSERT(obd != NULL); - *eof = 1; - return snprintf(page, count, "%d\n", ofd->ofd_precreate_batch); + return sprintf(buf, "%u\n", ofd->ofd_sync_journal); } -static int lprocfs_ofd_wr_precreate_batch(struct file *file, const char *buffer, - unsigned long count, void *data) +/** + * Set journal mode to synchronous or asynchronous. + * + * \param[in] file proc file + * \param[in] buffer string which represents mode + * 1: synchronous mode + * 0: asynchronous mode + * \param[in] count \a buffer length + * \param[in] off unused for single entry + * + * \retval \a count on success + * \retval negative number on error + */ +static ssize_t sync_journal_store(struct kobject *kobj, struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = (struct obd_device *)data; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val; + bool val; int rc; - rc = lprocfs_write_helper(buffer, count, &val); + rc = kstrtobool(buffer, &val); if (rc) return rc; - if (val < 1) - return -EINVAL; + spin_lock(&ofd->ofd_flags_lock); + ofd->ofd_sync_journal = val; + ofd_slc_set(ofd); + spin_unlock(&ofd->ofd_flags_lock); - spin_lock(&ofd->ofd_batch_lock); - ofd->ofd_precreate_batch = val; - spin_unlock(&ofd->ofd_batch_lock); return count; } +LUSTRE_RW_ATTR(sync_journal); -static int lprocfs_ofd_rd_last_id(char *page, char **start, off_t off, - int count, int *eof, void *data) -{ - struct obd_device *obd = data; - struct ofd_device *ofd; - struct ofd_seq *oseq = NULL; - int retval = 0, rc; - - if (obd == NULL) - return 0; - - ofd = ofd_dev(obd->obd_lu_dev); - - read_lock(&ofd->ofd_seq_list_lock); - cfs_list_for_each_entry(oseq, &ofd->ofd_seq_list, os_list) { - rc = snprintf(page, count, DOSTID"\n", POSTID(&oseq->os_oi)); - if (rc < 0) { - retval = rc; - break; - } - page += rc; - count -= rc; - retval += rc; - } - read_unlock(&ofd->ofd_seq_list_lock); - return retval; -} - -int lprocfs_ofd_rd_fmd_max_num(char *page, char **start, off_t off, - int count, int *eof, void *data) +static int ofd_brw_size_seq_show(struct seq_file *m, void *data) { - struct obd_device *obd = data; + struct obd_device *obd = m->private; struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int rc; - rc = snprintf(page, count, "%u\n", ofd->ofd_fmd_max_num); - return rc; + seq_printf(m, "%u\n", ofd->ofd_brw_size / ONE_MB_BRW_SIZE); + return 0; } -int lprocfs_ofd_wr_fmd_max_num(struct file *file, const char *buffer, - unsigned long count, void *data) +static ssize_t +ofd_brw_size_seq_write(struct file *file, const char __user *buffer, + size_t count, loff_t *off) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val; - int rc; + struct seq_file *m = file->private_data; + struct obd_device *obd = m->private; + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + __s64 val; + int rc; - rc = lprocfs_write_helper(buffer, count, &val); + rc = lprocfs_str_with_units_to_s64(buffer, count, &val, 'M'); if (rc) return rc; - if (val > 65536 || val < 1) + if (val <= 0) return -EINVAL; - ofd->ofd_fmd_max_num = val; + if (val > DT_MAX_BRW_SIZE || + val < (1 << ofd->ofd_lut.lut_tgd.tgd_blockbits)) + return -ERANGE; + + spin_lock(&ofd->ofd_flags_lock); + ofd->ofd_brw_size = val; + spin_unlock(&ofd->ofd_flags_lock); + return count; } -int lprocfs_ofd_rd_fmd_max_age(char *page, char **start, off_t off, - int count, int *eof, void *data) +LPROC_SEQ_FOPS(ofd_brw_size); + +/** + * Show the limit of soft sync RPCs. + * + * This value defines how many IO RPCs with OBD_BRW_SOFT_SYNC flag + * are allowed before sync update will be triggered. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t soft_sync_limit_show(struct kobject *kobj, + struct attribute *attr, char *buf) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - rc = snprintf(page, count, "%ld\n", ofd->ofd_fmd_max_age / CFS_HZ); - return rc; + return sprintf(buf, "%u\n", ofd->ofd_soft_sync_limit); } -int lprocfs_ofd_wr_fmd_max_age(struct file *file, const char *buffer, - unsigned long count, void *data) +/** + * Change the limit of soft sync RPCs. + * + * Define how many IO RPCs with OBD_BRW_SOFT_SYNC flag + * allowed before sync update will be done. + * + * This limit is global across all exports. + * + * \param[in] file proc file + * \param[in] buffer string which represents limit + * \param[in] count \a buffer length + * \param[in] off unused for single entry + * + * \retval \a count on success + * \retval negative number on error + */ +static ssize_t soft_sync_limit_store(struct kobject *kobj, + struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val; - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + unsigned int val; + int rc; - rc = lprocfs_write_helper(buffer, count, &val); - if (rc) + rc = kstrtouint(buffer, 0, &val); + if (rc < 0) return rc; - if (val > 65536 || val < 1) - return -EINVAL; - - ofd->ofd_fmd_max_age = val * CFS_HZ; - return count; + ofd->ofd_soft_sync_limit = val; + return 0; } +LUSTRE_RW_ATTR(soft_sync_limit); -static int lprocfs_ofd_rd_capa(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Show the LFSCK speed limit. + * + * The maximum number of items scanned per second. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t lfsck_speed_limit_show(struct kobject *kobj, + struct attribute *attr, char *buf) { - struct obd_device *obd = data; - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - rc = snprintf(page, count, "capability on: %s\n", - obd->u.filter.fo_fl_oss_capa ? "oss" : ""); - return rc; + return lfsck_get_speed(buf, ofd->ofd_osd); } -static int lprocfs_ofd_wr_capa(struct file *file, const char *buffer, - unsigned long count, void *data) +/** + * Change the LFSCK speed limit. + * + * Limit number of items that may be scanned per second. + * + * \param[in] file proc file + * \param[in] buffer string which represents limit + * \param[in] count \a buffer length + * \param[in] off unused for single entry + * + * \retval \a count on success + * \retval negative number on error + */ +static ssize_t lfsck_speed_limit_store(struct kobject *kobj, + struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = data; - int val, rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + unsigned int val; + int rc; - rc = lprocfs_write_helper(buffer, count, &val); - if (rc) + rc = kstrtouint(buffer, 0, &val); + if (rc != 0) return rc; - if (val & ~0x1) { - CERROR("invalid capability mode, only 0/1 are accepted.\n" - " 1: enable oss fid capability\n" - " 0: disable oss fid capability\n"); - return -EINVAL; - } + rc = lfsck_set_speed(ofd->ofd_osd, val); - obd->u.filter.fo_fl_oss_capa = val; - LCONSOLE_INFO("OSS %s %s fid capability.\n", obd->obd_name, - val ? "enabled" : "disabled"); - return count; + return rc != 0 ? rc : count; } +LUSTRE_RW_ATTR(lfsck_speed_limit); -static int lprocfs_ofd_rd_capa_count(char *page, char **start, off_t off, - int count, int *eof, void *data) +/** + * Show LFSCK layout verification stats from the most recent LFSCK run. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static int ofd_lfsck_layout_seq_show(struct seq_file *m, void *data) { - return snprintf(page, count, "%d %d\n", - capa_count[CAPA_SITE_CLIENT], - capa_count[CAPA_SITE_SERVER]); + struct obd_device *obd = m->private; + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + + return lfsck_dump(m, ofd->ofd_osd, LFSCK_TYPE_LAYOUT); } -int lprocfs_ofd_rd_degraded(char *page, char **start, off_t off, - int count, int *eof, void *data) +LPROC_SEQ_FOPS_RO(ofd_lfsck_layout); + +/** + * Show if LFSCK performed parent FID verification. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static int ofd_lfsck_verify_pfid_seq_show(struct seq_file *m, void *data) { - struct obd_device *obd = data; + struct obd_device *obd = m->private; struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - return snprintf(page, count, "%u\n", ofd->ofd_raid_degraded); + seq_printf(m, "switch: %s\ndetected: %llu\nrepaired: %llu\n", + ofd->ofd_lfsck_verify_pfid ? "on" : "off", + ofd->ofd_inconsistency_self_detected, + ofd->ofd_inconsistency_self_repaired); + return 0; } -int lprocfs_ofd_wr_degraded(struct file *file, const char *buffer, - unsigned long count, void *data) +/** + * Set the LFSCK behavior to verify parent FID correctness. + * + * If flag ofd_lfsck_verify_pfid is set then LFSCK does parent FID + * verification during read/write operations. + * + * \param[in] file proc file + * \param[in] buffer string which represents behavior + * 1: verify parent FID + * 0: don't verify parent FID + * \param[in] count \a buffer length + * \param[in] off unused for single entry + * + * \retval \a count on success + * \retval negative number on error + */ +static ssize_t +ofd_lfsck_verify_pfid_seq_write(struct file *file, const char __user *buffer, + size_t count, loff_t *off) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val, rc; + struct seq_file *m = file->private_data; + struct obd_device *obd = m->private; + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + bool val; + int rc; - rc = lprocfs_write_helper(buffer, count, &val); + rc = kstrtobool_from_user(buffer, count, &val); if (rc) return rc; - spin_lock(&ofd->ofd_flags_lock); - ofd->ofd_raid_degraded = !!val; - spin_unlock(&ofd->ofd_flags_lock); + ofd->ofd_lfsck_verify_pfid = val; + if (!ofd->ofd_lfsck_verify_pfid) { + ofd->ofd_inconsistency_self_detected = 0; + ofd->ofd_inconsistency_self_repaired = 0; + } return count; } -int lprocfs_ofd_rd_fstype(char *page, char **start, off_t off, int count, - int *eof, void *data) +LPROC_SEQ_FOPS(ofd_lfsck_verify_pfid); + +static int ofd_site_stats_seq_show(struct seq_file *m, void *data) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - struct lu_device *d; + struct obd_device *obd = m->private; - LASSERT(ofd->ofd_osd); - d = &ofd->ofd_osd->dd_lu_dev; - LASSERT(d->ld_type); - return snprintf(page, count, "%s\n", d->ld_type->ldt_name); + return lu_site_stats_seq_print(obd->obd_lu_dev->ld_site, m); } -int lprocfs_ofd_rd_syncjournal(char *page, char **start, off_t off, - int count, int *eof, void *data) +LPROC_SEQ_FOPS_RO(ofd_site_stats); + +/** + * Show if the OFD enforces T10PI checksum. + * + * \param[in] m seq_file handle + * \param[in] data unused for single entry + * + * \retval 0 on success + * \retval negative value on error + */ +static ssize_t checksum_t10pi_enforce_show(struct kobject *kobj, + struct attribute *attr, + char *buf) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - rc = snprintf(page, count, "%u\n", ofd->ofd_syncjournal); - return rc; + return sprintf(buf, "%u\n", ofd->ofd_checksum_t10pi_enforce); } -int lprocfs_ofd_wr_syncjournal(struct file *file, const char *buffer, - unsigned long count, void *data) +/** + * Force specific T10PI checksum modes to be enabled + * + * If T10PI *is* supported in hardware, allow only the supported T10PI type + * to be used. If T10PI is *not* supported by the OSD, setting the enforce + * parameter forces all T10PI types to be enabled (even if slower) for + * testing. + * + * The final determination of which algorithm to be used depends whether + * the client supports T10PI or not, and is handled at client connect time. + * + * \param[in] file proc file + * \param[in] buffer string which represents mode + * 1: set T10PI checksums enforced + * 0: unset T10PI checksums enforced + * \param[in] count \a buffer length + * \param[in] off unused for single entry + * + * \retval \a count on success + * \retval negative number on error + */ +static ssize_t checksum_t10pi_enforce_store(struct kobject *kobj, + struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val; - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + bool enforce; + int rc; - rc = lprocfs_write_helper(buffer, count, &val); + rc = kstrtobool(buffer, &enforce); if (rc) return rc; - if (val < 0) - return -EINVAL; - spin_lock(&ofd->ofd_flags_lock); - ofd->ofd_syncjournal = !!val; - ofd_slc_set(ofd); + ofd->ofd_checksum_t10pi_enforce = enforce; spin_unlock(&ofd->ofd_flags_lock); - return count; } +LUSTRE_RW_ATTR(checksum_t10pi_enforce); -static char *sync_on_cancel_states[] = {"never", - "blocking", - "always" }; +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 14, 53, 0) +static bool max_file_warned; +static bool rd_cache_warned; +static bool wr_cache_warned; -int lprocfs_ofd_rd_sync_lock_cancel(char *page, char **start, off_t off, - int count, int *eof, void *data) +static ssize_t read_cache_enable_show(struct kobject *kobj, + struct attribute *attr, + char *buf) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - rc = snprintf(page, count, "%s\n", - sync_on_cancel_states[ofd->ofd_sync_lock_cancel]); - return rc; + if (!rd_cache_warned) { + rd_cache_warned = true; + pr_info("ofd: 'obdfilter.*.read_cache_enabled' is deprecated, use 'osd-*.read_cache_enabled' instead\n"); + } + + if (!ofd->ofd_read_cache_enable) + return -EOPNOTSUPP; + + return lustre_attr_show(&ofd->ofd_osd->dd_kobj, + ofd->ofd_read_cache_enable, buf); } -int lprocfs_ofd_wr_sync_lock_cancel(struct file *file, const char *buffer, - unsigned long count, void *data) +static ssize_t read_cache_enable_store(struct kobject *kobj, + struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val = -1; - int i; - - for (i = 0 ; i < NUM_SYNC_ON_CANCEL_STATES; i++) { - if (memcmp(buffer, sync_on_cancel_states[i], - strlen(sync_on_cancel_states[i])) == 0) { - val = i; - break; - } - } - if (val == -1) { - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - rc = lprocfs_write_helper(buffer, count, &val); - if (rc) - return rc; + if (!rd_cache_warned) { + rd_cache_warned = true; + pr_info("ofd: 'obdfilter.*.read_cache_enabled' is deprecated, use 'osd-*.read_cache_enabled' instead\n"); } - if (val < 0 || val > 2) - return -EINVAL; + if (!ofd->ofd_read_cache_enable) + return -EOPNOTSUPP; - spin_lock(&ofd->ofd_flags_lock); - ofd->ofd_sync_lock_cancel = val; - spin_unlock(&ofd->ofd_flags_lock); - return count; + return lustre_attr_store(&ofd->ofd_osd->dd_kobj, + ofd->ofd_read_cache_enable, buffer, count); } +LUSTRE_RW_ATTR(read_cache_enable); -int lprocfs_ofd_rd_grant_compat_disable(char *page, char **start, off_t off, - int count, int *eof, void *data) +static ssize_t readcache_max_filesize_show(struct kobject *kobj, + struct attribute *attr, + char *buf) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - rc = snprintf(page, count, "%u\n", ofd->ofd_grant_compat_disable); - return rc; + if (!max_file_warned) { + max_file_warned = true; + pr_info("ofd: 'obdfilter.*.readcache_max_filesize' is deprecated, use 'osd-*.readcache_max_filesize' instead\n"); + } + + if (!ofd->ofd_read_cache_max_filesize) + return -EOPNOTSUPP; + + return lustre_attr_show(&ofd->ofd_osd->dd_kobj, + ofd->ofd_read_cache_max_filesize, buf); } -int lprocfs_ofd_wr_grant_compat_disable(struct file *file, const char *buffer, - unsigned long count, void *data) +static ssize_t readcache_max_filesize_store(struct kobject *kobj, + struct attribute *attr, + const char *buffer, size_t count) { - struct obd_device *obd = data; - struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - int val; - int rc; - - rc = lprocfs_write_helper(buffer, count, &val); - if (rc) - return rc; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); - if (val < 0) - return -EINVAL; + if (!max_file_warned) { + max_file_warned = true; + pr_info("ofd: 'obdfilter.*.readcache_max_filesize' is deprecated, use 'osd-*.readcache_max_filesize' instead\n"); + } - spin_lock(&ofd->ofd_flags_lock); - ofd->ofd_grant_compat_disable = !!val; - spin_unlock(&ofd->ofd_flags_lock); + if (!ofd->ofd_read_cache_max_filesize) + return -EOPNOTSUPP; - return count; + return lustre_attr_store(&ofd->ofd_osd->dd_kobj, + ofd->ofd_read_cache_max_filesize, + buffer, count); } +LUSTRE_RW_ATTR(readcache_max_filesize); -static struct lprocfs_vars lprocfs_ofd_obd_vars[] = { - { "uuid", lprocfs_rd_uuid, 0, 0 }, - { "blocksize", lprocfs_rd_blksize, 0, 0 }, - { "kbytestotal", lprocfs_rd_kbytestotal, 0, 0 }, - { "kbytesfree", lprocfs_rd_kbytesfree, 0, 0 }, - { "kbytesavail", lprocfs_rd_kbytesavail, 0, 0 }, - { "filestotal", lprocfs_rd_filestotal, 0, 0 }, - { "filesfree", lprocfs_rd_filesfree, 0, 0 }, - { "seqs_allocated", lprocfs_ofd_rd_seqs, 0, 0 }, - { "fstype", lprocfs_ofd_rd_fstype, 0, 0 }, - { "last_id", lprocfs_ofd_rd_last_id, 0, 0 }, - { "tot_dirty", lprocfs_ofd_rd_tot_dirty, 0, 0 }, - { "tot_pending", lprocfs_ofd_rd_tot_pending, 0, 0 }, - { "tot_granted", lprocfs_ofd_rd_tot_granted, 0, 0 }, - { "grant_precreate", lprocfs_ofd_rd_grant_precreate, 0, 0 }, - { "grant_ratio", lprocfs_ofd_rd_grant_ratio, - lprocfs_ofd_wr_grant_ratio, 0, 0 }, - { "precreate_batch", lprocfs_ofd_rd_precreate_batch, - lprocfs_ofd_wr_precreate_batch, 0 }, - { "recovery_status", lprocfs_obd_rd_recovery_status, 0, 0 }, - { "recovery_time_soft", lprocfs_obd_rd_recovery_time_soft, - lprocfs_obd_wr_recovery_time_soft, 0}, - { "recovery_time_hard", lprocfs_obd_rd_recovery_time_hard, - lprocfs_obd_wr_recovery_time_hard, 0}, - { "evict_client", 0, lprocfs_wr_evict_client, 0, - &lprocfs_evict_client_fops}, - { "num_exports", lprocfs_rd_num_exports, 0, 0 }, - { "degraded", lprocfs_ofd_rd_degraded, - lprocfs_ofd_wr_degraded, 0}, - { "sync_journal", lprocfs_ofd_rd_syncjournal, - lprocfs_ofd_wr_syncjournal, 0 }, - { "sync_on_lock_cancel", lprocfs_ofd_rd_sync_lock_cancel, - lprocfs_ofd_wr_sync_lock_cancel, 0 }, - { "instance", lprocfs_target_rd_instance, 0 }, - { "ir_factor", lprocfs_obd_rd_ir_factor, - lprocfs_obd_wr_ir_factor, 0}, - { "grant_compat_disable", lprocfs_ofd_rd_grant_compat_disable, - lprocfs_ofd_wr_grant_compat_disable, 0 }, - { "client_cache_count", lprocfs_ofd_rd_fmd_max_num, - lprocfs_ofd_wr_fmd_max_num, 0 }, - { "client_cache_seconds", lprocfs_ofd_rd_fmd_max_age, - lprocfs_ofd_wr_fmd_max_age, 0 }, - { "capa", lprocfs_ofd_rd_capa, - lprocfs_ofd_wr_capa, 0 }, - { "capa_count", lprocfs_ofd_rd_capa_count, 0, 0 }, - { "job_cleanup_interval", lprocfs_rd_job_interval, - lprocfs_wr_job_interval, 0}, - { 0 } -}; +static ssize_t writethrough_cache_enable_show(struct kobject *kobj, + struct attribute *attr, + char *buf) +{ + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); -static struct lprocfs_vars lprocfs_ofd_module_vars[] = { - { "num_refs", lprocfs_rd_numrefs, 0, 0 }, - { 0 } -}; + if (!wr_cache_warned) { + wr_cache_warned = true; + pr_info("ofd: 'obdfilter.*.writethrough_cache_enabled' is deprecated, use 'osd-*.writethrough_cache_enabled' instead\n"); + } -void lprocfs_ofd_init_vars(struct lprocfs_static_vars *lvars) + if (!ofd->ofd_write_cache_enable) + return -EOPNOTSUPP; + + return lustre_attr_show(&ofd->ofd_osd->dd_kobj, + ofd->ofd_write_cache_enable, buf); +} + +static ssize_t writethrough_cache_enable_store(struct kobject *kobj, + struct attribute *attr, + const char *buffer, size_t count) { - lvars->module_vars = lprocfs_ofd_module_vars; - lvars->obd_vars = lprocfs_ofd_obd_vars; + struct obd_device *obd = container_of(kobj, struct obd_device, + obd_kset.kobj); + struct ofd_device *ofd = ofd_dev(obd->obd_lu_dev); + + if (!ofd->ofd_write_cache_enable) + return -EOPNOTSUPP; + + return lustre_attr_store(&ofd->ofd_osd->dd_kobj, + ofd->ofd_write_cache_enable, + buffer, count); } +LUSTRE_RW_ATTR(writethrough_cache_enable); +#endif + +LPROC_SEQ_FOPS_RO_TYPE(ofd, recovery_status); +LUSTRE_RW_ATTR(recovery_time_hard); +LUSTRE_RW_ATTR(recovery_time_soft); +LUSTRE_RW_ATTR(ir_factor); + +LPROC_SEQ_FOPS_WR_ONLY(ofd, evict_client); +LPROC_SEQ_FOPS_RW_TYPE(ofd, checksum_dump); +LUSTRE_RW_ATTR(job_cleanup_interval); + +LUSTRE_RO_ATTR(tot_dirty); +LUSTRE_RO_ATTR(tot_granted); +LUSTRE_RO_ATTR(tot_pending); +LUSTRE_RW_ATTR(grant_compat_disable); +LUSTRE_RO_ATTR(instance); + +LUSTRE_RO_ATTR(num_exports); + +struct lprocfs_vars lprocfs_ofd_obd_vars[] = { + { .name = "last_id", + .fops = &ofd_last_id_fops }, + { .name = "recovery_status", + .fops = &ofd_recovery_status_fops }, + { .name = "evict_client", + .fops = &ofd_evict_client_fops }, + { .name = "brw_size", + .fops = &ofd_brw_size_fops }, + { .name = "checksum_dump", + .fops = &ofd_checksum_dump_fops }, + { .name = "lfsck_layout", + .fops = &ofd_lfsck_layout_fops }, + { .name = "lfsck_verify_pfid", + .fops = &ofd_lfsck_verify_pfid_fops }, + { .name = "site_stats", + .fops = &ofd_site_stats_fops }, + { NULL } +}; +/** + * Initialize OFD statistics counters + * + * param[in] stats statistics counters + */ void ofd_stats_counter_init(struct lprocfs_stats *stats) { - LASSERT(stats && stats->ls_num == LPROC_OFD_STATS_LAST); + LASSERT(stats && stats->ls_num >= LPROC_OFD_STATS_LAST); + lprocfs_counter_init(stats, LPROC_OFD_STATS_READ, - LPROCFS_CNTR_AVGMINMAX, "read", "bytes"); + LPROCFS_CNTR_AVGMINMAX, "read_bytes", "bytes"); lprocfs_counter_init(stats, LPROC_OFD_STATS_WRITE, - LPROCFS_CNTR_AVGMINMAX, "write", "bytes"); + LPROCFS_CNTR_AVGMINMAX, "write_bytes", "bytes"); + lprocfs_counter_init(stats, LPROC_OFD_STATS_GETATTR, + 0, "getattr", "reqs"); lprocfs_counter_init(stats, LPROC_OFD_STATS_SETATTR, 0, "setattr", "reqs"); lprocfs_counter_init(stats, LPROC_OFD_STATS_PUNCH, 0, "punch", "reqs"); lprocfs_counter_init(stats, LPROC_OFD_STATS_SYNC, 0, "sync", "reqs"); + lprocfs_counter_init(stats, LPROC_OFD_STATS_DESTROY, + 0, "destroy", "reqs"); + lprocfs_counter_init(stats, LPROC_OFD_STATS_CREATE, + 0, "create", "reqs"); + lprocfs_counter_init(stats, LPROC_OFD_STATS_STATFS, + 0, "statfs", "reqs"); + lprocfs_counter_init(stats, LPROC_OFD_STATS_GET_INFO, + 0, "get_info", "reqs"); + lprocfs_counter_init(stats, LPROC_OFD_STATS_SET_INFO, + 0, "set_info", "reqs"); + lprocfs_counter_init(stats, LPROC_OFD_STATS_QUOTACTL, + 0, "quotactl", "reqs"); +} + +LPROC_SEQ_FOPS(lprocfs_nid_stats_clear); + +static struct attribute *ofd_attrs[] = { + &lustre_attr_tot_dirty.attr, + &lustre_attr_tot_granted.attr, + &lustre_attr_tot_pending.attr, + &lustre_attr_grant_compat_disable.attr, + &lustre_attr_instance.attr, + &lustre_attr_recovery_time_hard.attr, + &lustre_attr_recovery_time_soft.attr, + &lustre_attr_ir_factor.attr, + &lustre_attr_num_exports.attr, + &lustre_attr_seqs_allocated.attr, + &lustre_attr_grant_precreate.attr, + &lustre_attr_precreate_batch.attr, + &lustre_attr_degraded.attr, + &lustre_attr_fstype.attr, + &lustre_attr_sync_journal.attr, + &lustre_attr_soft_sync_limit.attr, + &lustre_attr_lfsck_speed_limit.attr, + &lustre_attr_job_cleanup_interval.attr, + &lustre_attr_checksum_t10pi_enforce.attr, +#if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(2, 14, 53, 0) + &lustre_attr_read_cache_enable.attr, + &lustre_attr_readcache_max_filesize.attr, + &lustre_attr_writethrough_cache_enable.attr, +#endif + NULL, +}; + +/** + * Initialize all needed procfs entries for OFD device. + * + * \param[in] ofd OFD device + * + * \retval 0 if successful + * \retval negative value on error + */ +int ofd_tunables_init(struct ofd_device *ofd) +{ + struct obd_device *obd = ofd_obd(ofd); + struct proc_dir_entry *entry; + int rc = 0; + + ENTRY; + /* lprocfs must be setup before the ofd so state can be safely added + * to /proc incrementally as the ofd is setup + */ + obd->obd_ktype.default_attrs = ofd_attrs; + obd->obd_vars = lprocfs_ofd_obd_vars; + rc = lprocfs_obd_setup(obd, false); + if (rc) { + CERROR("%s: lprocfs_obd_setup failed: %d.\n", + obd->obd_name, rc); + RETURN(rc); + } + + rc = tgt_tunables_init(&ofd->ofd_lut); + if (rc) { + CERROR("%s: tgt_tunables_init failed: rc = %d\n", + obd->obd_name, rc); + GOTO(obd_cleanup, rc); + } + + rc = lprocfs_alloc_obd_stats(obd, LPROC_OFD_STATS_LAST); + if (rc) { + CERROR("%s: lprocfs_alloc_obd_stats failed: %d.\n", + obd->obd_name, rc); + GOTO(tgt_cleanup, rc); + } + + entry = lprocfs_register("exports", obd->obd_proc_entry, NULL, NULL); + if (IS_ERR(entry)) { + rc = PTR_ERR(entry); + CERROR("%s: error %d setting up lprocfs for %s\n", + obd->obd_name, rc, "exports"); + GOTO(obd_free_stats, rc); + } + obd->obd_proc_exports_entry = entry; + + entry = lprocfs_add_simple(obd->obd_proc_exports_entry, "clear", + obd, &lprocfs_nid_stats_clear_fops); + if (IS_ERR(entry)) { + rc = PTR_ERR(entry); + CERROR("%s: add proc entry 'clear' failed: %d.\n", + obd->obd_name, rc); + GOTO(obd_free_stats, rc); + } + + ofd_stats_counter_init(obd->obd_stats); + + rc = lprocfs_job_stats_init(obd, LPROC_OFD_STATS_LAST, + ofd_stats_counter_init); + if (rc) + GOTO(obd_free_stats, rc); + + RETURN(0); + +obd_free_stats: + lprocfs_free_obd_stats(obd); +tgt_cleanup: + tgt_tunables_fini(&ofd->ofd_lut); +obd_cleanup: + lprocfs_obd_cleanup(obd); + + return rc; } -#endif /* LPROCFS */ +#endif /* CONFIG_PROC_FS */