4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.gnu.org/licenses/gpl-2.0.html
23 * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
26 * Copyright (c) 2011, 2017, Intel Corporation.
29 * This file is part of Lustre, http://www.lustre.org/
30 * Lustre is a trademark of Sun Microsystems, Inc.
32 * lustre/obdclass/lprocfs_status.c
34 * Author: Hariharan Thantry <thantry@users.sourceforge.net>
37 #define DEBUG_SUBSYSTEM S_CLASS
39 #include <obd_class.h>
40 #include <lprocfs_status.h>
44 static int lprocfs_no_percpu_stats = 0;
45 module_param(lprocfs_no_percpu_stats, int, 0644);
46 MODULE_PARM_DESC(lprocfs_no_percpu_stats, "Do not alloc percpu data for lprocfs stats");
48 #define MAX_STRING_SIZE 128
50 int lprocfs_single_release(struct inode *inode, struct file *file)
52 return single_release(inode, file);
54 EXPORT_SYMBOL(lprocfs_single_release);
56 int lprocfs_seq_release(struct inode *inode, struct file *file)
58 return seq_release(inode, file);
60 EXPORT_SYMBOL(lprocfs_seq_release);
62 struct dentry *ldebugfs_add_simple(struct dentry *root,
63 char *name, void *data,
64 const struct file_operations *fops)
69 if (!root || !name || !fops)
70 return ERR_PTR(-EINVAL);
76 entry = debugfs_create_file(name, mode, root, data, fops);
77 if (IS_ERR_OR_NULL(entry)) {
78 CERROR("LprocFS: No memory to create <debugfs> entry %s", name);
79 return entry ?: ERR_PTR(-ENOMEM);
83 EXPORT_SYMBOL(ldebugfs_add_simple);
85 struct proc_dir_entry *
86 lprocfs_add_simple(struct proc_dir_entry *root, char *name,
87 void *data, const struct file_operations *fops)
89 struct proc_dir_entry *proc;
92 if (!root || !name || !fops)
93 return ERR_PTR(-EINVAL);
99 proc = proc_create_data(name, mode, root, fops, data);
101 CERROR("LprocFS: No memory to create /proc entry %s\n",
103 return ERR_PTR(-ENOMEM);
107 EXPORT_SYMBOL(lprocfs_add_simple);
109 struct proc_dir_entry *lprocfs_add_symlink(const char *name,
110 struct proc_dir_entry *parent,
111 const char *format, ...)
113 struct proc_dir_entry *entry;
117 if (!parent || !format)
120 OBD_ALLOC_WAIT(dest, MAX_STRING_SIZE + 1);
124 va_start(ap, format);
125 vsnprintf(dest, MAX_STRING_SIZE, format, ap);
128 entry = proc_symlink(name, parent, dest);
130 CERROR("LprocFS: Could not create symbolic link from "
131 "%s to %s\n", name, dest);
133 OBD_FREE(dest, MAX_STRING_SIZE + 1);
136 EXPORT_SYMBOL(lprocfs_add_symlink);
138 static const struct file_operations lprocfs_generic_fops = { };
140 int ldebugfs_add_vars(struct dentry *parent, struct lprocfs_vars *list,
143 if (IS_ERR_OR_NULL(parent) || IS_ERR_OR_NULL(list))
147 struct dentry *entry;
150 if (list->proc_mode != 0000) {
151 mode = list->proc_mode;
152 } else if (list->fops) {
153 if (list->fops->read)
155 if (list->fops->write)
158 entry = debugfs_create_file(list->name, mode, parent,
160 list->fops ? : &lprocfs_generic_fops);
161 if (IS_ERR_OR_NULL(entry))
162 return entry ? PTR_ERR(entry) : -ENOMEM;
167 EXPORT_SYMBOL_GPL(ldebugfs_add_vars);
172 * \param root [in] The parent proc entry on which new entry will be added.
173 * \param list [in] Array of proc entries to be added.
174 * \param data [in] The argument to be passed when entries read/write routines
175 * are called through /proc file.
177 * \retval 0 on success
181 lprocfs_add_vars(struct proc_dir_entry *root, struct lprocfs_vars *list,
188 struct proc_dir_entry *proc;
191 if (list->proc_mode != 0000) {
192 mode = list->proc_mode;
193 } else if (list->fops) {
194 if (list->fops->read)
196 if (list->fops->write)
199 proc = proc_create_data(list->name, mode, root,
200 list->fops ?: &lprocfs_generic_fops,
208 EXPORT_SYMBOL(lprocfs_add_vars);
210 void ldebugfs_remove(struct dentry **entryp)
212 debugfs_remove_recursive(*entryp);
215 EXPORT_SYMBOL_GPL(ldebugfs_remove);
217 #ifndef HAVE_REMOVE_PROC_SUBTREE
218 /* for b=10866, global variable */
219 DECLARE_RWSEM(_lprocfs_lock);
220 EXPORT_SYMBOL(_lprocfs_lock);
222 static void lprocfs_remove_nolock(struct proc_dir_entry **proot)
224 struct proc_dir_entry *root = *proot;
225 struct proc_dir_entry *temp = root;
226 struct proc_dir_entry *rm_entry;
227 struct proc_dir_entry *parent;
230 if (!root || IS_ERR(root))
233 parent = root->parent;
234 LASSERT(parent != NULL);
244 * Memory corruption once caused this to fail, and
245 * without this LASSERT we would loop here forever.
247 LASSERTF(strlen(rm_entry->name) == rm_entry->namelen,
248 "0x%p %s/%s len %d\n", rm_entry, temp->name,
249 rm_entry->name, (int)strlen(rm_entry->name));
251 remove_proc_entry(rm_entry->name, temp);
257 int remove_proc_subtree(const char *name, struct proc_dir_entry *parent)
259 struct proc_dir_entry *t = NULL;
260 struct proc_dir_entry **p;
263 LASSERT(parent != NULL);
266 down_write(&_lprocfs_lock);
267 /* lookup target name */
268 for (p = &parent->subdir; *p; p = &(*p)->next) {
269 if ((*p)->namelen != len)
271 if (memcmp(name, (*p)->name, len))
278 /* verify it's empty: do not count "num_refs" */
279 for (p = &t->subdir; *p; p = &(*p)->next) {
280 if ((*p)->namelen != strlen("num_refs")) {
284 if (memcmp("num_refs", (*p)->name,
285 strlen("num_refs"))) {
293 lprocfs_remove_nolock(&t);
295 up_write(&_lprocfs_lock);
298 #endif /* !HAVE_REMOVE_PROC_SUBTREE */
300 #ifndef HAVE_PROC_REMOVE
301 void proc_remove(struct proc_dir_entry *de)
303 #ifndef HAVE_REMOVE_PROC_SUBTREE
304 down_write(&_lprocfs_lock); /* search vs remove race */
305 lprocfs_remove_nolock(&de);
306 up_write(&_lprocfs_lock);
309 remove_proc_subtree(de->name, de->parent);
314 void lprocfs_remove(struct proc_dir_entry **rooth)
319 EXPORT_SYMBOL(lprocfs_remove);
321 void lprocfs_remove_proc_entry(const char *name, struct proc_dir_entry *parent)
323 LASSERT(parent != NULL);
324 remove_proc_entry(name, parent);
326 EXPORT_SYMBOL(lprocfs_remove_proc_entry);
328 struct dentry *ldebugfs_register(const char *name, struct dentry *parent,
329 struct lprocfs_vars *list, void *data)
331 struct dentry *entry;
333 entry = debugfs_create_dir(name, parent);
334 if (IS_ERR_OR_NULL(entry)) {
335 entry = entry ?: ERR_PTR(-ENOMEM);
339 if (!IS_ERR_OR_NULL(list)) {
342 rc = ldebugfs_add_vars(entry, list, data);
344 debugfs_remove(entry);
351 EXPORT_SYMBOL_GPL(ldebugfs_register);
353 struct proc_dir_entry *
354 lprocfs_register(const char *name, struct proc_dir_entry *parent,
355 struct lprocfs_vars *list, void *data)
357 struct proc_dir_entry *newchild;
359 newchild = proc_mkdir(name, parent);
361 return ERR_PTR(-ENOMEM);
364 int rc = lprocfs_add_vars(newchild, list, data);
366 lprocfs_remove(&newchild);
372 EXPORT_SYMBOL(lprocfs_register);
374 /* Generic callbacks */
375 int lprocfs_uuid_seq_show(struct seq_file *m, void *data)
377 struct obd_device *obd = data;
379 LASSERT(obd != NULL);
380 seq_printf(m, "%s\n", obd->obd_uuid.uuid);
383 EXPORT_SYMBOL(lprocfs_uuid_seq_show);
385 static ssize_t uuid_show(struct kobject *kobj, struct attribute *attr,
388 struct obd_device *obd = container_of(kobj, struct obd_device,
391 return sprintf(buf, "%s\n", obd->obd_uuid.uuid);
393 LUSTRE_RO_ATTR(uuid);
395 static ssize_t blocksize_show(struct kobject *kobj, struct attribute *attr,
398 struct obd_device *obd = container_of(kobj, struct obd_device,
400 struct obd_statfs osfs;
403 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
404 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
407 return sprintf(buf, "%u\n", osfs.os_bsize);
411 LUSTRE_RO_ATTR(blocksize);
413 static ssize_t kbytestotal_show(struct kobject *kobj, struct attribute *attr,
416 struct obd_device *obd = container_of(kobj, struct obd_device,
418 struct obd_statfs osfs;
421 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
422 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
425 u32 blk_size = osfs.os_bsize >> 10;
426 u64 result = osfs.os_blocks;
428 while (blk_size >>= 1)
431 return sprintf(buf, "%llu\n", result);
436 LUSTRE_RO_ATTR(kbytestotal);
438 static ssize_t kbytesfree_show(struct kobject *kobj, struct attribute *attr,
441 struct obd_device *obd = container_of(kobj, struct obd_device,
443 struct obd_statfs osfs;
446 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
447 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
450 u32 blk_size = osfs.os_bsize >> 10;
451 u64 result = osfs.os_bfree;
453 while (blk_size >>= 1)
456 return sprintf(buf, "%llu\n", result);
461 LUSTRE_RO_ATTR(kbytesfree);
463 static ssize_t kbytesavail_show(struct kobject *kobj, struct attribute *attr,
466 struct obd_device *obd = container_of(kobj, struct obd_device,
468 struct obd_statfs osfs;
471 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
472 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
475 u32 blk_size = osfs.os_bsize >> 10;
476 u64 result = osfs.os_bavail;
478 while (blk_size >>= 1)
481 return sprintf(buf, "%llu\n", result);
486 LUSTRE_RO_ATTR(kbytesavail);
488 static ssize_t filestotal_show(struct kobject *kobj, struct attribute *attr,
491 struct obd_device *obd = container_of(kobj, struct obd_device,
493 struct obd_statfs osfs;
496 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
497 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
500 return sprintf(buf, "%llu\n", osfs.os_files);
504 LUSTRE_RO_ATTR(filestotal);
506 static ssize_t filesfree_show(struct kobject *kobj, struct attribute *attr,
509 struct obd_device *obd = container_of(kobj, struct obd_device,
511 struct obd_statfs osfs;
514 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
515 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
518 return sprintf(buf, "%llu\n", osfs.os_ffree);
522 LUSTRE_RO_ATTR(filesfree);
524 ssize_t conn_uuid_show(struct kobject *kobj, struct attribute *attr, char *buf)
526 struct obd_device *obd = container_of(kobj, struct obd_device,
528 struct ptlrpc_connection *conn;
531 LPROCFS_CLIMP_CHECK(obd);
532 conn = obd->u.cli.cl_import->imp_connection;
533 if (conn && obd->u.cli.cl_import)
534 count = sprintf(buf, "%s\n", conn->c_remote_uuid.uuid);
536 count = sprintf(buf, "%s\n", "<none>");
538 LPROCFS_CLIMP_EXIT(obd);
541 EXPORT_SYMBOL(conn_uuid_show);
543 int lprocfs_server_uuid_seq_show(struct seq_file *m, void *data)
545 struct obd_device *obd = data;
546 struct obd_import *imp;
547 char *imp_state_name = NULL;
550 LASSERT(obd != NULL);
551 LPROCFS_CLIMP_CHECK(obd);
552 imp = obd->u.cli.cl_import;
553 imp_state_name = ptlrpc_import_state_name(imp->imp_state);
554 seq_printf(m, "%s\t%s%s\n", obd2cli_tgt(obd), imp_state_name,
555 imp->imp_deactive ? "\tDEACTIVATED" : "");
557 LPROCFS_CLIMP_EXIT(obd);
560 EXPORT_SYMBOL(lprocfs_server_uuid_seq_show);
562 /** add up per-cpu counters */
565 * Lock statistics structure for access, possibly only on this CPU.
567 * The statistics struct may be allocated with per-CPU structures for
568 * efficient concurrent update (usually only on server-wide stats), or
569 * as a single global struct (e.g. for per-client or per-job statistics),
570 * so the required locking depends on the type of structure allocated.
572 * For per-CPU statistics, pin the thread to the current cpuid so that
573 * will only access the statistics for that CPU. If the stats structure
574 * for the current CPU has not been allocated (or previously freed),
575 * allocate it now. The per-CPU statistics do not need locking since
576 * the thread is pinned to the CPU during update.
578 * For global statistics, lock the stats structure to prevent concurrent update.
580 * \param[in] stats statistics structure to lock
581 * \param[in] opc type of operation:
582 * LPROCFS_GET_SMP_ID: "lock" and return current CPU index
583 * for incrementing statistics for that CPU
584 * LPROCFS_GET_NUM_CPU: "lock" and return number of used
585 * CPU indices to iterate over all indices
586 * \param[out] flags CPU interrupt saved state for IRQ-safe locking
588 * \retval cpuid of current thread or number of allocated structs
589 * \retval negative on error (only for opc LPROCFS_GET_SMP_ID + per-CPU stats)
591 int lprocfs_stats_lock(struct lprocfs_stats *stats,
592 enum lprocfs_stats_lock_ops opc,
593 unsigned long *flags)
595 if (stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU) {
596 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
597 spin_lock_irqsave(&stats->ls_lock, *flags);
599 spin_lock(&stats->ls_lock);
600 return opc == LPROCFS_GET_NUM_CPU ? 1 : 0;
604 case LPROCFS_GET_SMP_ID: {
605 unsigned int cpuid = get_cpu();
607 if (unlikely(!stats->ls_percpu[cpuid])) {
608 int rc = lprocfs_stats_alloc_one(stats, cpuid);
617 case LPROCFS_GET_NUM_CPU:
618 return stats->ls_biggest_alloc_num;
625 * Unlock statistics structure after access.
627 * Unlock the lock acquired via lprocfs_stats_lock() for global statistics,
628 * or unpin this thread from the current cpuid for per-CPU statistics.
630 * This function must be called using the same arguments as used when calling
631 * lprocfs_stats_lock() so that the correct operation can be performed.
633 * \param[in] stats statistics structure to unlock
634 * \param[in] opc type of operation (current cpuid or number of structs)
635 * \param[in] flags CPU interrupt saved state for IRQ-safe locking
637 void lprocfs_stats_unlock(struct lprocfs_stats *stats,
638 enum lprocfs_stats_lock_ops opc,
639 unsigned long *flags)
641 if (stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU) {
642 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
643 spin_unlock_irqrestore(&stats->ls_lock, *flags);
645 spin_unlock(&stats->ls_lock);
646 } else if (opc == LPROCFS_GET_SMP_ID) {
651 /** add up per-cpu counters */
652 void lprocfs_stats_collect(struct lprocfs_stats *stats, int idx,
653 struct lprocfs_counter *cnt)
655 unsigned int num_entry;
656 struct lprocfs_counter *percpu_cntr;
658 unsigned long flags = 0;
660 memset(cnt, 0, sizeof(*cnt));
663 /* set count to 1 to avoid divide-by-zero errs in callers */
668 cnt->lc_min = LC_MIN_INIT;
670 num_entry = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
672 for (i = 0; i < num_entry; i++) {
673 if (!stats->ls_percpu[i])
675 percpu_cntr = lprocfs_stats_counter_get(stats, i, idx);
677 cnt->lc_count += percpu_cntr->lc_count;
678 cnt->lc_sum += percpu_cntr->lc_sum;
679 if (percpu_cntr->lc_min < cnt->lc_min)
680 cnt->lc_min = percpu_cntr->lc_min;
681 if (percpu_cntr->lc_max > cnt->lc_max)
682 cnt->lc_max = percpu_cntr->lc_max;
683 cnt->lc_sumsquare += percpu_cntr->lc_sumsquare;
686 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
689 static void obd_import_flags2str(struct obd_import *imp, struct seq_file *m)
693 if (imp->imp_obd->obd_no_recov) {
694 seq_printf(m, "no_recov");
698 flag2str(imp, invalid);
699 flag2str(imp, deactive);
700 flag2str(imp, replayable);
701 flag2str(imp, delayed_recovery);
702 flag2str(imp, vbr_failed);
703 flag2str(imp, pingable);
704 flag2str(imp, resend_replay);
705 flag2str(imp, no_pinger_recover);
706 flag2str(imp, connect_tried);
709 static const char *obd_connect_names[] = {
728 "remote_client_by_force",
737 "mds_mds_connection",
740 "alt_checksum_algorithm",
776 "file_secctx", /* 0x01 */
777 "lockaheadv2", /* 0x02 */
778 "dir_migrate", /* 0x04 */
779 "sum_statfs", /* 0x08 */
780 "overstriping", /* 0x10 */
783 "lock_convert", /* 0x80 */
784 "archive_id_array", /* 0x100 */
785 "unknown", /* 0x200 */
786 "selinux_policy", /* 0x400 */
789 "plain_layout", /* 0x2000 */
790 "async_discard", /* 0x4000 */
794 void obd_connect_seq_flags2str(struct seq_file *m, __u64 flags, __u64 flags2,
801 for (i = 0, mask = 1; i < 64; i++, mask <<= 1) {
803 seq_printf(m, "%s%s",
804 first ? "" : sep, obd_connect_names[i]);
809 if (flags & ~(mask - 1)) {
810 seq_printf(m, "%sunknown_%#llx",
811 first ? "" : sep, flags & ~(mask - 1));
815 if (!(flags & OBD_CONNECT_FLAGS2) || flags2 == 0)
818 for (i = 64, mask = 1; obd_connect_names[i] != NULL; i++, mask <<= 1) {
820 seq_printf(m, "%s%s",
821 first ? "" : sep, obd_connect_names[i]);
826 if (flags2 & ~(mask - 1)) {
827 seq_printf(m, "%sunknown2_%#llx",
828 first ? "" : sep, flags2 & ~(mask - 1));
832 EXPORT_SYMBOL(obd_connect_seq_flags2str);
834 int obd_connect_flags2str(char *page, int count, __u64 flags, __u64 flags2,
840 for (i = 0, mask = 1; i < 64; i++, mask <<= 1) {
842 ret += snprintf(page + ret, count - ret, "%s%s",
843 ret ? sep : "", obd_connect_names[i]);
846 if (flags & ~(mask - 1))
847 ret += snprintf(page + ret, count - ret,
849 ret ? sep : "", flags & ~(mask - 1));
851 if (!(flags & OBD_CONNECT_FLAGS2) || flags2 == 0)
854 for (i = 64, mask = 1; obd_connect_names[i] != NULL; i++, mask <<= 1) {
856 ret += snprintf(page + ret, count - ret, "%s%s",
857 ret ? sep : "", obd_connect_names[i]);
860 if (flags2 & ~(mask - 1))
861 ret += snprintf(page + ret, count - ret,
863 ret ? sep : "", flags2 & ~(mask - 1));
867 EXPORT_SYMBOL(obd_connect_flags2str);
870 obd_connect_data_seqprint(struct seq_file *m, struct obd_connect_data *ocd)
874 LASSERT(ocd != NULL);
875 flags = ocd->ocd_connect_flags;
877 seq_printf(m, " connect_data:\n"
880 ocd->ocd_connect_flags,
882 if (flags & OBD_CONNECT_VERSION)
883 seq_printf(m, " target_version: %u.%u.%u.%u\n",
884 OBD_OCD_VERSION_MAJOR(ocd->ocd_version),
885 OBD_OCD_VERSION_MINOR(ocd->ocd_version),
886 OBD_OCD_VERSION_PATCH(ocd->ocd_version),
887 OBD_OCD_VERSION_FIX(ocd->ocd_version));
888 if (flags & OBD_CONNECT_MDS)
889 seq_printf(m, " mdt_index: %d\n", ocd->ocd_group);
890 if (flags & OBD_CONNECT_GRANT)
891 seq_printf(m, " initial_grant: %d\n", ocd->ocd_grant);
892 if (flags & OBD_CONNECT_INDEX)
893 seq_printf(m, " target_index: %u\n", ocd->ocd_index);
894 if (flags & OBD_CONNECT_BRW_SIZE)
895 seq_printf(m, " max_brw_size: %d\n", ocd->ocd_brw_size);
896 if (flags & OBD_CONNECT_IBITS)
897 seq_printf(m, " ibits_known: %#llx\n",
898 ocd->ocd_ibits_known);
899 if (flags & OBD_CONNECT_GRANT_PARAM)
900 seq_printf(m, " grant_block_size: %d\n"
901 " grant_inode_size: %d\n"
902 " grant_max_extent_size: %d\n"
903 " grant_extent_tax: %d\n",
904 1 << ocd->ocd_grant_blkbits,
905 1 << ocd->ocd_grant_inobits,
906 ocd->ocd_grant_max_blks << ocd->ocd_grant_blkbits,
907 ocd->ocd_grant_tax_kb << 10);
908 if (flags & OBD_CONNECT_TRANSNO)
909 seq_printf(m, " first_transno: %#llx\n",
911 if (flags & OBD_CONNECT_CKSUM)
912 seq_printf(m, " cksum_types: %#x\n",
913 ocd->ocd_cksum_types);
914 if (flags & OBD_CONNECT_MAX_EASIZE)
915 seq_printf(m, " max_easize: %d\n", ocd->ocd_max_easize);
916 if (flags & OBD_CONNECT_MAXBYTES)
917 seq_printf(m, " max_object_bytes: %llu\n",
919 if (flags & OBD_CONNECT_MULTIMODRPCS)
920 seq_printf(m, " max_mod_rpcs: %hu\n",
921 ocd->ocd_maxmodrpcs);
924 int lprocfs_import_seq_show(struct seq_file *m, void *data)
926 char nidstr[LNET_NIDSTR_SIZE];
927 struct lprocfs_counter ret;
928 struct lprocfs_counter_header *header;
929 struct obd_device *obd = (struct obd_device *)data;
930 struct obd_import *imp;
931 struct obd_import_conn *conn;
932 struct obd_connect_data *ocd;
937 LASSERT(obd != NULL);
938 LPROCFS_CLIMP_CHECK(obd);
939 imp = obd->u.cli.cl_import;
940 ocd = &imp->imp_connect_data;
942 seq_printf(m, "import:\n"
946 " connect_flags: [ ",
949 ptlrpc_import_state_name(imp->imp_state));
950 obd_connect_seq_flags2str(m, imp->imp_connect_data.ocd_connect_flags,
951 imp->imp_connect_data.ocd_connect_flags2,
953 seq_printf(m, " ]\n");
954 obd_connect_data_seqprint(m, ocd);
955 seq_printf(m, " import_flags: [ ");
956 obd_import_flags2str(imp, m);
960 " failover_nids: [ ");
961 spin_lock(&imp->imp_lock);
963 list_for_each_entry(conn, &imp->imp_conn_list, oic_item) {
964 libcfs_nid2str_r(conn->oic_conn->c_peer.nid,
965 nidstr, sizeof(nidstr));
966 seq_printf(m, "%s%s", j ? ", " : "", nidstr);
969 if (imp->imp_connection)
970 libcfs_nid2str_r(imp->imp_connection->c_peer.nid,
971 nidstr, sizeof(nidstr));
973 strncpy(nidstr, "<none>", sizeof(nidstr));
975 " current_connection: %s\n"
976 " connection_attempts: %u\n"
978 " in-progress_invalidations: %u\n"
983 atomic_read(&imp->imp_inval_count),
984 ktime_get_real_seconds() - imp->imp_last_reply_time);
985 spin_unlock(&imp->imp_lock);
987 if (!obd->obd_svc_stats)
990 header = &obd->obd_svc_stats->ls_cnt_header[PTLRPC_REQWAIT_CNTR];
991 lprocfs_stats_collect(obd->obd_svc_stats, PTLRPC_REQWAIT_CNTR, &ret);
992 if (ret.lc_count != 0) {
993 /* first argument to do_div MUST be __u64 */
994 __u64 sum = ret.lc_sum;
995 do_div(sum, ret.lc_count);
999 seq_printf(m, " rpcs:\n"
1001 " unregistering: %u\n"
1003 " avg_waittime: %llu %s\n",
1004 atomic_read(&imp->imp_inflight),
1005 atomic_read(&imp->imp_unregistering),
1006 atomic_read(&imp->imp_timeouts),
1007 ret.lc_sum, header->lc_units);
1010 for(j = 0; j < IMP_AT_MAX_PORTALS; j++) {
1011 if (imp->imp_at.iat_portal[j] == 0)
1013 k = max_t(unsigned int, k,
1014 at_get(&imp->imp_at.iat_service_estimate[j]));
1016 seq_printf(m, " service_estimates:\n"
1017 " services: %u sec\n"
1018 " network: %u sec\n",
1020 at_get(&imp->imp_at.iat_net_latency));
1022 seq_printf(m, " transactions:\n"
1023 " last_replay: %llu\n"
1024 " peer_committed: %llu\n"
1025 " last_checked: %llu\n",
1026 imp->imp_last_replay_transno,
1027 imp->imp_peer_committed_transno,
1028 imp->imp_last_transno_checked);
1030 /* avg data rates */
1031 for (rw = 0; rw <= 1; rw++) {
1032 lprocfs_stats_collect(obd->obd_svc_stats,
1033 PTLRPC_LAST_CNTR + BRW_READ_BYTES + rw,
1035 if (ret.lc_sum > 0 && ret.lc_count > 0) {
1036 /* first argument to do_div MUST be __u64 */
1037 __u64 sum = ret.lc_sum;
1038 do_div(sum, ret.lc_count);
1040 seq_printf(m, " %s_data_averages:\n"
1041 " bytes_per_rpc: %llu\n",
1042 rw ? "write" : "read",
1045 k = (int)ret.lc_sum;
1046 j = opcode_offset(OST_READ + rw) + EXTRA_MAX_OPCODES;
1047 header = &obd->obd_svc_stats->ls_cnt_header[j];
1048 lprocfs_stats_collect(obd->obd_svc_stats, j, &ret);
1049 if (ret.lc_sum > 0 && ret.lc_count != 0) {
1050 /* first argument to do_div MUST be __u64 */
1051 __u64 sum = ret.lc_sum;
1052 do_div(sum, ret.lc_count);
1054 seq_printf(m, " %s_per_rpc: %llu\n",
1055 header->lc_units, ret.lc_sum);
1056 j = (int)ret.lc_sum;
1058 seq_printf(m, " MB_per_sec: %u.%.02u\n",
1059 k / j, (100 * k / j) % 100);
1064 LPROCFS_CLIMP_EXIT(obd);
1067 EXPORT_SYMBOL(lprocfs_import_seq_show);
1069 int lprocfs_state_seq_show(struct seq_file *m, void *data)
1071 struct obd_device *obd = (struct obd_device *)data;
1072 struct obd_import *imp;
1075 LASSERT(obd != NULL);
1076 LPROCFS_CLIMP_CHECK(obd);
1077 imp = obd->u.cli.cl_import;
1079 seq_printf(m, "current_state: %s\n",
1080 ptlrpc_import_state_name(imp->imp_state));
1081 seq_printf(m, "state_history:\n");
1082 k = imp->imp_state_hist_idx;
1083 for (j = 0; j < IMP_STATE_HIST_LEN; j++) {
1084 struct import_state_hist *ish =
1085 &imp->imp_state_hist[(k + j) % IMP_STATE_HIST_LEN];
1086 if (ish->ish_state == 0)
1088 seq_printf(m, " - [ %lld, %s ]\n", (s64)ish->ish_time,
1089 ptlrpc_import_state_name(ish->ish_state));
1092 LPROCFS_CLIMP_EXIT(obd);
1095 EXPORT_SYMBOL(lprocfs_state_seq_show);
1097 int lprocfs_at_hist_helper(struct seq_file *m, struct adaptive_timeout *at)
1100 for (i = 0; i < AT_BINS; i++)
1101 seq_printf(m, "%3u ", at->at_hist[i]);
1102 seq_printf(m, "\n");
1105 EXPORT_SYMBOL(lprocfs_at_hist_helper);
1107 /* See also ptlrpc_lprocfs_timeouts_show_seq */
1108 int lprocfs_timeouts_seq_show(struct seq_file *m, void *data)
1110 struct obd_device *obd = (struct obd_device *)data;
1111 struct obd_import *imp;
1112 unsigned int cur, worst;
1113 time64_t now, worstt;
1116 LASSERT(obd != NULL);
1117 LPROCFS_CLIMP_CHECK(obd);
1118 imp = obd->u.cli.cl_import;
1120 now = ktime_get_real_seconds();
1122 /* Some network health info for kicks */
1123 seq_printf(m, "%-10s : %lld, %llds ago\n",
1124 "last reply", (s64)imp->imp_last_reply_time,
1125 (s64)(now - imp->imp_last_reply_time));
1127 cur = at_get(&imp->imp_at.iat_net_latency);
1128 worst = imp->imp_at.iat_net_latency.at_worst_ever;
1129 worstt = imp->imp_at.iat_net_latency.at_worst_time;
1130 seq_printf(m, "%-10s : cur %3u worst %3u (at %lld, %llds ago) ",
1131 "network", cur, worst, (s64)worstt, (s64)(now - worstt));
1132 lprocfs_at_hist_helper(m, &imp->imp_at.iat_net_latency);
1134 for(i = 0; i < IMP_AT_MAX_PORTALS; i++) {
1135 if (imp->imp_at.iat_portal[i] == 0)
1137 cur = at_get(&imp->imp_at.iat_service_estimate[i]);
1138 worst = imp->imp_at.iat_service_estimate[i].at_worst_ever;
1139 worstt = imp->imp_at.iat_service_estimate[i].at_worst_time;
1140 seq_printf(m, "portal %-2d : cur %3u worst %3u (at %lld, %llds ago) ",
1141 imp->imp_at.iat_portal[i], cur, worst, (s64)worstt,
1142 (s64)(now - worstt));
1143 lprocfs_at_hist_helper(m, &imp->imp_at.iat_service_estimate[i]);
1146 LPROCFS_CLIMP_EXIT(obd);
1149 EXPORT_SYMBOL(lprocfs_timeouts_seq_show);
1151 int lprocfs_connect_flags_seq_show(struct seq_file *m, void *data)
1153 struct obd_device *obd = data;
1157 LPROCFS_CLIMP_CHECK(obd);
1158 flags = obd->u.cli.cl_import->imp_connect_data.ocd_connect_flags;
1159 flags2 = obd->u.cli.cl_import->imp_connect_data.ocd_connect_flags2;
1160 seq_printf(m, "flags=%#llx\n", flags);
1161 seq_printf(m, "flags2=%#llx\n", flags2);
1162 obd_connect_seq_flags2str(m, flags, flags2, "\n");
1163 seq_printf(m, "\n");
1164 LPROCFS_CLIMP_EXIT(obd);
1167 EXPORT_SYMBOL(lprocfs_connect_flags_seq_show);
1169 static const struct attribute *obd_def_uuid_attrs[] = {
1170 &lustre_attr_uuid.attr,
1174 static const struct attribute *obd_def_attrs[] = {
1175 &lustre_attr_blocksize.attr,
1176 &lustre_attr_kbytestotal.attr,
1177 &lustre_attr_kbytesfree.attr,
1178 &lustre_attr_kbytesavail.attr,
1179 &lustre_attr_filestotal.attr,
1180 &lustre_attr_filesfree.attr,
1181 &lustre_attr_uuid.attr,
1185 static void obd_sysfs_release(struct kobject *kobj)
1187 struct obd_device *obd = container_of(kobj, struct obd_device,
1190 complete(&obd->obd_kobj_unregister);
1193 int lprocfs_obd_setup(struct obd_device *obd, bool uuid_only)
1195 struct lprocfs_vars *debugfs_vars = NULL;
1198 if (!obd || obd->obd_magic != OBD_DEVICE_MAGIC)
1201 rc = kobject_set_name(&obd->obd_kset.kobj, "%s", obd->obd_name);
1205 obd->obd_ktype.sysfs_ops = &lustre_sysfs_ops;
1206 obd->obd_ktype.release = obd_sysfs_release;
1208 obd->obd_kset.kobj.parent = &obd->obd_type->typ_kobj;
1209 obd->obd_kset.kobj.ktype = &obd->obd_ktype;
1210 init_completion(&obd->obd_kobj_unregister);
1211 rc = kset_register(&obd->obd_kset);
1216 obd->obd_attrs = obd_def_uuid_attrs;
1218 obd->obd_attrs = obd_def_attrs;
1220 rc = sysfs_create_files(&obd->obd_kset.kobj, obd->obd_attrs);
1222 kset_unregister(&obd->obd_kset);
1226 if (!obd->obd_type->typ_procroot)
1227 debugfs_vars = obd->obd_vars;
1228 obd->obd_debugfs_entry = ldebugfs_register(obd->obd_name,
1229 obd->obd_type->typ_debugfs_entry,
1231 if (IS_ERR_OR_NULL(obd->obd_debugfs_entry)) {
1232 rc = obd->obd_debugfs_entry ? PTR_ERR(obd->obd_debugfs_entry)
1234 CERROR("error %d setting up debugfs for %s\n",
1236 obd->obd_debugfs_entry = NULL;
1238 sysfs_remove_files(&obd->obd_kset.kobj, obd->obd_attrs);
1239 obd->obd_attrs = NULL;
1240 kset_unregister(&obd->obd_kset);
1244 if (obd->obd_proc_entry || !obd->obd_type->typ_procroot)
1245 GOTO(already_registered, rc);
1247 obd->obd_proc_entry = lprocfs_register(obd->obd_name,
1248 obd->obd_type->typ_procroot,
1249 obd->obd_vars, obd);
1250 if (IS_ERR(obd->obd_proc_entry)) {
1251 rc = PTR_ERR(obd->obd_proc_entry);
1252 CERROR("error %d setting up lprocfs for %s\n",rc,obd->obd_name);
1253 obd->obd_proc_entry = NULL;
1255 ldebugfs_remove(&obd->obd_debugfs_entry);
1256 sysfs_remove_files(&obd->obd_kset.kobj, obd->obd_attrs);
1257 obd->obd_attrs = NULL;
1258 kset_unregister(&obd->obd_kset);
1264 EXPORT_SYMBOL(lprocfs_obd_setup);
1266 int lprocfs_obd_cleanup(struct obd_device *obd)
1271 if (obd->obd_proc_exports_entry) {
1272 /* Should be no exports left */
1273 lprocfs_remove(&obd->obd_proc_exports_entry);
1274 obd->obd_proc_exports_entry = NULL;
1277 if (obd->obd_proc_entry) {
1278 lprocfs_remove(&obd->obd_proc_entry);
1279 obd->obd_proc_entry = NULL;
1282 if (!IS_ERR_OR_NULL(obd->obd_debugfs_entry))
1283 ldebugfs_remove(&obd->obd_debugfs_entry);
1285 /* obd device never allocated a kset */
1286 if (!obd->obd_kset.kobj.state_initialized)
1289 if (obd->obd_attrs) {
1290 sysfs_remove_files(&obd->obd_kset.kobj, obd->obd_attrs);
1291 obd->obd_attrs = NULL;
1294 kset_unregister(&obd->obd_kset);
1295 wait_for_completion(&obd->obd_kobj_unregister);
1298 EXPORT_SYMBOL(lprocfs_obd_cleanup);
1300 int lprocfs_stats_alloc_one(struct lprocfs_stats *stats, unsigned int cpuid)
1302 struct lprocfs_counter *cntr;
1303 unsigned int percpusize;
1305 unsigned long flags = 0;
1308 LASSERT(stats->ls_percpu[cpuid] == NULL);
1309 LASSERT((stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU) == 0);
1311 percpusize = lprocfs_stats_counter_size(stats);
1312 LIBCFS_ALLOC_ATOMIC(stats->ls_percpu[cpuid], percpusize);
1313 if (stats->ls_percpu[cpuid]) {
1315 if (unlikely(stats->ls_biggest_alloc_num <= cpuid)) {
1316 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
1317 spin_lock_irqsave(&stats->ls_lock, flags);
1319 spin_lock(&stats->ls_lock);
1320 if (stats->ls_biggest_alloc_num <= cpuid)
1321 stats->ls_biggest_alloc_num = cpuid + 1;
1322 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE) {
1323 spin_unlock_irqrestore(&stats->ls_lock, flags);
1325 spin_unlock(&stats->ls_lock);
1328 /* initialize the ls_percpu[cpuid] non-zero counter */
1329 for (i = 0; i < stats->ls_num; ++i) {
1330 cntr = lprocfs_stats_counter_get(stats, cpuid, i);
1331 cntr->lc_min = LC_MIN_INIT;
1337 struct lprocfs_stats *lprocfs_alloc_stats(unsigned int num,
1338 enum lprocfs_stats_flags flags)
1340 struct lprocfs_stats *stats;
1341 unsigned int num_entry;
1342 unsigned int percpusize = 0;
1348 if (lprocfs_no_percpu_stats != 0)
1349 flags |= LPROCFS_STATS_FLAG_NOPERCPU;
1351 if (flags & LPROCFS_STATS_FLAG_NOPERCPU)
1354 num_entry = num_possible_cpus();
1356 /* alloc percpu pointers for all possible cpu slots */
1357 LIBCFS_ALLOC(stats, offsetof(typeof(*stats), ls_percpu[num_entry]));
1361 stats->ls_num = num;
1362 stats->ls_flags = flags;
1363 spin_lock_init(&stats->ls_lock);
1365 /* alloc num of counter headers */
1366 LIBCFS_ALLOC(stats->ls_cnt_header,
1367 stats->ls_num * sizeof(struct lprocfs_counter_header));
1368 if (!stats->ls_cnt_header)
1371 if ((flags & LPROCFS_STATS_FLAG_NOPERCPU) != 0) {
1372 /* contains only one set counters */
1373 percpusize = lprocfs_stats_counter_size(stats);
1374 LIBCFS_ALLOC_ATOMIC(stats->ls_percpu[0], percpusize);
1375 if (!stats->ls_percpu[0])
1377 stats->ls_biggest_alloc_num = 1;
1378 } else if ((flags & LPROCFS_STATS_FLAG_IRQ_SAFE) != 0) {
1379 /* alloc all percpu data, currently only obd_memory use this */
1380 for (i = 0; i < num_entry; ++i)
1381 if (lprocfs_stats_alloc_one(stats, i) < 0)
1388 lprocfs_free_stats(&stats);
1391 EXPORT_SYMBOL(lprocfs_alloc_stats);
1393 void lprocfs_free_stats(struct lprocfs_stats **statsh)
1395 struct lprocfs_stats *stats = *statsh;
1396 unsigned int num_entry;
1397 unsigned int percpusize;
1400 if (!stats || stats->ls_num == 0)
1404 if (stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU)
1407 num_entry = num_possible_cpus();
1409 percpusize = lprocfs_stats_counter_size(stats);
1410 for (i = 0; i < num_entry; i++)
1411 if (stats->ls_percpu[i])
1412 LIBCFS_FREE(stats->ls_percpu[i], percpusize);
1413 if (stats->ls_cnt_header)
1414 LIBCFS_FREE(stats->ls_cnt_header, stats->ls_num *
1415 sizeof(struct lprocfs_counter_header));
1416 LIBCFS_FREE(stats, offsetof(typeof(*stats), ls_percpu[num_entry]));
1418 EXPORT_SYMBOL(lprocfs_free_stats);
1420 u64 lprocfs_stats_collector(struct lprocfs_stats *stats, int idx,
1421 enum lprocfs_fields_flags field)
1423 unsigned long flags = 0;
1424 unsigned int num_cpu;
1430 num_cpu = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
1431 for (i = 0; i < num_cpu; i++) {
1432 struct lprocfs_counter *cntr;
1434 if (!stats->ls_percpu[i])
1437 cntr = lprocfs_stats_counter_get(stats, i, idx);
1438 ret += lprocfs_read_helper(cntr, &stats->ls_cnt_header[idx],
1439 stats->ls_flags, field);
1441 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
1444 EXPORT_SYMBOL(lprocfs_stats_collector);
1446 void lprocfs_clear_stats(struct lprocfs_stats *stats)
1448 struct lprocfs_counter *percpu_cntr;
1451 unsigned int num_entry;
1452 unsigned long flags = 0;
1454 num_entry = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
1456 for (i = 0; i < num_entry; i++) {
1457 if (!stats->ls_percpu[i])
1459 for (j = 0; j < stats->ls_num; j++) {
1460 percpu_cntr = lprocfs_stats_counter_get(stats, i, j);
1461 percpu_cntr->lc_count = 0;
1462 percpu_cntr->lc_min = LC_MIN_INIT;
1463 percpu_cntr->lc_max = 0;
1464 percpu_cntr->lc_sumsquare = 0;
1465 percpu_cntr->lc_sum = 0;
1466 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
1467 percpu_cntr->lc_sum_irq = 0;
1471 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
1473 EXPORT_SYMBOL(lprocfs_clear_stats);
1475 static ssize_t lprocfs_stats_seq_write(struct file *file,
1476 const char __user *buf,
1477 size_t len, loff_t *off)
1479 struct seq_file *seq = file->private_data;
1480 struct lprocfs_stats *stats = seq->private;
1482 lprocfs_clear_stats(stats);
1487 static void *lprocfs_stats_seq_start(struct seq_file *p, loff_t *pos)
1489 struct lprocfs_stats *stats = p->private;
1491 return (*pos < stats->ls_num) ? pos : NULL;
1494 static void lprocfs_stats_seq_stop(struct seq_file *p, void *v)
1498 static void *lprocfs_stats_seq_next(struct seq_file *p, void *v, loff_t *pos)
1502 return lprocfs_stats_seq_start(p, pos);
1505 /* seq file export of one lprocfs counter */
1506 static int lprocfs_stats_seq_show(struct seq_file *p, void *v)
1508 struct lprocfs_stats *stats = p->private;
1509 struct lprocfs_counter_header *hdr;
1510 struct lprocfs_counter ctr;
1511 int idx = *(loff_t *)v;
1514 struct timespec64 now;
1516 ktime_get_real_ts64(&now);
1517 seq_printf(p, "%-25s %llu.%09lu secs.nsecs\n",
1518 "snapshot_time", (s64)now.tv_sec, now.tv_nsec);
1521 hdr = &stats->ls_cnt_header[idx];
1522 lprocfs_stats_collect(stats, idx, &ctr);
1524 if (ctr.lc_count == 0)
1527 seq_printf(p, "%-25s %lld samples [%s]", hdr->lc_name,
1528 ctr.lc_count, hdr->lc_units);
1530 if ((hdr->lc_config & LPROCFS_CNTR_AVGMINMAX) && ctr.lc_count > 0) {
1531 seq_printf(p, " %lld %lld %lld",
1532 ctr.lc_min, ctr.lc_max, ctr.lc_sum);
1533 if (hdr->lc_config & LPROCFS_CNTR_STDDEV)
1534 seq_printf(p, " %llu", ctr.lc_sumsquare);
1540 static const struct seq_operations lprocfs_stats_seq_sops = {
1541 .start = lprocfs_stats_seq_start,
1542 .stop = lprocfs_stats_seq_stop,
1543 .next = lprocfs_stats_seq_next,
1544 .show = lprocfs_stats_seq_show,
1547 static int lprocfs_stats_seq_open(struct inode *inode, struct file *file)
1549 struct seq_file *seq;
1552 rc = LPROCFS_ENTRY_CHECK(inode);
1556 rc = seq_open(file, &lprocfs_stats_seq_sops);
1559 seq = file->private_data;
1560 seq->private = inode->i_private ? inode->i_private : PDE_DATA(inode);
1564 static const struct file_operations lprocfs_stats_seq_fops = {
1565 .owner = THIS_MODULE,
1566 .open = lprocfs_stats_seq_open,
1568 .write = lprocfs_stats_seq_write,
1569 .llseek = seq_lseek,
1570 .release = lprocfs_seq_release,
1573 int ldebugfs_register_stats(struct dentry *parent, const char *name,
1574 struct lprocfs_stats *stats)
1576 struct dentry *entry;
1578 LASSERT(!IS_ERR_OR_NULL(parent));
1580 entry = debugfs_create_file(name, 0644, parent, stats,
1581 &lprocfs_stats_seq_fops);
1582 if (IS_ERR_OR_NULL(entry))
1583 return entry ? PTR_ERR(entry) : -ENOMEM;
1587 EXPORT_SYMBOL_GPL(ldebugfs_register_stats);
1589 int lprocfs_register_stats(struct proc_dir_entry *root, const char *name,
1590 struct lprocfs_stats *stats)
1592 struct proc_dir_entry *entry;
1593 LASSERT(root != NULL);
1595 entry = proc_create_data(name, 0644, root,
1596 &lprocfs_stats_seq_fops, stats);
1601 EXPORT_SYMBOL(lprocfs_register_stats);
1603 void lprocfs_counter_init(struct lprocfs_stats *stats, int index,
1604 unsigned conf, const char *name, const char *units)
1606 struct lprocfs_counter_header *header;
1607 struct lprocfs_counter *percpu_cntr;
1608 unsigned long flags = 0;
1610 unsigned int num_cpu;
1612 LASSERT(stats != NULL);
1614 header = &stats->ls_cnt_header[index];
1615 LASSERTF(header != NULL, "Failed to allocate stats header:[%d]%s/%s\n",
1616 index, name, units);
1618 header->lc_config = conf;
1619 header->lc_name = name;
1620 header->lc_units = units;
1622 num_cpu = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
1623 for (i = 0; i < num_cpu; ++i) {
1624 if (!stats->ls_percpu[i])
1626 percpu_cntr = lprocfs_stats_counter_get(stats, i, index);
1627 percpu_cntr->lc_count = 0;
1628 percpu_cntr->lc_min = LC_MIN_INIT;
1629 percpu_cntr->lc_max = 0;
1630 percpu_cntr->lc_sumsquare = 0;
1631 percpu_cntr->lc_sum = 0;
1632 if ((stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE) != 0)
1633 percpu_cntr->lc_sum_irq = 0;
1635 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
1637 EXPORT_SYMBOL(lprocfs_counter_init);
1639 static const char * const mps_stats[] = {
1640 [LPROC_MD_CLOSE] = "close",
1641 [LPROC_MD_CREATE] = "create",
1642 [LPROC_MD_ENQUEUE] = "enqueue",
1643 [LPROC_MD_GETATTR] = "getattr",
1644 [LPROC_MD_INTENT_LOCK] = "intent_lock",
1645 [LPROC_MD_LINK] = "link",
1646 [LPROC_MD_RENAME] = "rename",
1647 [LPROC_MD_SETATTR] = "setattr",
1648 [LPROC_MD_FSYNC] = "fsync",
1649 [LPROC_MD_READ_PAGE] = "read_page",
1650 [LPROC_MD_UNLINK] = "unlink",
1651 [LPROC_MD_SETXATTR] = "setxattr",
1652 [LPROC_MD_GETXATTR] = "getxattr",
1653 [LPROC_MD_INTENT_GETATTR_ASYNC] = "intent_getattr_async",
1654 [LPROC_MD_REVALIDATE_LOCK] = "revalidate_lock",
1657 int lprocfs_alloc_md_stats(struct obd_device *obd,
1658 unsigned int num_private_stats)
1660 struct lprocfs_stats *stats;
1661 unsigned int num_stats;
1665 * TODO Ensure that this function is only used where
1666 * appropriate by adding an assertion to the effect that
1667 * obd->obd_type->typ_md_ops is not NULL. We can't do this now
1668 * because mdt_procfs_init() uses this function to allocate
1669 * the stats backing /proc/fs/lustre/mdt/.../md_stats but the
1670 * mdt layer does not use the md_ops interface. This is
1671 * confusing and a waste of memory. See LU-2484.
1673 LASSERT(obd->obd_proc_entry != NULL);
1674 LASSERT(obd->obd_md_stats == NULL);
1676 num_stats = ARRAY_SIZE(mps_stats) + num_private_stats;
1677 stats = lprocfs_alloc_stats(num_stats, 0);
1681 for (i = 0; i < ARRAY_SIZE(mps_stats); i++) {
1682 lprocfs_counter_init(stats, i, 0, mps_stats[i], "reqs");
1683 if (!stats->ls_cnt_header[i].lc_name) {
1684 CERROR("Missing md_stat initializer md_op operation at offset %d. Aborting.\n",
1690 rc = lprocfs_register_stats(obd->obd_proc_entry, "md_stats", stats);
1692 lprocfs_free_stats(&stats);
1694 obd->obd_md_stats = stats;
1699 EXPORT_SYMBOL(lprocfs_alloc_md_stats);
1701 void lprocfs_free_md_stats(struct obd_device *obd)
1703 struct lprocfs_stats *stats = obd->obd_md_stats;
1706 obd->obd_md_stats = NULL;
1707 lprocfs_free_stats(&stats);
1710 EXPORT_SYMBOL(lprocfs_free_md_stats);
1712 void lprocfs_init_ldlm_stats(struct lprocfs_stats *ldlm_stats)
1714 lprocfs_counter_init(ldlm_stats,
1715 LDLM_ENQUEUE - LDLM_FIRST_OPC,
1716 0, "ldlm_enqueue", "reqs");
1717 lprocfs_counter_init(ldlm_stats,
1718 LDLM_CONVERT - LDLM_FIRST_OPC,
1719 0, "ldlm_convert", "reqs");
1720 lprocfs_counter_init(ldlm_stats,
1721 LDLM_CANCEL - LDLM_FIRST_OPC,
1722 0, "ldlm_cancel", "reqs");
1723 lprocfs_counter_init(ldlm_stats,
1724 LDLM_BL_CALLBACK - LDLM_FIRST_OPC,
1725 0, "ldlm_bl_callback", "reqs");
1726 lprocfs_counter_init(ldlm_stats,
1727 LDLM_CP_CALLBACK - LDLM_FIRST_OPC,
1728 0, "ldlm_cp_callback", "reqs");
1729 lprocfs_counter_init(ldlm_stats,
1730 LDLM_GL_CALLBACK - LDLM_FIRST_OPC,
1731 0, "ldlm_gl_callback", "reqs");
1733 EXPORT_SYMBOL(lprocfs_init_ldlm_stats);
1735 __s64 lprocfs_read_helper(struct lprocfs_counter *lc,
1736 struct lprocfs_counter_header *header,
1737 enum lprocfs_stats_flags flags,
1738 enum lprocfs_fields_flags field)
1746 case LPROCFS_FIELDS_FLAGS_CONFIG:
1747 ret = header->lc_config;
1749 case LPROCFS_FIELDS_FLAGS_SUM:
1751 if ((flags & LPROCFS_STATS_FLAG_IRQ_SAFE) != 0)
1752 ret += lc->lc_sum_irq;
1754 case LPROCFS_FIELDS_FLAGS_MIN:
1757 case LPROCFS_FIELDS_FLAGS_MAX:
1760 case LPROCFS_FIELDS_FLAGS_AVG:
1761 ret = (lc->lc_max - lc->lc_min) / 2;
1763 case LPROCFS_FIELDS_FLAGS_SUMSQUARE:
1764 ret = lc->lc_sumsquare;
1766 case LPROCFS_FIELDS_FLAGS_COUNT:
1774 EXPORT_SYMBOL(lprocfs_read_helper);
1776 /* Obtains the conversion factor for the unit specified */
1777 static int get_mult(char unit, __u64 *mult)
1782 /* peta, tera, giga, mega, and kilo */
1799 /* some tests expect % to be accepted */
1813 * Ensures the numeric string is valid. The function provides the final
1814 * multiplier in the case a unit exists at the end of the string. It also
1815 * locates the start of the whole and fractional parts (if any). This
1816 * function modifies the string so kstrtoull can be used to parse both
1817 * the whole and fraction portions. This function also figures out
1818 * the base of the number.
1820 static int preprocess_numeric_str(char *buffer, __u64 *mult, __u64 def_mult,
1821 bool allow_units, char **whole, char **frac,
1824 bool hit_decimal = false;
1825 bool hit_unit = false;
1833 /* a hex string if it starts with "0x" */
1834 if (buffer[0] == '0' && tolower(buffer[1]) == 'x') {
1842 /* allow for a single new line before the null terminator */
1843 if (*buffer == '\n') {
1853 /* any chars after our unit indicates a malformed string */
1857 /* ensure we only hit one decimal */
1858 if (*buffer == '.') {
1862 /* if past start, there's a whole part */
1863 if (start != buffer)
1869 } else if (!isdigit(*buffer) &&
1870 !(*base == 16 && isxdigit(*buffer))) {
1872 /* if we allow units, attempt to get mult */
1874 rc = get_mult(*buffer, mult);
1878 /* string stops here, but keep processing */
1890 /* hit a decimal, make sure there's a fractional part */
1896 /* didn't hit a decimal, but may have a whole part */
1897 if (start != buffer && *start)
1901 /* malformed string if we didn't get anything */
1902 if (!*frac && !*whole)
1909 * Parses a numeric string which can contain a whole and fraction portion
1910 * into a __u64. Accepts a multiplier to apply to the value parsed. Also
1911 * allows the string to have a unit at the end. The function handles
1912 * wrapping of the final unsigned value.
1914 static int str_to_u64_parse(char *buffer, unsigned long count,
1915 __u64 *val, __u64 def_mult, bool allow_units)
1919 unsigned int frac_d = 1;
1920 __u64 wrap_indicator = ULLONG_MAX;
1925 unsigned int base = 10;
1927 rc = preprocess_numeric_str(buffer, &mult, def_mult, allow_units,
1928 &strwhole, &strfrac, &base);
1938 /* the multiplier limits how large the value can be */
1939 wrap_indicator = div64_u64(wrap_indicator, mult);
1942 rc = kstrtoull(strwhole, base, &whole);
1946 if (whole > wrap_indicator)
1953 if (strlen(strfrac) > 10)
1956 rc = kstrtoull(strfrac, base, &frac);
1960 /* determine power of fractional portion */
1966 /* fractional portion is too large to perform calculation */
1967 if (frac > wrap_indicator)
1971 do_div(frac, frac_d);
1974 /* check that the sum of whole and fraction fits in u64 */
1975 if (whole > (ULLONG_MAX - frac))
1978 *val = whole + frac;
1984 * This function parses numeric/hex strings into __s64. It accepts a multiplier
1985 * which will apply to the value parsed. It also can allow the string to
1986 * have a unit as the last character. The function handles overflow/underflow
1987 * of the signed integer.
1989 static int str_to_s64_internal(const char __user *buffer, unsigned long count,
1990 __s64 *val, __u64 def_mult, bool allow_units)
1994 unsigned int offset = 0;
1995 int signed sign = 1;
1996 __u64 max = LLONG_MAX;
1999 if (count > (sizeof(kernbuf) - 1))
2002 if (copy_from_user(kernbuf, buffer, count))
2005 kernbuf[count] = '\0';
2007 /* keep track of our sign */
2008 if (*kernbuf == '-') {
2011 /* equivalent to max = -LLONG_MIN, avoids overflow */
2015 rc = str_to_u64_parse(kernbuf + offset, count - offset,
2016 &tmp, def_mult, allow_units);
2020 /* check for overflow/underflow */
2024 *val = (__s64)tmp * sign;
2030 * Convert a user string into a signed 64 bit number. This function produces
2031 * an error when the value parsed from the string times multiplier underflows or
2032 * overflows. This function only accepts strings that contains digits, an
2033 * optional decimal, and a char representing a unit at the end. If a unit is
2034 * specified in the string, the multiplier provided by the caller is ignored.
2035 * This function can also accept hexadecimal strings which are prefixed with
2038 * \param[in] buffer string consisting of numbers, a decimal, and a unit
2039 * \param[in] count buffer length
2040 * \param[in] val if successful, the value represented by the string
2041 * \param[in] defunit default unit if string doesn't contain one
2043 * \retval 0 on success
2044 * \retval negative number on error
2046 int lprocfs_str_with_units_to_s64(const char __user *buffer,
2047 unsigned long count, __s64 *val, char defunit)
2052 if (defunit != '1') {
2053 rc = get_mult(defunit, &mult);
2058 return str_to_s64_internal(buffer, count, val, mult, true);
2060 EXPORT_SYMBOL(lprocfs_str_with_units_to_s64);
2062 char *lprocfs_strnstr(const char *s1, const char *s2, size_t len)
2071 if (!memcmp(s1, s2, l2))
2077 EXPORT_SYMBOL(lprocfs_strnstr);
2080 * Find the string \a name in the input \a buffer, and return a pointer to the
2081 * value immediately following \a name, reducing \a count appropriately.
2082 * If \a name is not found the original \a buffer is returned.
2084 char *lprocfs_find_named_value(const char *buffer, const char *name,
2088 size_t buflen = *count;
2090 /* there is no strnstr() in rhel5 and ubuntu kernels */
2091 val = lprocfs_strnstr(buffer, name, buflen);
2093 return (char *)buffer;
2095 val += strlen(name); /* skip prefix */
2096 while (val < buffer + buflen && isspace(*val)) /* skip separator */
2100 while (val < buffer + buflen && isalnum(*val)) {
2105 return val - *count;
2107 EXPORT_SYMBOL(lprocfs_find_named_value);
2109 int ldebugfs_seq_create(struct dentry *parent, const char *name, umode_t mode,
2110 const struct file_operations *seq_fops, void *data)
2112 struct dentry *entry;
2114 /* Disallow secretly (un)writable entries. */
2115 LASSERT((!seq_fops->write) == (!(mode & 0222)));
2117 entry = debugfs_create_file(name, mode, parent, data, seq_fops);
2118 if (IS_ERR_OR_NULL(entry))
2119 return entry ? PTR_ERR(entry) : -ENOMEM;
2123 EXPORT_SYMBOL_GPL(ldebugfs_seq_create);
2125 int lprocfs_seq_create(struct proc_dir_entry *parent,
2128 const struct file_operations *seq_fops,
2131 struct proc_dir_entry *entry;
2134 /* Disallow secretly (un)writable entries. */
2135 LASSERT((seq_fops->write == NULL) == ((mode & 0222) == 0));
2137 entry = proc_create_data(name, mode, parent, seq_fops, data);
2144 EXPORT_SYMBOL(lprocfs_seq_create);
2146 int lprocfs_obd_seq_create(struct obd_device *dev,
2149 const struct file_operations *seq_fops,
2152 return (lprocfs_seq_create(dev->obd_proc_entry, name,
2153 mode, seq_fops, data));
2155 EXPORT_SYMBOL(lprocfs_obd_seq_create);
2157 void lprocfs_oh_tally(struct obd_histogram *oh, unsigned int value)
2159 if (value >= OBD_HIST_MAX)
2160 value = OBD_HIST_MAX - 1;
2162 spin_lock(&oh->oh_lock);
2163 oh->oh_buckets[value]++;
2164 spin_unlock(&oh->oh_lock);
2166 EXPORT_SYMBOL(lprocfs_oh_tally);
2168 void lprocfs_oh_tally_log2(struct obd_histogram *oh, unsigned int value)
2170 unsigned int val = 0;
2172 if (likely(value != 0))
2173 val = min(fls(value - 1), OBD_HIST_MAX);
2175 lprocfs_oh_tally(oh, val);
2177 EXPORT_SYMBOL(lprocfs_oh_tally_log2);
2179 unsigned long lprocfs_oh_sum(struct obd_histogram *oh)
2181 unsigned long ret = 0;
2184 for (i = 0; i < OBD_HIST_MAX; i++)
2185 ret += oh->oh_buckets[i];
2188 EXPORT_SYMBOL(lprocfs_oh_sum);
2190 void lprocfs_oh_clear(struct obd_histogram *oh)
2192 spin_lock(&oh->oh_lock);
2193 memset(oh->oh_buckets, 0, sizeof(oh->oh_buckets));
2194 spin_unlock(&oh->oh_lock);
2196 EXPORT_SYMBOL(lprocfs_oh_clear);
2198 ssize_t lustre_attr_show(struct kobject *kobj,
2199 struct attribute *attr, char *buf)
2201 struct lustre_attr *a = container_of(attr, struct lustre_attr, attr);
2203 return a->show ? a->show(kobj, attr, buf) : 0;
2205 EXPORT_SYMBOL_GPL(lustre_attr_show);
2207 ssize_t lustre_attr_store(struct kobject *kobj, struct attribute *attr,
2208 const char *buf, size_t len)
2210 struct lustre_attr *a = container_of(attr, struct lustre_attr, attr);
2212 return a->store ? a->store(kobj, attr, buf, len) : len;
2214 EXPORT_SYMBOL_GPL(lustre_attr_store);
2216 const struct sysfs_ops lustre_sysfs_ops = {
2217 .show = lustre_attr_show,
2218 .store = lustre_attr_store,
2220 EXPORT_SYMBOL_GPL(lustre_sysfs_ops);
2222 int lprocfs_obd_max_pages_per_rpc_seq_show(struct seq_file *m, void *data)
2224 struct obd_device *dev = data;
2225 struct client_obd *cli = &dev->u.cli;
2227 spin_lock(&cli->cl_loi_list_lock);
2228 seq_printf(m, "%d\n", cli->cl_max_pages_per_rpc);
2229 spin_unlock(&cli->cl_loi_list_lock);
2232 EXPORT_SYMBOL(lprocfs_obd_max_pages_per_rpc_seq_show);
2234 ssize_t lprocfs_obd_max_pages_per_rpc_seq_write(struct file *file,
2235 const char __user *buffer,
2236 size_t count, loff_t *off)
2238 struct obd_device *dev =
2239 ((struct seq_file *)file->private_data)->private;
2240 struct client_obd *cli = &dev->u.cli;
2241 struct obd_connect_data *ocd = &cli->cl_import->imp_connect_data;
2245 rc = lprocfs_str_with_units_to_s64(buffer, count, &val, '1');
2251 /* if the max_pages is specified in bytes, convert to pages */
2252 if (val >= ONE_MB_BRW_SIZE)
2255 LPROCFS_CLIMP_CHECK(dev);
2257 chunk_mask = ~((1 << (cli->cl_chunkbits - PAGE_SHIFT)) - 1);
2258 /* max_pages_per_rpc must be chunk aligned */
2259 val = (val + ~chunk_mask) & chunk_mask;
2260 if (val == 0 || (ocd->ocd_brw_size != 0 &&
2261 val > ocd->ocd_brw_size >> PAGE_SHIFT)) {
2262 LPROCFS_CLIMP_EXIT(dev);
2265 spin_lock(&cli->cl_loi_list_lock);
2266 cli->cl_max_pages_per_rpc = val;
2267 client_adjust_max_dirty(cli);
2268 spin_unlock(&cli->cl_loi_list_lock);
2270 LPROCFS_CLIMP_EXIT(dev);
2273 EXPORT_SYMBOL(lprocfs_obd_max_pages_per_rpc_seq_write);
2275 ssize_t short_io_bytes_show(struct kobject *kobj, struct attribute *attr,
2278 struct obd_device *dev = container_of(kobj, struct obd_device,
2280 struct client_obd *cli = &dev->u.cli;
2283 spin_lock(&cli->cl_loi_list_lock);
2284 rc = sprintf(buf, "%d\n", cli->cl_max_short_io_bytes);
2285 spin_unlock(&cli->cl_loi_list_lock);
2288 EXPORT_SYMBOL(short_io_bytes_show);
2290 /* Used to catch people who think they're specifying pages. */
2291 #define MIN_SHORT_IO_BYTES 64U
2293 ssize_t short_io_bytes_store(struct kobject *kobj, struct attribute *attr,
2294 const char *buffer, size_t count)
2296 struct obd_device *dev = container_of(kobj, struct obd_device,
2298 struct client_obd *cli = &dev->u.cli;
2302 LPROCFS_CLIMP_CHECK(dev);
2304 rc = kstrtouint(buffer, 0, &val);
2308 if (val && (val < MIN_SHORT_IO_BYTES || val > OBD_MAX_SHORT_IO_BYTES))
2309 GOTO(out, rc = -ERANGE);
2313 spin_lock(&cli->cl_loi_list_lock);
2314 if (val > (cli->cl_max_pages_per_rpc << PAGE_SHIFT))
2317 cli->cl_max_short_io_bytes = val;
2318 spin_unlock(&cli->cl_loi_list_lock);
2321 LPROCFS_CLIMP_EXIT(dev);
2324 EXPORT_SYMBOL(short_io_bytes_store);
2326 int lprocfs_wr_root_squash(const char __user *buffer, unsigned long count,
2327 struct root_squash_info *squash, char *name)
2330 char kernbuf[64], *tmp, *errmsg;
2331 unsigned long uid, gid;
2334 if (count >= sizeof(kernbuf)) {
2335 errmsg = "string too long";
2336 GOTO(failed_noprint, rc = -EINVAL);
2338 if (copy_from_user(kernbuf, buffer, count)) {
2339 errmsg = "bad address";
2340 GOTO(failed_noprint, rc = -EFAULT);
2342 kernbuf[count] = '\0';
2344 /* look for uid gid separator */
2345 tmp = strchr(kernbuf, ':');
2347 errmsg = "needs uid:gid format";
2348 GOTO(failed, rc = -EINVAL);
2354 if (kstrtoul(kernbuf, 0, &uid) != 0) {
2356 GOTO(failed, rc = -EINVAL);
2360 if (kstrtoul(tmp, 0, &gid) != 0) {
2362 GOTO(failed, rc = -EINVAL);
2365 squash->rsi_uid = uid;
2366 squash->rsi_gid = gid;
2368 LCONSOLE_INFO("%s: root_squash is set to %u:%u\n",
2369 name, squash->rsi_uid, squash->rsi_gid);
2377 CWARN("%s: failed to set root_squash to \"%s\", %s, rc = %d\n",
2378 name, kernbuf, errmsg, rc);
2381 CWARN("%s: failed to set root_squash due to %s, rc = %d\n",
2385 EXPORT_SYMBOL(lprocfs_wr_root_squash);
2388 int lprocfs_wr_nosquash_nids(const char __user *buffer, unsigned long count,
2389 struct root_squash_info *squash, char *name)
2392 char *kernbuf = NULL;
2394 struct list_head tmp;
2399 errmsg = "string too long";
2400 GOTO(failed, rc = -EINVAL);
2403 OBD_ALLOC(kernbuf, count + 1);
2405 errmsg = "no memory";
2406 GOTO(failed, rc = -ENOMEM);
2408 if (copy_from_user(kernbuf, buffer, count)) {
2409 errmsg = "bad address";
2410 GOTO(failed, rc = -EFAULT);
2412 kernbuf[count] = '\0';
2414 if (count > 0 && kernbuf[count - 1] == '\n')
2417 if ((len == 4 && strncmp(kernbuf, "NONE", len) == 0) ||
2418 (len == 5 && strncmp(kernbuf, "clear", len) == 0)) {
2419 /* empty string is special case */
2420 down_write(&squash->rsi_sem);
2421 if (!list_empty(&squash->rsi_nosquash_nids))
2422 cfs_free_nidlist(&squash->rsi_nosquash_nids);
2423 up_write(&squash->rsi_sem);
2424 LCONSOLE_INFO("%s: nosquash_nids is cleared\n", name);
2425 OBD_FREE(kernbuf, count + 1);
2429 INIT_LIST_HEAD(&tmp);
2430 if (cfs_parse_nidlist(kernbuf, count, &tmp) <= 0) {
2431 errmsg = "can't parse";
2432 GOTO(failed, rc = -EINVAL);
2434 LCONSOLE_INFO("%s: nosquash_nids set to %s\n",
2436 OBD_FREE(kernbuf, count + 1);
2439 down_write(&squash->rsi_sem);
2440 if (!list_empty(&squash->rsi_nosquash_nids))
2441 cfs_free_nidlist(&squash->rsi_nosquash_nids);
2442 list_splice(&tmp, &squash->rsi_nosquash_nids);
2443 up_write(&squash->rsi_sem);
2449 CWARN("%s: failed to set nosquash_nids to \"%s\", %s rc = %d\n",
2450 name, kernbuf, errmsg, rc);
2451 OBD_FREE(kernbuf, count + 1);
2453 CWARN("%s: failed to set nosquash_nids due to %s rc = %d\n",
2458 EXPORT_SYMBOL(lprocfs_wr_nosquash_nids);
2460 #endif /* CONFIG_PROC_FS*/