4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.gnu.org/licenses/gpl-2.0.html
23 * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
26 * Copyright (c) 2011, 2017, Intel Corporation.
29 * This file is part of Lustre, http://www.lustre.org/
31 * lustre/obdclass/lprocfs_status.c
33 * Author: Hariharan Thantry <thantry@users.sourceforge.net>
36 #define DEBUG_SUBSYSTEM S_CLASS
38 #include <obd_class.h>
39 #include <lprocfs_status.h>
43 static int lprocfs_no_percpu_stats = 0;
44 module_param(lprocfs_no_percpu_stats, int, 0644);
45 MODULE_PARM_DESC(lprocfs_no_percpu_stats, "Do not alloc percpu data for lprocfs stats");
47 #define MAX_STRING_SIZE 128
49 int lprocfs_single_release(struct inode *inode, struct file *file)
51 return single_release(inode, file);
53 EXPORT_SYMBOL(lprocfs_single_release);
55 int lprocfs_seq_release(struct inode *inode, struct file *file)
57 return seq_release(inode, file);
59 EXPORT_SYMBOL(lprocfs_seq_release);
61 static umode_t default_mode(const struct proc_ops *ops)
73 struct proc_dir_entry *
74 lprocfs_add_simple(struct proc_dir_entry *root, char *name,
75 void *data, const struct proc_ops *fops)
77 struct proc_dir_entry *proc;
80 if (!root || !name || !fops)
81 return ERR_PTR(-EINVAL);
83 mode = default_mode(fops);
84 proc = proc_create_data(name, mode, root, fops, data);
86 CERROR("LprocFS: No memory to create /proc entry %s\n",
88 return ERR_PTR(-ENOMEM);
92 EXPORT_SYMBOL(lprocfs_add_simple);
94 struct proc_dir_entry *lprocfs_add_symlink(const char *name,
95 struct proc_dir_entry *parent,
96 const char *format, ...)
98 struct proc_dir_entry *entry;
102 if (!parent || !format)
105 OBD_ALLOC_WAIT(dest, MAX_STRING_SIZE + 1);
109 va_start(ap, format);
110 vsnprintf(dest, MAX_STRING_SIZE, format, ap);
113 entry = proc_symlink(name, parent, dest);
115 CERROR("LprocFS: Could not create symbolic link from "
116 "%s to %s\n", name, dest);
118 OBD_FREE(dest, MAX_STRING_SIZE + 1);
121 EXPORT_SYMBOL(lprocfs_add_symlink);
123 static const struct file_operations ldebugfs_empty_ops = { };
125 void ldebugfs_add_vars(struct dentry *parent, struct ldebugfs_vars *list,
128 if (IS_ERR_OR_NULL(parent) || IS_ERR_OR_NULL(list))
134 if (list->proc_mode != 0000) {
135 mode = list->proc_mode;
136 } else if (list->fops) {
137 if (list->fops->read)
139 if (list->fops->write)
142 debugfs_create_file(list->name, mode, parent,
144 list->fops ? : &ldebugfs_empty_ops);
148 EXPORT_SYMBOL_GPL(ldebugfs_add_vars);
150 static const struct proc_ops lprocfs_empty_ops = { };
155 * \param root [in] The parent proc entry on which new entry will be added.
156 * \param list [in] Array of proc entries to be added.
157 * \param data [in] The argument to be passed when entries read/write routines
158 * are called through /proc file.
160 * \retval 0 on success
164 lprocfs_add_vars(struct proc_dir_entry *root, struct lprocfs_vars *list,
171 struct proc_dir_entry *proc;
175 mode = list->proc_mode;
177 mode = default_mode(list->fops);
178 proc = proc_create_data(list->name, mode, root,
179 list->fops ?: &lprocfs_empty_ops,
187 EXPORT_SYMBOL(lprocfs_add_vars);
189 void lprocfs_remove(struct proc_dir_entry **rooth)
194 EXPORT_SYMBOL(lprocfs_remove);
196 void lprocfs_remove_proc_entry(const char *name, struct proc_dir_entry *parent)
198 LASSERT(parent != NULL);
199 remove_proc_entry(name, parent);
201 EXPORT_SYMBOL(lprocfs_remove_proc_entry);
203 struct proc_dir_entry *
204 lprocfs_register(const char *name, struct proc_dir_entry *parent,
205 struct lprocfs_vars *list, void *data)
207 struct proc_dir_entry *newchild;
209 newchild = proc_mkdir(name, parent);
211 return ERR_PTR(-ENOMEM);
214 int rc = lprocfs_add_vars(newchild, list, data);
216 lprocfs_remove(&newchild);
222 EXPORT_SYMBOL(lprocfs_register);
224 /* Generic callbacks */
225 int lprocfs_uuid_seq_show(struct seq_file *m, void *data)
227 struct obd_device *obd = data;
229 LASSERT(obd != NULL);
230 seq_printf(m, "%s\n", obd->obd_uuid.uuid);
233 EXPORT_SYMBOL(lprocfs_uuid_seq_show);
235 static ssize_t uuid_show(struct kobject *kobj, struct attribute *attr,
238 struct obd_device *obd = container_of(kobj, struct obd_device,
241 return sprintf(buf, "%s\n", obd->obd_uuid.uuid);
243 LUSTRE_RO_ATTR(uuid);
245 static ssize_t blocksize_show(struct kobject *kobj, struct attribute *attr,
248 struct obd_device *obd = container_of(kobj, struct obd_device,
250 struct obd_statfs osfs;
253 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
254 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
257 return sprintf(buf, "%u\n", osfs.os_bsize);
261 LUSTRE_RO_ATTR(blocksize);
263 static ssize_t kbytestotal_show(struct kobject *kobj, struct attribute *attr,
266 struct obd_device *obd = container_of(kobj, struct obd_device,
268 struct obd_statfs osfs;
271 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
272 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
275 u32 blk_size = osfs.os_bsize >> 10;
276 u64 result = osfs.os_blocks;
278 result *= rounddown_pow_of_two(blk_size ?: 1);
279 return sprintf(buf, "%llu\n", result);
284 LUSTRE_RO_ATTR(kbytestotal);
286 static ssize_t kbytesfree_show(struct kobject *kobj, struct attribute *attr,
289 struct obd_device *obd = container_of(kobj, struct obd_device,
291 struct obd_statfs osfs;
294 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
295 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
298 u32 blk_size = osfs.os_bsize >> 10;
299 u64 result = osfs.os_bfree;
301 while (blk_size >>= 1)
304 return sprintf(buf, "%llu\n", result);
309 LUSTRE_RO_ATTR(kbytesfree);
311 static ssize_t kbytesavail_show(struct kobject *kobj, struct attribute *attr,
314 struct obd_device *obd = container_of(kobj, struct obd_device,
316 struct obd_statfs osfs;
319 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
320 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
323 u32 blk_size = osfs.os_bsize >> 10;
324 u64 result = osfs.os_bavail;
326 while (blk_size >>= 1)
329 return sprintf(buf, "%llu\n", result);
334 LUSTRE_RO_ATTR(kbytesavail);
336 static ssize_t filestotal_show(struct kobject *kobj, struct attribute *attr,
339 struct obd_device *obd = container_of(kobj, struct obd_device,
341 struct obd_statfs osfs;
344 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
345 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
348 return sprintf(buf, "%llu\n", osfs.os_files);
352 LUSTRE_RO_ATTR(filestotal);
354 static ssize_t filesfree_show(struct kobject *kobj, struct attribute *attr,
357 struct obd_device *obd = container_of(kobj, struct obd_device,
359 struct obd_statfs osfs;
362 rc = obd_statfs(NULL, obd->obd_self_export, &osfs,
363 ktime_get_seconds() - OBD_STATFS_CACHE_SECONDS,
366 return sprintf(buf, "%llu\n", osfs.os_ffree);
370 LUSTRE_RO_ATTR(filesfree);
372 ssize_t conn_uuid_show(struct kobject *kobj, struct attribute *attr, char *buf)
374 struct obd_device *obd = container_of(kobj, struct obd_device,
376 struct obd_import *imp;
377 struct ptlrpc_connection *conn;
380 with_imp_locked(obd, imp, count) {
381 conn = imp->imp_connection;
383 count = sprintf(buf, "%s\n", conn->c_remote_uuid.uuid);
385 count = sprintf(buf, "%s\n", "<none>");
390 EXPORT_SYMBOL(conn_uuid_show);
392 int lprocfs_server_uuid_seq_show(struct seq_file *m, void *data)
394 struct obd_device *obd = data;
395 struct obd_import *imp;
396 const char *imp_state_name = NULL;
399 LASSERT(obd != NULL);
400 with_imp_locked(obd, imp, rc) {
401 imp_state_name = ptlrpc_import_state_name(imp->imp_state);
402 seq_printf(m, "%s\t%s%s\n", obd2cli_tgt(obd), imp_state_name,
403 imp->imp_deactive ? "\tDEACTIVATED" : "");
408 EXPORT_SYMBOL(lprocfs_server_uuid_seq_show);
410 /** add up per-cpu counters */
413 * Lock statistics structure for access, possibly only on this CPU.
415 * The statistics struct may be allocated with per-CPU structures for
416 * efficient concurrent update (usually only on server-wide stats), or
417 * as a single global struct (e.g. for per-client or per-job statistics),
418 * so the required locking depends on the type of structure allocated.
420 * For per-CPU statistics, pin the thread to the current cpuid so that
421 * will only access the statistics for that CPU. If the stats structure
422 * for the current CPU has not been allocated (or previously freed),
423 * allocate it now. The per-CPU statistics do not need locking since
424 * the thread is pinned to the CPU during update.
426 * For global statistics, lock the stats structure to prevent concurrent update.
428 * \param[in] stats statistics structure to lock
429 * \param[in] opc type of operation:
430 * LPROCFS_GET_SMP_ID: "lock" and return current CPU index
431 * for incrementing statistics for that CPU
432 * LPROCFS_GET_NUM_CPU: "lock" and return number of used
433 * CPU indices to iterate over all indices
434 * \param[out] flags CPU interrupt saved state for IRQ-safe locking
436 * \retval cpuid of current thread or number of allocated structs
437 * \retval negative on error (only for opc LPROCFS_GET_SMP_ID + per-CPU stats)
439 int lprocfs_stats_lock(struct lprocfs_stats *stats,
440 enum lprocfs_stats_lock_ops opc,
441 unsigned long *flags)
443 if (stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU) {
444 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
445 spin_lock_irqsave(&stats->ls_lock, *flags);
447 spin_lock(&stats->ls_lock);
448 return opc == LPROCFS_GET_NUM_CPU ? 1 : 0;
452 case LPROCFS_GET_SMP_ID: {
453 unsigned int cpuid = get_cpu();
455 if (unlikely(!stats->ls_percpu[cpuid])) {
456 int rc = lprocfs_stats_alloc_one(stats, cpuid);
465 case LPROCFS_GET_NUM_CPU:
466 return stats->ls_biggest_alloc_num;
473 * Unlock statistics structure after access.
475 * Unlock the lock acquired via lprocfs_stats_lock() for global statistics,
476 * or unpin this thread from the current cpuid for per-CPU statistics.
478 * This function must be called using the same arguments as used when calling
479 * lprocfs_stats_lock() so that the correct operation can be performed.
481 * \param[in] stats statistics structure to unlock
482 * \param[in] opc type of operation (current cpuid or number of structs)
483 * \param[in] flags CPU interrupt saved state for IRQ-safe locking
485 void lprocfs_stats_unlock(struct lprocfs_stats *stats,
486 enum lprocfs_stats_lock_ops opc,
487 unsigned long *flags)
489 if (stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU) {
490 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
491 spin_unlock_irqrestore(&stats->ls_lock, *flags);
493 spin_unlock(&stats->ls_lock);
494 } else if (opc == LPROCFS_GET_SMP_ID) {
499 /** add up per-cpu counters */
500 void lprocfs_stats_collect(struct lprocfs_stats *stats, int idx,
501 struct lprocfs_counter *cnt)
503 unsigned int num_entry;
504 struct lprocfs_counter *percpu_cntr;
506 unsigned long flags = 0;
508 memset(cnt, 0, sizeof(*cnt));
511 /* set count to 1 to avoid divide-by-zero errs in callers */
516 cnt->lc_min = LC_MIN_INIT;
518 num_entry = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
520 for (i = 0; i < num_entry; i++) {
521 if (!stats->ls_percpu[i])
523 percpu_cntr = lprocfs_stats_counter_get(stats, i, idx);
525 cnt->lc_count += percpu_cntr->lc_count;
526 cnt->lc_sum += percpu_cntr->lc_sum;
527 if (percpu_cntr->lc_min < cnt->lc_min)
528 cnt->lc_min = percpu_cntr->lc_min;
529 if (percpu_cntr->lc_max > cnt->lc_max)
530 cnt->lc_max = percpu_cntr->lc_max;
531 cnt->lc_sumsquare += percpu_cntr->lc_sumsquare;
534 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
537 static void obd_import_flags2str(struct obd_import *imp, struct seq_file *m)
541 if (imp->imp_obd->obd_no_recov) {
542 seq_printf(m, "no_recov");
546 flag2str(imp, invalid);
547 flag2str(imp, deactive);
548 flag2str(imp, replayable);
549 flag2str(imp, delayed_recovery);
550 flag2str(imp, vbr_failed);
551 flag2str(imp, pingable);
552 flag2str(imp, resend_replay);
553 flag2str(imp, no_pinger_recover);
554 flag2str(imp, connect_tried);
557 static const char *const obd_connect_names[] = {
576 "remote_client_by_force",
585 "mds_mds_connection",
588 "alt_checksum_algorithm",
624 "file_secctx", /* 0x01 */
625 "lockaheadv2", /* 0x02 */
626 "dir_migrate", /* 0x04 */
627 "sum_statfs", /* 0x08 */
628 "overstriping", /* 0x10 */
631 "lock_convert", /* 0x80 */
632 "archive_id_array", /* 0x100 */
633 "increasing_xid", /* 0x200 */
634 "selinux_policy", /* 0x400 */
637 "crush", /* 0x2000 */
638 "async_discard", /* 0x4000 */
639 "client_encryption", /* 0x8000 */
640 "fidmap", /* 0x10000 */
641 "getattr_pfid", /* 0x20000 */
642 "lseek", /* 0x40000 */
643 "dom_lvb", /* 0x80000 */
644 "reply_mbits", /* 0x100000 */
645 "mode_convert", /* 0x200000 */
646 "batch_rpc", /* 0x400000 */
647 "pcc_ro", /* 0x800000 */
648 "mne_nid_type", /* 0x1000000 */
649 "lock_contend", /* 0x2000000 */
650 "atomic_open_lock", /* 0x4000000 */
651 "name_encryption", /* 0x8000000 */
655 void obd_connect_seq_flags2str(struct seq_file *m, __u64 flags, __u64 flags2,
662 for (i = 0, mask = 1; i < 64; i++, mask <<= 1) {
664 seq_printf(m, "%s%s",
665 first ? "" : sep, obd_connect_names[i]);
670 if (flags & ~(mask - 1)) {
671 seq_printf(m, "%sunknown_%#llx",
672 first ? "" : sep, flags & ~(mask - 1));
676 if (!(flags & OBD_CONNECT_FLAGS2) || flags2 == 0)
679 for (i = 64, mask = 1; obd_connect_names[i] != NULL; i++, mask <<= 1) {
681 seq_printf(m, "%s%s",
682 first ? "" : sep, obd_connect_names[i]);
687 if (flags2 & ~(mask - 1)) {
688 seq_printf(m, "%sunknown2_%#llx",
689 first ? "" : sep, flags2 & ~(mask - 1));
693 EXPORT_SYMBOL(obd_connect_seq_flags2str);
695 int obd_connect_flags2str(char *page, int count, __u64 flags, __u64 flags2,
701 for (i = 0, mask = 1; i < 64; i++, mask <<= 1) {
703 ret += snprintf(page + ret, count - ret, "%s%s",
704 ret ? sep : "", obd_connect_names[i]);
707 if (flags & ~(mask - 1))
708 ret += snprintf(page + ret, count - ret,
710 ret ? sep : "", flags & ~(mask - 1));
712 if (!(flags & OBD_CONNECT_FLAGS2) || flags2 == 0)
715 for (i = 64, mask = 1; obd_connect_names[i] != NULL; i++, mask <<= 1) {
717 ret += snprintf(page + ret, count - ret, "%s%s",
718 ret ? sep : "", obd_connect_names[i]);
721 if (flags2 & ~(mask - 1))
722 ret += snprintf(page + ret, count - ret,
724 ret ? sep : "", flags2 & ~(mask - 1));
728 EXPORT_SYMBOL(obd_connect_flags2str);
731 obd_connect_data_seqprint(struct seq_file *m, struct obd_connect_data *ocd)
735 LASSERT(ocd != NULL);
736 flags = ocd->ocd_connect_flags;
738 seq_printf(m, " connect_data:\n"
741 ocd->ocd_connect_flags,
743 if (flags & OBD_CONNECT_VERSION)
744 seq_printf(m, " target_version: %u.%u.%u.%u\n",
745 OBD_OCD_VERSION_MAJOR(ocd->ocd_version),
746 OBD_OCD_VERSION_MINOR(ocd->ocd_version),
747 OBD_OCD_VERSION_PATCH(ocd->ocd_version),
748 OBD_OCD_VERSION_FIX(ocd->ocd_version));
749 if (flags & OBD_CONNECT_MDS)
750 seq_printf(m, " mdt_index: %d\n", ocd->ocd_group);
751 if (flags & OBD_CONNECT_GRANT)
752 seq_printf(m, " initial_grant: %d\n", ocd->ocd_grant);
753 if (flags & OBD_CONNECT_INDEX)
754 seq_printf(m, " target_index: %u\n", ocd->ocd_index);
755 if (flags & OBD_CONNECT_BRW_SIZE)
756 seq_printf(m, " max_brw_size: %d\n", ocd->ocd_brw_size);
757 if (flags & OBD_CONNECT_IBITS)
758 seq_printf(m, " ibits_known: %#llx\n",
759 ocd->ocd_ibits_known);
760 if (flags & OBD_CONNECT_GRANT_PARAM)
761 seq_printf(m, " grant_block_size: %d\n"
762 " grant_inode_size: %d\n"
763 " grant_max_extent_size: %d\n"
764 " grant_extent_tax: %d\n",
765 1 << ocd->ocd_grant_blkbits,
766 1 << ocd->ocd_grant_inobits,
767 ocd->ocd_grant_max_blks << ocd->ocd_grant_blkbits,
768 ocd->ocd_grant_tax_kb << 10);
769 if (flags & OBD_CONNECT_TRANSNO)
770 seq_printf(m, " first_transno: %#llx\n",
772 if (flags & OBD_CONNECT_CKSUM)
773 seq_printf(m, " cksum_types: %#x\n",
774 ocd->ocd_cksum_types);
775 if (flags & OBD_CONNECT_MAX_EASIZE)
776 seq_printf(m, " max_easize: %d\n", ocd->ocd_max_easize);
777 if (flags & OBD_CONNECT_MAXBYTES)
778 seq_printf(m, " max_object_bytes: %llu\n",
780 if (flags & OBD_CONNECT_MULTIMODRPCS)
781 seq_printf(m, " max_mod_rpcs: %hu\n",
782 ocd->ocd_maxmodrpcs);
785 static void lprocfs_import_seq_show_locked(struct seq_file *m,
786 struct obd_device *obd,
787 struct obd_import *imp)
789 char nidstr[LNET_NIDSTR_SIZE];
790 struct lprocfs_counter ret;
791 struct lprocfs_counter_header *header;
792 struct obd_import_conn *conn;
793 struct obd_connect_data *ocd;
798 ocd = &imp->imp_connect_data;
800 seq_printf(m, "import:\n"
804 " connect_flags: [ ",
807 ptlrpc_import_state_name(imp->imp_state));
808 obd_connect_seq_flags2str(m, imp->imp_connect_data.ocd_connect_flags,
809 imp->imp_connect_data.ocd_connect_flags2,
811 seq_printf(m, " ]\n");
812 obd_connect_data_seqprint(m, ocd);
813 seq_printf(m, " import_flags: [ ");
814 obd_import_flags2str(imp, m);
818 " failover_nids: [ ");
819 spin_lock(&imp->imp_lock);
821 list_for_each_entry(conn, &imp->imp_conn_list, oic_item) {
822 libcfs_nidstr_r(&conn->oic_conn->c_peer.nid,
823 nidstr, sizeof(nidstr));
824 seq_printf(m, "%s%s", j ? ", " : "", nidstr);
827 if (imp->imp_connection)
828 libcfs_nidstr_r(&imp->imp_connection->c_peer.nid,
829 nidstr, sizeof(nidstr));
831 strncpy(nidstr, "<none>", sizeof(nidstr));
833 " current_connection: %s\n"
834 " connection_attempts: %u\n"
836 " in-progress_invalidations: %u\n"
841 atomic_read(&imp->imp_inval_count),
842 ktime_get_real_seconds() - imp->imp_last_reply_time);
843 spin_unlock(&imp->imp_lock);
845 if (!obd->obd_svc_stats)
848 header = &obd->obd_svc_stats->ls_cnt_header[PTLRPC_REQWAIT_CNTR];
849 lprocfs_stats_collect(obd->obd_svc_stats, PTLRPC_REQWAIT_CNTR, &ret);
850 if (ret.lc_count != 0)
851 ret.lc_sum = div64_s64(ret.lc_sum, ret.lc_count);
854 seq_printf(m, " rpcs:\n"
856 " unregistering: %u\n"
858 " avg_waittime: %llu %s\n",
859 atomic_read(&imp->imp_inflight),
860 atomic_read(&imp->imp_unregistering),
861 atomic_read(&imp->imp_timeouts),
862 ret.lc_sum, header->lc_units);
865 for(j = 0; j < IMP_AT_MAX_PORTALS; j++) {
866 if (imp->imp_at.iat_portal[j] == 0)
868 k = max_t(unsigned int, k,
869 at_get(&imp->imp_at.iat_service_estimate[j]));
871 seq_printf(m, " service_estimates:\n"
872 " services: %u sec\n"
873 " network: %d sec\n",
875 at_get(&imp->imp_at.iat_net_latency));
877 seq_printf(m, " transactions:\n"
878 " last_replay: %llu\n"
879 " peer_committed: %llu\n"
880 " last_checked: %llu\n",
881 imp->imp_last_replay_transno,
882 imp->imp_peer_committed_transno,
883 imp->imp_last_transno_checked);
886 for (rw = 0; rw <= 1; rw++) {
887 lprocfs_stats_collect(obd->obd_svc_stats,
888 PTLRPC_LAST_CNTR + BRW_READ_BYTES + rw,
890 if (ret.lc_sum > 0 && ret.lc_count > 0) {
891 ret.lc_sum = div64_s64(ret.lc_sum, ret.lc_count);
892 seq_printf(m, " %s_data_averages:\n"
893 " bytes_per_rpc: %llu\n",
894 rw ? "write" : "read",
898 j = opcode_offset(OST_READ + rw) + EXTRA_MAX_OPCODES;
899 header = &obd->obd_svc_stats->ls_cnt_header[j];
900 lprocfs_stats_collect(obd->obd_svc_stats, j, &ret);
901 if (ret.lc_sum > 0 && ret.lc_count != 0) {
902 ret.lc_sum = div64_s64(ret.lc_sum, ret.lc_count);
903 seq_printf(m, " %s_per_rpc: %llu\n",
904 header->lc_units, ret.lc_sum);
907 seq_printf(m, " MB_per_sec: %u.%.02u\n",
908 k / j, (100 * k / j) % 100);
913 int lprocfs_import_seq_show(struct seq_file *m, void *data)
915 struct obd_device *obd = (struct obd_device *)data;
916 struct obd_import *imp;
919 LASSERT(obd != NULL);
920 with_imp_locked(obd, imp, rv)
921 lprocfs_import_seq_show_locked(m, obd, imp);
924 EXPORT_SYMBOL(lprocfs_import_seq_show);
926 int lprocfs_state_seq_show(struct seq_file *m, void *data)
928 struct obd_device *obd = (struct obd_device *)data;
929 struct obd_import *imp;
933 LASSERT(obd != NULL);
934 with_imp_locked(obd, imp, rc) {
935 seq_printf(m, "current_state: %s\n",
936 ptlrpc_import_state_name(imp->imp_state));
937 seq_printf(m, "state_history:\n");
938 k = imp->imp_state_hist_idx;
939 for (j = 0; j < IMP_STATE_HIST_LEN; j++) {
940 struct import_state_hist *ish =
941 &imp->imp_state_hist[(k + j) % IMP_STATE_HIST_LEN];
942 if (ish->ish_state == 0)
944 seq_printf(m, " - [ %lld, %s ]\n", (s64)ish->ish_time,
945 ptlrpc_import_state_name(ish->ish_state));
951 EXPORT_SYMBOL(lprocfs_state_seq_show);
953 int lprocfs_at_hist_helper(struct seq_file *m, struct adaptive_timeout *at)
956 for (i = 0; i < AT_BINS; i++)
957 seq_printf(m, "%3u ", at->at_hist[i]);
961 EXPORT_SYMBOL(lprocfs_at_hist_helper);
963 /* See also ptlrpc_lprocfs_timeouts_show_seq */
964 static void lprocfs_timeouts_seq_show_locked(struct seq_file *m,
965 struct obd_device *obd,
966 struct obd_import *imp)
968 timeout_t cur_timeout, worst_timeout;
969 time64_t now, worst_timestamp;
972 LASSERT(obd != NULL);
974 now = ktime_get_real_seconds();
976 /* Some network health info for kicks */
977 seq_printf(m, "%-10s : %lld, %llds ago\n",
978 "last reply", (s64)imp->imp_last_reply_time,
979 (s64)(now - imp->imp_last_reply_time));
981 cur_timeout = at_get(&imp->imp_at.iat_net_latency);
982 worst_timeout = imp->imp_at.iat_net_latency.at_worst_timeout_ever;
983 worst_timestamp = imp->imp_at.iat_net_latency.at_worst_timestamp;
984 seq_printf(m, "%-10s : cur %3u worst %3u (at %lld, %llds ago) ",
985 "network", cur_timeout, worst_timeout, worst_timestamp,
986 now - worst_timestamp);
987 lprocfs_at_hist_helper(m, &imp->imp_at.iat_net_latency);
989 for(i = 0; i < IMP_AT_MAX_PORTALS; i++) {
990 struct adaptive_timeout *service_est;
992 if (imp->imp_at.iat_portal[i] == 0)
995 service_est = &imp->imp_at.iat_service_estimate[i];
996 cur_timeout = at_get(service_est);
997 worst_timeout = service_est->at_worst_timeout_ever;
998 worst_timestamp = service_est->at_worst_timestamp;
999 seq_printf(m, "portal %-2d : cur %3u worst %3u (at %lld, %llds ago) ",
1000 imp->imp_at.iat_portal[i], cur_timeout,
1001 worst_timeout, worst_timestamp,
1002 now - worst_timestamp);
1003 lprocfs_at_hist_helper(m, service_est);
1007 int lprocfs_timeouts_seq_show(struct seq_file *m, void *data)
1009 struct obd_device *obd = (struct obd_device *)data;
1010 struct obd_import *imp;
1013 with_imp_locked(obd, imp, rc)
1014 lprocfs_timeouts_seq_show_locked(m, obd, imp);
1017 EXPORT_SYMBOL(lprocfs_timeouts_seq_show);
1019 int lprocfs_connect_flags_seq_show(struct seq_file *m, void *data)
1021 struct obd_device *obd = data;
1024 struct obd_import *imp;
1027 with_imp_locked(obd, imp, rc) {
1028 flags = imp->imp_connect_data.ocd_connect_flags;
1029 flags2 = imp->imp_connect_data.ocd_connect_flags2;
1030 seq_printf(m, "flags=%#llx\n", flags);
1031 seq_printf(m, "flags2=%#llx\n", flags2);
1032 obd_connect_seq_flags2str(m, flags, flags2, "\n");
1033 seq_printf(m, "\n");
1038 EXPORT_SYMBOL(lprocfs_connect_flags_seq_show);
1040 static const struct attribute *obd_def_uuid_attrs[] = {
1041 &lustre_attr_uuid.attr,
1045 static const struct attribute *obd_def_attrs[] = {
1046 &lustre_attr_blocksize.attr,
1047 &lustre_attr_kbytestotal.attr,
1048 &lustre_attr_kbytesfree.attr,
1049 &lustre_attr_kbytesavail.attr,
1050 &lustre_attr_filestotal.attr,
1051 &lustre_attr_filesfree.attr,
1052 &lustre_attr_uuid.attr,
1056 static void obd_sysfs_release(struct kobject *kobj)
1058 struct obd_device *obd = container_of(kobj, struct obd_device,
1061 complete(&obd->obd_kobj_unregister);
1064 int lprocfs_obd_setup(struct obd_device *obd, bool uuid_only)
1066 struct ldebugfs_vars *debugfs_vars = NULL;
1069 if (!obd || obd->obd_magic != OBD_DEVICE_MAGIC)
1072 rc = kobject_set_name(&obd->obd_kset.kobj, "%s", obd->obd_name);
1076 obd->obd_ktype.sysfs_ops = &lustre_sysfs_ops;
1077 obd->obd_ktype.release = obd_sysfs_release;
1079 obd->obd_kset.kobj.parent = &obd->obd_type->typ_kobj;
1080 obd->obd_kset.kobj.ktype = &obd->obd_ktype;
1081 init_completion(&obd->obd_kobj_unregister);
1082 rc = kset_register(&obd->obd_kset);
1087 obd->obd_attrs = obd_def_uuid_attrs;
1089 obd->obd_attrs = obd_def_attrs;
1091 rc = sysfs_create_files(&obd->obd_kset.kobj, obd->obd_attrs);
1093 kset_unregister(&obd->obd_kset);
1097 if (!obd->obd_type->typ_procroot)
1098 debugfs_vars = obd->obd_debugfs_vars;
1099 obd->obd_debugfs_entry = debugfs_create_dir(
1100 obd->obd_name, obd->obd_type->typ_debugfs_entry);
1101 ldebugfs_add_vars(obd->obd_debugfs_entry, debugfs_vars, obd);
1103 if (obd->obd_proc_entry || !obd->obd_type->typ_procroot)
1104 GOTO(already_registered, rc);
1106 obd->obd_proc_entry = lprocfs_register(obd->obd_name,
1107 obd->obd_type->typ_procroot,
1108 obd->obd_vars, obd);
1109 if (IS_ERR(obd->obd_proc_entry)) {
1110 rc = PTR_ERR(obd->obd_proc_entry);
1111 CERROR("error %d setting up lprocfs for %s\n",rc,obd->obd_name);
1112 obd->obd_proc_entry = NULL;
1114 debugfs_remove_recursive(obd->obd_debugfs_entry);
1115 obd->obd_debugfs_entry = NULL;
1117 sysfs_remove_files(&obd->obd_kset.kobj, obd->obd_attrs);
1118 obd->obd_attrs = NULL;
1119 kset_unregister(&obd->obd_kset);
1125 EXPORT_SYMBOL(lprocfs_obd_setup);
1127 int lprocfs_obd_cleanup(struct obd_device *obd)
1132 if (obd->obd_proc_exports_entry) {
1133 /* Should be no exports left */
1134 lprocfs_remove(&obd->obd_proc_exports_entry);
1135 obd->obd_proc_exports_entry = NULL;
1138 if (obd->obd_proc_entry) {
1139 lprocfs_remove(&obd->obd_proc_entry);
1140 obd->obd_proc_entry = NULL;
1143 debugfs_remove_recursive(obd->obd_debugfs_entry);
1144 obd->obd_debugfs_entry = NULL;
1146 /* obd device never allocated a kset */
1147 if (!obd->obd_kset.kobj.state_initialized)
1150 if (obd->obd_attrs) {
1151 sysfs_remove_files(&obd->obd_kset.kobj, obd->obd_attrs);
1152 obd->obd_attrs = NULL;
1155 kset_unregister(&obd->obd_kset);
1156 wait_for_completion(&obd->obd_kobj_unregister);
1159 EXPORT_SYMBOL(lprocfs_obd_cleanup);
1161 int lprocfs_stats_alloc_one(struct lprocfs_stats *stats, unsigned int cpuid)
1163 struct lprocfs_counter *cntr;
1164 unsigned int percpusize;
1166 unsigned long flags = 0;
1169 LASSERT(stats->ls_percpu[cpuid] == NULL);
1170 LASSERT((stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU) == 0);
1172 percpusize = lprocfs_stats_counter_size(stats);
1173 LIBCFS_ALLOC_ATOMIC(stats->ls_percpu[cpuid], percpusize);
1174 if (stats->ls_percpu[cpuid]) {
1176 if (unlikely(stats->ls_biggest_alloc_num <= cpuid)) {
1177 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
1178 spin_lock_irqsave(&stats->ls_lock, flags);
1180 spin_lock(&stats->ls_lock);
1181 if (stats->ls_biggest_alloc_num <= cpuid)
1182 stats->ls_biggest_alloc_num = cpuid + 1;
1183 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE) {
1184 spin_unlock_irqrestore(&stats->ls_lock, flags);
1186 spin_unlock(&stats->ls_lock);
1189 /* initialize the ls_percpu[cpuid] non-zero counter */
1190 for (i = 0; i < stats->ls_num; ++i) {
1191 cntr = lprocfs_stats_counter_get(stats, cpuid, i);
1192 cntr->lc_min = LC_MIN_INIT;
1198 struct lprocfs_stats *lprocfs_alloc_stats(unsigned int num,
1199 enum lprocfs_stats_flags flags)
1201 struct lprocfs_stats *stats;
1202 unsigned int num_entry;
1203 unsigned int percpusize = 0;
1209 if (lprocfs_no_percpu_stats != 0)
1210 flags |= LPROCFS_STATS_FLAG_NOPERCPU;
1212 if (flags & LPROCFS_STATS_FLAG_NOPERCPU)
1215 num_entry = num_possible_cpus();
1217 /* alloc percpu pointers for all possible cpu slots */
1218 LIBCFS_ALLOC(stats, offsetof(typeof(*stats), ls_percpu[num_entry]));
1222 stats->ls_num = num;
1223 stats->ls_flags = flags;
1224 stats->ls_init = ktime_get_real();
1225 spin_lock_init(&stats->ls_lock);
1227 /* alloc num of counter headers */
1228 CFS_ALLOC_PTR_ARRAY(stats->ls_cnt_header, stats->ls_num);
1229 if (!stats->ls_cnt_header)
1232 if ((flags & LPROCFS_STATS_FLAG_NOPERCPU) != 0) {
1233 /* contains only one set counters */
1234 percpusize = lprocfs_stats_counter_size(stats);
1235 LIBCFS_ALLOC_ATOMIC(stats->ls_percpu[0], percpusize);
1236 if (!stats->ls_percpu[0])
1238 stats->ls_biggest_alloc_num = 1;
1239 } else if ((flags & LPROCFS_STATS_FLAG_IRQ_SAFE) != 0) {
1240 /* alloc all percpu data, currently only obd_memory use this */
1241 for (i = 0; i < num_entry; ++i)
1242 if (lprocfs_stats_alloc_one(stats, i) < 0)
1249 lprocfs_free_stats(&stats);
1252 EXPORT_SYMBOL(lprocfs_alloc_stats);
1254 void lprocfs_free_stats(struct lprocfs_stats **statsh)
1256 struct lprocfs_stats *stats = *statsh;
1257 unsigned int num_entry;
1258 unsigned int percpusize;
1261 if (!stats || stats->ls_num == 0)
1265 if (stats->ls_flags & LPROCFS_STATS_FLAG_NOPERCPU)
1268 num_entry = num_possible_cpus();
1270 percpusize = lprocfs_stats_counter_size(stats);
1271 for (i = 0; i < num_entry; i++)
1272 if (stats->ls_percpu[i])
1273 LIBCFS_FREE(stats->ls_percpu[i], percpusize);
1274 if (stats->ls_cnt_header)
1275 CFS_FREE_PTR_ARRAY(stats->ls_cnt_header, stats->ls_num);
1276 LIBCFS_FREE(stats, offsetof(typeof(*stats), ls_percpu[num_entry]));
1278 EXPORT_SYMBOL(lprocfs_free_stats);
1280 u64 lprocfs_stats_collector(struct lprocfs_stats *stats, int idx,
1281 enum lprocfs_fields_flags field)
1283 unsigned long flags = 0;
1284 unsigned int num_cpu;
1290 num_cpu = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
1291 for (i = 0; i < num_cpu; i++) {
1292 struct lprocfs_counter *cntr;
1294 if (!stats->ls_percpu[i])
1297 cntr = lprocfs_stats_counter_get(stats, i, idx);
1298 ret += lprocfs_read_helper(cntr, &stats->ls_cnt_header[idx],
1299 stats->ls_flags, field);
1301 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
1304 EXPORT_SYMBOL(lprocfs_stats_collector);
1306 void lprocfs_clear_stats(struct lprocfs_stats *stats)
1308 struct lprocfs_counter *percpu_cntr;
1311 unsigned int num_entry;
1312 unsigned long flags = 0;
1314 num_entry = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
1316 for (i = 0; i < num_entry; i++) {
1317 if (!stats->ls_percpu[i])
1319 for (j = 0; j < stats->ls_num; j++) {
1320 percpu_cntr = lprocfs_stats_counter_get(stats, i, j);
1321 percpu_cntr->lc_count = 0;
1322 percpu_cntr->lc_min = LC_MIN_INIT;
1323 percpu_cntr->lc_max = 0;
1324 percpu_cntr->lc_sumsquare = 0;
1325 percpu_cntr->lc_sum = 0;
1326 if (stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE)
1327 percpu_cntr->lc_sum_irq = 0;
1330 stats->ls_init = ktime_get_real();
1332 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
1334 EXPORT_SYMBOL(lprocfs_clear_stats);
1336 static ssize_t lprocfs_stats_seq_write(struct file *file,
1337 const char __user *buf,
1338 size_t len, loff_t *off)
1340 struct seq_file *seq = file->private_data;
1341 struct lprocfs_stats *stats = seq->private;
1343 lprocfs_clear_stats(stats);
1348 static void *lprocfs_stats_seq_start(struct seq_file *p, loff_t *pos)
1350 struct lprocfs_stats *stats = p->private;
1352 return (*pos < stats->ls_num) ? pos : NULL;
1355 static void lprocfs_stats_seq_stop(struct seq_file *p, void *v)
1359 static void *lprocfs_stats_seq_next(struct seq_file *p, void *v, loff_t *pos)
1363 return lprocfs_stats_seq_start(p, pos);
1367 * print header of stats including snapshot_time, start_time and elapsed_time.
1369 * \param seq the file to print content to
1370 * \param now end time to calculate elapsed_time
1371 * \param ts_init start time to calculate elapsed_time
1372 * \param width the width of key to align them well
1373 * \param colon "" or ":"
1374 * \param show_units show units or not
1375 * \param prefix prefix (indent) before printing each line of header
1376 * to align them with other content
1378 void lprocfs_stats_header(struct seq_file *seq, ktime_t now, ktime_t ts_init,
1379 int width, const char *colon, bool show_units,
1382 const char *units = show_units ? " secs.nsecs" : "";
1383 struct timespec64 ts;
1386 field = (colon && colon[0]) ? "snapshot_time:" : "snapshot_time";
1387 ts = ktime_to_timespec64(now);
1388 seq_printf(seq, "%s%-*s %llu.%09lu%s\n", prefix, width, field,
1389 (s64)ts.tv_sec, ts.tv_nsec, units);
1391 field = (colon && colon[0]) ? "start_time:" : "start_time";
1392 ts = ktime_to_timespec64(ts_init);
1393 seq_printf(seq, "%s%-*s %llu.%09lu%s\n", prefix, width, field,
1394 (s64)ts.tv_sec, ts.tv_nsec, units);
1396 field = (colon && colon[0]) ? "elapsed_time:" : "elapsed_time";
1397 ts = ktime_to_timespec64(ktime_sub(now, ts_init));
1398 seq_printf(seq, "%s%-*s %llu.%09lu%s\n", prefix, width, field,
1399 (s64)ts.tv_sec, ts.tv_nsec, units);
1401 EXPORT_SYMBOL(lprocfs_stats_header);
1403 /* seq file export of one lprocfs counter */
1404 static int lprocfs_stats_seq_show(struct seq_file *p, void *v)
1406 struct lprocfs_stats *stats = p->private;
1407 struct lprocfs_counter_header *hdr;
1408 struct lprocfs_counter ctr;
1409 int idx = *(loff_t *)v;
1412 lprocfs_stats_header(p, ktime_get_real(), stats->ls_init, 25,
1415 hdr = &stats->ls_cnt_header[idx];
1416 lprocfs_stats_collect(stats, idx, &ctr);
1418 if (ctr.lc_count == 0)
1421 seq_printf(p, "%-25s %lld samples [%s]", hdr->lc_name,
1422 ctr.lc_count, hdr->lc_units);
1424 if ((hdr->lc_config & LPROCFS_CNTR_AVGMINMAX) && ctr.lc_count > 0) {
1425 seq_printf(p, " %lld %lld %lld",
1426 ctr.lc_min, ctr.lc_max, ctr.lc_sum);
1427 if (hdr->lc_config & LPROCFS_CNTR_STDDEV)
1428 seq_printf(p, " %llu", ctr.lc_sumsquare);
1434 static const struct seq_operations lprocfs_stats_seq_sops = {
1435 .start = lprocfs_stats_seq_start,
1436 .stop = lprocfs_stats_seq_stop,
1437 .next = lprocfs_stats_seq_next,
1438 .show = lprocfs_stats_seq_show,
1441 static int lprocfs_stats_seq_open(struct inode *inode, struct file *file)
1443 struct seq_file *seq;
1446 rc = seq_open(file, &lprocfs_stats_seq_sops);
1449 seq = file->private_data;
1450 seq->private = inode->i_private ? inode->i_private : pde_data(inode);
1454 const struct file_operations ldebugfs_stats_seq_fops = {
1455 .owner = THIS_MODULE,
1456 .open = lprocfs_stats_seq_open,
1458 .write = lprocfs_stats_seq_write,
1459 .llseek = seq_lseek,
1460 .release = lprocfs_seq_release,
1462 EXPORT_SYMBOL(ldebugfs_stats_seq_fops);
1464 static const struct proc_ops lprocfs_stats_seq_fops = {
1465 PROC_OWNER(THIS_MODULE)
1466 .proc_open = lprocfs_stats_seq_open,
1467 .proc_read = seq_read,
1468 .proc_write = lprocfs_stats_seq_write,
1469 .proc_lseek = seq_lseek,
1470 .proc_release = lprocfs_seq_release,
1473 int lprocfs_register_stats(struct proc_dir_entry *root, const char *name,
1474 struct lprocfs_stats *stats)
1476 struct proc_dir_entry *entry;
1477 LASSERT(root != NULL);
1479 entry = proc_create_data(name, 0644, root,
1480 &lprocfs_stats_seq_fops, stats);
1485 EXPORT_SYMBOL(lprocfs_register_stats);
1487 void lprocfs_counter_init(struct lprocfs_stats *stats, int index,
1488 unsigned conf, const char *name, const char *units)
1490 struct lprocfs_counter_header *header;
1491 struct lprocfs_counter *percpu_cntr;
1492 unsigned long flags = 0;
1494 unsigned int num_cpu;
1496 LASSERT(stats != NULL);
1498 header = &stats->ls_cnt_header[index];
1499 LASSERTF(header != NULL, "Failed to allocate stats header:[%d]%s/%s\n",
1500 index, name, units);
1502 header->lc_config = conf;
1503 header->lc_name = name;
1504 header->lc_units = units;
1506 num_cpu = lprocfs_stats_lock(stats, LPROCFS_GET_NUM_CPU, &flags);
1507 for (i = 0; i < num_cpu; ++i) {
1508 if (!stats->ls_percpu[i])
1510 percpu_cntr = lprocfs_stats_counter_get(stats, i, index);
1511 percpu_cntr->lc_count = 0;
1512 percpu_cntr->lc_min = LC_MIN_INIT;
1513 percpu_cntr->lc_max = 0;
1514 percpu_cntr->lc_sumsquare = 0;
1515 percpu_cntr->lc_sum = 0;
1516 if ((stats->ls_flags & LPROCFS_STATS_FLAG_IRQ_SAFE) != 0)
1517 percpu_cntr->lc_sum_irq = 0;
1519 lprocfs_stats_unlock(stats, LPROCFS_GET_NUM_CPU, &flags);
1521 EXPORT_SYMBOL(lprocfs_counter_init);
1523 static const char * const mps_stats[] = {
1524 [LPROC_MD_CLOSE] = "close",
1525 [LPROC_MD_CREATE] = "create",
1526 [LPROC_MD_ENQUEUE] = "enqueue",
1527 [LPROC_MD_GETATTR] = "getattr",
1528 [LPROC_MD_INTENT_LOCK] = "intent_lock",
1529 [LPROC_MD_LINK] = "link",
1530 [LPROC_MD_RENAME] = "rename",
1531 [LPROC_MD_SETATTR] = "setattr",
1532 [LPROC_MD_FSYNC] = "fsync",
1533 [LPROC_MD_READ_PAGE] = "read_page",
1534 [LPROC_MD_UNLINK] = "unlink",
1535 [LPROC_MD_SETXATTR] = "setxattr",
1536 [LPROC_MD_GETXATTR] = "getxattr",
1537 [LPROC_MD_INTENT_GETATTR_ASYNC] = "intent_getattr_async",
1538 [LPROC_MD_REVALIDATE_LOCK] = "revalidate_lock",
1541 int lprocfs_alloc_md_stats(struct obd_device *obd,
1542 unsigned int num_private_stats)
1544 struct lprocfs_stats *stats;
1545 unsigned int num_stats;
1549 * TODO Ensure that this function is only used where
1550 * appropriate by adding an assertion to the effect that
1551 * obd->obd_type->typ_md_ops is not NULL. We can't do this now
1552 * because mdt_procfs_init() uses this function to allocate
1553 * the stats backing /proc/fs/lustre/mdt/.../md_stats but the
1554 * mdt layer does not use the md_ops interface. This is
1555 * confusing and a waste of memory. See LU-2484.
1557 LASSERT(obd->obd_proc_entry != NULL);
1558 LASSERT(obd->obd_md_stats == NULL);
1560 num_stats = ARRAY_SIZE(mps_stats) + num_private_stats;
1561 stats = lprocfs_alloc_stats(num_stats, 0);
1565 for (i = 0; i < ARRAY_SIZE(mps_stats); i++) {
1566 lprocfs_counter_init(stats, i, 0, mps_stats[i], "reqs");
1567 if (!stats->ls_cnt_header[i].lc_name) {
1568 CERROR("Missing md_stat initializer md_op operation at offset %d. Aborting.\n",
1574 rc = lprocfs_register_stats(obd->obd_proc_entry, "md_stats", stats);
1576 lprocfs_free_stats(&stats);
1578 obd->obd_md_stats = stats;
1583 EXPORT_SYMBOL(lprocfs_alloc_md_stats);
1585 void lprocfs_free_md_stats(struct obd_device *obd)
1587 struct lprocfs_stats *stats = obd->obd_md_stats;
1590 obd->obd_md_stats = NULL;
1591 lprocfs_free_stats(&stats);
1594 EXPORT_SYMBOL(lprocfs_free_md_stats);
1596 void lprocfs_init_ldlm_stats(struct lprocfs_stats *ldlm_stats)
1598 lprocfs_counter_init(ldlm_stats,
1599 LDLM_ENQUEUE - LDLM_FIRST_OPC,
1600 0, "ldlm_enqueue", "reqs");
1601 lprocfs_counter_init(ldlm_stats,
1602 LDLM_CONVERT - LDLM_FIRST_OPC,
1603 0, "ldlm_convert", "reqs");
1604 lprocfs_counter_init(ldlm_stats,
1605 LDLM_CANCEL - LDLM_FIRST_OPC,
1606 0, "ldlm_cancel", "reqs");
1607 lprocfs_counter_init(ldlm_stats,
1608 LDLM_BL_CALLBACK - LDLM_FIRST_OPC,
1609 0, "ldlm_bl_callback", "reqs");
1610 lprocfs_counter_init(ldlm_stats,
1611 LDLM_CP_CALLBACK - LDLM_FIRST_OPC,
1612 0, "ldlm_cp_callback", "reqs");
1613 lprocfs_counter_init(ldlm_stats,
1614 LDLM_GL_CALLBACK - LDLM_FIRST_OPC,
1615 0, "ldlm_gl_callback", "reqs");
1617 EXPORT_SYMBOL(lprocfs_init_ldlm_stats);
1619 __s64 lprocfs_read_helper(struct lprocfs_counter *lc,
1620 struct lprocfs_counter_header *header,
1621 enum lprocfs_stats_flags flags,
1622 enum lprocfs_fields_flags field)
1630 case LPROCFS_FIELDS_FLAGS_CONFIG:
1631 ret = header->lc_config;
1633 case LPROCFS_FIELDS_FLAGS_SUM:
1635 if ((flags & LPROCFS_STATS_FLAG_IRQ_SAFE) != 0)
1636 ret += lc->lc_sum_irq;
1638 case LPROCFS_FIELDS_FLAGS_MIN:
1641 case LPROCFS_FIELDS_FLAGS_MAX:
1644 case LPROCFS_FIELDS_FLAGS_AVG:
1645 ret = (lc->lc_max - lc->lc_min) / 2;
1647 case LPROCFS_FIELDS_FLAGS_SUMSQUARE:
1648 ret = lc->lc_sumsquare;
1650 case LPROCFS_FIELDS_FLAGS_COUNT:
1658 EXPORT_SYMBOL(lprocfs_read_helper);
1661 * string_to_size - convert ASCII string representing a numerical
1662 * value with optional units to 64-bit binary value
1664 * @size: The numerical value extract out of @buffer
1665 * @buffer: passed in string to parse
1666 * @count: length of the @buffer
1668 * This function returns a 64-bit binary value if @buffer contains a valid
1669 * numerical string. The string is parsed to 3 significant figures after
1670 * the decimal point. Support the string containing an optional units at
1671 * the end which can be base 2 or base 10 in value. If no units are given
1672 * the string is assumed to just a numerical value.
1674 * Returns: @count if the string is successfully parsed,
1675 * -errno on invalid input strings. Error values:
1677 * - ``-EINVAL``: @buffer is not a proper numerical string
1678 * - ``-EOVERFLOW``: results does not fit into 64 bits.
1679 * - ``-E2BIG ``: @buffer is too large (not a valid number)
1681 int string_to_size(u64 *size, const char *buffer, size_t count)
1683 /* For string_get_size() it can support values above exabytes,
1684 * (ZiB, YiB) due to breaking the return value into a size and
1685 * bulk size to avoid 64 bit overflow. We don't break the size
1686 * up into block size units so we don't support ZiB or YiB.
1688 static const char *const units_10[] = {
1689 "kB", "MB", "GB", "TB", "PB", "EB",
1691 static const char *const units_2[] = {
1692 "K", "M", "G", "T", "P", "E",
1694 static const char *const *const units_str[] = {
1695 [STRING_UNITS_2] = units_2,
1696 [STRING_UNITS_10] = units_10,
1698 static const unsigned int coeff[] = {
1699 [STRING_UNITS_10] = 1000,
1700 [STRING_UNITS_2] = 1024,
1702 enum string_size_units unit = STRING_UNITS_2;
1703 u64 whole, blk_size = 1;
1704 char kernbuf[22], *end;
1709 if (count >= sizeof(kernbuf)) {
1710 CERROR("count %zd > buffer %zd\n", count, sizeof(kernbuf));
1715 /* The "iB" suffix is optionally allowed for indicating base-2 numbers.
1716 * If suffix is only "B" and not "iB" then we treat it as base-10.
1718 end = strstr(buffer, "B");
1719 if (end && *(end - 1) != 'i')
1720 unit = STRING_UNITS_10;
1722 i = unit == STRING_UNITS_2 ? ARRAY_SIZE(units_2) - 1 :
1723 ARRAY_SIZE(units_10) - 1;
1725 end = strnstr(buffer, units_str[unit][i], count);
1728 blk_size *= coeff[unit];
1734 /* as 'B' is a substring of all units, we need to handle it
1738 /* 'B' is only acceptable letter at this point */
1739 end = strnchr(buffer, count, 'B');
1743 if (count - len > 2 ||
1744 (count - len == 2 && strcmp(end, "B\n") != 0)) {
1745 CDEBUG(D_INFO, "unknown suffix '%s'\n", buffer);
1749 /* kstrtoull will error out if it has non digits */
1753 end = strnchr(buffer, count, '.');
1755 /* need to limit 3 decimal places */
1756 char rem[4] = "000";
1763 /* limit to 3 decimal points */
1764 off = min_t(size_t, 3, strspn(end, "0123456789"));
1765 /* need to limit frac_d to a u32 */
1766 memcpy(rem, end, off);
1767 rc = kstrtoull(rem, 10, &frac);
1771 if (fls64(frac) + fls64(blk_size) - 1 > 64)
1779 snprintf(kernbuf, sizeof(kernbuf), "%.*s", (int)len, buffer);
1780 rc = kstrtoull(kernbuf, 10, &whole);
1784 if (whole != 0 && fls64(whole) + fls64(blk_size) - 1 > 64)
1787 *size += whole * blk_size;
1791 EXPORT_SYMBOL(string_to_size);
1794 * sysfs_memparse - parse a ASCII string to 64-bit binary value,
1795 * with optional units
1797 * @buffer: kernel pointer to input string
1798 * @count: number of bytes in the input @buffer
1799 * @val: (output) binary value returned to caller
1800 * @defunit: default unit suffix to use if none is provided
1802 * Parses a string into a number. The number stored at @buffer is
1803 * potentially suffixed with K, M, G, T, P, E. Besides these other
1804 * valid suffix units are shown in the string_to_size() function.
1805 * If the string lacks a suffix then the defunit is used. The defunit
1806 * should be given as a binary unit (e.g. MiB) as that is the standard
1807 * for tunables in Lustre. If no unit suffix is given (e.g. 'G'), then
1808 * it is assumed to be in binary units.
1810 * Returns: 0 on success or -errno on failure.
1812 int sysfs_memparse(const char *buffer, size_t count, u64 *val,
1813 const char *defunit)
1815 const char *param = buffer;
1819 count = strlen(buffer);
1820 while (count > 0 && isspace(buffer[count - 1]))
1826 /* If there isn't already a unit on this value, append @defunit.
1827 * Units of 'B' don't affect the value, so don't bother adding.
1829 if (!isalpha(buffer[count - 1]) && defunit[0] != 'B') {
1830 if (count + 3 >= sizeof(tmp_buf)) {
1831 CERROR("count %zd > size %zd\n", count, sizeof(param));
1835 scnprintf(tmp_buf, sizeof(tmp_buf), "%.*s%s", (int)count,
1838 count = strlen(param);
1841 rc = string_to_size(val, param, count);
1843 return rc < 0 ? rc : 0;
1845 EXPORT_SYMBOL(sysfs_memparse);
1847 char *lprocfs_strnstr(const char *s1, const char *s2, size_t len)
1856 if (!memcmp(s1, s2, l2))
1862 EXPORT_SYMBOL(lprocfs_strnstr);
1865 * Find the string \a name in the input \a buffer, and return a pointer to the
1866 * value immediately following \a name, reducing \a count appropriately.
1867 * If \a name is not found the original \a buffer is returned.
1869 char *lprocfs_find_named_value(const char *buffer, const char *name,
1873 size_t buflen = *count;
1875 /* there is no strnstr() in rhel5 and ubuntu kernels */
1876 val = lprocfs_strnstr(buffer, name, buflen);
1878 return (char *)buffer;
1880 val += strlen(name); /* skip prefix */
1881 while (val < buffer + buflen && isspace(*val)) /* skip separator */
1885 while (val < buffer + buflen && isalnum(*val)) {
1890 return val - *count;
1892 EXPORT_SYMBOL(lprocfs_find_named_value);
1894 int lprocfs_seq_create(struct proc_dir_entry *parent,
1897 const struct proc_ops *seq_fops,
1900 struct proc_dir_entry *entry;
1903 /* Disallow secretly (un)writable entries. */
1904 LASSERT(!seq_fops->proc_write == !(mode & 0222));
1906 entry = proc_create_data(name, mode, parent, seq_fops, data);
1913 EXPORT_SYMBOL(lprocfs_seq_create);
1915 int lprocfs_obd_seq_create(struct obd_device *obd,
1918 const struct proc_ops *seq_fops,
1921 return lprocfs_seq_create(obd->obd_proc_entry, name,
1922 mode, seq_fops, data);
1924 EXPORT_SYMBOL(lprocfs_obd_seq_create);
1926 void lprocfs_oh_tally(struct obd_histogram *oh, unsigned int value)
1928 if (value >= OBD_HIST_MAX)
1929 value = OBD_HIST_MAX - 1;
1931 spin_lock(&oh->oh_lock);
1932 oh->oh_buckets[value]++;
1933 spin_unlock(&oh->oh_lock);
1935 EXPORT_SYMBOL(lprocfs_oh_tally);
1937 void lprocfs_oh_tally_log2(struct obd_histogram *oh, unsigned int value)
1939 unsigned int val = 0;
1941 if (likely(value != 0))
1942 val = min(fls(value - 1), OBD_HIST_MAX);
1944 lprocfs_oh_tally(oh, val);
1946 EXPORT_SYMBOL(lprocfs_oh_tally_log2);
1948 unsigned long lprocfs_oh_sum(struct obd_histogram *oh)
1950 unsigned long ret = 0;
1953 for (i = 0; i < OBD_HIST_MAX; i++)
1954 ret += oh->oh_buckets[i];
1957 EXPORT_SYMBOL(lprocfs_oh_sum);
1959 void lprocfs_oh_clear(struct obd_histogram *oh)
1961 spin_lock(&oh->oh_lock);
1962 memset(oh->oh_buckets, 0, sizeof(oh->oh_buckets));
1963 spin_unlock(&oh->oh_lock);
1965 EXPORT_SYMBOL(lprocfs_oh_clear);
1967 void lprocfs_oh_tally_pcpu(struct obd_hist_pcpu *oh,
1970 if (value >= OBD_HIST_MAX)
1971 value = OBD_HIST_MAX - 1;
1973 percpu_counter_inc(&oh->oh_pc_buckets[value]);
1975 EXPORT_SYMBOL(lprocfs_oh_tally_pcpu);
1977 void lprocfs_oh_tally_log2_pcpu(struct obd_hist_pcpu *oh,
1980 unsigned int val = 0;
1982 if (likely(value != 0))
1983 val = min(fls(value - 1), OBD_HIST_MAX);
1985 lprocfs_oh_tally_pcpu(oh, val);
1987 EXPORT_SYMBOL(lprocfs_oh_tally_log2_pcpu);
1989 unsigned long lprocfs_oh_counter_pcpu(struct obd_hist_pcpu *oh,
1992 return percpu_counter_sum(&oh->oh_pc_buckets[value]);
1994 EXPORT_SYMBOL(lprocfs_oh_counter_pcpu);
1996 unsigned long lprocfs_oh_sum_pcpu(struct obd_hist_pcpu *oh)
1998 unsigned long ret = 0;
2001 for (i = 0; i < OBD_HIST_MAX; i++)
2002 ret += percpu_counter_sum(&oh->oh_pc_buckets[i]);
2006 EXPORT_SYMBOL(lprocfs_oh_sum_pcpu);
2008 int lprocfs_oh_alloc_pcpu(struct obd_hist_pcpu *oh)
2012 if (oh->oh_initialized)
2015 for (i = 0; i < OBD_HIST_MAX; i++) {
2016 rc = percpu_counter_init(&oh->oh_pc_buckets[i], 0, GFP_KERNEL);
2021 oh->oh_initialized = true;
2026 for (i--; i >= 0; i--)
2027 percpu_counter_destroy(&oh->oh_pc_buckets[i]);
2031 EXPORT_SYMBOL(lprocfs_oh_alloc_pcpu);
2033 void lprocfs_oh_clear_pcpu(struct obd_hist_pcpu *oh)
2037 for (i = 0; i < OBD_HIST_MAX; i++)
2038 percpu_counter_set(&oh->oh_pc_buckets[i], 0);
2040 EXPORT_SYMBOL(lprocfs_oh_clear_pcpu);
2042 void lprocfs_oh_release_pcpu(struct obd_hist_pcpu *oh)
2046 if (!oh->oh_initialized)
2049 for (i = 0; i < OBD_HIST_MAX; i++)
2050 percpu_counter_destroy(&oh->oh_pc_buckets[i]);
2052 oh->oh_initialized = false;
2054 EXPORT_SYMBOL(lprocfs_oh_release_pcpu);
2056 ssize_t lustre_attr_show(struct kobject *kobj,
2057 struct attribute *attr, char *buf)
2059 struct lustre_attr *a = container_of(attr, struct lustre_attr, attr);
2061 return a->show ? a->show(kobj, attr, buf) : 0;
2063 EXPORT_SYMBOL_GPL(lustre_attr_show);
2065 ssize_t lustre_attr_store(struct kobject *kobj, struct attribute *attr,
2066 const char *buf, size_t len)
2068 struct lustre_attr *a = container_of(attr, struct lustre_attr, attr);
2070 return a->store ? a->store(kobj, attr, buf, len) : len;
2072 EXPORT_SYMBOL_GPL(lustre_attr_store);
2074 const struct sysfs_ops lustre_sysfs_ops = {
2075 .show = lustre_attr_show,
2076 .store = lustre_attr_store,
2078 EXPORT_SYMBOL_GPL(lustre_sysfs_ops);
2080 int lprocfs_obd_max_pages_per_rpc_seq_show(struct seq_file *m, void *data)
2082 struct obd_device *obd = data;
2083 struct client_obd *cli = &obd->u.cli;
2085 spin_lock(&cli->cl_loi_list_lock);
2086 seq_printf(m, "%d\n", cli->cl_max_pages_per_rpc);
2087 spin_unlock(&cli->cl_loi_list_lock);
2090 EXPORT_SYMBOL(lprocfs_obd_max_pages_per_rpc_seq_show);
2092 ssize_t lprocfs_obd_max_pages_per_rpc_seq_write(struct file *file,
2093 const char __user *buffer,
2094 size_t count, loff_t *off)
2096 struct seq_file *m = file->private_data;
2097 struct obd_device *obd = m->private;
2098 struct client_obd *cli = &obd->u.cli;
2099 struct obd_import *imp;
2100 struct obd_connect_data *ocd;
2105 if (count > sizeof(kernbuf) - 1)
2108 if (copy_from_user(kernbuf, buffer, count))
2111 kernbuf[count] = '\0';
2113 rc = sysfs_memparse(kernbuf, count, &val, "B");
2117 /* if the max_pages is specified in bytes, convert to pages */
2118 if (val >= ONE_MB_BRW_SIZE)
2121 with_imp_locked(obd, imp, rc) {
2122 ocd = &imp->imp_connect_data;
2123 chunk_mask = ~((1 << (cli->cl_chunkbits - PAGE_SHIFT)) - 1);
2124 /* max_pages_per_rpc must be chunk aligned */
2125 val = (val + ~chunk_mask) & chunk_mask;
2126 if (val == 0 || (ocd->ocd_brw_size != 0 &&
2127 val > ocd->ocd_brw_size >> PAGE_SHIFT)) {
2130 spin_lock(&cli->cl_loi_list_lock);
2131 cli->cl_max_pages_per_rpc = val;
2132 client_adjust_max_dirty(cli);
2133 spin_unlock(&cli->cl_loi_list_lock);
2139 EXPORT_SYMBOL(lprocfs_obd_max_pages_per_rpc_seq_write);
2141 ssize_t short_io_bytes_show(struct kobject *kobj, struct attribute *attr,
2144 struct obd_device *obd = container_of(kobj, struct obd_device,
2146 struct client_obd *cli = &obd->u.cli;
2149 spin_lock(&cli->cl_loi_list_lock);
2150 rc = sprintf(buf, "%d\n", cli->cl_max_short_io_bytes);
2151 spin_unlock(&cli->cl_loi_list_lock);
2154 EXPORT_SYMBOL(short_io_bytes_show);
2156 /* Used to catch people who think they're specifying pages. */
2157 #define MIN_SHORT_IO_BYTES 64U
2159 ssize_t short_io_bytes_store(struct kobject *kobj, struct attribute *attr,
2160 const char *buffer, size_t count)
2162 struct obd_device *obd = container_of(kobj, struct obd_device,
2164 struct client_obd *cli = &obd->u.cli;
2168 if (strcmp(buffer, "-1") == 0) {
2169 val = OBD_DEF_SHORT_IO_BYTES;
2171 rc = sysfs_memparse(buffer, count, &val, "B");
2176 if (val && (val < MIN_SHORT_IO_BYTES || val > LNET_MTU))
2177 GOTO(out, rc = -ERANGE);
2181 spin_lock(&cli->cl_loi_list_lock);
2182 cli->cl_max_short_io_bytes = min_t(u64, val, OST_MAX_SHORT_IO_BYTES);
2183 spin_unlock(&cli->cl_loi_list_lock);
2188 EXPORT_SYMBOL(short_io_bytes_store);
2190 int lprocfs_wr_root_squash(const char __user *buffer, unsigned long count,
2191 struct root_squash_info *squash, char *name)
2194 char kernbuf[64], *tmp, *errmsg;
2195 unsigned long uid, gid;
2198 if (count >= sizeof(kernbuf)) {
2199 errmsg = "string too long";
2200 GOTO(failed_noprint, rc = -EINVAL);
2202 if (copy_from_user(kernbuf, buffer, count)) {
2203 errmsg = "bad address";
2204 GOTO(failed_noprint, rc = -EFAULT);
2206 kernbuf[count] = '\0';
2208 /* look for uid gid separator */
2209 tmp = strchr(kernbuf, ':');
2211 errmsg = "needs uid:gid format";
2212 GOTO(failed, rc = -EINVAL);
2218 if (kstrtoul(kernbuf, 0, &uid) != 0) {
2220 GOTO(failed, rc = -EINVAL);
2224 if (kstrtoul(tmp, 0, &gid) != 0) {
2226 GOTO(failed, rc = -EINVAL);
2229 squash->rsi_uid = uid;
2230 squash->rsi_gid = gid;
2232 LCONSOLE_INFO("%s: root_squash is set to %u:%u\n",
2233 name, squash->rsi_uid, squash->rsi_gid);
2241 CWARN("%s: failed to set root_squash to \"%s\", %s, rc = %d\n",
2242 name, kernbuf, errmsg, rc);
2245 CWARN("%s: failed to set root_squash due to %s, rc = %d\n",
2249 EXPORT_SYMBOL(lprocfs_wr_root_squash);
2252 int lprocfs_wr_nosquash_nids(const char __user *buffer, unsigned long count,
2253 struct root_squash_info *squash, char *name)
2256 char *kernbuf = NULL;
2263 errmsg = "string too long";
2264 GOTO(failed, rc = -EINVAL);
2267 OBD_ALLOC(kernbuf, count + 1);
2269 errmsg = "no memory";
2270 GOTO(failed, rc = -ENOMEM);
2272 if (copy_from_user(kernbuf, buffer, count)) {
2273 errmsg = "bad address";
2274 GOTO(failed, rc = -EFAULT);
2276 kernbuf[count] = '\0';
2278 if (count > 0 && kernbuf[count - 1] == '\n')
2281 if ((len == 4 && strncmp(kernbuf, "NONE", len) == 0) ||
2282 (len == 5 && strncmp(kernbuf, "clear", len) == 0)) {
2283 /* empty string is special case */
2284 spin_lock(&squash->rsi_lock);
2285 if (!list_empty(&squash->rsi_nosquash_nids))
2286 cfs_free_nidlist(&squash->rsi_nosquash_nids);
2287 spin_unlock(&squash->rsi_lock);
2288 LCONSOLE_INFO("%s: nosquash_nids is cleared\n", name);
2289 OBD_FREE(kernbuf, count + 1);
2293 if (cfs_parse_nidlist(kernbuf, count, &tmp) <= 0) {
2294 errmsg = "can't parse";
2295 GOTO(failed, rc = -EINVAL);
2297 LCONSOLE_INFO("%s: nosquash_nids set to %s\n",
2299 OBD_FREE(kernbuf, count + 1);
2302 spin_lock(&squash->rsi_lock);
2303 if (!list_empty(&squash->rsi_nosquash_nids))
2304 cfs_free_nidlist(&squash->rsi_nosquash_nids);
2305 list_splice(&tmp, &squash->rsi_nosquash_nids);
2306 spin_unlock(&squash->rsi_lock);
2312 CWARN("%s: failed to set nosquash_nids to \"%s\", %s rc = %d\n",
2313 name, kernbuf, errmsg, rc);
2314 OBD_FREE(kernbuf, count + 1);
2316 CWARN("%s: failed to set nosquash_nids due to %s rc = %d\n",
2321 EXPORT_SYMBOL(lprocfs_wr_nosquash_nids);
2323 #endif /* CONFIG_PROC_FS*/