4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
20 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
21 * CA 95054 USA or visit www.sun.com if you need additional information or
27 * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
28 * Use is subject to license terms.
30 * Copyright (c) 2011, 2015, Intel Corporation.
33 * This file is part of Lustre, http://www.lustre.org/
34 * Lustre is a trademark of Sun Microsystems, Inc.
36 * lustre/osd/osd_lproc.c
38 * Author: Mikhail Pershin <tappro@sun.com>
41 #define DEBUG_SUBSYSTEM S_OSD
43 #include <lprocfs_status.h>
44 #include <lustre/lustre_idl.h>
46 #include "osd_internal.h"
50 void osd_brw_stats_update(struct osd_device *osd, struct osd_iobuf *iobuf)
52 struct brw_stats *s = &osd->od_brw_stats;
53 sector_t *last_block = NULL;
54 struct page **pages = iobuf->dr_pages;
55 struct page *last_page = NULL;
56 unsigned long discont_pages = 0;
57 unsigned long discont_blocks = 0;
58 sector_t *blocks = iobuf->dr_blocks;
59 int i, nr_pages = iobuf->dr_npages;
61 int rw = iobuf->dr_rw;
63 if (unlikely(nr_pages == 0))
66 blocks_per_page = PAGE_CACHE_SIZE >> osd_sb(osd)->s_blocksize_bits;
68 lprocfs_oh_tally_log2(&s->hist[BRW_R_PAGES+rw], nr_pages);
70 while (nr_pages-- > 0) {
71 if (last_page && (*pages)->index != (last_page->index + 1))
75 for (i = 0; i < blocks_per_page; i++) {
76 if (last_block && *blocks != (*last_block + 1))
78 last_block = blocks++;
82 lprocfs_oh_tally(&s->hist[BRW_R_DISCONT_PAGES+rw], discont_pages);
83 lprocfs_oh_tally(&s->hist[BRW_R_DISCONT_BLOCKS+rw], discont_blocks);
86 #define pct(a, b) (b ? a * 100 / b : 0)
88 static void display_brw_stats(struct seq_file *seq, char *name, char *units,
89 struct obd_histogram *read, struct obd_histogram *write, int scale)
91 unsigned long read_tot, write_tot, r, w, read_cum = 0, write_cum = 0;
94 seq_printf(seq, "\n%26s read | write\n", " ");
95 seq_printf(seq, "%-22s %-5s %% cum %% | %-11s %% cum %%\n",
98 read_tot = lprocfs_oh_sum(read);
99 write_tot = lprocfs_oh_sum(write);
100 for (i = 0; i < OBD_HIST_MAX; i++) {
101 r = read->oh_buckets[i];
102 w = write->oh_buckets[i];
105 if (read_cum == 0 && write_cum == 0)
109 seq_printf(seq, "%u", i);
111 seq_printf(seq, "%u", scale << i);
113 seq_printf(seq, "%uK", scale << (i-10));
115 seq_printf(seq, "%uM", scale << (i-20));
117 seq_printf(seq, ":\t\t%10lu %3lu %3lu | %4lu %3lu %3lu\n",
118 r, pct(r, read_tot), pct(read_cum, read_tot),
119 w, pct(w, write_tot), pct(write_cum, write_tot));
121 if (read_cum == read_tot && write_cum == write_tot)
126 static void brw_stats_show(struct seq_file *seq, struct brw_stats *brw_stats)
130 /* this sampling races with updates */
131 do_gettimeofday(&now);
132 seq_printf(seq, "snapshot_time: %lu.%lu (secs.usecs)\n",
133 now.tv_sec, now.tv_usec);
135 display_brw_stats(seq, "pages per bulk r/w", "rpcs",
136 &brw_stats->hist[BRW_R_PAGES],
137 &brw_stats->hist[BRW_W_PAGES], 1);
139 display_brw_stats(seq, "discontiguous pages", "rpcs",
140 &brw_stats->hist[BRW_R_DISCONT_PAGES],
141 &brw_stats->hist[BRW_W_DISCONT_PAGES], 0);
143 display_brw_stats(seq, "discontiguous blocks", "rpcs",
144 &brw_stats->hist[BRW_R_DISCONT_BLOCKS],
145 &brw_stats->hist[BRW_W_DISCONT_BLOCKS], 0);
147 display_brw_stats(seq, "disk fragmented I/Os", "ios",
148 &brw_stats->hist[BRW_R_DIO_FRAGS],
149 &brw_stats->hist[BRW_W_DIO_FRAGS], 0);
151 display_brw_stats(seq, "disk I/Os in flight", "ios",
152 &brw_stats->hist[BRW_R_RPC_HIST],
153 &brw_stats->hist[BRW_W_RPC_HIST], 0);
155 display_brw_stats(seq, "I/O time (1/1000s)", "ios",
156 &brw_stats->hist[BRW_R_IO_TIME],
157 &brw_stats->hist[BRW_W_IO_TIME],
158 jiffies_to_msecs(1000) / MSEC_PER_SEC);
160 display_brw_stats(seq, "disk I/O size", "ios",
161 &brw_stats->hist[BRW_R_DISK_IOSIZE],
162 &brw_stats->hist[BRW_W_DISK_IOSIZE], 1);
167 static int osd_brw_stats_seq_show(struct seq_file *seq, void *v)
169 struct osd_device *osd = seq->private;
171 brw_stats_show(seq, &osd->od_brw_stats);
176 static ssize_t osd_brw_stats_seq_write(struct file *file,
177 const char __user *buf,
178 size_t len, loff_t *off)
180 struct seq_file *seq = file->private_data;
181 struct osd_device *osd = seq->private;
184 for (i = 0; i < BRW_LAST; i++)
185 lprocfs_oh_clear(&osd->od_brw_stats.hist[i]);
190 LPROC_SEQ_FOPS(osd_brw_stats);
192 static int osd_stats_init(struct osd_device *osd)
197 for (i = 0; i < BRW_LAST; i++)
198 spin_lock_init(&osd->od_brw_stats.hist[i].oh_lock);
200 osd->od_stats = lprocfs_alloc_stats(LPROC_OSD_LAST, 0);
201 if (osd->od_stats != NULL) {
202 result = lprocfs_register_stats(osd->od_proc_entry, "stats",
207 lprocfs_counter_init(osd->od_stats, LPROC_OSD_GET_PAGE,
208 LPROCFS_CNTR_AVGMINMAX|LPROCFS_CNTR_STDDEV,
210 lprocfs_counter_init(osd->od_stats, LPROC_OSD_NO_PAGE,
211 LPROCFS_CNTR_AVGMINMAX,
212 "get_page_failures", "num");
213 lprocfs_counter_init(osd->od_stats, LPROC_OSD_CACHE_ACCESS,
214 LPROCFS_CNTR_AVGMINMAX,
215 "cache_access", "pages");
216 lprocfs_counter_init(osd->od_stats, LPROC_OSD_CACHE_HIT,
217 LPROCFS_CNTR_AVGMINMAX,
218 "cache_hit", "pages");
219 lprocfs_counter_init(osd->od_stats, LPROC_OSD_CACHE_MISS,
220 LPROCFS_CNTR_AVGMINMAX,
221 "cache_miss", "pages");
222 #if OSD_THANDLE_STATS
223 lprocfs_counter_init(osd->od_stats, LPROC_OSD_THANDLE_STARTING,
224 LPROCFS_CNTR_AVGMINMAX,
225 "thandle starting", "usec");
226 lprocfs_counter_init(osd->od_stats, LPROC_OSD_THANDLE_OPEN,
227 LPROCFS_CNTR_AVGMINMAX,
228 "thandle open", "usec");
229 lprocfs_counter_init(osd->od_stats, LPROC_OSD_THANDLE_CLOSING,
230 LPROCFS_CNTR_AVGMINMAX,
231 "thandle closing", "usec");
233 result = lprocfs_seq_create(osd->od_proc_entry, "brw_stats",
234 0644, &osd_brw_stats_fops, osd);
242 static int ldiskfs_osd_fstype_seq_show(struct seq_file *m, void *data)
244 struct osd_device *osd = osd_dt_dev((struct dt_device *)m->private);
246 LASSERT(osd != NULL);
247 seq_puts(m, "ldiskfs\n");
250 LPROC_SEQ_FOPS_RO(ldiskfs_osd_fstype);
252 static int ldiskfs_osd_mntdev_seq_show(struct seq_file *m, void *data)
254 struct osd_device *osd = osd_dt_dev((struct dt_device *)m->private);
256 LASSERT(osd != NULL);
257 if (unlikely(osd->od_mnt == NULL))
260 seq_printf(m, "%s\n", osd->od_mntdev);
263 LPROC_SEQ_FOPS_RO(ldiskfs_osd_mntdev);
265 static int ldiskfs_osd_cache_seq_show(struct seq_file *m, void *data)
267 struct osd_device *osd = osd_dt_dev((struct dt_device *)m->private);
269 LASSERT(osd != NULL);
270 if (unlikely(osd->od_mnt == NULL))
273 seq_printf(m, "%u\n", osd->od_read_cache);
278 ldiskfs_osd_cache_seq_write(struct file *file, const char __user *buffer,
279 size_t count, loff_t *off)
281 struct seq_file *m = file->private_data;
282 struct dt_device *dt = m->private;
283 struct osd_device *osd = osd_dt_dev(dt);
287 LASSERT(osd != NULL);
288 if (unlikely(osd->od_mnt == NULL))
291 rc = lprocfs_str_to_s64(buffer, count, &val);
295 osd->od_read_cache = !!val;
298 LPROC_SEQ_FOPS(ldiskfs_osd_cache);
300 static int ldiskfs_osd_wcache_seq_show(struct seq_file *m, void *data)
302 struct osd_device *osd = osd_dt_dev((struct dt_device *)m->private);
304 LASSERT(osd != NULL);
305 if (unlikely(osd->od_mnt == NULL))
308 seq_printf(m, "%u\n", osd->od_writethrough_cache);
313 ldiskfs_osd_wcache_seq_write(struct file *file, const char __user *buffer,
314 size_t count, loff_t *off)
316 struct seq_file *m = file->private_data;
317 struct dt_device *dt = m->private;
318 struct osd_device *osd = osd_dt_dev(dt);
322 LASSERT(osd != NULL);
323 if (unlikely(osd->od_mnt == NULL))
326 rc = lprocfs_str_to_s64(buffer, count, &val);
330 osd->od_writethrough_cache = !!val;
333 LPROC_SEQ_FOPS(ldiskfs_osd_wcache);
336 lprocfs_osd_force_sync_seq_write(struct file *file, const char __user *buffer,
337 size_t count, loff_t *off)
339 struct seq_file *m = file->private_data;
340 struct dt_device *dt = m->private;
341 struct osd_device *osd = osd_dt_dev(dt);
345 LASSERT(osd != NULL);
346 if (unlikely(osd->od_mnt == NULL))
349 rc = lu_env_init(&env, LCT_LOCAL);
352 rc = dt_sync(&env, dt);
355 return rc == 0 ? count : rc;
357 LPROC_SEQ_FOPS_WO_TYPE(ldiskfs, osd_force_sync);
359 static int ldiskfs_osd_pdo_seq_show(struct seq_file *m, void *data)
361 seq_printf(m, "%s\n", ldiskfs_pdo ? "ON" : "OFF");
366 ldiskfs_osd_pdo_seq_write(struct file *file, const char __user *buffer,
367 size_t count, loff_t *off)
372 rc = lprocfs_str_to_s64(buffer, count, &pdo);
380 LPROC_SEQ_FOPS(ldiskfs_osd_pdo);
382 static int ldiskfs_osd_auto_scrub_seq_show(struct seq_file *m, void *data)
384 struct osd_device *dev = osd_dt_dev((struct dt_device *)m->private);
386 LASSERT(dev != NULL);
387 if (unlikely(dev->od_mnt == NULL))
390 seq_printf(m, "%d\n", !dev->od_noscrub);
395 ldiskfs_osd_auto_scrub_seq_write(struct file *file, const char __user *buffer,
396 size_t count, loff_t *off)
398 struct seq_file *m = file->private_data;
399 struct dt_device *dt = m->private;
400 struct osd_device *dev = osd_dt_dev(dt);
404 LASSERT(dev != NULL);
405 if (unlikely(dev->od_mnt == NULL))
408 rc = lprocfs_str_to_s64(buffer, count, &val);
412 dev->od_noscrub = !val;
415 LPROC_SEQ_FOPS(ldiskfs_osd_auto_scrub);
417 static int ldiskfs_osd_full_scrub_ratio_seq_show(struct seq_file *m, void *data)
419 struct osd_device *dev = osd_dt_dev((struct dt_device *)m->private);
421 LASSERT(dev != NULL);
422 if (unlikely(dev->od_mnt == NULL))
425 seq_printf(m, LPU64"\n", dev->od_full_scrub_ratio);
430 ldiskfs_osd_full_scrub_ratio_seq_write(struct file *file,
431 const char __user *buffer,
432 size_t count, loff_t *off)
434 struct seq_file *m = file->private_data;
435 struct dt_device *dt = m->private;
436 struct osd_device *dev = osd_dt_dev(dt);
440 LASSERT(dev != NULL);
441 if (unlikely(dev->od_mnt == NULL))
444 rc = lprocfs_str_to_s64(buffer, count, &val);
451 dev->od_full_scrub_ratio = val;
454 LPROC_SEQ_FOPS(ldiskfs_osd_full_scrub_ratio);
456 static int ldiskfs_osd_full_scrub_threshold_rate_seq_show(struct seq_file *m,
459 struct osd_device *dev = osd_dt_dev((struct dt_device *)m->private);
461 LASSERT(dev != NULL);
462 if (unlikely(dev->od_mnt == NULL))
465 seq_printf(m, LPU64" (bad OI mappings/minute)\n",
466 dev->od_full_scrub_threshold_rate);
471 ldiskfs_osd_full_scrub_threshold_rate_seq_write(struct file *file,
472 const char __user *buffer,
473 size_t count, loff_t *off)
475 struct seq_file *m = file->private_data;
476 struct dt_device *dt = m->private;
477 struct osd_device *dev = osd_dt_dev(dt);
481 LASSERT(dev != NULL);
482 if (unlikely(dev->od_mnt == NULL))
485 rc = lprocfs_str_to_s64(buffer, count, &val);
492 dev->od_full_scrub_threshold_rate = val;
495 LPROC_SEQ_FOPS(ldiskfs_osd_full_scrub_threshold_rate);
498 ldiskfs_osd_track_declares_assert_seq_show(struct seq_file *m, void *data)
500 seq_printf(m, "%d\n", ldiskfs_track_declares_assert);
505 ldiskfs_osd_track_declares_assert_seq_write(struct file *file,
506 const char __user *buffer,
507 size_t count, loff_t *off)
509 __s64 track_declares_assert;
512 rc = lprocfs_str_to_s64(buffer, count, &track_declares_assert);
516 ldiskfs_track_declares_assert = !!track_declares_assert;
520 LPROC_SEQ_FOPS(ldiskfs_osd_track_declares_assert);
522 static int ldiskfs_osd_oi_scrub_seq_show(struct seq_file *m, void *data)
524 struct osd_device *dev = osd_dt_dev((struct dt_device *)m->private);
526 LASSERT(dev != NULL);
527 if (unlikely(dev->od_mnt == NULL))
530 return osd_scrub_dump(m, dev);
532 LPROC_SEQ_FOPS_RO(ldiskfs_osd_oi_scrub);
534 static int ldiskfs_osd_readcache_seq_show(struct seq_file *m, void *data)
536 struct osd_device *osd = osd_dt_dev((struct dt_device *)m->private);
538 LASSERT(osd != NULL);
539 if (unlikely(osd->od_mnt == NULL))
542 seq_printf(m, LPU64"\n", osd->od_readcache_max_filesize);
547 ldiskfs_osd_readcache_seq_write(struct file *file, const char __user *buffer,
548 size_t count, loff_t *off)
550 struct seq_file *m = file->private_data;
551 struct dt_device *dt = m->private;
552 struct osd_device *osd = osd_dt_dev(dt);
556 LASSERT(osd != NULL);
557 if (unlikely(osd->od_mnt == NULL))
560 rc = lprocfs_str_with_units_to_s64(buffer, count, &val, '1');
566 osd->od_readcache_max_filesize = val > OSD_MAX_CACHE_SIZE ?
567 OSD_MAX_CACHE_SIZE : val;
570 LPROC_SEQ_FOPS(ldiskfs_osd_readcache);
572 #if LUSTRE_VERSION_CODE < OBD_OCD_VERSION(3, 0, 52, 0)
573 static int ldiskfs_osd_index_in_idif_seq_show(struct seq_file *m, void *data)
575 struct osd_device *dev = osd_dt_dev((struct dt_device *)m->private);
577 LASSERT(dev != NULL);
578 if (unlikely(dev->od_mnt == NULL))
581 seq_printf(m, "%d\n", (int)(dev->od_index_in_idif));
586 ldiskfs_osd_index_in_idif_seq_write(struct file *file,
587 const char __user *buffer,
588 size_t count, loff_t *off)
591 struct seq_file *m = file->private_data;
592 struct dt_device *dt = m->private;
593 struct osd_device *dev = osd_dt_dev(dt);
594 struct lu_target *tgt;
598 LASSERT(dev != NULL);
599 if (unlikely(dev->od_mnt == NULL))
602 rc = lprocfs_str_to_s64(buffer, count, &val);
606 if (dev->od_index_in_idif) {
610 LCONSOLE_WARN("%s: OST-index in IDIF has been enabled, "
611 "it cannot be reverted back.\n", osd_name(dev));
618 rc = lu_env_init(&env, LCT_DT_THREAD);
622 tgt = dev->od_dt_dev.dd_lu_dev.ld_site->ls_tgt;
623 tgt->lut_lsd.lsd_feature_rocompat |= OBD_ROCOMPAT_IDX_IN_IDIF;
624 rc = tgt_server_data_update(&env, tgt, 1);
629 LCONSOLE_INFO("%s: enable OST-index in IDIF successfully, "
630 "it cannot be reverted back.\n", osd_name(dev));
632 dev->od_index_in_idif = 1;
635 LPROC_SEQ_FOPS(ldiskfs_osd_index_in_idif);
637 int osd_register_proc_index_in_idif(struct osd_device *osd)
639 struct proc_dir_entry *proc;
641 proc = proc_create_data("index_in_idif", 0, osd->od_proc_entry,
642 &ldiskfs_osd_index_in_idif_fops,
651 LPROC_SEQ_FOPS_RO_TYPE(ldiskfs, dt_blksize);
652 LPROC_SEQ_FOPS_RO_TYPE(ldiskfs, dt_kbytestotal);
653 LPROC_SEQ_FOPS_RO_TYPE(ldiskfs, dt_kbytesfree);
654 LPROC_SEQ_FOPS_RO_TYPE(ldiskfs, dt_kbytesavail);
655 LPROC_SEQ_FOPS_RO_TYPE(ldiskfs, dt_filestotal);
656 LPROC_SEQ_FOPS_RO_TYPE(ldiskfs, dt_filesfree);
658 struct lprocfs_vars lprocfs_osd_obd_vars[] = {
659 { .name = "blocksize",
660 .fops = &ldiskfs_dt_blksize_fops },
661 { .name = "kbytestotal",
662 .fops = &ldiskfs_dt_kbytestotal_fops },
663 { .name = "kbytesfree",
664 .fops = &ldiskfs_dt_kbytesfree_fops },
665 { .name = "kbytesavail",
666 .fops = &ldiskfs_dt_kbytesavail_fops },
667 { .name = "filestotal",
668 .fops = &ldiskfs_dt_filestotal_fops },
669 { .name = "filesfree",
670 .fops = &ldiskfs_dt_filesfree_fops },
672 .fops = &ldiskfs_osd_fstype_fops },
674 .fops = &ldiskfs_osd_mntdev_fops },
675 { .name = "force_sync",
676 .fops = &ldiskfs_osd_force_sync_fops },
678 .fops = &ldiskfs_osd_pdo_fops },
679 { .name = "auto_scrub",
680 .fops = &ldiskfs_osd_auto_scrub_fops },
681 { .name = "full_scrub_ratio",
682 .fops = &ldiskfs_osd_full_scrub_ratio_fops },
683 { .name = "full_scrub_threshold_rate",
684 .fops = &ldiskfs_osd_full_scrub_threshold_rate_fops },
685 { .name = "oi_scrub",
686 .fops = &ldiskfs_osd_oi_scrub_fops },
687 { .name = "read_cache_enable",
688 .fops = &ldiskfs_osd_cache_fops },
689 { .name = "writethrough_cache_enable",
690 .fops = &ldiskfs_osd_wcache_fops },
691 { .name = "readcache_max_filesize",
692 .fops = &ldiskfs_osd_readcache_fops },
696 struct lprocfs_vars lprocfs_osd_module_vars[] = {
697 { .name = "track_declares_assert",
698 .fops = &ldiskfs_osd_track_declares_assert_fops },
703 int osd_procfs_init(struct osd_device *osd, const char *name)
705 struct obd_type *type;
709 if (osd->od_proc_entry)
712 /* at the moment there is no linkage between lu_type
713 * and obd_type, so we lookup obd_type this way */
714 type = class_search_type(LUSTRE_OSD_LDISKFS_NAME);
716 LASSERT(name != NULL);
717 LASSERT(type != NULL);
719 /* Find the type procroot and add the proc entry for this device */
720 osd->od_proc_entry = lprocfs_register(name, type->typ_procroot,
721 lprocfs_osd_obd_vars,
723 if (IS_ERR(osd->od_proc_entry)) {
724 rc = PTR_ERR(osd->od_proc_entry);
725 CERROR("Error %d setting up lprocfs for %s\n",
727 osd->od_proc_entry = NULL;
731 rc = osd_stats_init(osd);
736 osd_procfs_fini(osd);
740 int osd_procfs_fini(struct osd_device *osd)
743 lprocfs_free_stats(&osd->od_stats);
745 if (osd->od_proc_entry)
746 lprocfs_remove(&osd->od_proc_entry);