4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.gnu.org/licenses/gpl-2.0.html
23 * Copyright (c) 2008, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
26 * Copyright (c) 2012, 2017, Intel Corporation.
29 * This file is part of Lustre, http://www.lustre.org/
31 * lustre/osd-zfs/osd_lproc.c
33 * Author: Alex Zhuravlev <bzzz@whamcloud.com>
34 * Author: Mike Pershin <tappro@whamcloud.com>
37 #define DEBUG_SUBSYSTEM S_OSD
40 #include <obd_class.h>
41 #include <lprocfs_status.h>
42 #include <lustre_scrub.h>
44 #include "osd_internal.h"
48 static void display_brw_stats(struct seq_file *seq, char *name, char *units,
49 struct obd_histogram *read,
50 struct obd_histogram *write, int scale)
52 unsigned long read_tot, write_tot, r, w, read_cum = 0, write_cum = 0;
55 seq_printf(seq, "\n%26s read | write\n", " ");
56 seq_printf(seq, "%-22s %-5s %% cum %% | %-11s %% cum %%\n",
59 read_tot = lprocfs_oh_sum(read);
60 write_tot = lprocfs_oh_sum(write);
61 for (i = 0; i < OBD_HIST_MAX; i++) {
62 r = read->oh_buckets[i];
63 w = write->oh_buckets[i];
66 if (read_cum == 0 && write_cum == 0)
70 seq_printf(seq, "%u", i);
72 seq_printf(seq, "%u", scale << i);
74 seq_printf(seq, "%uK", scale << (i-10));
76 seq_printf(seq, "%uM", scale << (i-20));
78 seq_printf(seq, ":\t\t%10lu %3u %3u | %4lu %3u %3u\n",
79 r, pct(r, read_tot), pct(read_cum, read_tot),
80 w, pct(w, write_tot), pct(write_cum, write_tot));
82 if (read_cum == read_tot && write_cum == write_tot)
87 static void brw_stats_show(struct seq_file *seq, struct brw_stats *brw_stats)
89 /* this sampling races with updates */
90 lprocfs_stats_header(seq, ktime_get(), brw_stats->bs_init, 25, ":", 1);
92 display_brw_stats(seq, "pages per bulk r/w", "rpcs",
93 &brw_stats->bs_hist[BRW_R_PAGES],
94 &brw_stats->bs_hist[BRW_W_PAGES], 1);
96 display_brw_stats(seq, "discontiguous pages", "rpcs",
97 &brw_stats->bs_hist[BRW_R_DISCONT_PAGES],
98 &brw_stats->bs_hist[BRW_W_DISCONT_PAGES], 0);
100 display_brw_stats(seq, "discontiguous blocks", "rpcs",
101 &brw_stats->bs_hist[BRW_R_DISCONT_BLOCKS],
102 &brw_stats->bs_hist[BRW_W_DISCONT_BLOCKS], 0);
104 display_brw_stats(seq, "disk fragmented I/Os", "ios",
105 &brw_stats->bs_hist[BRW_R_DIO_FRAGS],
106 &brw_stats->bs_hist[BRW_W_DIO_FRAGS], 0);
108 display_brw_stats(seq, "disk I/Os in flight", "ios",
109 &brw_stats->bs_hist[BRW_R_RPC_HIST],
110 &brw_stats->bs_hist[BRW_W_RPC_HIST], 0);
112 display_brw_stats(seq, "I/O time (1/1000s)", "ios",
113 &brw_stats->bs_hist[BRW_R_IO_TIME],
114 &brw_stats->bs_hist[BRW_W_IO_TIME], 1);
116 display_brw_stats(seq, "disk I/O size", "ios",
117 &brw_stats->bs_hist[BRW_R_DISK_IOSIZE],
118 &brw_stats->bs_hist[BRW_W_DISK_IOSIZE], 1);
121 static int osd_brw_stats_seq_show(struct seq_file *seq, void *v)
123 struct osd_device *osd = seq->private;
125 brw_stats_show(seq, &osd->od_brw_stats);
130 static ssize_t osd_brw_stats_seq_write(struct file *file,
131 const char __user *buf,
132 size_t len, loff_t *off)
134 struct seq_file *seq = file->private_data;
135 struct osd_device *osd = seq->private;
138 for (i = 0; i < BRW_LAST; i++)
139 lprocfs_oh_clear(&osd->od_brw_stats.bs_hist[i]);
144 LPROC_SEQ_FOPS(osd_brw_stats);
146 static int osd_stats_init(struct osd_device *osd)
151 for (i = 0; i < BRW_LAST; i++)
152 spin_lock_init(&osd->od_brw_stats.bs_hist[i].oh_lock);
154 osd->od_stats = lprocfs_alloc_stats(LPROC_OSD_LAST, 0);
155 if (osd->od_stats != NULL) {
156 result = lprocfs_register_stats(osd->od_proc_entry, "stats",
161 lprocfs_counter_init(osd->od_stats, LPROC_OSD_GET_PAGE,
162 LPROCFS_CNTR_AVGMINMAX|LPROCFS_CNTR_STDDEV,
164 lprocfs_counter_init(osd->od_stats, LPROC_OSD_NO_PAGE,
165 LPROCFS_CNTR_AVGMINMAX,
166 "get_page_failures", "num");
167 lprocfs_counter_init(osd->od_stats, LPROC_OSD_CACHE_ACCESS,
168 LPROCFS_CNTR_AVGMINMAX,
169 "cache_access", "pages");
170 lprocfs_counter_init(osd->od_stats, LPROC_OSD_CACHE_HIT,
171 LPROCFS_CNTR_AVGMINMAX,
172 "cache_hit", "pages");
173 lprocfs_counter_init(osd->od_stats, LPROC_OSD_CACHE_MISS,
174 LPROCFS_CNTR_AVGMINMAX,
175 "cache_miss", "pages");
176 lprocfs_counter_init(osd->od_stats, LPROC_OSD_COPY_IO,
177 LPROCFS_CNTR_AVGMINMAX,
179 lprocfs_counter_init(osd->od_stats, LPROC_OSD_ZEROCOPY_IO,
180 LPROCFS_CNTR_AVGMINMAX,
181 "zerocopy", "pages");
182 lprocfs_counter_init(osd->od_stats, LPROC_OSD_TAIL_IO,
183 LPROCFS_CNTR_AVGMINMAX,
185 #ifdef OSD_THANDLE_STATS
186 lprocfs_counter_init(osd->od_stats, LPROC_OSD_THANDLE_STARTING,
187 LPROCFS_CNTR_AVGMINMAX,
188 "thandle_starting", "usec");
189 lprocfs_counter_init(osd->od_stats, LPROC_OSD_THANDLE_OPEN,
190 LPROCFS_CNTR_AVGMINMAX,
191 "thandle_open", "usec");
192 lprocfs_counter_init(osd->od_stats, LPROC_OSD_THANDLE_CLOSING,
193 LPROCFS_CNTR_AVGMINMAX,
194 "thandle_closing", "usec");
196 result = lprocfs_seq_create(osd->od_proc_entry, "brw_stats",
197 0644, &osd_brw_stats_fops, osd);
206 static int zfs_osd_oi_scrub_seq_show(struct seq_file *m, void *data)
208 struct osd_device *dev = osd_dt_dev((struct dt_device *)m->private);
210 LASSERT(dev != NULL);
214 scrub_dump(m, &dev->od_scrub);
217 LDEBUGFS_SEQ_FOPS_RO(zfs_osd_oi_scrub);
219 static ssize_t auto_scrub_show(struct kobject *kobj, struct attribute *attr,
222 struct dt_device *dt = container_of(kobj, struct dt_device,
224 struct osd_device *dev = osd_dt_dev(dt);
230 return scnprintf(buf, PAGE_SIZE, "%lld\n",
231 dev->od_scrub.os_auto_scrub_interval);
234 static ssize_t auto_scrub_store(struct kobject *kobj, struct attribute *attr,
235 const char *buffer, size_t count)
237 struct dt_device *dt = container_of(kobj, struct dt_device,
239 struct osd_device *dev = osd_dt_dev(dt);
247 rc = kstrtoull(buffer, 0, &val);
251 dev->od_scrub.os_auto_scrub_interval = val;
254 LUSTRE_RW_ATTR(auto_scrub);
256 static ssize_t fstype_show(struct kobject *kobj, struct attribute *attr,
259 return sprintf(buf, "zfs\n");
261 LUSTRE_RO_ATTR(fstype);
263 static ssize_t mntdev_show(struct kobject *kobj, struct attribute *attr,
266 struct dt_device *dt = container_of(kobj, struct dt_device,
268 struct osd_device *osd = osd_dt_dev(dt);
272 return sprintf(buf, "%s\n", osd->od_mntdev);
274 LUSTRE_RO_ATTR(mntdev);
276 ssize_t force_sync_store(struct kobject *kobj, struct attribute *attr,
277 const char *buffer, size_t count)
279 struct dt_device *dt = container_of(kobj, struct dt_device,
284 rc = lu_env_init(&env, LCT_LOCAL);
288 rc = dt_sync(&env, dt);
291 return rc == 0 ? count : rc;
293 LUSTRE_WO_ATTR(force_sync);
295 static ssize_t sync_on_lseek_show(struct kobject *kobj, struct attribute *attr,
298 struct dt_device *dt = container_of(kobj, struct dt_device, dd_kobj);
299 struct osd_device *osd = osd_dt_dev(dt);
304 return sprintf(buf, "%u\n", osd->od_sync_on_lseek);
307 ssize_t sync_on_lseek_store(struct kobject *kobj, struct attribute *attr,
308 const char *buffer, size_t count)
310 struct dt_device *dt = container_of(kobj, struct dt_device, dd_kobj);
311 struct osd_device *osd = osd_dt_dev(dt);
318 rc = kstrtobool(buffer, &val);
322 osd->od_sync_on_lseek = !!val;
326 LUSTRE_RW_ATTR(sync_on_lseek);
328 static ssize_t nonrotational_show(struct kobject *kobj, struct attribute *attr,
331 struct dt_device *dt = container_of(kobj, struct dt_device,
333 struct osd_device *osd = osd_dt_dev(dt);
339 return sprintf(buf, "%u\n", osd->od_nonrotational);
342 static ssize_t nonrotational_store(struct kobject *kobj,
343 struct attribute *attr, const char *buffer,
346 struct dt_device *dt = container_of(kobj, struct dt_device,
348 struct osd_device *osd = osd_dt_dev(dt);
356 rc = kstrtobool(buffer, &val);
360 osd->od_nonrotational = val;
363 LUSTRE_RW_ATTR(nonrotational);
365 static ssize_t index_backup_show(struct kobject *kobj, struct attribute *attr,
368 struct dt_device *dt = container_of(kobj, struct dt_device,
370 struct osd_device *dev = osd_dt_dev(dt);
376 return sprintf(buf, "%d\n", dev->od_index_backup_policy);
379 ssize_t index_backup_store(struct kobject *kobj, struct attribute *attr,
380 const char *buffer, size_t count)
382 struct dt_device *dt = container_of(kobj, struct dt_device,
384 struct osd_device *dev = osd_dt_dev(dt);
392 rc = kstrtoint(buffer, 0, &val);
396 dev->od_index_backup_policy = val;
399 LUSTRE_RW_ATTR(index_backup);
401 static int zfs_osd_readcache_seq_show(struct seq_file *m, void *data)
403 struct osd_device *osd = osd_dt_dev((struct dt_device *)m->private);
405 LASSERT(osd != NULL);
406 if (unlikely(osd->od_os == NULL))
409 seq_printf(m, "%llu\n", osd->od_readcache_max_filesize);
414 zfs_osd_readcache_seq_write(struct file *file, const char __user *buffer,
415 size_t count, loff_t *off)
417 struct seq_file *m = file->private_data;
418 struct dt_device *dt = m->private;
419 struct osd_device *osd = osd_dt_dev(dt);
420 char kernbuf[22] = "";
424 LASSERT(osd != NULL);
425 if (unlikely(osd->od_os == NULL))
428 if (count >= sizeof(kernbuf))
431 if (copy_from_user(kernbuf, buffer, count))
435 rc = sysfs_memparse(kernbuf, count, &val, "B");
439 osd->od_readcache_max_filesize = val > OSD_MAX_CACHE_SIZE ?
440 OSD_MAX_CACHE_SIZE : val;
443 LDEBUGFS_SEQ_FOPS(zfs_osd_readcache);
445 static struct attribute *zfs_attrs[] = {
446 &lustre_attr_fstype.attr,
447 &lustre_attr_mntdev.attr,
448 &lustre_attr_force_sync.attr,
449 &lustre_attr_nonrotational.attr,
450 &lustre_attr_index_backup.attr,
451 &lustre_attr_auto_scrub.attr,
452 &lustre_attr_sync_on_lseek.attr,
456 struct ldebugfs_vars ldebugfs_osd_obd_vars[] = {
457 { .name = "oi_scrub",
458 .fops = &zfs_osd_oi_scrub_fops },
459 { .name = "readcache_max_filesize",
460 .fops = &zfs_osd_readcache_fops },
464 int osd_procfs_init(struct osd_device *osd, const char *name)
466 struct obd_type *type;
471 /* at the moment there is no linkage between lu_type
472 * and obd_type, so we lookup obd_type this way
474 type = class_search_type(LUSTRE_OSD_ZFS_NAME);
479 /* put reference taken by class_search_type */
480 kobject_put(&type->typ_kobj);
482 osd->od_dt_dev.dd_ktype.default_attrs = zfs_attrs;
483 rc = dt_tunables_init(&osd->od_dt_dev, type, name,
484 ldebugfs_osd_obd_vars);
486 CERROR("%s: cannot setup sysfs / debugfs entry: %d\n",
491 if (osd->od_proc_entry)
494 osd->od_proc_entry = lprocfs_register(name, type->typ_procroot,
495 NULL, &osd->od_dt_dev);
496 if (IS_ERR(osd->od_proc_entry)) {
497 rc = PTR_ERR(osd->od_proc_entry);
498 CERROR("Error %d setting up lprocfs for %s\n", rc, name);
499 osd->od_proc_entry = NULL;
503 rc = osd_stats_init(osd);
508 osd_procfs_fini(osd);
512 int osd_procfs_fini(struct osd_device *osd)
517 lprocfs_free_stats(&osd->od_stats);
519 if (osd->od_proc_entry) {
520 lprocfs_remove(&osd->od_proc_entry);
521 osd->od_proc_entry = NULL;
524 return dt_tunables_fini(&osd->od_dt_dev);