Whamcloud - gitweb
LU-12616 obclass: fix MDS start/stop race
[fs/lustre-release.git] / lustre / mdc / lproc_mdc.c
1 /*
2  * GPL HEADER START
3  *
4  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License version 2 only,
8  * as published by the Free Software Foundation.
9  *
10  * This program is distributed in the hope that it will be useful, but
11  * WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  * General Public License version 2 for more details (a copy is included
14  * in the LICENSE file that accompanied this code).
15  *
16  * You should have received a copy of the GNU General Public License
17  * version 2 along with this program; If not, see
18  * http://www.gnu.org/licenses/gpl-2.0.html
19  *
20  * GPL HEADER END
21  */
22 /*
23  * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved.
24  * Use is subject to license terms.
25  *
26  * Copyright (c) 2011, 2017, Intel Corporation.
27  */
28 /*
29  * This file is part of Lustre, http://www.lustre.org/
30  * Lustre is a trademark of Sun Microsystems, Inc.
31  */
32 #define DEBUG_SUBSYSTEM S_CLASS
33
34 #include <linux/vfs.h>
35 #include <obd_class.h>
36 #include <lprocfs_status.h>
37 #include <lustre_osc.h>
38 #include <cl_object.h>
39 #include "mdc_internal.h"
40
41 static ssize_t active_show(struct kobject *kobj, struct attribute *attr,
42                            char *buf)
43 {
44         struct obd_device *dev = container_of(kobj, struct obd_device,
45                                               obd_kset.kobj);
46         ssize_t len;
47
48         LPROCFS_CLIMP_CHECK(dev);
49         len = sprintf(buf, "%d\n", !dev->u.cli.cl_import->imp_deactive);
50         LPROCFS_CLIMP_EXIT(dev);
51         return len;
52 }
53
54 static ssize_t active_store(struct kobject *kobj, struct attribute *attr,
55                             const char *buffer, size_t count)
56 {
57         struct obd_device *dev = container_of(kobj, struct obd_device,
58                                               obd_kset.kobj);
59         bool val;
60         int rc;
61
62         rc = kstrtobool(buffer, &val);
63         if (rc)
64                 return rc;
65
66         /* opposite senses */
67         if (dev->u.cli.cl_import->imp_deactive == val)
68                 rc = ptlrpc_set_import_active(dev->u.cli.cl_import, val);
69         else
70                 CDEBUG(D_CONFIG, "activate %u: ignoring repeat request\n",
71                        val);
72
73         return count;
74 }
75 LUSTRE_RW_ATTR(active);
76
77 static ssize_t max_rpcs_in_flight_show(struct kobject *kobj,
78                                        struct attribute *attr,
79                                        char *buf)
80 {
81         struct obd_device *dev = container_of(kobj, struct obd_device,
82                                               obd_kset.kobj);
83         ssize_t len;
84         u32 max;
85
86         max = obd_get_max_rpcs_in_flight(&dev->u.cli);
87         len = sprintf(buf, "%u\n", max);
88
89         return len;
90 }
91
92 static ssize_t max_rpcs_in_flight_store(struct kobject *kobj,
93                                         struct attribute *attr,
94                                         const char *buffer,
95                                         size_t count)
96 {
97         struct obd_device *dev = container_of(kobj, struct obd_device,
98                                               obd_kset.kobj);
99         unsigned int val;
100         int rc;
101
102         rc = kstrtouint(buffer, 10, &val);
103         if (rc)
104                 return rc;
105
106         rc = obd_set_max_rpcs_in_flight(&dev->u.cli, val);
107         if (rc)
108                 count = rc;
109
110         return count;
111 }
112 LUSTRE_RW_ATTR(max_rpcs_in_flight);
113
114 static ssize_t max_mod_rpcs_in_flight_show(struct kobject *kobj,
115                                            struct attribute *attr,
116                                            char *buf)
117 {
118         struct obd_device *dev = container_of(kobj, struct obd_device,
119                                               obd_kset.kobj);
120         u16 max;
121
122         max = obd_get_max_mod_rpcs_in_flight(&dev->u.cli);
123         return sprintf(buf, "%hu\n", max);
124 }
125
126 static ssize_t max_mod_rpcs_in_flight_store(struct kobject *kobj,
127                                             struct attribute *attr,
128                                             const char *buffer,
129                                             size_t count)
130 {
131         struct obd_device *dev = container_of(kobj, struct obd_device,
132                                               obd_kset.kobj);
133         u16 val;
134         int rc;
135
136         rc = kstrtou16(buffer, 10, &val);
137         if (rc)
138                 return rc;
139
140         rc = obd_set_max_mod_rpcs_in_flight(&dev->u.cli, val);
141         if (rc)
142                 count = rc;
143
144         return count;
145 }
146 LUSTRE_RW_ATTR(max_mod_rpcs_in_flight);
147
148 static int mdc_max_dirty_mb_seq_show(struct seq_file *m, void *v)
149 {
150         struct obd_device *dev = m->private;
151         struct client_obd *cli = &dev->u.cli;
152         unsigned long val;
153
154         spin_lock(&cli->cl_loi_list_lock);
155         val = PAGES_TO_MiB(cli->cl_dirty_max_pages);
156         spin_unlock(&cli->cl_loi_list_lock);
157
158         seq_printf(m, "%lu\n", val);
159         return 0;
160 }
161
162 static ssize_t mdc_max_dirty_mb_seq_write(struct file *file,
163                                           const char __user *buffer,
164                                           size_t count, loff_t *off)
165 {
166         struct seq_file *sfl = file->private_data;
167         struct obd_device *dev = sfl->private;
168         struct client_obd *cli = &dev->u.cli;
169         s64 pages_number;
170         int rc;
171
172         rc = lprocfs_str_with_units_to_s64(buffer, count, &pages_number, 'M');
173         if (rc)
174                 return rc;
175
176         /* MB -> pages */
177         pages_number = round_up(pages_number, 1024 * 1024) >> PAGE_SHIFT;
178         if (pages_number <= 0 ||
179             pages_number >= MiB_TO_PAGES(OSC_MAX_DIRTY_MB_MAX) ||
180             pages_number > cfs_totalram_pages() / 4) /* 1/4 of RAM */
181                 return -ERANGE;
182
183         spin_lock(&cli->cl_loi_list_lock);
184         cli->cl_dirty_max_pages = pages_number;
185         osc_wake_cache_waiters(cli);
186         spin_unlock(&cli->cl_loi_list_lock);
187
188         return count;
189 }
190 LPROC_SEQ_FOPS(mdc_max_dirty_mb);
191
192 static ssize_t contention_seconds_show(struct kobject *kobj,
193                                        struct attribute *attr,
194                                        char *buf)
195 {
196         struct obd_device *obd = container_of(kobj, struct obd_device,
197                                               obd_kset.kobj);
198         struct osc_device *od = obd2osc_dev(obd);
199
200         return sprintf(buf, "%lld\n", od->od_contention_time);
201 }
202
203 static ssize_t contention_seconds_store(struct kobject *kobj,
204                                         struct attribute *attr,
205                                         const char *buffer,
206                                         size_t count)
207 {
208         struct obd_device *obd = container_of(kobj, struct obd_device,
209                                               obd_kset.kobj);
210         struct osc_device *od = obd2osc_dev(obd);
211         time64_t val;
212         int rc;
213
214         rc = kstrtoll(buffer, 0, &val);
215         if (rc)
216                 return rc;
217
218         od->od_contention_time = val;
219
220         return count;
221 }
222 LUSTRE_RW_ATTR(contention_seconds);
223
224 LUSTRE_ATTR(mds_conn_uuid, 0444, conn_uuid_show, NULL);
225 LUSTRE_RO_ATTR(conn_uuid);
226
227 LUSTRE_RW_ATTR(ping);
228
229 static int mdc_cached_mb_seq_show(struct seq_file *m, void *v)
230 {
231         struct obd_device *dev = m->private;
232         struct client_obd *cli = &dev->u.cli;
233         int shift = 20 - PAGE_SHIFT;
234
235         seq_printf(m, "used_mb: %ld\n"
236                    "busy_cnt: %ld\n"
237                    "reclaim: %llu\n",
238                    (atomic_long_read(&cli->cl_lru_in_list) +
239                     atomic_long_read(&cli->cl_lru_busy)) >> shift,
240                     atomic_long_read(&cli->cl_lru_busy),
241                    cli->cl_lru_reclaim);
242
243         return 0;
244 }
245
246 /* shrink the number of caching pages to a specific number */
247 static ssize_t
248 mdc_cached_mb_seq_write(struct file *file, const char __user *buffer,
249                         size_t count, loff_t *off)
250 {
251         struct seq_file *sfl = file->private_data;
252         struct obd_device *dev = sfl->private;
253         struct client_obd *cli = &dev->u.cli;
254         __s64 pages_number;
255         long rc;
256         char kernbuf[128];
257
258         if (count >= sizeof(kernbuf))
259                 return -EINVAL;
260
261         if (copy_from_user(kernbuf, buffer, count))
262                 return -EFAULT;
263         kernbuf[count] = 0;
264
265         buffer += lprocfs_find_named_value(kernbuf, "used_mb:", &count) -
266                   kernbuf;
267         rc = lprocfs_str_with_units_to_s64(buffer, count, &pages_number, 'M');
268         if (rc)
269                 return rc;
270
271         pages_number >>= PAGE_SHIFT;
272
273         if (pages_number < 0)
274                 return -ERANGE;
275
276         rc = atomic_long_read(&cli->cl_lru_in_list) - pages_number;
277         if (rc > 0) {
278                 struct lu_env *env;
279                 __u16 refcheck;
280
281                 env = cl_env_get(&refcheck);
282                 if (!IS_ERR(env)) {
283                         (void)osc_lru_shrink(env, cli, rc, true);
284                         cl_env_put(env, &refcheck);
285                 }
286         }
287
288         return count;
289 }
290 LPROC_SEQ_FOPS(mdc_cached_mb);
291
292 static int mdc_unstable_stats_seq_show(struct seq_file *m, void *v)
293 {
294         struct obd_device *dev = m->private;
295         struct client_obd *cli = &dev->u.cli;
296         long pages;
297         int mb;
298
299         pages = atomic_long_read(&cli->cl_unstable_count);
300         mb    = (pages * PAGE_SIZE) >> 20;
301
302         seq_printf(m, "unstable_pages: %20ld\n"
303                    "unstable_mb:              %10d\n", pages, mb);
304         return 0;
305 }
306 LPROC_SEQ_FOPS_RO(mdc_unstable_stats);
307
308 static ssize_t mdc_rpc_stats_seq_write(struct file *file,
309                                        const char __user *buf,
310                                        size_t len, loff_t *off)
311 {
312         struct seq_file *seq = file->private_data;
313         struct obd_device *dev = seq->private;
314         struct client_obd *cli = &dev->u.cli;
315
316         lprocfs_oh_clear(&cli->cl_mod_rpcs_hist);
317
318         lprocfs_oh_clear(&cli->cl_read_rpc_hist);
319         lprocfs_oh_clear(&cli->cl_write_rpc_hist);
320         lprocfs_oh_clear(&cli->cl_read_page_hist);
321         lprocfs_oh_clear(&cli->cl_write_page_hist);
322         lprocfs_oh_clear(&cli->cl_read_offset_hist);
323         lprocfs_oh_clear(&cli->cl_write_offset_hist);
324
325         return len;
326 }
327
328 static int mdc_rpc_stats_seq_show(struct seq_file *seq, void *v)
329 {
330         struct obd_device *dev = seq->private;
331         struct client_obd *cli = &dev->u.cli;
332         unsigned long read_tot = 0, write_tot = 0, read_cum, write_cum;
333         int i;
334
335         obd_mod_rpc_stats_seq_show(&dev->u.cli, seq);
336
337         spin_lock(&cli->cl_loi_list_lock);
338
339         seq_printf(seq, "\nread RPCs in flight:  %d\n",
340                    cli->cl_r_in_flight);
341         seq_printf(seq, "write RPCs in flight: %d\n",
342                    cli->cl_w_in_flight);
343         seq_printf(seq, "pending write pages:  %d\n",
344                    atomic_read(&cli->cl_pending_w_pages));
345         seq_printf(seq, "pending read pages:   %d\n",
346                    atomic_read(&cli->cl_pending_r_pages));
347
348         seq_printf(seq, "\n\t\t\tread\t\t\twrite\n");
349         seq_printf(seq, "pages per rpc         rpcs   %% cum %% |");
350         seq_printf(seq, "       rpcs   %% cum %%\n");
351
352         read_tot = lprocfs_oh_sum(&cli->cl_read_page_hist);
353         write_tot = lprocfs_oh_sum(&cli->cl_write_page_hist);
354
355         read_cum = 0;
356         write_cum = 0;
357         for (i = 0; i < OBD_HIST_MAX; i++) {
358                 unsigned long r = cli->cl_read_page_hist.oh_buckets[i];
359                 unsigned long w = cli->cl_write_page_hist.oh_buckets[i];
360
361                 read_cum += r;
362                 write_cum += w;
363                 seq_printf(seq, "%d:\t\t%10lu %3u %3u   | %10lu %3u %3u\n",
364                            1 << i, r, pct(r, read_tot),
365                            pct(read_cum, read_tot), w,
366                            pct(w, write_tot),
367                            pct(write_cum, write_tot));
368                 if (read_cum == read_tot && write_cum == write_tot)
369                         break;
370         }
371
372         seq_printf(seq, "\n\t\t\tread\t\t\twrite\n");
373         seq_printf(seq, "rpcs in flight        rpcs   %% cum %% |");
374         seq_printf(seq, "       rpcs   %% cum %%\n");
375
376         read_tot = lprocfs_oh_sum(&cli->cl_read_rpc_hist);
377         write_tot = lprocfs_oh_sum(&cli->cl_write_rpc_hist);
378
379         read_cum = 0;
380         write_cum = 0;
381         for (i = 0; i < OBD_HIST_MAX; i++) {
382                 unsigned long r = cli->cl_read_rpc_hist.oh_buckets[i];
383                 unsigned long w = cli->cl_write_rpc_hist.oh_buckets[i];
384
385                 read_cum += r;
386                 write_cum += w;
387                 seq_printf(seq, "%d:\t\t%10lu %3u %3u   | %10lu %3u %3u\n",
388                            i, r, pct(r, read_tot), pct(read_cum, read_tot), w,
389                            pct(w, write_tot), pct(write_cum, write_tot));
390                 if (read_cum == read_tot && write_cum == write_tot)
391                         break;
392         }
393
394         seq_printf(seq, "\n\t\t\tread\t\t\twrite\n");
395         seq_printf(seq, "offset                rpcs   %% cum %% |");
396         seq_printf(seq, "       rpcs   %% cum %%\n");
397
398         read_tot = lprocfs_oh_sum(&cli->cl_read_offset_hist);
399         write_tot = lprocfs_oh_sum(&cli->cl_write_offset_hist);
400
401         read_cum = 0;
402         write_cum = 0;
403         for (i = 0; i < OBD_HIST_MAX; i++) {
404                 unsigned long r = cli->cl_read_offset_hist.oh_buckets[i];
405                 unsigned long w = cli->cl_write_offset_hist.oh_buckets[i];
406
407                 read_cum += r;
408                 write_cum += w;
409                 seq_printf(seq, "%d:\t\t%10lu %3u %3u   | %10lu %3u %3u\n",
410                            (i == 0) ? 0 : 1 << (i - 1),
411                            r, pct(r, read_tot), pct(read_cum, read_tot),
412                            w, pct(w, write_tot), pct(write_cum, write_tot));
413                 if (read_cum == read_tot && write_cum == write_tot)
414                         break;
415         }
416         spin_unlock(&cli->cl_loi_list_lock);
417
418         return 0;
419 }
420 LPROC_SEQ_FOPS(mdc_rpc_stats);
421
422 static int mdc_stats_seq_show(struct seq_file *seq, void *v)
423 {
424         struct timespec64 now;
425         struct obd_device *dev = seq->private;
426         struct osc_stats *stats = &obd2osc_dev(dev)->od_stats;
427
428         ktime_get_real_ts64(&now);
429
430         seq_printf(seq, "snapshot_time:         %lld.%09lu (secs.nsecs)\n",
431                    (s64)now.tv_sec, now.tv_nsec);
432         seq_printf(seq, "lockless_write_bytes\t\t%llu\n",
433                    stats->os_lockless_writes);
434         seq_printf(seq, "lockless_read_bytes\t\t%llu\n",
435                    stats->os_lockless_reads);
436         seq_printf(seq, "lockless_truncate\t\t%llu\n",
437                    stats->os_lockless_truncates);
438         return 0;
439 }
440
441 static ssize_t mdc_stats_seq_write(struct file *file,
442                                    const char __user *buf,
443                                    size_t len, loff_t *off)
444 {
445         struct seq_file *seq = file->private_data;
446         struct obd_device *dev = seq->private;
447         struct osc_stats *stats = &obd2osc_dev(dev)->od_stats;
448
449         memset(stats, 0, sizeof(*stats));
450         return len;
451 }
452 LPROC_SEQ_FOPS(mdc_stats);
453
454 static int mdc_dom_min_repsize_seq_show(struct seq_file *m, void *v)
455 {
456         struct obd_device *dev = m->private;
457
458         seq_printf(m, "%u\n", dev->u.cli.cl_dom_min_inline_repsize);
459
460         return 0;
461 }
462
463 static ssize_t mdc_dom_min_repsize_seq_write(struct file *file,
464                                              const char __user *buffer,
465                                              size_t count, loff_t *off)
466 {
467         struct obd_device *dev;
468         unsigned int val;
469         int rc;
470
471         dev =  ((struct seq_file *)file->private_data)->private;
472         rc = kstrtouint_from_user(buffer, count, 0, &val);
473         if (rc)
474                 return rc;
475
476         if (val > MDC_DOM_MAX_INLINE_REPSIZE)
477                 return -ERANGE;
478
479         dev->u.cli.cl_dom_min_inline_repsize = val;
480         return count;
481 }
482 LPROC_SEQ_FOPS(mdc_dom_min_repsize);
483
484 LPROC_SEQ_FOPS_RO_TYPE(mdc, connect_flags);
485 LPROC_SEQ_FOPS_RO_TYPE(mdc, server_uuid);
486 LPROC_SEQ_FOPS_RO_TYPE(mdc, timeouts);
487 LPROC_SEQ_FOPS_RO_TYPE(mdc, state);
488 LPROC_SEQ_FOPS_RW_TYPE(mdc, obd_max_pages_per_rpc);
489 LPROC_SEQ_FOPS_RW_TYPE(mdc, import);
490 LPROC_SEQ_FOPS_RW_TYPE(mdc, pinger_recov);
491
492 struct lprocfs_vars lprocfs_mdc_obd_vars[] = {
493         { .name =       "connect_flags",
494           .fops =       &mdc_connect_flags_fops },
495         { .name =       "mds_server_uuid",
496           .fops =       &mdc_server_uuid_fops   },
497         { .name =       "max_pages_per_rpc",
498           .fops =       &mdc_obd_max_pages_per_rpc_fops },
499         { .name =       "max_dirty_mb",
500           .fops =       &mdc_max_dirty_mb_fops          },
501         { .name =       "mdc_cached_mb",
502           .fops =       &mdc_cached_mb_fops             },
503         { .name =       "timeouts",
504           .fops =       &mdc_timeouts_fops              },
505         { .name =       "import",
506           .fops =       &mdc_import_fops                },
507         { .name =       "state",
508           .fops =       &mdc_state_fops                 },
509         { .name =       "pinger_recov",
510           .fops =       &mdc_pinger_recov_fops          },
511         { .name =       "rpc_stats",
512           .fops =       &mdc_rpc_stats_fops             },
513         { .name =       "unstable_stats",
514           .fops =       &mdc_unstable_stats_fops        },
515         { .name =       "mdc_stats",
516           .fops =       &mdc_stats_fops                 },
517         { .name =       "mdc_dom_min_repsize",
518           .fops =       &mdc_dom_min_repsize_fops       },
519         { NULL }
520 };
521
522 static struct attribute *mdc_attrs[] = {
523         &lustre_attr_active.attr,
524         &lustre_attr_max_rpcs_in_flight.attr,
525         &lustre_attr_max_mod_rpcs_in_flight.attr,
526         &lustre_attr_contention_seconds.attr,
527         &lustre_attr_mds_conn_uuid.attr,
528         &lustre_attr_conn_uuid.attr,
529         &lustre_attr_ping.attr,
530         NULL,
531 };
532
533 int mdc_tunables_init(struct obd_device *obd)
534 {
535         int rc;
536
537         obd->obd_ktype.default_attrs = mdc_attrs;
538         obd->obd_vars = lprocfs_mdc_obd_vars;
539
540         rc = lprocfs_obd_setup(obd, false);
541         if (rc)
542                 goto out_failed;
543 #ifdef CONFIG_PROC_FS
544         rc = lprocfs_alloc_md_stats(obd, 0);
545         if (rc) {
546                 lprocfs_obd_cleanup(obd);
547                 goto out_failed;
548         }
549 #endif
550         rc = sptlrpc_lprocfs_cliobd_attach(obd);
551         if (rc) {
552 #ifdef CONFIG_PROC_FS
553                 lprocfs_free_md_stats(obd);
554 #endif
555                 lprocfs_obd_cleanup(obd);
556                 goto out_failed;
557         }
558         ptlrpc_lprocfs_register_obd(obd);
559
560 out_failed:
561         return rc;
562 }