Whamcloud - gitweb
LU-13805 llite: add flag to disable unaligned DIO
[fs/lustre-release.git] / lustre / llite / lproc_llite.c
1 /*
2  * GPL HEADER START
3  *
4  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License version 2 only,
8  * as published by the Free Software Foundation.
9  *
10  * This program is distributed in the hope that it will be useful, but
11  * WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  * General Public License version 2 for more details (a copy is included
14  * in the LICENSE file that accompanied this code).
15  *
16  * You should have received a copy of the GNU General Public License
17  * version 2 along with this program; If not, see
18  * http://www.gnu.org/licenses/gpl-2.0.html
19  *
20  * GPL HEADER END
21  */
22 /*
23  * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved.
24  * Use is subject to license terms.
25  *
26  * Copyright (c) 2012, 2017, Intel Corporation.
27  */
28 /*
29  * This file is part of Lustre, http://www.lustre.org/
30  */
31 #define DEBUG_SUBSYSTEM S_LLITE
32
33 #include <linux/version.h>
34 #include <linux/user_namespace.h>
35 #include <linux/uidgid.h>
36
37 #include <uapi/linux/lustre/lustre_param.h>
38 #include <lprocfs_status.h>
39 #include <obd_support.h>
40
41 #include "llite_internal.h"
42 #include "lprocfs_status.h"
43 #include "vvp_internal.h"
44
45 static struct kobject *llite_kobj;
46 static struct dentry *llite_root;
47
48 static void llite_kobj_release(struct kobject *kobj)
49 {
50         if (!IS_ERR_OR_NULL(llite_root)) {
51                 debugfs_remove(llite_root);
52                 llite_root = NULL;
53         }
54
55         kfree(kobj);
56 }
57
58 static struct kobj_type llite_kobj_ktype = {
59         .release        = llite_kobj_release,
60         .sysfs_ops      = &lustre_sysfs_ops,
61 };
62
63 int llite_tunables_register(void)
64 {
65         int rc;
66
67         llite_kobj = kzalloc(sizeof(*llite_kobj), GFP_KERNEL);
68         if (!llite_kobj)
69                 return -ENOMEM;
70
71         llite_kobj->kset = lustre_kset;
72         rc = kobject_init_and_add(llite_kobj, &llite_kobj_ktype,
73                                   &lustre_kset->kobj, "%s", "llite");
74         if (rc)
75                 goto free_kobj;
76
77         llite_root = debugfs_create_dir("llite", debugfs_lustre_root);
78         return 0;
79
80 free_kobj:
81         kobject_put(llite_kobj);
82         llite_kobj = NULL;
83
84         return rc;
85 }
86
87 void llite_tunables_unregister(void)
88 {
89         kobject_put(llite_kobj);
90         llite_kobj = NULL;
91 }
92
93 /* <debugfs>/lustre/llite mount point registration */
94 static const struct file_operations ll_rw_extents_stats_fops;
95 static const struct file_operations ll_rw_extents_stats_pp_fops;
96 static const struct file_operations ll_rw_offset_stats_fops;
97
98 /**
99  * ll_stats_pid_write() - Determine if stats collection should be enabled
100  * @buf: Buffer containing the data written
101  * @len: Number of bytes in the buffer
102  *
103  * Several proc files begin collecting stats when a value is written, and stop
104  * collecting when either '0' or 'disable' is written. This function checks the
105  * written value to see if collection should be enabled or disabled.
106  *
107  * Return: If '0' or 'disable' is provided, 0 is returned. If the text
108  * equivalent of a number is written, that number is returned. Otherwise,
109  * 1 is returned. Non-zero return values indicate collection should be enabled.
110  */
111 static s64 ll_stats_pid_write(const char __user *buf, size_t len)
112 {
113         unsigned long long value = 1;
114         char kernbuf[16];
115         int rc;
116
117         rc = kstrtoull_from_user(buf, len, 0, &value);
118         if (rc < 0 && len < sizeof(kernbuf)) {
119                 if (copy_from_user(kernbuf, buf, len))
120                         return -EFAULT;
121                 kernbuf[len] = 0;
122
123                 if (kernbuf[len - 1] == '\n')
124                         kernbuf[len - 1] = 0;
125
126                 if (strncasecmp(kernbuf, "disable", 7) == 0)
127                         value = 0;
128         }
129
130         return value;
131 }
132
133 static ssize_t blocksize_show(struct kobject *kobj, struct attribute *attr,
134                               char *buf)
135 {
136         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
137                                               ll_kset.kobj);
138         struct obd_statfs osfs;
139         int rc;
140
141         rc = ll_statfs_internal(sbi, &osfs, OBD_STATFS_NODELAY);
142         if (rc)
143                 return rc;
144
145         return sprintf(buf, "%u\n", osfs.os_bsize);
146 }
147 LUSTRE_RO_ATTR(blocksize);
148
149 static ssize_t stat_blocksize_show(struct kobject *kobj, struct attribute *attr,
150                                    char *buf)
151 {
152         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
153                                               ll_kset.kobj);
154
155         return sprintf(buf, "%u\n", sbi->ll_stat_blksize);
156 }
157
158 static ssize_t stat_blocksize_store(struct kobject *kobj,
159                                     struct attribute *attr,
160                                     const char *buffer,
161                                     size_t count)
162 {
163         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
164                                               ll_kset.kobj);
165         unsigned int val;
166         int rc;
167
168         rc = kstrtouint(buffer, 10, &val);
169         if (rc)
170                 return rc;
171
172         if (val != 0 && (val < PAGE_SIZE || (val & (val - 1))) != 0)
173                 return -ERANGE;
174
175         sbi->ll_stat_blksize = val;
176
177         return count;
178 }
179 LUSTRE_RW_ATTR(stat_blocksize);
180
181 static ssize_t kbytestotal_show(struct kobject *kobj, struct attribute *attr,
182                                 char *buf)
183 {
184         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
185                                               ll_kset.kobj);
186         struct obd_statfs osfs;
187         u32 blk_size;
188         u64 result;
189         int rc;
190
191         rc = ll_statfs_internal(sbi, &osfs, OBD_STATFS_NODELAY);
192         if (rc)
193                 return rc;
194
195         blk_size = osfs.os_bsize >> 10;
196         result = osfs.os_blocks;
197
198         while (blk_size >>= 1)
199                 result <<= 1;
200
201         return sprintf(buf, "%llu\n", result);
202 }
203 LUSTRE_RO_ATTR(kbytestotal);
204
205 static ssize_t kbytesfree_show(struct kobject *kobj, struct attribute *attr,
206                                char *buf)
207 {
208         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
209                                               ll_kset.kobj);
210         struct obd_statfs osfs;
211         u32 blk_size;
212         u64 result;
213         int rc;
214
215         rc = ll_statfs_internal(sbi, &osfs, OBD_STATFS_NODELAY);
216         if (rc)
217                 return rc;
218
219         blk_size = osfs.os_bsize >> 10;
220         result = osfs.os_bfree;
221
222         while (blk_size >>= 1)
223                 result <<= 1;
224
225         return sprintf(buf, "%llu\n", result);
226 }
227 LUSTRE_RO_ATTR(kbytesfree);
228
229 static ssize_t kbytesavail_show(struct kobject *kobj, struct attribute *attr,
230                                 char *buf)
231 {
232         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
233                                               ll_kset.kobj);
234         struct obd_statfs osfs;
235         u32 blk_size;
236         u64 result;
237         int rc;
238
239         rc = ll_statfs_internal(sbi, &osfs, OBD_STATFS_NODELAY);
240         if (rc)
241                 return rc;
242
243         blk_size = osfs.os_bsize >> 10;
244         result = osfs.os_bavail;
245
246         while (blk_size >>= 1)
247                 result <<= 1;
248
249         return sprintf(buf, "%llu\n", result);
250 }
251 LUSTRE_RO_ATTR(kbytesavail);
252
253 static ssize_t filestotal_show(struct kobject *kobj, struct attribute *attr,
254                                char *buf)
255 {
256         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
257                                               ll_kset.kobj);
258         struct obd_statfs osfs;
259         int rc;
260
261         rc = ll_statfs_internal(sbi, &osfs, OBD_STATFS_NODELAY);
262         if (rc)
263                 return rc;
264
265         return sprintf(buf, "%llu\n", osfs.os_files);
266 }
267 LUSTRE_RO_ATTR(filestotal);
268
269 static ssize_t filesfree_show(struct kobject *kobj, struct attribute *attr,
270                               char *buf)
271 {
272         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
273                                               ll_kset.kobj);
274         struct obd_statfs osfs;
275         int rc;
276
277         rc = ll_statfs_internal(sbi, &osfs, OBD_STATFS_NODELAY);
278         if (rc)
279                 return rc;
280
281         return sprintf(buf, "%llu\n", osfs.os_ffree);
282 }
283 LUSTRE_RO_ATTR(filesfree);
284
285 static ssize_t client_type_show(struct kobject *kobj, struct attribute *attr,
286                                 char *buf)
287 {
288         return sprintf(buf, "local client\n");
289 }
290 LUSTRE_RO_ATTR(client_type);
291
292 LUSTRE_RW_ATTR(foreign_symlink_enable);
293
294 LUSTRE_RW_ATTR(foreign_symlink_prefix);
295
296 LUSTRE_RW_ATTR(foreign_symlink_upcall);
297
298 LUSTRE_WO_ATTR(foreign_symlink_upcall_info);
299
300 static ssize_t fstype_show(struct kobject *kobj, struct attribute *attr,
301                            char *buf)
302 {
303         return sprintf(buf, "lustre\n");
304 }
305 LUSTRE_RO_ATTR(fstype);
306
307 static ssize_t uuid_show(struct kobject *kobj, struct attribute *attr,
308                          char *buf)
309 {
310         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
311                                               ll_kset.kobj);
312
313         return sprintf(buf, "%s\n", sbi->ll_sb_uuid.uuid);
314 }
315 LUSTRE_RO_ATTR(uuid);
316
317 static int ll_site_stats_seq_show(struct seq_file *m, void *v)
318 {
319         struct super_block *sb = m->private;
320
321         /*
322          * See description of statistical counters in struct cl_site, and
323          * struct lu_site.
324          */
325         return cl_site_stats_print(lu2cl_site(ll_s2sbi(sb)->ll_site), m);
326 }
327
328 LDEBUGFS_SEQ_FOPS_RO(ll_site_stats);
329
330 static ssize_t max_read_ahead_mb_show(struct kobject *kobj,
331                                       struct attribute *attr, char *buf)
332 {
333         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
334                                               ll_kset.kobj);
335
336         return scnprintf(buf, PAGE_SIZE, "%lu\n",
337                         PAGES_TO_MiB(sbi->ll_ra_info.ra_max_pages));
338 }
339
340 static ssize_t max_read_ahead_mb_store(struct kobject *kobj,
341                                        struct attribute *attr,
342                                        const char *buffer, size_t count)
343 {
344         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
345                                               ll_kset.kobj);
346         u64 ra_max_mb, pages_number;
347         int rc;
348
349         rc = sysfs_memparse(buffer, count, &ra_max_mb, "MiB");
350         if (rc)
351                 return rc;
352
353         pages_number = round_up(ra_max_mb, 1024 * 1024) >> PAGE_SHIFT;
354         CDEBUG(D_INFO, "%s: set max_read_ahead_mb=%llu (%llu pages)\n",
355                sbi->ll_fsname, PAGES_TO_MiB(pages_number), pages_number);
356         if (pages_number > cfs_totalram_pages() / 2) {
357                 /* 1/2 of RAM */
358                 CERROR("%s: cannot set max_read_ahead_mb=%llu > totalram/2=%luMB\n",
359                        sbi->ll_fsname, PAGES_TO_MiB(pages_number),
360                        PAGES_TO_MiB(cfs_totalram_pages() / 2));
361                 return -ERANGE;
362         }
363
364         spin_lock(&sbi->ll_lock);
365         sbi->ll_ra_info.ra_max_pages = pages_number;
366         spin_unlock(&sbi->ll_lock);
367
368         return count;
369 }
370 LUSTRE_RW_ATTR(max_read_ahead_mb);
371
372 static ssize_t max_read_ahead_per_file_mb_show(struct kobject *kobj,
373                                                struct attribute *attr,
374                                                char *buf)
375 {
376         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
377                                               ll_kset.kobj);
378
379         return scnprintf(buf, PAGE_SIZE, "%lu\n",
380                          PAGES_TO_MiB(sbi->ll_ra_info.ra_max_pages_per_file));
381 }
382
383 static ssize_t max_read_ahead_per_file_mb_store(struct kobject *kobj,
384                                                 struct attribute *attr,
385                                                 const char *buffer,
386                                                 size_t count)
387 {
388         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
389                                               ll_kset.kobj);
390         u64 ra_max_file_mb, pages_number;
391         int rc;
392
393         rc = sysfs_memparse(buffer, count, &ra_max_file_mb, "MiB");
394         if (rc)
395                 return rc;
396
397         pages_number = round_up(ra_max_file_mb, 1024 * 1024) >> PAGE_SHIFT;
398         if (pages_number > sbi->ll_ra_info.ra_max_pages) {
399                 CERROR("%s: cannot set max_read_ahead_per_file_mb=%llu > max_read_ahead_mb=%lu\n",
400                        sbi->ll_fsname, PAGES_TO_MiB(pages_number),
401                        PAGES_TO_MiB(sbi->ll_ra_info.ra_max_pages));
402                 return -ERANGE;
403         }
404
405         spin_lock(&sbi->ll_lock);
406         sbi->ll_ra_info.ra_max_pages_per_file = pages_number;
407         spin_unlock(&sbi->ll_lock);
408
409         return count;
410 }
411 LUSTRE_RW_ATTR(max_read_ahead_per_file_mb);
412
413 static ssize_t max_read_ahead_whole_mb_show(struct kobject *kobj,
414                                             struct attribute *attr, char *buf)
415 {
416         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
417                                               ll_kset.kobj);
418
419         return scnprintf(buf, PAGE_SIZE, "%lu\n",
420                          PAGES_TO_MiB(sbi->ll_ra_info.ra_max_read_ahead_whole_pages));
421 }
422
423 static ssize_t max_read_ahead_whole_mb_store(struct kobject *kobj,
424                                              struct attribute *attr,
425                                              const char *buffer, size_t count)
426 {
427         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
428                                               ll_kset.kobj);
429         u64 ra_max_whole_mb, pages_number;
430         int rc;
431
432         rc = sysfs_memparse(buffer, count, &ra_max_whole_mb, "MiB");
433         if (rc)
434                 return rc;
435
436         pages_number = round_up(ra_max_whole_mb, 1024 * 1024) >> PAGE_SHIFT;
437         /* Cap this at the current max readahead window size, the readahead
438          * algorithm does this anyway so it's pointless to set it larger.
439          */
440         if (pages_number > sbi->ll_ra_info.ra_max_pages_per_file) {
441                 CERROR("%s: cannot set max_read_ahead_whole_mb=%llu > max_read_ahead_per_file_mb=%lu\n",
442                        sbi->ll_fsname, PAGES_TO_MiB(pages_number),
443                        PAGES_TO_MiB(sbi->ll_ra_info.ra_max_pages_per_file));
444
445                 return -ERANGE;
446         }
447
448         spin_lock(&sbi->ll_lock);
449         sbi->ll_ra_info.ra_max_read_ahead_whole_pages = pages_number;
450         spin_unlock(&sbi->ll_lock);
451
452         return count;
453 }
454 LUSTRE_RW_ATTR(max_read_ahead_whole_mb);
455
456 static int ll_max_cached_mb_seq_show(struct seq_file *m, void *v)
457 {
458         struct super_block     *sb    = m->private;
459         struct ll_sb_info      *sbi   = ll_s2sbi(sb);
460         struct cl_client_cache *cache = sbi->ll_cache;
461         struct ll_ra_info *ra = &sbi->ll_ra_info;
462         long max_cached_mb;
463         long unused_mb;
464
465         mutex_lock(&cache->ccc_max_cache_mb_lock);
466         max_cached_mb = PAGES_TO_MiB(cache->ccc_lru_max);
467         unused_mb = PAGES_TO_MiB(atomic_long_read(&cache->ccc_lru_left));
468         mutex_unlock(&cache->ccc_max_cache_mb_lock);
469
470         seq_printf(m, "users: %d\n"
471                       "max_cached_mb: %ld\n"
472                       "used_mb: %ld\n"
473                       "unused_mb: %ld\n"
474                       "reclaim_count: %u\n"
475                       "max_read_ahead_mb: %lu\n"
476                       "used_read_ahead_mb: %d\n",
477                    refcount_read(&cache->ccc_users),
478                    max_cached_mb,
479                    max_cached_mb - unused_mb,
480                    unused_mb,
481                    cache->ccc_lru_shrinkers,
482                    PAGES_TO_MiB(ra->ra_max_pages),
483                    PAGES_TO_MiB(atomic_read(&ra->ra_cur_pages)));
484         return 0;
485 }
486
487 static ssize_t ll_max_cached_mb_seq_write(struct file *file,
488                                           const char __user *buffer,
489                                           size_t count, loff_t *off)
490 {
491         struct seq_file *m = file->private_data;
492         struct super_block *sb = m->private;
493         struct ll_sb_info *sbi = ll_s2sbi(sb);
494         struct cl_client_cache *cache = sbi->ll_cache;
495         struct lu_env *env;
496         long diff = 0;
497         long nrpages = 0;
498         __u16 refcheck;
499         u64 value;
500         u64 pages_number;
501         int rc;
502         char kernbuf[128], *ptr;
503         bool percent = false;
504
505         ENTRY;
506         if (count >= sizeof(kernbuf))
507                 RETURN(-EINVAL);
508
509         if (copy_from_user(kernbuf, buffer, count))
510                 RETURN(-EFAULT);
511
512         if (count > 0 && kernbuf[count - 1] == '%') {
513                 percent = true;
514                 /* strip off the % */
515                 kernbuf[count - 1] = '\0';
516         } else {
517                 kernbuf[count] = '\0';
518         }
519
520         ptr = lprocfs_find_named_value(kernbuf, "max_cached_mb:", &count);
521         if (percent)
522                 rc = sysfs_memparse(ptr, count, &value, "B");
523         else
524                 rc = sysfs_memparse(ptr, count, &value, "MiB");
525         if (rc)
526                 RETURN(rc);
527
528         if (percent) {
529                 pages_number = cfs_totalram_pages() * value / 100;
530         } else {
531                 pages_number = value >> PAGE_SHIFT;
532         }
533
534         if (pages_number < 0 || pages_number > cfs_totalram_pages()) {
535                 CERROR("%s: can't set max cache more than %lu MB\n",
536                        sbi->ll_fsname,
537                        PAGES_TO_MiB(cfs_totalram_pages()));
538                 RETURN(-ERANGE);
539         }
540         /* Allow enough cache so clients can make well-formed RPCs */
541         pages_number = max_t(long, pages_number, PTLRPC_MAX_BRW_PAGES);
542
543         mutex_lock(&cache->ccc_max_cache_mb_lock);
544         diff = pages_number - cache->ccc_lru_max;
545
546         /* easy - add more LRU slots. */
547         if (diff >= 0) {
548                 atomic_long_add(diff, &cache->ccc_lru_left);
549                 GOTO(out, rc = 0);
550         }
551
552         env = cl_env_get(&refcheck);
553         if (IS_ERR(env))
554                 GOTO(out_unlock, rc = PTR_ERR(env));
555
556         diff = -diff;
557         while (diff > 0) {
558                 long tmp;
559
560                 /* reduce LRU budget from free slots. */
561                 do {
562                         long lru_left_old, lru_left_new, lru_left_ret;
563
564                         lru_left_old = atomic_long_read(&cache->ccc_lru_left);
565                         if (lru_left_old == 0)
566                                 break;
567
568                         lru_left_new = lru_left_old > diff ?
569                                         lru_left_old - diff : 0;
570                         lru_left_ret =
571                                 atomic_long_cmpxchg(&cache->ccc_lru_left,
572                                                     lru_left_old,
573                                                     lru_left_new);
574                         if (likely(lru_left_old == lru_left_ret)) {
575                                 diff -= lru_left_old - lru_left_new;
576                                 nrpages += lru_left_old - lru_left_new;
577                                 break;
578                         }
579                 } while (1);
580
581                 if (diff <= 0)
582                         break;
583
584                 if (sbi->ll_dt_exp == NULL) { /* being initialized */
585                         rc = -ENODEV;
586                         break;
587                 }
588
589                 /* Request extra free slots to avoid them all being used
590                  * by other processes before this can continue shrinking.
591                  */
592                 tmp = diff + min_t(long, diff, MiB_TO_PAGES(1024));
593                 /* difficult - have to ask OSCs to drop LRU slots. */
594                 rc = obd_set_info_async(env, sbi->ll_dt_exp,
595                                 sizeof(KEY_CACHE_LRU_SHRINK),
596                                 KEY_CACHE_LRU_SHRINK,
597                                 sizeof(tmp), &tmp, NULL);
598                 if (rc < 0)
599                         break;
600         }
601         cl_env_put(env, &refcheck);
602
603 out:
604         if (rc >= 0) {
605                 cache->ccc_lru_max = pages_number;
606                 rc = count;
607         } else {
608                 atomic_long_add(nrpages, &cache->ccc_lru_left);
609         }
610 out_unlock:
611         mutex_unlock(&cache->ccc_max_cache_mb_lock);
612         return rc;
613 }
614 LDEBUGFS_SEQ_FOPS(ll_max_cached_mb);
615
616 static ssize_t checksums_show(struct kobject *kobj, struct attribute *attr,
617                               char *buf)
618 {
619         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
620                                               ll_kset.kobj);
621
622         return scnprintf(buf, PAGE_SIZE, "%u\n",
623                          test_bit(LL_SBI_CHECKSUM, sbi->ll_flags));
624 }
625
626 static ssize_t checksums_store(struct kobject *kobj, struct attribute *attr,
627                                const char *buffer, size_t count)
628 {
629         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
630                                               ll_kset.kobj);
631         bool val;
632         int tmp;
633         int rc;
634
635         if (!sbi->ll_dt_exp)
636                 /* Not set up yet */
637                 return -EAGAIN;
638
639         rc = kstrtobool(buffer, &val);
640         if (rc)
641                 return rc;
642         if (val)
643                 set_bit(LL_SBI_CHECKSUM, sbi->ll_flags);
644         else
645                 clear_bit(LL_SBI_CHECKSUM, sbi->ll_flags);
646         tmp = val;
647
648         rc = obd_set_info_async(NULL, sbi->ll_dt_exp, sizeof(KEY_CHECKSUM),
649                                 KEY_CHECKSUM, sizeof(tmp), &tmp, NULL);
650         if (rc)
651                 CWARN("Failed to set OSC checksum flags: %d\n", rc);
652
653         return count;
654 }
655 LUSTRE_RW_ATTR(checksums);
656
657 LUSTRE_ATTR(checksum_pages, 0644, checksums_show, checksums_store);
658
659 static ssize_t ll_rd_track_id(struct kobject *kobj, char *buf,
660                               enum stats_track_type type)
661 {
662         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
663                                               ll_kset.kobj);
664
665         if (sbi->ll_stats_track_type == type)
666                 return sprintf(buf, "%d\n", sbi->ll_stats_track_id);
667         else if (sbi->ll_stats_track_type == STATS_TRACK_ALL)
668                 return sprintf(buf, "0 (all)\n");
669
670         return sprintf(buf, "untracked\n");
671 }
672
673 static ssize_t ll_wr_track_id(struct kobject *kobj, const char *buffer,
674                               size_t count, enum stats_track_type type)
675 {
676         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
677                                               ll_kset.kobj);
678         unsigned long pid;
679         int rc;
680
681         rc = kstrtoul(buffer, 10, &pid);
682         if (rc)
683                 return rc;
684
685         sbi->ll_stats_track_id = pid;
686         if (pid == 0)
687                 sbi->ll_stats_track_type = STATS_TRACK_ALL;
688         else
689                 sbi->ll_stats_track_type = type;
690         lprocfs_stats_clear(sbi->ll_stats);
691         return count;
692 }
693
694 static ssize_t stats_track_pid_show(struct kobject *kobj,
695                                     struct attribute *attr,
696                                     char *buf)
697 {
698         return ll_rd_track_id(kobj, buf, STATS_TRACK_PID);
699 }
700
701 static ssize_t stats_track_pid_store(struct kobject *kobj,
702                                      struct attribute *attr,
703                                      const char *buffer,
704                                      size_t count)
705 {
706         return ll_wr_track_id(kobj, buffer, count, STATS_TRACK_PID);
707 }
708 LUSTRE_RW_ATTR(stats_track_pid);
709
710 static ssize_t stats_track_ppid_show(struct kobject *kobj,
711                                      struct attribute *attr,
712                                      char *buf)
713 {
714         return ll_rd_track_id(kobj, buf, STATS_TRACK_PPID);
715 }
716
717 static ssize_t stats_track_ppid_store(struct kobject *kobj,
718                                       struct attribute *attr,
719                                       const char *buffer,
720                                       size_t count)
721 {
722         return ll_wr_track_id(kobj, buffer, count, STATS_TRACK_PPID);
723 }
724 LUSTRE_RW_ATTR(stats_track_ppid);
725
726 static ssize_t stats_track_gid_show(struct kobject *kobj,
727                                     struct attribute *attr,
728                                     char *buf)
729 {
730         return ll_rd_track_id(kobj, buf, STATS_TRACK_GID);
731 }
732
733 static ssize_t stats_track_gid_store(struct kobject *kobj,
734                                      struct attribute *attr,
735                                      const char *buffer,
736                                      size_t count)
737 {
738         return ll_wr_track_id(kobj, buffer, count, STATS_TRACK_GID);
739 }
740 LUSTRE_RW_ATTR(stats_track_gid);
741
742 static ssize_t statahead_running_max_show(struct kobject *kobj,
743                                           struct attribute *attr,
744                                           char *buf)
745 {
746         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
747                                               ll_kset.kobj);
748
749         return scnprintf(buf, PAGE_SIZE, "%u\n", sbi->ll_sa_running_max);
750 }
751
752 static ssize_t statahead_running_max_store(struct kobject *kobj,
753                                            struct attribute *attr,
754                                            const char *buffer,
755                                            size_t count)
756 {
757         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
758                                               ll_kset.kobj);
759         unsigned long val;
760         int rc;
761
762         rc = kstrtoul(buffer, 0, &val);
763         if (rc)
764                 return rc;
765
766         if (val <= LL_SA_RUNNING_MAX) {
767                 sbi->ll_sa_running_max = val;
768                 return count;
769         }
770
771         CERROR("Bad statahead_running_max value %lu. Valid values "
772                "are in the range [0, %d]\n", val, LL_SA_RUNNING_MAX);
773
774         return -ERANGE;
775 }
776 LUSTRE_RW_ATTR(statahead_running_max);
777
778 static ssize_t statahead_batch_max_show(struct kobject *kobj,
779                                         struct attribute *attr,
780                                         char *buf)
781 {
782         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
783                                               ll_kset.kobj);
784
785         return snprintf(buf, 16, "%u\n", sbi->ll_sa_batch_max);
786 }
787
788 static ssize_t statahead_batch_max_store(struct kobject *kobj,
789                                          struct attribute *attr,
790                                          const char *buffer,
791                                          size_t count)
792 {
793         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
794                                               ll_kset.kobj);
795         unsigned long val;
796         int rc;
797
798         rc = kstrtoul(buffer, 0, &val);
799         if (rc)
800                 return rc;
801
802         if (val > LL_SA_BATCH_MAX) {
803                 CWARN("%s: statahead_batch_max value %lu limited to maximum %d\n",
804                       sbi->ll_fsname, val, LL_SA_BATCH_MAX);
805                 val = LL_SA_BATCH_MAX;
806         }
807
808         sbi->ll_sa_batch_max = val;
809         return count;
810 }
811 LUSTRE_RW_ATTR(statahead_batch_max);
812
813 static ssize_t statahead_max_show(struct kobject *kobj,
814                                   struct attribute *attr,
815                                   char *buf)
816 {
817         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
818                                               ll_kset.kobj);
819
820         return sprintf(buf, "%u\n", sbi->ll_sa_max);
821 }
822
823 static ssize_t statahead_max_store(struct kobject *kobj,
824                                    struct attribute *attr,
825                                    const char *buffer,
826                                    size_t count)
827 {
828         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
829                                               ll_kset.kobj);
830         unsigned long val;
831         int rc;
832
833         rc = kstrtoul(buffer, 0, &val);
834         if (rc)
835                 return rc;
836
837         if (val > LL_SA_RPC_MAX) {
838                 CWARN("%s: statahead_max value %lu limited to maximum %d\n",
839                       sbi->ll_fsname, val, LL_SA_RPC_MAX);
840                 val = LL_SA_RPC_MAX;
841         }
842
843         sbi->ll_sa_max = val;
844         return count;
845 }
846 LUSTRE_RW_ATTR(statahead_max);
847
848 static ssize_t statahead_agl_show(struct kobject *kobj,
849                                   struct attribute *attr,
850                                   char *buf)
851 {
852         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
853                                               ll_kset.kobj);
854
855         return scnprintf(buf, PAGE_SIZE, "%u\n",
856                          test_bit(LL_SBI_AGL_ENABLED, sbi->ll_flags));
857 }
858
859 static ssize_t statahead_agl_store(struct kobject *kobj,
860                                    struct attribute *attr,
861                                    const char *buffer,
862                                    size_t count)
863 {
864         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
865                                               ll_kset.kobj);
866         bool val;
867         int rc;
868
869         rc = kstrtobool(buffer, &val);
870         if (rc)
871                 return rc;
872
873         if (val)
874                 set_bit(LL_SBI_AGL_ENABLED, sbi->ll_flags);
875         else
876                 clear_bit(LL_SBI_AGL_ENABLED, sbi->ll_flags);
877
878         return count;
879 }
880 LUSTRE_RW_ATTR(statahead_agl);
881
882 static int ll_statahead_stats_seq_show(struct seq_file *m, void *v)
883 {
884         struct super_block *sb = m->private;
885         struct ll_sb_info *sbi = ll_s2sbi(sb);
886
887         seq_printf(m, "statahead total: %u\n"
888                       "statahead wrong: %u\n"
889                       "agl total: %u\n"
890                       "hit_total: %u\n"
891                       "miss_total: %u\n",
892                    atomic_read(&sbi->ll_sa_total),
893                    atomic_read(&sbi->ll_sa_wrong),
894                    atomic_read(&sbi->ll_agl_total),
895                    atomic_read(&sbi->ll_sa_hit_total),
896                    atomic_read(&sbi->ll_sa_miss_total));
897         return 0;
898 }
899
900 static ssize_t ll_statahead_stats_seq_write(struct file *file,
901                                             const char __user *buffer,
902                                             size_t count, loff_t *off)
903 {
904         struct seq_file *m = file->private_data;
905         struct super_block *sb = m->private;
906         struct ll_sb_info *sbi = ll_s2sbi(sb);
907
908         atomic_set(&sbi->ll_sa_total, 0);
909         atomic_set(&sbi->ll_sa_wrong, 0);
910         atomic_set(&sbi->ll_agl_total, 0);
911         atomic_set(&sbi->ll_sa_hit_total, 0);
912         atomic_set(&sbi->ll_sa_miss_total, 0);
913
914         return count;
915 }
916 LDEBUGFS_SEQ_FOPS(ll_statahead_stats);
917
918 static ssize_t lazystatfs_show(struct kobject *kobj,
919                                struct attribute *attr,
920                                char *buf)
921 {
922         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
923                                               ll_kset.kobj);
924
925         return scnprintf(buf, PAGE_SIZE, "%u\n",
926                          test_bit(LL_SBI_LAZYSTATFS, sbi->ll_flags));
927 }
928
929 static ssize_t lazystatfs_store(struct kobject *kobj,
930                                 struct attribute *attr,
931                                 const char *buffer,
932                                 size_t count)
933 {
934         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
935                                               ll_kset.kobj);
936         bool val;
937         int rc;
938
939         rc = kstrtobool(buffer, &val);
940         if (rc)
941                 return rc;
942
943         if (val)
944                 set_bit(LL_SBI_LAZYSTATFS, sbi->ll_flags);
945         else
946                 clear_bit(LL_SBI_LAZYSTATFS, sbi->ll_flags);
947
948         return count;
949 }
950 LUSTRE_RW_ATTR(lazystatfs);
951
952 static ssize_t statfs_max_age_show(struct kobject *kobj, struct attribute *attr,
953                                    char *buf)
954 {
955         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
956                                               ll_kset.kobj);
957
958         return scnprintf(buf, PAGE_SIZE, "%u\n", sbi->ll_statfs_max_age);
959 }
960
961 static ssize_t statfs_max_age_store(struct kobject *kobj,
962                                     struct attribute *attr, const char *buffer,
963                                     size_t count)
964 {
965         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
966                                               ll_kset.kobj);
967         unsigned int val;
968         int rc;
969
970         rc = kstrtouint(buffer, 10, &val);
971         if (rc)
972                 return rc;
973         if (val > OBD_STATFS_CACHE_MAX_AGE)
974                 return -EINVAL;
975
976         sbi->ll_statfs_max_age = val;
977
978         return count;
979 }
980 LUSTRE_RW_ATTR(statfs_max_age);
981
982 static ssize_t max_easize_show(struct kobject *kobj,
983                                struct attribute *attr,
984                                char *buf)
985 {
986         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
987                                               ll_kset.kobj);
988         unsigned int ealen;
989         int rc;
990
991         rc = ll_get_max_mdsize(sbi, &ealen);
992         if (rc)
993                 return rc;
994
995         /* Limit xattr size returned to userspace based on kernel maximum */
996         return scnprintf(buf, PAGE_SIZE, "%u\n",
997                          ealen > XATTR_SIZE_MAX ? XATTR_SIZE_MAX : ealen);
998 }
999 LUSTRE_RO_ATTR(max_easize);
1000
1001 /**
1002  * Get default_easize.
1003  *
1004  * \see client_obd::cl_default_mds_easize
1005  *
1006  * \param[in] m         seq_file handle
1007  * \param[in] v         unused for single entry
1008  *
1009  * \retval 0            on success
1010  * \retval negative     negated errno on failure
1011  */
1012 static ssize_t default_easize_show(struct kobject *kobj,
1013                                    struct attribute *attr,
1014                                    char *buf)
1015 {
1016         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1017                                               ll_kset.kobj);
1018         unsigned int ealen;
1019         int rc;
1020
1021         rc = ll_get_default_mdsize(sbi, &ealen);
1022         if (rc)
1023                 return rc;
1024
1025         /* Limit xattr size returned to userspace based on kernel maximum */
1026         return scnprintf(buf, PAGE_SIZE, "%u\n",
1027                          ealen > XATTR_SIZE_MAX ? XATTR_SIZE_MAX : ealen);
1028 }
1029
1030 /**
1031  * Set default_easize.
1032  *
1033  * Range checking on the passed value is handled by
1034  * ll_set_default_mdsize().
1035  *
1036  * \see client_obd::cl_default_mds_easize
1037  *
1038  * \param[in] file      proc file
1039  * \param[in] buffer    string passed from user space
1040  * \param[in] count     \a buffer length
1041  * \param[in] off       unused for single entry
1042  *
1043  * \retval positive     \a count on success
1044  * \retval negative     negated errno on failure
1045  */
1046 static ssize_t default_easize_store(struct kobject *kobj,
1047                                     struct attribute *attr,
1048                                     const char *buffer,
1049                                     size_t count)
1050 {
1051         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1052                                               ll_kset.kobj);
1053         unsigned int val;
1054         int rc;
1055
1056         if (count == 0)
1057                 return 0;
1058
1059         rc = kstrtouint(buffer, 10, &val);
1060         if (rc)
1061                 return rc;
1062
1063         rc = ll_set_default_mdsize(sbi, val);
1064         if (rc)
1065                 return rc;
1066
1067         return count;
1068 }
1069 LUSTRE_RW_ATTR(default_easize);
1070
1071 LDEBUGFS_SEQ_FOPS_RO(ll_sbi_flags);
1072
1073 static ssize_t xattr_cache_show(struct kobject *kobj,
1074                                 struct attribute *attr,
1075                                 char *buf)
1076 {
1077         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1078                                               ll_kset.kobj);
1079
1080         return sprintf(buf, "%u\n", sbi->ll_xattr_cache_enabled);
1081 }
1082
1083 static ssize_t xattr_cache_store(struct kobject *kobj,
1084                                  struct attribute *attr,
1085                                  const char *buffer,
1086                                  size_t count)
1087 {
1088         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1089                                               ll_kset.kobj);
1090         bool val;
1091         int rc;
1092
1093         rc = kstrtobool(buffer, &val);
1094         if (rc)
1095                 return rc;
1096
1097         if (val && !test_bit(LL_SBI_XATTR_CACHE, sbi->ll_flags))
1098                 return -EOPNOTSUPP;
1099
1100         sbi->ll_xattr_cache_enabled = val;
1101         sbi->ll_xattr_cache_set = 1;
1102
1103         return count;
1104 }
1105 LUSTRE_RW_ATTR(xattr_cache);
1106
1107 static ssize_t tiny_write_show(struct kobject *kobj,
1108                                struct attribute *attr,
1109                                char *buf)
1110 {
1111         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1112                                               ll_kset.kobj);
1113
1114         return scnprintf(buf, PAGE_SIZE, "%u\n",
1115                          test_bit(LL_SBI_TINY_WRITE, sbi->ll_flags));
1116 }
1117
1118 static ssize_t tiny_write_store(struct kobject *kobj,
1119                                 struct attribute *attr,
1120                                 const char *buffer,
1121                                 size_t count)
1122 {
1123         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1124                                               ll_kset.kobj);
1125         bool val;
1126         int rc;
1127
1128         rc = kstrtobool(buffer, &val);
1129         if (rc)
1130                 return rc;
1131
1132         spin_lock(&sbi->ll_lock);
1133         if (val)
1134                 set_bit(LL_SBI_TINY_WRITE, sbi->ll_flags);
1135         else
1136                 clear_bit(LL_SBI_TINY_WRITE, sbi->ll_flags);
1137         spin_unlock(&sbi->ll_lock);
1138
1139         return count;
1140 }
1141 LUSTRE_RW_ATTR(tiny_write);
1142
1143 static ssize_t unaligned_dio_show(struct kobject *kobj,
1144                                   struct attribute *attr,
1145                                   char *buf)
1146 {
1147         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1148                                               ll_kset.kobj);
1149
1150         return scnprintf(buf, PAGE_SIZE, "%u\n",
1151                          test_bit(LL_SBI_UNALIGNED_DIO, sbi->ll_flags));
1152 }
1153
1154 static ssize_t unaligned_dio_store(struct kobject *kobj,
1155                                    struct attribute *attr,
1156                                    const char *buffer,
1157                                    size_t count)
1158 {
1159         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1160                                               ll_kset.kobj);
1161         bool val;
1162         int rc;
1163
1164         rc = kstrtobool(buffer, &val);
1165         if (rc)
1166                 return rc;
1167
1168         spin_lock(&sbi->ll_lock);
1169         if (val)
1170                 set_bit(LL_SBI_UNALIGNED_DIO, sbi->ll_flags);
1171         else
1172                 clear_bit(LL_SBI_UNALIGNED_DIO, sbi->ll_flags);
1173         spin_unlock(&sbi->ll_lock);
1174
1175         return count;
1176 }
1177 LUSTRE_RW_ATTR(unaligned_dio);
1178
1179 static ssize_t parallel_dio_show(struct kobject *kobj,
1180                                  struct attribute *attr,
1181                                  char *buf)
1182 {
1183         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1184                                               ll_kset.kobj);
1185
1186         return snprintf(buf, PAGE_SIZE, "%u\n",
1187                         test_bit(LL_SBI_PARALLEL_DIO, sbi->ll_flags));
1188 }
1189
1190 static ssize_t parallel_dio_store(struct kobject *kobj,
1191                                   struct attribute *attr,
1192                                   const char *buffer,
1193                                   size_t count)
1194 {
1195         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1196                                               ll_kset.kobj);
1197         bool val;
1198         int rc;
1199
1200         rc = kstrtobool(buffer, &val);
1201         if (rc)
1202                 return rc;
1203
1204         spin_lock(&sbi->ll_lock);
1205         if (val)
1206                 set_bit(LL_SBI_PARALLEL_DIO, sbi->ll_flags);
1207         else
1208                 clear_bit(LL_SBI_PARALLEL_DIO, sbi->ll_flags);
1209         spin_unlock(&sbi->ll_lock);
1210
1211         return count;
1212 }
1213 LUSTRE_RW_ATTR(parallel_dio);
1214
1215 static ssize_t max_read_ahead_async_active_show(struct kobject *kobj,
1216                                                struct attribute *attr,
1217                                                char *buf)
1218 {
1219         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1220                                               ll_kset.kobj);
1221
1222         return scnprintf(buf, PAGE_SIZE, "%u\n",
1223                          sbi->ll_ra_info.ra_async_max_active);
1224 }
1225
1226 static ssize_t max_read_ahead_async_active_store(struct kobject *kobj,
1227                                                  struct attribute *attr,
1228                                                  const char *buffer,
1229                                                  size_t count)
1230 {
1231         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1232                                               ll_kset.kobj);
1233         unsigned int val;
1234         int rc;
1235
1236         rc = kstrtouint(buffer, 10, &val);
1237         if (rc)
1238                 return rc;
1239
1240         /**
1241          * It doesn't make any sense to make it exceed what
1242          * workqueue could acutally support. This can easily
1243          * over subscripe the cores but Lustre internally
1244          * throttles to avoid those impacts.
1245          */
1246         if (val > WQ_UNBOUND_MAX_ACTIVE) {
1247                 CERROR("%s: cannot set max_read_ahead_async_active=%u larger than %u\n",
1248                        sbi->ll_fsname, val, WQ_UNBOUND_MAX_ACTIVE);
1249                 return -ERANGE;
1250         }
1251
1252         spin_lock(&sbi->ll_lock);
1253         sbi->ll_ra_info.ra_async_max_active = val;
1254         spin_unlock(&sbi->ll_lock);
1255
1256         return count;
1257 }
1258 LUSTRE_RW_ATTR(max_read_ahead_async_active);
1259
1260 static ssize_t read_ahead_async_file_threshold_mb_show(struct kobject *kobj,
1261                                                        struct attribute *attr,
1262                                                        char *buf)
1263 {
1264         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1265                                               ll_kset.kobj);
1266
1267         return scnprintf(buf, PAGE_SIZE, "%lu\n", PAGES_TO_MiB(
1268                          sbi->ll_ra_info.ra_async_pages_per_file_threshold));
1269 }
1270
1271 static ssize_t
1272 read_ahead_async_file_threshold_mb_store(struct kobject *kobj,
1273                                          struct attribute *attr,
1274                                          const char *buffer, size_t count)
1275 {
1276         unsigned long pages_number;
1277         unsigned long max_ra_per_file;
1278         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1279                                               ll_kset.kobj);
1280         int rc;
1281
1282         rc = kstrtoul(buffer, 10, &pages_number);
1283         if (rc)
1284                 return rc;
1285
1286         pages_number = MiB_TO_PAGES(pages_number);
1287         max_ra_per_file = sbi->ll_ra_info.ra_max_pages_per_file;
1288         if (pages_number < 0 || pages_number > max_ra_per_file) {
1289                 CERROR("%s: can't set read_ahead_async_file_threshold_mb=%lu > "
1290                        "max_read_readahead_per_file_mb=%lu\n", sbi->ll_fsname,
1291                        PAGES_TO_MiB(pages_number),
1292                        PAGES_TO_MiB(max_ra_per_file));
1293                 return -ERANGE;
1294         }
1295         sbi->ll_ra_info.ra_async_pages_per_file_threshold = pages_number;
1296
1297         return count;
1298 }
1299 LUSTRE_RW_ATTR(read_ahead_async_file_threshold_mb);
1300
1301 static ssize_t read_ahead_range_kb_show(struct kobject *kobj,
1302                                         struct attribute *attr,char *buf)
1303 {
1304         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1305                                               ll_kset.kobj);
1306
1307         return snprintf(buf, PAGE_SIZE, "%lu\n",
1308                         sbi->ll_ra_info.ra_range_pages << (PAGE_SHIFT - 10));
1309 }
1310
1311 static ssize_t
1312 read_ahead_range_kb_store(struct kobject *kobj,
1313                                struct attribute *attr,
1314                                const char *buffer, size_t count)
1315 {
1316         unsigned long pages_number;
1317         unsigned long max_ra_per_file;
1318         u64 val;
1319         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1320                                               ll_kset.kobj);
1321         int rc;
1322
1323         rc = sysfs_memparse(buffer, count, &val, "KiB");
1324         if (rc < 0)
1325                 return rc;
1326
1327         pages_number = val >> PAGE_SHIFT;
1328         /* Disable mmap range read */
1329         if (pages_number == 0)
1330                 goto out;
1331
1332         max_ra_per_file = sbi->ll_ra_info.ra_max_pages_per_file;
1333         if (pages_number > max_ra_per_file ||
1334             pages_number < RA_MIN_MMAP_RANGE_PAGES)
1335                 return -ERANGE;
1336
1337 out:
1338         spin_lock(&sbi->ll_lock);
1339         sbi->ll_ra_info.ra_range_pages = pages_number;
1340         spin_unlock(&sbi->ll_lock);
1341
1342         return count;
1343 }
1344 LUSTRE_RW_ATTR(read_ahead_range_kb);
1345
1346 static ssize_t fast_read_show(struct kobject *kobj,
1347                               struct attribute *attr,
1348                               char *buf)
1349 {
1350         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1351                                               ll_kset.kobj);
1352
1353         return scnprintf(buf, PAGE_SIZE, "%u\n",
1354                          test_bit(LL_SBI_FAST_READ, sbi->ll_flags));
1355 }
1356
1357 static ssize_t fast_read_store(struct kobject *kobj,
1358                                struct attribute *attr,
1359                                const char *buffer,
1360                                size_t count)
1361 {
1362         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1363                                               ll_kset.kobj);
1364         bool val;
1365         int rc;
1366
1367         rc = kstrtobool(buffer, &val);
1368         if (rc)
1369                 return rc;
1370
1371         spin_lock(&sbi->ll_lock);
1372         if (val)
1373                 set_bit(LL_SBI_FAST_READ, sbi->ll_flags);
1374         else
1375                 clear_bit(LL_SBI_FAST_READ, sbi->ll_flags);
1376         spin_unlock(&sbi->ll_lock);
1377
1378         return count;
1379 }
1380 LUSTRE_RW_ATTR(fast_read);
1381
1382 static ssize_t file_heat_show(struct kobject *kobj,
1383                               struct attribute *attr,
1384                               char *buf)
1385 {
1386         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1387                                               ll_kset.kobj);
1388
1389         return scnprintf(buf, PAGE_SIZE, "%u\n",
1390                          test_bit(LL_SBI_FILE_HEAT, sbi->ll_flags));
1391 }
1392
1393 static ssize_t file_heat_store(struct kobject *kobj,
1394                                struct attribute *attr,
1395                                const char *buffer,
1396                                size_t count)
1397 {
1398         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1399                                               ll_kset.kobj);
1400         bool val;
1401         int rc;
1402
1403         rc = kstrtobool(buffer, &val);
1404         if (rc)
1405                 return rc;
1406
1407         spin_lock(&sbi->ll_lock);
1408         if (val)
1409                 set_bit(LL_SBI_FILE_HEAT, sbi->ll_flags);
1410         else
1411                 clear_bit(LL_SBI_FILE_HEAT, sbi->ll_flags);
1412         spin_unlock(&sbi->ll_lock);
1413
1414         return count;
1415 }
1416 LUSTRE_RW_ATTR(file_heat);
1417
1418 static ssize_t heat_decay_percentage_show(struct kobject *kobj,
1419                                           struct attribute *attr,
1420                                           char *buf)
1421 {
1422         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1423                                               ll_kset.kobj);
1424
1425         return scnprintf(buf, PAGE_SIZE, "%u\n",
1426                          (sbi->ll_heat_decay_weight * 100 + 128) / 256);
1427 }
1428
1429 static ssize_t heat_decay_percentage_store(struct kobject *kobj,
1430                                            struct attribute *attr,
1431                                            const char *buffer,
1432                                            size_t count)
1433 {
1434         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1435                                               ll_kset.kobj);
1436         unsigned long val;
1437         int rc;
1438
1439         rc = kstrtoul(buffer, 10, &val);
1440         if (rc)
1441                 return rc;
1442
1443         if (val < 0 || val > 100)
1444                 return -ERANGE;
1445
1446         sbi->ll_heat_decay_weight = (val * 256 + 50) / 100;
1447
1448         return count;
1449 }
1450 LUSTRE_RW_ATTR(heat_decay_percentage);
1451
1452 static ssize_t heat_period_second_show(struct kobject *kobj,
1453                                        struct attribute *attr,
1454                                        char *buf)
1455 {
1456         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1457                                               ll_kset.kobj);
1458
1459         return scnprintf(buf, PAGE_SIZE, "%u\n", sbi->ll_heat_period_second);
1460 }
1461
1462 static ssize_t heat_period_second_store(struct kobject *kobj,
1463                                         struct attribute *attr,
1464                                         const char *buffer,
1465                                         size_t count)
1466 {
1467         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1468                                               ll_kset.kobj);
1469         unsigned long val;
1470         int rc;
1471
1472         rc = kstrtoul(buffer, 10, &val);
1473         if (rc)
1474                 return rc;
1475
1476         if (val <= 0)
1477                 return -ERANGE;
1478
1479         sbi->ll_heat_period_second = val;
1480
1481         return count;
1482 }
1483 LUSTRE_RW_ATTR(heat_period_second);
1484
1485 static ssize_t opencache_threshold_count_show(struct kobject *kobj,
1486                                               struct attribute *attr,
1487                                               char *buf)
1488 {
1489         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1490                                               ll_kset.kobj);
1491
1492         if (sbi->ll_oc_thrsh_count)
1493                 return snprintf(buf, PAGE_SIZE, "%u\n",
1494                                 sbi->ll_oc_thrsh_count);
1495         else
1496                 return snprintf(buf, PAGE_SIZE, "off\n");
1497 }
1498
1499 static ssize_t opencache_threshold_count_store(struct kobject *kobj,
1500                                                struct attribute *attr,
1501                                                const char *buffer,
1502                                                size_t count)
1503 {
1504         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1505                                               ll_kset.kobj);
1506         unsigned int val;
1507         int rc;
1508
1509         rc = kstrtouint(buffer, 10, &val);
1510         if (rc) {
1511                 bool enable;
1512                 /* also accept "off" to disable and "on" to always cache */
1513                 rc = kstrtobool(buffer, &enable);
1514                 if (rc)
1515                         return rc;
1516                 val = enable;
1517         }
1518         sbi->ll_oc_thrsh_count = val;
1519
1520         return count;
1521 }
1522 LUSTRE_RW_ATTR(opencache_threshold_count);
1523
1524 static ssize_t opencache_threshold_ms_show(struct kobject *kobj,
1525                                            struct attribute *attr,
1526                                            char *buf)
1527 {
1528         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1529                                               ll_kset.kobj);
1530
1531         return snprintf(buf, PAGE_SIZE, "%u\n", sbi->ll_oc_thrsh_ms);
1532 }
1533
1534 static ssize_t opencache_threshold_ms_store(struct kobject *kobj,
1535                                             struct attribute *attr,
1536                                             const char *buffer,
1537                                             size_t count)
1538 {
1539         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1540                                               ll_kset.kobj);
1541         unsigned int val;
1542         int rc;
1543
1544         rc = kstrtouint(buffer, 10, &val);
1545         if (rc)
1546                 return rc;
1547
1548         sbi->ll_oc_thrsh_ms = val;
1549
1550         return count;
1551 }
1552 LUSTRE_RW_ATTR(opencache_threshold_ms);
1553
1554 static ssize_t opencache_max_ms_show(struct kobject *kobj,
1555                                      struct attribute *attr,
1556                                      char *buf)
1557 {
1558         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1559                                               ll_kset.kobj);
1560
1561         return snprintf(buf, PAGE_SIZE, "%u\n", sbi->ll_oc_max_ms);
1562 }
1563
1564 static ssize_t opencache_max_ms_store(struct kobject *kobj,
1565                                       struct attribute *attr,
1566                                       const char *buffer,
1567                                       size_t count)
1568 {
1569         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1570                                               ll_kset.kobj);
1571         unsigned int val;
1572         int rc;
1573
1574         rc = kstrtouint(buffer, 10, &val);
1575         if (rc)
1576                 return rc;
1577
1578         sbi->ll_oc_max_ms = val;
1579
1580         return count;
1581 }
1582 LUSTRE_RW_ATTR(opencache_max_ms);
1583
1584 static ssize_t inode_cache_show(struct kobject *kobj,
1585                                 struct attribute *attr,
1586                                 char *buf)
1587 {
1588         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1589                                               ll_kset.kobj);
1590
1591         return snprintf(buf, PAGE_SIZE, "%u\n", sbi->ll_inode_cache_enabled);
1592 }
1593
1594 static ssize_t inode_cache_store(struct kobject *kobj,
1595                                  struct attribute *attr,
1596                                  const char *buffer,
1597                                  size_t count)
1598 {
1599         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1600                                               ll_kset.kobj);
1601         bool val;
1602         int rc;
1603
1604         rc = kstrtobool(buffer, &val);
1605         if (rc)
1606                 return rc;
1607
1608         sbi->ll_inode_cache_enabled = val;
1609
1610         return count;
1611 }
1612 LUSTRE_RW_ATTR(inode_cache);
1613
1614 static int ll_unstable_stats_seq_show(struct seq_file *m, void *v)
1615 {
1616         struct super_block      *sb    = m->private;
1617         struct ll_sb_info       *sbi   = ll_s2sbi(sb);
1618         struct cl_client_cache  *cache = sbi->ll_cache;
1619         long pages;
1620         int mb;
1621
1622         pages = atomic_long_read(&cache->ccc_unstable_nr);
1623         mb    = (pages * PAGE_SIZE) >> 20;
1624
1625         seq_printf(m, "unstable_check:     %8d\n"
1626                       "unstable_pages: %12ld\n"
1627                       "unstable_mb:        %8d\n",
1628                    cache->ccc_unstable_check, pages, mb);
1629         return 0;
1630 }
1631
1632 static ssize_t ll_unstable_stats_seq_write(struct file *file,
1633                                            const char __user *buffer,
1634                                            size_t count, loff_t *unused)
1635 {
1636         struct seq_file *seq = file->private_data;
1637         struct ll_sb_info *sbi = ll_s2sbi((struct super_block *)seq->private);
1638         char kernbuf[128];
1639         bool val;
1640         int rc;
1641
1642         if (count == 0)
1643                 return 0;
1644         if (count >= sizeof(kernbuf))
1645                 return -EINVAL;
1646
1647         if (copy_from_user(kernbuf, buffer, count))
1648                 return -EFAULT;
1649         kernbuf[count] = 0;
1650
1651         buffer += lprocfs_find_named_value(kernbuf, "unstable_check:", &count) -
1652                   kernbuf;
1653         rc = kstrtobool_from_user(buffer, count, &val);
1654         if (rc < 0)
1655                 return rc;
1656
1657         /* borrow lru lock to set the value */
1658         spin_lock(&sbi->ll_cache->ccc_lru_lock);
1659         sbi->ll_cache->ccc_unstable_check = val;
1660         spin_unlock(&sbi->ll_cache->ccc_lru_lock);
1661
1662         return count;
1663 }
1664
1665 LDEBUGFS_SEQ_FOPS(ll_unstable_stats);
1666
1667 static int ll_root_squash_seq_show(struct seq_file *m, void *v)
1668 {
1669         struct super_block *sb = m->private;
1670         struct ll_sb_info *sbi = ll_s2sbi(sb);
1671         struct root_squash_info *squash = &sbi->ll_squash;
1672
1673         seq_printf(m, "%u:%u\n", squash->rsi_uid, squash->rsi_gid);
1674         return 0;
1675 }
1676
1677 static ssize_t ll_root_squash_seq_write(struct file *file,
1678                                         const char __user *buffer,
1679                                         size_t count, loff_t *off)
1680 {
1681         struct seq_file *m = file->private_data;
1682         struct super_block *sb = m->private;
1683         struct ll_sb_info *sbi = ll_s2sbi(sb);
1684         struct root_squash_info *squash = &sbi->ll_squash;
1685
1686         return lprocfs_wr_root_squash(buffer, count, squash, sbi->ll_fsname);
1687 }
1688
1689 LDEBUGFS_SEQ_FOPS(ll_root_squash);
1690
1691 static int ll_nosquash_nids_seq_show(struct seq_file *m, void *v)
1692 {
1693         struct super_block *sb = m->private;
1694         struct ll_sb_info *sbi = ll_s2sbi(sb);
1695         struct root_squash_info *squash = &sbi->ll_squash;
1696         int len;
1697
1698         spin_lock(&squash->rsi_lock);
1699         if (!list_empty(&squash->rsi_nosquash_nids)) {
1700                 len = cfs_print_nidlist(m->buf + m->count, m->size - m->count,
1701                                         &squash->rsi_nosquash_nids);
1702                 m->count += len;
1703                 seq_putc(m, '\n');
1704         } else {
1705                 seq_puts(m, "NONE\n");
1706         }
1707         spin_unlock(&squash->rsi_lock);
1708
1709         return 0;
1710 }
1711
1712 static ssize_t ll_nosquash_nids_seq_write(struct file *file,
1713                                           const char __user *buffer,
1714                                           size_t count, loff_t *off)
1715 {
1716         struct seq_file *m = file->private_data;
1717         struct super_block *sb = m->private;
1718         struct ll_sb_info *sbi = ll_s2sbi(sb);
1719         struct root_squash_info *squash = &sbi->ll_squash;
1720         int rc;
1721
1722         rc = lprocfs_wr_nosquash_nids(buffer, count, squash, sbi->ll_fsname);
1723         if (rc < 0)
1724                 return rc;
1725
1726         ll_compute_rootsquash_state(sbi);
1727
1728         return rc;
1729 }
1730
1731 LDEBUGFS_SEQ_FOPS(ll_nosquash_nids);
1732
1733 #if defined(CONFIG_LL_ENCRYPTION)
1734 static ssize_t enable_filename_encryption_show(struct kobject *kobj,
1735                                                struct attribute *attr,
1736                                                char *buffer)
1737 {
1738         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1739                                               ll_kset.kobj);
1740         struct lustre_sb_info *lsi = sbi->lsi;
1741
1742         return snprintf(buffer, PAGE_SIZE,  "%u\n",
1743                         lsi->lsi_flags & LSI_FILENAME_ENC ? 1 : 0);
1744 }
1745
1746 static ssize_t enable_filename_encryption_store(struct kobject *kobj,
1747                                                 struct attribute *attr,
1748                                                 const char *buffer,
1749                                                 size_t count)
1750 {
1751         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1752                                               ll_kset.kobj);
1753         struct lustre_sb_info *lsi = sbi->lsi;
1754         bool val;
1755         int rc;
1756
1757         rc = kstrtobool(buffer, &val);
1758         if (rc)
1759                 return rc;
1760
1761         if (val) {
1762                 if (!ll_sbi_has_name_encrypt(sbi)) {
1763                         /* server does not support name encryption,
1764                          * so force it to NULL on client
1765                          */
1766                         CDEBUG(D_SEC, "%s: server does not support name encryption\n",
1767                                sbi->ll_fsname);
1768                         lsi->lsi_flags &= ~LSI_FILENAME_ENC;
1769                         return -EOPNOTSUPP;
1770                 }
1771
1772                 lsi->lsi_flags |= LSI_FILENAME_ENC;
1773         } else {
1774                 lsi->lsi_flags &= ~LSI_FILENAME_ENC;
1775         }
1776
1777         return count;
1778 }
1779
1780 LUSTRE_RW_ATTR(enable_filename_encryption);
1781 #endif /* CONFIG_LL_ENCRYPTION */
1782
1783 #if defined(CONFIG_LL_ENCRYPTION) || defined(HAVE_LUSTRE_CRYPTO)
1784 static ssize_t filename_enc_use_old_base64_show(struct kobject *kobj,
1785                                                 struct attribute *attr,
1786                                                 char *buffer)
1787 {
1788         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1789                                               ll_kset.kobj);
1790         struct lustre_sb_info *lsi = sbi->lsi;
1791
1792         return snprintf(buffer, PAGE_SIZE, "%u\n",
1793                         lsi->lsi_flags & LSI_FILENAME_ENC_B64_OLD_CLI ? 1 : 0);
1794 }
1795
1796 static ssize_t filename_enc_use_old_base64_store(struct kobject *kobj,
1797                                                  struct attribute *attr,
1798                                                  const char *buffer,
1799                                                  size_t count)
1800 {
1801         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1802                                               ll_kset.kobj);
1803         struct lustre_sb_info *lsi = sbi->lsi;
1804         bool val;
1805         int rc;
1806
1807         rc = kstrtobool(buffer, &val);
1808         if (rc)
1809                 return rc;
1810
1811         if (val) {
1812                 if (!ll_sbi_has_name_encrypt(sbi)) {
1813                         /* server does not support name encryption,
1814                          * so force it to NULL on client
1815                          */
1816                         CDEBUG(D_SEC,
1817                                "%s: server does not support name encryption\n",
1818                                sbi->ll_fsname);
1819                         lsi->lsi_flags &= ~LSI_FILENAME_ENC_B64_OLD_CLI;
1820                         return -EOPNOTSUPP;
1821                 }
1822
1823                 lsi->lsi_flags |= LSI_FILENAME_ENC_B64_OLD_CLI;
1824         } else {
1825                 lsi->lsi_flags &= ~LSI_FILENAME_ENC_B64_OLD_CLI;
1826         }
1827
1828         return count;
1829 }
1830
1831 LUSTRE_RW_ATTR(filename_enc_use_old_base64);
1832 #endif /* CONFIG_LL_ENCRYPTION || HAVE_LUSTRE_CRYPTO */
1833
1834 static int ll_pcc_seq_show(struct seq_file *m, void *v)
1835 {
1836         struct super_block *sb = m->private;
1837         struct ll_sb_info *sbi = ll_s2sbi(sb);
1838
1839         return pcc_super_dump(&sbi->ll_pcc_super, m);
1840 }
1841
1842 static ssize_t ll_pcc_seq_write(struct file *file, const char __user *buffer,
1843                                 size_t count, loff_t *off)
1844 {
1845         struct seq_file *m = file->private_data;
1846         struct super_block *sb = m->private;
1847         struct ll_sb_info *sbi = ll_s2sbi(sb);
1848         int rc;
1849         char *kernbuf;
1850
1851         if (count >= LPROCFS_WR_PCC_MAX_CMD)
1852                 return -EINVAL;
1853
1854         if (!(exp_connect_flags2(sbi->ll_md_exp) & OBD_CONNECT2_PCC))
1855                 return -EOPNOTSUPP;
1856
1857         OBD_ALLOC(kernbuf, count + 1);
1858         if (kernbuf == NULL)
1859                 return -ENOMEM;
1860
1861         if (copy_from_user(kernbuf, buffer, count))
1862                 GOTO(out_free_kernbuff, rc = -EFAULT);
1863
1864         rc = pcc_cmd_handle(kernbuf, count, &sbi->ll_pcc_super);
1865 out_free_kernbuff:
1866         OBD_FREE(kernbuf, count + 1);
1867         return rc ? rc : count;
1868 }
1869 LDEBUGFS_SEQ_FOPS(ll_pcc);
1870
1871 struct ldebugfs_vars lprocfs_llite_obd_vars[] = {
1872         { .name =       "site",
1873           .fops =       &ll_site_stats_fops                     },
1874         { .name =       "max_cached_mb",
1875           .fops =       &ll_max_cached_mb_fops                  },
1876         { .name =       "statahead_stats",
1877           .fops =       &ll_statahead_stats_fops                },
1878         { .name =       "unstable_stats",
1879           .fops =       &ll_unstable_stats_fops                 },
1880         { .name =       "sbi_flags",
1881           .fops =       &ll_sbi_flags_fops                      },
1882         { .name =       "root_squash",
1883           .fops =       &ll_root_squash_fops                    },
1884         { .name =       "nosquash_nids",
1885           .fops =       &ll_nosquash_nids_fops                  },
1886         { .name =       "pcc",
1887           .fops =       &ll_pcc_fops,                           },
1888         { NULL }
1889 };
1890
1891 #define MAX_STRING_SIZE 128
1892
1893 static struct attribute *llite_attrs[] = {
1894         &lustre_attr_blocksize.attr,
1895         &lustre_attr_stat_blocksize.attr,
1896         &lustre_attr_kbytestotal.attr,
1897         &lustre_attr_kbytesfree.attr,
1898         &lustre_attr_kbytesavail.attr,
1899         &lustre_attr_filestotal.attr,
1900         &lustre_attr_filesfree.attr,
1901         &lustre_attr_client_type.attr,
1902         &lustre_attr_foreign_symlink_enable.attr,
1903         &lustre_attr_foreign_symlink_prefix.attr,
1904         &lustre_attr_foreign_symlink_upcall.attr,
1905         &lustre_attr_foreign_symlink_upcall_info.attr,
1906         &lustre_attr_fstype.attr,
1907         &lustre_attr_uuid.attr,
1908         &lustre_attr_checksums.attr,
1909         &lustre_attr_checksum_pages.attr,
1910         &lustre_attr_max_read_ahead_mb.attr,
1911         &lustre_attr_max_read_ahead_per_file_mb.attr,
1912         &lustre_attr_max_read_ahead_whole_mb.attr,
1913         &lustre_attr_max_read_ahead_async_active.attr,
1914         &lustre_attr_read_ahead_async_file_threshold_mb.attr,
1915         &lustre_attr_read_ahead_range_kb.attr,
1916         &lustre_attr_stats_track_pid.attr,
1917         &lustre_attr_stats_track_ppid.attr,
1918         &lustre_attr_stats_track_gid.attr,
1919         &lustre_attr_statahead_running_max.attr,
1920         &lustre_attr_statahead_batch_max.attr,
1921         &lustre_attr_statahead_max.attr,
1922         &lustre_attr_statahead_agl.attr,
1923         &lustre_attr_lazystatfs.attr,
1924         &lustre_attr_statfs_max_age.attr,
1925         &lustre_attr_max_easize.attr,
1926         &lustre_attr_default_easize.attr,
1927         &lustre_attr_xattr_cache.attr,
1928         &lustre_attr_fast_read.attr,
1929         &lustre_attr_tiny_write.attr,
1930         &lustre_attr_parallel_dio.attr,
1931         &lustre_attr_unaligned_dio.attr,
1932         &lustre_attr_file_heat.attr,
1933         &lustre_attr_heat_decay_percentage.attr,
1934         &lustre_attr_heat_period_second.attr,
1935         &lustre_attr_opencache_threshold_count.attr,
1936         &lustre_attr_opencache_threshold_ms.attr,
1937         &lustre_attr_opencache_max_ms.attr,
1938         &lustre_attr_inode_cache.attr,
1939 #ifdef CONFIG_LL_ENCRYPTION
1940         &lustre_attr_enable_filename_encryption.attr,
1941 #endif
1942 #if defined(CONFIG_LL_ENCRYPTION) || defined(HAVE_LUSTRE_CRYPTO)
1943         &lustre_attr_filename_enc_use_old_base64.attr,
1944 #endif
1945         NULL,
1946 };
1947
1948 KOBJ_ATTRIBUTE_GROUPS(llite); /* creates llite_groups */
1949
1950 static void sbi_kobj_release(struct kobject *kobj)
1951 {
1952         struct ll_sb_info *sbi = container_of(kobj, struct ll_sb_info,
1953                                               ll_kset.kobj);
1954         complete(&sbi->ll_kobj_unregister);
1955 }
1956
1957 static struct kobj_type sbi_ktype = {
1958         .default_groups = KOBJ_ATTR_GROUPS(llite),
1959         .sysfs_ops      = &lustre_sysfs_ops,
1960         .release        = sbi_kobj_release,
1961 };
1962
1963 static const struct llite_file_opcode {
1964         __u32                           lfo_opcode;
1965         enum lprocfs_counter_config     lfo_config;
1966         const char                      *lfo_opname;
1967 } llite_opcode_table[LPROC_LL_FILE_OPCODES] = {
1968         /* file operation */
1969         { LPROC_LL_READ_BYTES,  LPROCFS_TYPE_BYTES_FULL, "read_bytes" },
1970         { LPROC_LL_WRITE_BYTES, LPROCFS_TYPE_BYTES_FULL, "write_bytes" },
1971         { LPROC_LL_READ,        LPROCFS_TYPE_LATENCY,   "read" },
1972         { LPROC_LL_WRITE,       LPROCFS_TYPE_LATENCY,   "write" },
1973         { LPROC_LL_IOCTL,       LPROCFS_TYPE_REQS,      "ioctl" },
1974         { LPROC_LL_OPEN,        LPROCFS_TYPE_LATENCY,   "open" },
1975         { LPROC_LL_RELEASE,     LPROCFS_TYPE_LATENCY,   "close" },
1976         { LPROC_LL_MMAP,        LPROCFS_TYPE_LATENCY,   "mmap" },
1977         { LPROC_LL_FAULT,       LPROCFS_TYPE_LATENCY,   "page_fault" },
1978         { LPROC_LL_MKWRITE,     LPROCFS_TYPE_LATENCY,   "page_mkwrite" },
1979         { LPROC_LL_LLSEEK,      LPROCFS_TYPE_LATENCY,   "seek" },
1980         { LPROC_LL_FSYNC,       LPROCFS_TYPE_LATENCY,   "fsync" },
1981         { LPROC_LL_READDIR,     LPROCFS_TYPE_LATENCY,   "readdir" },
1982         { LPROC_LL_INODE_OCOUNT, LPROCFS_TYPE_REQS | LPROCFS_CNTR_AVGMINMAX |
1983                                 LPROCFS_CNTR_STDDEV,    "opencount" },
1984         { LPROC_LL_INODE_OPCLTM,LPROCFS_TYPE_LATENCY,   "openclosetime" },
1985         /* inode operation */
1986         { LPROC_LL_SETATTR,     LPROCFS_TYPE_LATENCY,   "setattr" },
1987         { LPROC_LL_TRUNC,       LPROCFS_TYPE_LATENCY,   "truncate" },
1988         { LPROC_LL_FLOCK,       LPROCFS_TYPE_LATENCY,   "flock" },
1989         { LPROC_LL_GETATTR,     LPROCFS_TYPE_LATENCY,   "getattr" },
1990         { LPROC_LL_FALLOCATE,   LPROCFS_TYPE_LATENCY,   "fallocate"},
1991         /* dir inode operation */
1992         { LPROC_LL_CREATE,      LPROCFS_TYPE_LATENCY,   "create" },
1993         { LPROC_LL_LINK,        LPROCFS_TYPE_LATENCY,   "link" },
1994         { LPROC_LL_UNLINK,      LPROCFS_TYPE_LATENCY,   "unlink" },
1995         { LPROC_LL_SYMLINK,     LPROCFS_TYPE_LATENCY,   "symlink" },
1996         { LPROC_LL_MKDIR,       LPROCFS_TYPE_LATENCY,   "mkdir" },
1997         { LPROC_LL_RMDIR,       LPROCFS_TYPE_LATENCY,   "rmdir" },
1998         { LPROC_LL_MKNOD,       LPROCFS_TYPE_LATENCY,   "mknod" },
1999         { LPROC_LL_RENAME,      LPROCFS_TYPE_LATENCY,   "rename" },
2000         /* special inode operation */
2001         { LPROC_LL_STATFS,      LPROCFS_TYPE_LATENCY,   "statfs" },
2002         { LPROC_LL_SETXATTR,    LPROCFS_TYPE_LATENCY,   "setxattr" },
2003         { LPROC_LL_GETXATTR,    LPROCFS_TYPE_LATENCY,   "getxattr" },
2004         { LPROC_LL_GETXATTR_HITS, LPROCFS_TYPE_REQS,    "getxattr_hits" },
2005         { LPROC_LL_LISTXATTR,   LPROCFS_TYPE_LATENCY,   "listxattr" },
2006         { LPROC_LL_REMOVEXATTR, LPROCFS_TYPE_LATENCY,   "removexattr" },
2007         { LPROC_LL_INODE_PERM,  LPROCFS_TYPE_LATENCY,   "inode_permission" },
2008 };
2009
2010 void ll_stats_ops_tally(struct ll_sb_info *sbi, int op, long count)
2011 {
2012         if (!sbi->ll_stats)
2013                 return;
2014
2015         if (sbi->ll_stats_track_type == STATS_TRACK_ALL)
2016                 lprocfs_counter_add(sbi->ll_stats, op, count);
2017         else if (sbi->ll_stats_track_type == STATS_TRACK_PID &&
2018                  sbi->ll_stats_track_id == current->pid)
2019                 lprocfs_counter_add(sbi->ll_stats, op, count);
2020         else if (sbi->ll_stats_track_type == STATS_TRACK_PPID &&
2021                  sbi->ll_stats_track_id == current->real_parent->pid)
2022                 lprocfs_counter_add(sbi->ll_stats, op, count);
2023         else if (sbi->ll_stats_track_type == STATS_TRACK_GID &&
2024                  sbi->ll_stats_track_id ==
2025                         from_kgid(&init_user_ns, current_gid()))
2026                 lprocfs_counter_add(sbi->ll_stats, op, count);
2027 }
2028 EXPORT_SYMBOL(ll_stats_ops_tally);
2029
2030 static const char *const ra_stat_string[] = {
2031         [RA_STAT_HIT]                   = "hits",
2032         [RA_STAT_MISS]                  = "misses",
2033         [RA_STAT_DISTANT_READPAGE]      = "readpage_not_consecutive",
2034         [RA_STAT_MISS_IN_WINDOW]        = "miss_inside_window",
2035         [RA_STAT_FAILED_GRAB_PAGE]      = "failed_grab_cache_page",
2036         [RA_STAT_FAILED_MATCH]          = "failed_lock_match",
2037         [RA_STAT_DISCARDED]             = "read_but_discarded",
2038         [RA_STAT_ZERO_LEN]              = "zero_length_file",
2039         [RA_STAT_ZERO_WINDOW]           = "zero_size_window",
2040         [RA_STAT_EOF]                   = "readahead_to_eof",
2041         [RA_STAT_MAX_IN_FLIGHT]         = "hit_max_readahead_issue",
2042         [RA_STAT_WRONG_GRAB_PAGE]       = "wrong_page_from_grab_cache_page",
2043         [RA_STAT_FAILED_REACH_END]      = "failed_to_reach_end",
2044         [RA_STAT_ASYNC]                 = "async_readahead",
2045         [RA_STAT_FAILED_FAST_READ]      = "failed_to_fast_read",
2046         [RA_STAT_MMAP_RANGE_READ]       = "mmap_range_read",
2047         [RA_STAT_READAHEAD_PAGES]       = "readahead_pages"
2048 };
2049
2050 int ll_debugfs_register_super(struct super_block *sb, const char *name)
2051 {
2052         struct lustre_sb_info *lsi = s2lsi(sb);
2053         struct ll_sb_info *sbi = ll_s2sbi(sb);
2054         int err, id;
2055
2056         ENTRY;
2057         LASSERT(sbi);
2058
2059         if (IS_ERR_OR_NULL(llite_root))
2060                 goto out_ll_kset;
2061
2062         sbi->ll_debugfs_entry = debugfs_create_dir(name, llite_root);
2063         ldebugfs_add_vars(sbi->ll_debugfs_entry, lprocfs_llite_obd_vars, sb);
2064
2065         debugfs_create_file("dump_page_cache", 0444, sbi->ll_debugfs_entry, sbi,
2066                             &vvp_dump_pgcache_file_ops);
2067
2068         debugfs_create_file("extents_stats", 0644, sbi->ll_debugfs_entry, sbi,
2069                                  &ll_rw_extents_stats_fops);
2070
2071         debugfs_create_file("extents_stats_per_process", 0644,
2072                             sbi->ll_debugfs_entry, sbi,
2073                             &ll_rw_extents_stats_pp_fops);
2074
2075         debugfs_create_file("offset_stats", 0644, sbi->ll_debugfs_entry, sbi,
2076                             &ll_rw_offset_stats_fops);
2077
2078         /* File operations stats */
2079         sbi->ll_stats = lprocfs_stats_alloc(LPROC_LL_FILE_OPCODES,
2080                                             LPROCFS_STATS_FLAG_NONE);
2081         if (sbi->ll_stats == NULL)
2082                 GOTO(out_debugfs, err = -ENOMEM);
2083
2084         /* do counter init */
2085         for (id = 0; id < LPROC_LL_FILE_OPCODES; id++)
2086                 lprocfs_counter_init(sbi->ll_stats,
2087                                      llite_opcode_table[id].lfo_opcode,
2088                                      llite_opcode_table[id].lfo_config,
2089                                      llite_opcode_table[id].lfo_opname);
2090
2091         debugfs_create_file("stats", 0644, sbi->ll_debugfs_entry,
2092                             sbi->ll_stats, &ldebugfs_stats_seq_fops);
2093
2094         sbi->ll_ra_stats = lprocfs_stats_alloc(ARRAY_SIZE(ra_stat_string),
2095                                                LPROCFS_STATS_FLAG_NONE);
2096         if (sbi->ll_ra_stats == NULL)
2097                 GOTO(out_stats, err = -ENOMEM);
2098
2099         for (id = 0; id < ARRAY_SIZE(ra_stat_string); id++) {
2100                 if (id == RA_STAT_READAHEAD_PAGES)
2101                         lprocfs_counter_init(sbi->ll_ra_stats, id,
2102                                              LPROCFS_TYPE_PAGES |
2103                                              LPROCFS_CNTR_AVGMINMAX,
2104                                              ra_stat_string[id]);
2105                 else
2106                         lprocfs_counter_init(sbi->ll_ra_stats, id,
2107                                              LPROCFS_TYPE_PAGES,
2108                                              ra_stat_string[id]);
2109         }
2110
2111         debugfs_create_file("read_ahead_stats", 0644, sbi->ll_debugfs_entry,
2112                             sbi->ll_ra_stats, &ldebugfs_stats_seq_fops);
2113
2114 out_ll_kset:
2115         /* Yes we also register sysfs mount kset here as well */
2116         sbi->ll_kset.kobj.parent = llite_kobj;
2117         sbi->ll_kset.kobj.ktype = &sbi_ktype;
2118         init_completion(&sbi->ll_kobj_unregister);
2119         err = kobject_set_name(&sbi->ll_kset.kobj, "%s", name);
2120         if (err)
2121                 GOTO(out_ra_stats, err);
2122
2123         err = kset_register(&sbi->ll_kset);
2124         if (err)
2125                 GOTO(out_ra_stats, err);
2126
2127         lsi->lsi_kobj = kobject_get(&sbi->ll_kset.kobj);
2128
2129         RETURN(0);
2130 out_ra_stats:
2131         lprocfs_stats_free(&sbi->ll_ra_stats);
2132 out_stats:
2133         lprocfs_stats_free(&sbi->ll_stats);
2134 out_debugfs:
2135         debugfs_remove_recursive(sbi->ll_debugfs_entry);
2136
2137         RETURN(err);
2138 }
2139
2140 void ll_debugfs_unregister_super(struct super_block *sb)
2141 {
2142         struct lustre_sb_info *lsi = s2lsi(sb);
2143         struct ll_sb_info *sbi = ll_s2sbi(sb);
2144
2145         debugfs_remove_recursive(sbi->ll_debugfs_entry);
2146
2147         if (sbi->ll_dt_obd)
2148                 sysfs_remove_link(&sbi->ll_kset.kobj,
2149                                   sbi->ll_dt_obd->obd_type->typ_name);
2150
2151         if (sbi->ll_md_obd)
2152                 sysfs_remove_link(&sbi->ll_kset.kobj,
2153                                   sbi->ll_md_obd->obd_type->typ_name);
2154
2155         kobject_put(lsi->lsi_kobj);
2156
2157         kset_unregister(&sbi->ll_kset);
2158         wait_for_completion(&sbi->ll_kobj_unregister);
2159
2160         lprocfs_stats_free(&sbi->ll_ra_stats);
2161         lprocfs_stats_free(&sbi->ll_stats);
2162 }
2163 #undef MAX_STRING_SIZE
2164
2165 static void ll_display_extents_info(struct ll_rw_extents_info *rw_extents,
2166                                     struct seq_file *seq, int which)
2167 {
2168         unsigned long read_tot = 0, write_tot = 0, read_cum, write_cum;
2169         unsigned long start, end, r, w;
2170         char *unitp = "KMGTPEZY";
2171         int i, units = 10;
2172         struct per_process_info *pp_info;
2173
2174         pp_info = &rw_extents->pp_extents[which];
2175         read_cum = 0;
2176         write_cum = 0;
2177         start = 0;
2178
2179         for (i = 0; i < LL_HIST_MAX; i++) {
2180                 read_tot += pp_info->pp_r_hist.oh_buckets[i];
2181                 write_tot += pp_info->pp_w_hist.oh_buckets[i];
2182         }
2183
2184         for (i = 0; i < LL_HIST_MAX; i++) {
2185                 r = pp_info->pp_r_hist.oh_buckets[i];
2186                 w = pp_info->pp_w_hist.oh_buckets[i];
2187                 read_cum += r;
2188                 write_cum += w;
2189                 end = 1 << (i + LL_HIST_START - units);
2190                 seq_printf(seq, "%4lu%c - %4lu%c%c: %14lu %4u %4u  | "
2191                            "%14lu %4u %4u\n", start, *unitp, end, *unitp,
2192                            (i == LL_HIST_MAX - 1) ? '+' : ' ',
2193                            r, pct(r, read_tot), pct(read_cum, read_tot),
2194                            w, pct(w, write_tot), pct(write_cum, write_tot));
2195                 start = end;
2196                 if (start == (1 << 10)) {
2197                         start = 1;
2198                         units += 10;
2199                         unitp++;
2200                 }
2201                 if (read_cum == read_tot && write_cum == write_tot)
2202                         break;
2203         }
2204 }
2205
2206 static int ll_rw_extents_stats_pp_seq_show(struct seq_file *seq, void *v)
2207 {
2208         struct ll_sb_info *sbi = seq->private;
2209         struct ll_rw_extents_info *rw_extents = sbi->ll_rw_extents_info;
2210         int k;
2211
2212         if (!sbi->ll_rw_stats_on || !rw_extents) {
2213                 seq_puts(seq, "disabled\n write anything to this file to activate, then '0' or 'disable' to deactivate\n");
2214                 return 0;
2215         }
2216
2217         spin_lock(&sbi->ll_pp_extent_lock);
2218         lprocfs_stats_header(seq, ktime_get_real(), rw_extents->pp_init, 25,
2219                              ":", true, "");
2220         seq_printf(seq, "%15s %19s       | %20s\n", " ", "read", "write");
2221         seq_printf(seq, "%13s   %14s %4s %4s  | %14s %4s %4s\n",
2222                    "extents", "calls", "%", "cum%", "calls", "%", "cum%");
2223
2224         for (k = 0; k < LL_PROCESS_HIST_MAX; k++) {
2225                 if (rw_extents->pp_extents[k].pid != 0) {
2226                         seq_printf(seq, "\nPID: %d\n",
2227                                    rw_extents->pp_extents[k].pid);
2228                         ll_display_extents_info(rw_extents, seq, k);
2229                 }
2230         }
2231         spin_unlock(&sbi->ll_pp_extent_lock);
2232         return 0;
2233 }
2234
2235 static int alloc_rw_stats_info(struct ll_sb_info *sbi)
2236 {
2237         struct ll_rw_extents_info *rw_extents;
2238         struct ll_rw_process_info *offset;
2239         struct ll_rw_process_info *process;
2240         int i, rc = 0;
2241
2242         OBD_ALLOC(rw_extents, sizeof(*rw_extents));
2243         if (!rw_extents)
2244                 return -ENOMEM;
2245
2246         for (i = 0; i <= LL_PROCESS_HIST_MAX; i++) {
2247                 spin_lock_init(&rw_extents->pp_extents[i].pp_r_hist.oh_lock);
2248                 spin_lock_init(&rw_extents->pp_extents[i].pp_w_hist.oh_lock);
2249         }
2250         rw_extents->pp_init = ktime_get_real();
2251
2252         spin_lock(&sbi->ll_pp_extent_lock);
2253         if (!sbi->ll_rw_extents_info)
2254                 sbi->ll_rw_extents_info = rw_extents;
2255         spin_unlock(&sbi->ll_pp_extent_lock);
2256         /* another writer allocated the struct before we got the lock */
2257         if (sbi->ll_rw_extents_info != rw_extents)
2258                 OBD_FREE(rw_extents, sizeof(*rw_extents));
2259
2260         OBD_ALLOC(process, sizeof(*process) * LL_PROCESS_HIST_MAX);
2261         if (!process)
2262                 GOTO(out, rc = -ENOMEM);
2263         OBD_ALLOC(offset, sizeof(*offset) * LL_OFFSET_HIST_MAX);
2264         if (!offset)
2265                 GOTO(out_free, rc = -ENOMEM);
2266
2267         spin_lock(&sbi->ll_process_lock);
2268         if (!sbi->ll_rw_process_info)
2269                 sbi->ll_rw_process_info = process;
2270         if (!sbi->ll_rw_offset_info)
2271                 sbi->ll_rw_offset_info = offset;
2272         spin_unlock(&sbi->ll_process_lock);
2273         sbi->ll_process_stats_init = ktime_get_real();
2274
2275         /* another writer allocated the structs before we got the lock */
2276         if (sbi->ll_rw_offset_info != offset)
2277                 OBD_FREE(offset, sizeof(*offset) * LL_OFFSET_HIST_MAX);
2278         if (sbi->ll_rw_process_info != process) {
2279 out_free:
2280                 OBD_FREE(process, sizeof(*process) * LL_PROCESS_HIST_MAX);
2281         }
2282
2283 out:
2284         return rc;
2285 }
2286
2287 void ll_free_rw_stats_info(struct ll_sb_info *sbi)
2288 {
2289         if (sbi->ll_rw_extents_info) {
2290                 OBD_FREE(sbi->ll_rw_extents_info,
2291                          sizeof(*sbi->ll_rw_extents_info));
2292                 sbi->ll_rw_extents_info = NULL;
2293         }
2294         if (sbi->ll_rw_offset_info) {
2295                 OBD_FREE(sbi->ll_rw_offset_info,
2296                          sizeof(*sbi->ll_rw_offset_info) * LL_OFFSET_HIST_MAX);
2297                 sbi->ll_rw_offset_info = NULL;
2298         }
2299         if (sbi->ll_rw_process_info) {
2300                 OBD_FREE(sbi->ll_rw_process_info,
2301                         sizeof(*sbi->ll_rw_process_info) * LL_PROCESS_HIST_MAX);
2302                 sbi->ll_rw_process_info = NULL;
2303         }
2304 }
2305
2306 static ssize_t ll_rw_extents_stats_pp_seq_write(struct file *file,
2307                                                 const char __user *buf,
2308                                                 size_t len, loff_t *off)
2309 {
2310         struct seq_file *seq = file->private_data;
2311         struct ll_sb_info *sbi = seq->private;
2312         struct ll_rw_extents_info *rw_extents;
2313         int i;
2314         __s64 value;
2315
2316         if (len == 0)
2317                 return -EINVAL;
2318
2319         value = ll_stats_pid_write(buf, len);
2320
2321         if (value == 0) {
2322                 sbi->ll_rw_stats_on = 0;
2323         } else {
2324                 if (!sbi->ll_rw_extents_info) {
2325                         int rc = alloc_rw_stats_info(sbi);
2326
2327                         if (rc)
2328                                 return rc;
2329                 }
2330                 sbi->ll_rw_stats_on = 1;
2331         }
2332
2333
2334         spin_lock(&sbi->ll_pp_extent_lock);
2335         rw_extents = sbi->ll_rw_extents_info;
2336         if (rw_extents) {
2337                 rw_extents->pp_init = ktime_get_real();
2338                 for (i = 0; i < LL_PROCESS_HIST_MAX; i++) {
2339                         rw_extents->pp_extents[i].pid = 0;
2340                         lprocfs_oh_clear(&rw_extents->pp_extents[i].pp_r_hist);
2341                         lprocfs_oh_clear(&rw_extents->pp_extents[i].pp_w_hist);
2342                 }
2343         }
2344         spin_unlock(&sbi->ll_pp_extent_lock);
2345
2346         return len;
2347 }
2348
2349 LDEBUGFS_SEQ_FOPS(ll_rw_extents_stats_pp);
2350
2351 static int ll_rw_extents_stats_seq_show(struct seq_file *seq, void *v)
2352 {
2353         struct ll_sb_info *sbi = seq->private;
2354         struct ll_rw_extents_info *rw_extents = sbi->ll_rw_extents_info;
2355
2356         if (!sbi->ll_rw_stats_on || !rw_extents) {
2357                 seq_puts(seq, "disabled\n write anything to this file to activate, then '0' or 'disable' to deactivate\n");
2358                 return 0;
2359         }
2360
2361         spin_lock(&sbi->ll_lock);
2362         lprocfs_stats_header(seq, ktime_get_real(), rw_extents->pp_init, 25,
2363                              ":", true, "");
2364
2365         seq_printf(seq, "%15s %19s       | %20s\n", " ", "read", "write");
2366         seq_printf(seq, "%13s   %14s %4s %4s  | %14s %4s %4s\n",
2367                    "extents", "calls", "%", "cum%",
2368                    "calls", "%", "cum%");
2369
2370         ll_display_extents_info(rw_extents, seq, LL_PROCESS_HIST_MAX);
2371         spin_unlock(&sbi->ll_lock);
2372
2373         return 0;
2374 }
2375
2376 static ssize_t ll_rw_extents_stats_seq_write(struct file *file,
2377                                              const char __user *buf,
2378                                              size_t len, loff_t *off)
2379 {
2380         struct seq_file *seq = file->private_data;
2381         struct ll_sb_info *sbi = seq->private;
2382         struct ll_rw_extents_info *rw_extents;
2383         int i;
2384         __s64 value;
2385
2386         if (len == 0)
2387                 return -EINVAL;
2388
2389         value = ll_stats_pid_write(buf, len);
2390
2391         if (value == 0) {
2392                 sbi->ll_rw_stats_on = 0;
2393         } else {
2394                 if (!sbi->ll_rw_extents_info) {
2395                         int rc = alloc_rw_stats_info(sbi);
2396
2397                         if (rc)
2398                                 return rc;
2399                 }
2400                 sbi->ll_rw_stats_on = 1;
2401         }
2402
2403         spin_lock(&sbi->ll_pp_extent_lock);
2404         rw_extents = sbi->ll_rw_extents_info;
2405         if (rw_extents) {
2406                 rw_extents->pp_init = ktime_get_real();
2407                 for (i = 0; i <= LL_PROCESS_HIST_MAX; i++) {
2408                         rw_extents->pp_extents[i].pid = 0;
2409                         lprocfs_oh_clear(&rw_extents->pp_extents[i].pp_r_hist);
2410                         lprocfs_oh_clear(&rw_extents->pp_extents[i].pp_w_hist);
2411                 }
2412         }
2413         spin_unlock(&sbi->ll_pp_extent_lock);
2414
2415         return len;
2416 }
2417
2418 LDEBUGFS_SEQ_FOPS(ll_rw_extents_stats);
2419
2420 void ll_rw_stats_tally(struct ll_sb_info *sbi, pid_t pid,
2421                        struct ll_file_data *file, loff_t pos,
2422                        size_t count, int rw)
2423 {
2424         int i, cur = -1;
2425         struct ll_rw_process_info *process;
2426         struct ll_rw_process_info *offset;
2427         int *off_count = &sbi->ll_rw_offset_entry_count;
2428         int *process_count = &sbi->ll_offset_process_count;
2429         struct ll_rw_extents_info *rw_extents;
2430
2431         if (!sbi->ll_rw_stats_on)
2432                 return;
2433
2434         spin_lock(&sbi->ll_pp_extent_lock);
2435         rw_extents = sbi->ll_rw_extents_info;
2436         if (!rw_extents) {
2437                 spin_unlock(&sbi->ll_pp_extent_lock);
2438                 return;
2439         }
2440
2441         /* Extent statistics */
2442         for (i = 0; i < LL_PROCESS_HIST_MAX; i++) {
2443                 if (rw_extents->pp_extents[i].pid == pid) {
2444                         cur = i;
2445                         break;
2446                 }
2447         }
2448
2449         if (cur == -1) {
2450                 /* new process */
2451                 sbi->ll_extent_process_count =
2452                         (sbi->ll_extent_process_count + 1) % LL_PROCESS_HIST_MAX;
2453                 cur = sbi->ll_extent_process_count;
2454                 rw_extents->pp_extents[cur].pid = pid;
2455                 lprocfs_oh_clear(&rw_extents->pp_extents[cur].pp_r_hist);
2456                 lprocfs_oh_clear(&rw_extents->pp_extents[cur].pp_w_hist);
2457         }
2458
2459         for (i = 0; (count >= 1 << (LL_HIST_START + i)) &&
2460              (i < (LL_HIST_MAX - 1)); i++);
2461         if (rw == 0) {
2462                 rw_extents->pp_extents[cur].pp_r_hist.oh_buckets[i]++;
2463                 rw_extents->pp_extents[LL_PROCESS_HIST_MAX].pp_r_hist.oh_buckets[i]++;
2464         } else {
2465                 rw_extents->pp_extents[cur].pp_w_hist.oh_buckets[i]++;
2466                 rw_extents->pp_extents[LL_PROCESS_HIST_MAX].pp_w_hist.oh_buckets[i]++;
2467         }
2468         spin_unlock(&sbi->ll_pp_extent_lock);
2469
2470         spin_lock(&sbi->ll_process_lock);
2471         process = sbi->ll_rw_process_info;
2472         offset = sbi->ll_rw_offset_info;
2473         if (!process || !offset)
2474                 goto out_unlock;
2475
2476         /* Offset statistics */
2477         for (i = 0; i < LL_PROCESS_HIST_MAX; i++) {
2478                 if (process[i].rw_pid == pid) {
2479                         if (process[i].rw_last_file != file) {
2480                                 process[i].rw_range_start = pos;
2481                                 process[i].rw_last_file_pos = pos + count;
2482                                 process[i].rw_smallest_extent = count;
2483                                 process[i].rw_largest_extent = count;
2484                                 process[i].rw_offset = 0;
2485                                 process[i].rw_last_file = file;
2486                                 goto out_unlock;
2487                         }
2488                         if (process[i].rw_last_file_pos != pos) {
2489                                 *off_count =
2490                                     (*off_count + 1) % LL_OFFSET_HIST_MAX;
2491                                 offset[*off_count].rw_op = process[i].rw_op;
2492                                 offset[*off_count].rw_pid = pid;
2493                                 offset[*off_count].rw_range_start =
2494                                         process[i].rw_range_start;
2495                                 offset[*off_count].rw_range_end =
2496                                         process[i].rw_last_file_pos;
2497                                 offset[*off_count].rw_smallest_extent =
2498                                         process[i].rw_smallest_extent;
2499                                 offset[*off_count].rw_largest_extent =
2500                                         process[i].rw_largest_extent;
2501                                 offset[*off_count].rw_offset =
2502                                         process[i].rw_offset;
2503                                 process[i].rw_op = rw;
2504                                 process[i].rw_range_start = pos;
2505                                 process[i].rw_smallest_extent = count;
2506                                 process[i].rw_largest_extent = count;
2507                                 process[i].rw_offset = pos -
2508                                         process[i].rw_last_file_pos;
2509                         }
2510                         if (process[i].rw_smallest_extent > count)
2511                                 process[i].rw_smallest_extent = count;
2512                         if (process[i].rw_largest_extent < count)
2513                                 process[i].rw_largest_extent = count;
2514                         process[i].rw_last_file_pos = pos + count;
2515                         goto out_unlock;
2516                 }
2517         }
2518         *process_count = (*process_count + 1) % LL_PROCESS_HIST_MAX;
2519         process[*process_count].rw_pid = pid;
2520         process[*process_count].rw_op = rw;
2521         process[*process_count].rw_range_start = pos;
2522         process[*process_count].rw_last_file_pos = pos + count;
2523         process[*process_count].rw_smallest_extent = count;
2524         process[*process_count].rw_largest_extent = count;
2525         process[*process_count].rw_offset = 0;
2526         process[*process_count].rw_last_file = file;
2527
2528 out_unlock:
2529         spin_unlock(&sbi->ll_process_lock);
2530 }
2531
2532 static int ll_rw_offset_stats_seq_show(struct seq_file *seq, void *v)
2533 {
2534         struct ll_sb_info *sbi = seq->private;
2535         struct ll_rw_process_info *offset;
2536         struct ll_rw_process_info *process;
2537         int i;
2538
2539         if (!sbi->ll_rw_stats_on) {
2540                 seq_puts(seq, "disabled\n write anything to this file to activate, then '0' or 'disable' to deactivate\n");
2541                 return 0;
2542         }
2543
2544         spin_lock(&sbi->ll_process_lock);
2545         lprocfs_stats_header(seq, ktime_get_real(), sbi->ll_process_stats_init,
2546                              25, ":", true, "");
2547         seq_printf(seq, "%3s %10s %14s %14s %17s %17s %14s\n",
2548                    "R/W", "PID", "RANGE START", "RANGE END",
2549                    "SMALLEST EXTENT", "LARGEST EXTENT", "OFFSET");
2550
2551         /* We stored the discontiguous offsets here; print them first */
2552         offset = sbi->ll_rw_offset_info;
2553         for (i = 0; offset && i < LL_OFFSET_HIST_MAX; i++) {
2554                 if (offset[i].rw_pid != 0)
2555                         seq_printf(seq,
2556                                   "%3c %10d %14llu %14llu %17lu %17lu %14lld\n",
2557                                    offset[i].rw_op == READ ? 'R' : 'W',
2558                                    offset[i].rw_pid,
2559                                    offset[i].rw_range_start,
2560                                    offset[i].rw_range_end,
2561                                    (unsigned long)offset[i].rw_smallest_extent,
2562                                    (unsigned long)offset[i].rw_largest_extent,
2563                                    offset[i].rw_offset);
2564         }
2565
2566         /* Then print the current offsets for each process */
2567         process = sbi->ll_rw_process_info;
2568         for (i = 0; process && i < LL_PROCESS_HIST_MAX; i++) {
2569                 if (process[i].rw_pid != 0)
2570                         seq_printf(seq,
2571                                   "%3c %10d %14llu %14llu %17lu %17lu %14lld\n",
2572                                    process[i].rw_op == READ ? 'R' : 'W',
2573                                    process[i].rw_pid,
2574                                    process[i].rw_range_start,
2575                                    process[i].rw_last_file_pos,
2576                                    (unsigned long)process[i].rw_smallest_extent,
2577                                    (unsigned long)process[i].rw_largest_extent,
2578                                    process[i].rw_offset);
2579         }
2580         spin_unlock(&sbi->ll_process_lock);
2581
2582         return 0;
2583 }
2584
2585 static ssize_t ll_rw_offset_stats_seq_write(struct file *file,
2586                                             const char __user *buf,
2587                                             size_t len, loff_t *off)
2588 {
2589         struct seq_file *seq = file->private_data;
2590         struct ll_sb_info *sbi = seq->private;
2591         __s64 value;
2592
2593         if (len == 0)
2594                 return -EINVAL;
2595
2596         value = ll_stats_pid_write(buf, len);
2597
2598         if (value == 0) {
2599                 sbi->ll_rw_stats_on = 0;
2600         } else {
2601                 if (!sbi->ll_rw_process_info || !sbi->ll_rw_offset_info) {
2602                         int rc = alloc_rw_stats_info(sbi);
2603
2604                         if (rc)
2605                                 return rc;
2606                 }
2607                 sbi->ll_rw_stats_on = 1;
2608         }
2609
2610         spin_lock(&sbi->ll_process_lock);
2611         sbi->ll_offset_process_count = 0;
2612         sbi->ll_rw_offset_entry_count = 0;
2613         sbi->ll_process_stats_init = ktime_get_real();
2614         if (sbi->ll_rw_process_info)
2615                 memset(sbi->ll_rw_process_info, 0,
2616                        sizeof(struct ll_rw_process_info) * LL_PROCESS_HIST_MAX);
2617         if (sbi->ll_rw_offset_info)
2618                 memset(sbi->ll_rw_offset_info, 0,
2619                        sizeof(struct ll_rw_process_info) * LL_OFFSET_HIST_MAX);
2620         spin_unlock(&sbi->ll_process_lock);
2621
2622         return len;
2623 }
2624
2625 LDEBUGFS_SEQ_FOPS(ll_rw_offset_stats);