1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
4 * Copyright (C) 2001, 2002 Cluster File Systems, Inc.
6 * This file is part of Lustre, http://www.lustre.org.
8 * Lustre is free software; you can redistribute it and/or
9 * modify it under the terms of version 2 of the GNU General Public
10 * License as published by the Free Software Foundation.
12 * Lustre is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Lustre; if not, write to the Free Software
19 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
27 #include <linux/config.h>
28 #include <linux/autoconf.h>
29 #include <linux/slab.h>
30 #include <linux/highmem.h>
31 #include <linux/buffer_head.h>
33 #include <libcfs/kp30.h>
34 #include <linux/lustre_compat25.h>
36 /* global variables */
37 extern int obd_memmax;
38 extern atomic_t obd_memory;
40 extern unsigned int obd_fail_loc;
41 extern unsigned int obd_timeout;
42 extern unsigned int ldlm_timeout;
43 extern char obd_lustre_upcall[128];
44 extern unsigned int obd_sync_filter;
45 extern unsigned int obd_dump_on_timeout;
46 extern wait_queue_head_t obd_race_waitq;
48 #define OBD_FAIL_MDS 0x100
49 #define OBD_FAIL_MDS_HANDLE_UNPACK 0x101
50 #define OBD_FAIL_MDS_GETATTR_NET 0x102
51 #define OBD_FAIL_MDS_GETATTR_PACK 0x103
52 #define OBD_FAIL_MDS_READPAGE_NET 0x104
53 #define OBD_FAIL_MDS_READPAGE_PACK 0x105
54 #define OBD_FAIL_MDS_SENDPAGE 0x106
55 #define OBD_FAIL_MDS_REINT_NET 0x107
56 #define OBD_FAIL_MDS_REINT_UNPACK 0x108
57 #define OBD_FAIL_MDS_REINT_SETATTR 0x109
58 #define OBD_FAIL_MDS_REINT_SETATTR_WRITE 0x10a
59 #define OBD_FAIL_MDS_REINT_CREATE 0x10b
60 #define OBD_FAIL_MDS_REINT_CREATE_WRITE 0x10c
61 #define OBD_FAIL_MDS_REINT_UNLINK 0x10d
62 #define OBD_FAIL_MDS_REINT_UNLINK_WRITE 0x10e
63 #define OBD_FAIL_MDS_REINT_LINK 0x10f
64 #define OBD_FAIL_MDS_REINT_LINK_WRITE 0x110
65 #define OBD_FAIL_MDS_REINT_RENAME 0x111
66 #define OBD_FAIL_MDS_REINT_RENAME_WRITE 0x112
67 #define OBD_FAIL_MDS_OPEN_NET 0x113
68 #define OBD_FAIL_MDS_OPEN_PACK 0x114
69 #define OBD_FAIL_MDS_CLOSE_NET 0x115
70 #define OBD_FAIL_MDS_CLOSE_PACK 0x116
71 #define OBD_FAIL_MDS_CONNECT_NET 0x117
72 #define OBD_FAIL_MDS_CONNECT_PACK 0x118
73 #define OBD_FAIL_MDS_REINT_NET_REP 0x119
74 #define OBD_FAIL_MDS_DISCONNECT_NET 0x11a
75 #define OBD_FAIL_MDS_GETSTATUS_NET 0x11b
76 #define OBD_FAIL_MDS_GETSTATUS_PACK 0x11c
77 #define OBD_FAIL_MDS_STATFS_PACK 0x11d
78 #define OBD_FAIL_MDS_STATFS_NET 0x11e
79 #define OBD_FAIL_MDS_GETATTR_LOCK_NET 0x11f
80 #define OBD_FAIL_MDS_PIN_NET 0x120
81 #define OBD_FAIL_MDS_UNPIN_NET 0x121
82 #define OBD_FAIL_MDS_ALL_REPLY_NET 0x122
83 #define OBD_FAIL_MDS_ALL_REQUEST_NET 0x123
84 #define OBD_FAIL_MDS_SYNC_NET 0x124
85 #define OBD_FAIL_MDS_SYNC_PACK 0x125
86 #define OBD_FAIL_MDS_DONE_WRITING_NET 0x126
87 #define OBD_FAIL_MDS_DONE_WRITING_PACK 0x127
88 #define OBD_FAIL_MDS_ALLOC_OBDO 0x128
89 #define OBD_FAIL_MDS_PAUSE_OPEN 0x129
90 #define OBD_FAIL_MDS_STATFS_LCW_SLEEP 0x12a
91 #define OBD_FAIL_MDS_OPEN_CREATE 0x12b
92 #define OBD_FAIL_MDS_ACCESS_CHECK_NET 0x12c
93 #define OBD_FAIL_MDS_ACCESS_CHECK_PACK 0x12d
95 #define OBD_FAIL_OST 0x200
96 #define OBD_FAIL_OST_CONNECT_NET 0x201
97 #define OBD_FAIL_OST_DISCONNECT_NET 0x202
98 #define OBD_FAIL_OST_GET_INFO_NET 0x203
99 #define OBD_FAIL_OST_CREATE_NET 0x204
100 #define OBD_FAIL_OST_DESTROY_NET 0x205
101 #define OBD_FAIL_OST_GETATTR_NET 0x206
102 #define OBD_FAIL_OST_SETATTR_NET 0x207
103 #define OBD_FAIL_OST_OPEN_NET 0x208
104 #define OBD_FAIL_OST_CLOSE_NET 0x209
105 #define OBD_FAIL_OST_BRW_NET 0x20a
106 #define OBD_FAIL_OST_PUNCH_NET 0x20b
107 #define OBD_FAIL_OST_STATFS_NET 0x20c
108 #define OBD_FAIL_OST_HANDLE_UNPACK 0x20d
109 #define OBD_FAIL_OST_BRW_WRITE_BULK 0x20e
110 #define OBD_FAIL_OST_BRW_READ_BULK 0x20f
111 #define OBD_FAIL_OST_SYNC_NET 0x210
112 #define OBD_FAIL_OST_ALL_REPLY_NET 0x211
113 #define OBD_FAIL_OST_ALL_REQUESTS_NET 0x212
114 #define OBD_FAIL_OST_LDLM_REPLY_NET 0x213
115 #define OBD_FAIL_OST_BRW_PAUSE_BULK 0x214
116 #define OBD_FAIL_OST_ENOSPC 0x215
117 #define OBD_FAIL_OST_EROFS 0x216
120 #define OBD_FAIL_LDLM 0x300
121 #define OBD_FAIL_LDLM_NAMESPACE_NEW 0x301
122 #define OBD_FAIL_LDLM_ENQUEUE 0x302
123 #define OBD_FAIL_LDLM_CONVERT 0x303
124 #define OBD_FAIL_LDLM_CANCEL 0x304
125 #define OBD_FAIL_LDLM_BL_CALLBACK 0x305
126 #define OBD_FAIL_LDLM_CP_CALLBACK 0x306
127 #define OBD_FAIL_LDLM_GL_CALLBACK 0x307
128 #define OBD_FAIL_LDLM_ENQUEUE_EXTENT_ERR 0x308
129 #define OBD_FAIL_LDLM_ENQUEUE_INTENT_ERR 0x309
130 #define OBD_FAIL_LDLM_CREATE_RESOURCE 0x30a
131 #define OBD_FAIL_LDLM_ENQUEUE_BLOCKED 0x30b
132 #define OBD_FAIL_LDLM_REPLY 0x30c
135 #define OBD_FAIL_OSC 0x400
136 #define OBD_FAIL_OSC_BRW_READ_BULK 0x401
137 #define OBD_FAIL_OSC_BRW_WRITE_BULK 0x402
138 #define OBD_FAIL_OSC_LOCK_BL_AST 0x403
139 #define OBD_FAIL_OSC_LOCK_CP_AST 0x404
140 #define OBD_FAIL_OSC_MATCH 0x405
142 #define OBD_FAIL_PTLRPC 0x500
143 #define OBD_FAIL_PTLRPC_ACK 0x501
144 #define OBD_FAIL_PTLRPC_RQBD 0x502
145 #define OBD_FAIL_PTLRPC_BULK_GET_NET 0x503
146 #define OBD_FAIL_PTLRPC_BULK_PUT_NET 0x504
148 #define OBD_FAIL_OBD_PING_NET 0x600
149 #define OBD_FAIL_OBD_LOG_CANCEL_NET 0x601
150 #define OBD_FAIL_OBD_LOGD_NET 0x602
152 #define OBD_FAIL_TGT_REPLY_NET 0x700
153 #define OBD_FAIL_TGT_CONN_RACE 0x701
155 #define OBD_FAIL_SVCSEC_ACCEPT_BEG 0x750
156 #define OBD_FAIL_SVCSEC_ACCEPT_END 0x751
157 #define OBD_FAIL_SVCSEC_WRAP_BEG 0x752
158 #define OBD_FAIL_SVCSEC_WRAP_END 0x753
159 #define OBD_FAIL_SVCGSS_ERR_NOTIFY 0x760
160 #define OBD_FAIL_SVCGSS_INIT_REQ 0x780
161 #define OBD_FAIL_SVCGSS_INIT_REP 0x781
163 #define OBD_FAIL_MDC_REVALIDATE_PAUSE 0x800
165 /* preparation for a more advanced failure testbed (not functional yet) */
166 #define OBD_FAIL_MASK_SYS 0x0000FF00
167 #define OBD_FAIL_MASK_LOC (0x000000FF | OBD_FAIL_MASK_SYS)
168 #define OBD_FAIL_ONCE 0x80000000
169 #define OBD_FAILED 0x40000000
170 #define OBD_FAIL_MDS_ALL_NET 0x01000000
171 #define OBD_FAIL_OST_ALL_NET 0x02000000
173 #define OBD_FAIL_CHECK(id) (((obd_fail_loc & OBD_FAIL_MASK_LOC) == \
174 ((id) & OBD_FAIL_MASK_LOC)) && \
175 ((obd_fail_loc & (OBD_FAILED | OBD_FAIL_ONCE))!= \
176 (OBD_FAILED | OBD_FAIL_ONCE)))
178 #define OBD_FAIL_CHECK_ONCE(id) \
180 if (OBD_FAIL_CHECK(id)) { \
181 CERROR("obd_fail_loc=%x\n", id); \
182 obd_fail_loc |= OBD_FAILED; \
183 if ((id) & OBD_FAIL_ONCE) \
184 obd_fail_loc |= OBD_FAIL_ONCE; \
190 #define OBD_FAIL_RETURN(id, ret) \
192 if (OBD_FAIL_CHECK_ONCE(id)) { \
197 #define OBD_FAIL_GOTO(id, label, ret) \
199 if (OBD_FAIL_CHECK_ONCE(id)) { \
200 GOTO(label, (ret)); \
204 #define OBD_FAIL_TIMEOUT(id, secs) \
206 if (OBD_FAIL_CHECK_ONCE(id)) { \
207 CERROR("obd_fail_timeout id %x sleeping for %d secs\n", \
209 set_current_state(TASK_UNINTERRUPTIBLE); \
210 schedule_timeout((secs) * HZ); \
211 set_current_state(TASK_RUNNING); \
212 CERROR("obd_fail_timeout id %x awake\n", (id)); \
219 * sleep_on() is known to be racy, using wait_event() interface instead as
220 * recommended. --umka
222 #define OBD_SLEEP_ON(wq) \
224 DEFINE_WAIT(__wait); \
225 prepare_to_wait(&wq, &__wait, TASK_INTERRUPTIBLE); \
227 finish_wait(&wq, &__wait); \
230 /* The idea here is to synchronise two threads to force a race. The
231 * first thread that calls this with a matching fail_loc is put to
232 * sleep. The next thread that calls with the same fail_loc wakes up
233 * the first and continues. */
234 #define OBD_RACE(id) \
236 if (OBD_FAIL_CHECK_ONCE(id)) { \
237 CERROR("obd_race id %x sleeping\n", (id)); \
238 OBD_SLEEP_ON(obd_race_waitq); \
239 CERROR("obd_fail_race id %x awake\n", (id)); \
240 } else if ((obd_fail_loc & OBD_FAIL_MASK_LOC) == \
241 ((id) & OBD_FAIL_MASK_LOC)) { \
242 wake_up(&obd_race_waitq); \
246 /* sigh. an expedient fix until OBD_RACE is fixed up */
247 #define OBD_RACE(foo) LBUG()
250 #define fixme() CDEBUG(D_OTHER, "FIXME\n");
253 # include <linux/types.h>
254 # include <linux/blkdev.h>
257 # if (LINUX_VERSION_CODE >= KERNEL_VERSION(2,5,0))
258 # define BDEVNAME_DECLARE_STORAGE(foo) char foo[BDEVNAME_SIZE]
259 # define ll_bdevname(SB, STORAGE) __bdevname(kdev_t_to_nr(SB->s_dev), STORAGE)
260 # define ll_lock_kernel lock_kernel()
261 # define ll_sbdev(SB) ((SB)->s_bdev)
262 # define ll_sbdev_type struct block_device *
263 # define ll_sbdev_sync fsync_bdev
265 # define BDEVNAME_DECLARE_STORAGE(foo) char __unused_##foo
266 # define ll_sbdev(SB) (kdev_t_to_nr((SB)->s_dev))
267 # define ll_sbdev_type kdev_t
268 # define ll_sbdev_sync fsync_dev
269 # define ll_bdevname(SB,STORAGE) ((void)__unused_##STORAGE,bdevname(ll_sbdev(SB)))
270 # define ll_lock_kernel
273 #ifdef HAVE_OLD_DEV_SET_RDONLY
274 void dev_set_rdonly(ll_sbdev_type dev, int no_write);
275 void dev_clear_rdonly(int no_write);
277 void dev_set_rdonly(ll_sbdev_type dev);
278 void dev_clear_rdonly(ll_sbdev_type dev);
280 int dev_check_rdonly(ll_sbdev_type dev);
281 #define ll_check_rdonly(dev) dev_check_rdonly(dev)
283 static inline void ll_set_rdonly(ll_sbdev_type dev)
285 CDEBUG(D_IOCTL | D_HA, "set dev %ld rdonly\n", (long)dev);
287 #ifdef HAVE_OLD_DEV_SET_RDONLY
288 dev_set_rdonly(dev, 2);
294 static inline void ll_clear_rdonly(ll_sbdev_type dev)
296 CDEBUG(D_IOCTL | D_HA, "unset dev %ld rdonly\n", (long)dev);
297 if (ll_check_rdonly(dev)) {
299 #ifdef HAVE_OLD_DEV_SET_RDONLY
302 dev_clear_rdonly(dev);
307 static inline void OBD_FAIL_WRITE(int id, struct super_block *sb)
309 if (OBD_FAIL_CHECK(id)) {
310 BDEVNAME_DECLARE_STORAGE(tmp);
311 CERROR("obd_fail_loc=%x, fail write operation on %s\n",
312 id, ll_bdevname(sb, tmp));
313 ll_set_rdonly(ll_sbdev(sb));
314 /* We set FAIL_ONCE because we never "un-fail" a device */
315 obd_fail_loc |= OBD_FAILED | OBD_FAIL_ONCE;
318 #else /* !__KERNEL__ */
319 # define LTIME_S(time) (time)
320 /* for obd_class.h */
322 # define ERR_PTR(a) ((void *)(a))
324 #endif /* __KERNEL__ */
326 extern atomic_t portal_kmemory;
328 #if defined (CONFIG_DEBUG_MEMORY) && defined(__KERNEL__)
330 #define MT_FLAGS_WRONG_SIZE (1 << 0)
331 #define MEM_LOC_LEN 128
334 struct hlist_node m_hash;
335 char m_loc[MEM_LOC_LEN];
341 void lvfs_memdbg_show(void);
342 void lvfs_memdbg_insert(struct mem_track *mt);
343 void lvfs_memdbg_remove(struct mem_track *mt);
344 struct mem_track *lvfs_memdbg_find(void *ptr);
346 int lvfs_memdbg_check_insert(struct mem_track *mt);
347 struct mem_track *lvfs_memdbg_check_remove(void *ptr);
349 static inline struct mem_track *
350 __new_mem_track(void *ptr, int size,
351 char *file, int line)
353 struct mem_track *mt;
355 mt = kmalloc(sizeof(*mt), GFP_KERNEL);
359 snprintf(mt->m_loc, sizeof(mt->m_loc) - 1,
360 "%s:%d", file, line);
369 __free_mem_track(struct mem_track *mt)
375 __get_mem_track(void *ptr, int size,
376 char *file, int line)
378 struct mem_track *mt;
380 mt = __new_mem_track(ptr, size, file, line);
382 CWARN("can't allocate new memory track\n");
386 if (!lvfs_memdbg_check_insert(mt))
387 __free_mem_track(mt);
393 __put_mem_track(void *ptr, int size,
394 char *file, int line)
396 struct mem_track *mt;
398 if (!(mt = lvfs_memdbg_check_remove(ptr))) {
399 CWARN("ptr 0x%p is not allocated. Attempt to free "
400 "not allocated memory at %s:%d\n", ptr,
404 if (mt->m_size != size) {
405 mt->m_flags |= MT_FLAGS_WRONG_SIZE;
406 CWARN("freeing memory chunk of different size "
407 "than allocated (%d != %d) at %s:%d\n",
408 mt->m_size, size, file, line);
410 __free_mem_track(mt);
416 #define get_mem_track(ptr, size, file, line) \
417 __get_mem_track((ptr), (size), (file), (line))
419 #define put_mem_track(ptr, size, file, line) \
420 __put_mem_track((ptr), (size), (file), (line))
422 #else /* !CONFIG_DEBUG_MEMORY */
424 #define get_mem_track(ptr, size, file, line) \
427 #define put_mem_track(ptr, size, file, line) \
429 #endif /* !CONFIG_DEBUG_MEMORY */
431 #define OBD_ALLOC_GFP(ptr, size, gfp_mask) \
433 (ptr) = kmalloc(size, (gfp_mask)); \
434 if ((ptr) == NULL) { \
435 CERROR("kmalloc of '" #ptr "' (%d bytes) failed at %s:%d\n", \
436 (int)(size), __FILE__, __LINE__); \
437 CERROR("%d total bytes allocated by Lustre, %d by Portals\n", \
438 atomic_read(&obd_memory), atomic_read(&portal_kmemory)); \
440 memset(ptr, 0, size); \
441 atomic_add(size, &obd_memory); \
442 if (atomic_read(&obd_memory) > obd_memmax) \
443 obd_memmax = atomic_read(&obd_memory); \
444 get_mem_track((ptr), (size), __FILE__, __LINE__); \
445 CDEBUG(D_MALLOC, "kmalloced '" #ptr "': %d at %p (tot %d)\n", \
446 (int)(size), (ptr), atomic_read(&obd_memory)); \
451 # define OBD_GFP_MASK GFP_NOFS
455 #define OBD_ALLOC(ptr, size) OBD_ALLOC_GFP(ptr, size, OBD_GFP_MASK)
457 #define OBD_ALLOC(ptr, size) (ptr = malloc(size))
460 #define OBD_ALLOC_WAIT(ptr, size) OBD_ALLOC_GFP(ptr, size, GFP_KERNEL)
463 # define OBD_VMALLOC(ptr, size) OBD_ALLOC(ptr, size)
465 # define OBD_VMALLOC(ptr, size) \
467 (ptr) = vmalloc(size); \
468 if ((ptr) == NULL) { \
469 CERROR("vmalloc of '" #ptr "' (%d bytes) failed at %s:%d\n", \
470 (int)(size), __FILE__, __LINE__); \
471 CERROR("%d total bytes allocated by Lustre, %d by Portals\n", \
472 atomic_read(&obd_memory), atomic_read(&portal_kmemory)); \
474 memset(ptr, 0, size); \
475 atomic_add(size, &obd_memory); \
476 if (atomic_read(&obd_memory) > obd_memmax) \
477 obd_memmax = atomic_read(&obd_memory); \
478 get_mem_track((ptr), (size), __FILE__, __LINE__); \
479 CDEBUG(D_MALLOC, "vmalloced '" #ptr "': %d at %p (tot %d)\n", \
480 (int)(size), ptr, atomic_read(&obd_memory)); \
485 #ifdef CONFIG_DEBUG_SLAB
486 #define POISON(ptr, c, s) do {} while (0)
488 #define POISON(ptr, c, s) memset(ptr, c, s)
492 #define POISON_PAGE(page, val) do { memset(kmap(page), val, PAGE_SIZE); \
493 kunmap(page); } while (0)
495 #define POISON_PAGE(page, val) do { } while (0)
499 #define OBD_FREE(ptr, size) \
502 put_mem_track((ptr), (size), __FILE__, __LINE__); \
503 atomic_sub(size, &obd_memory); \
504 CDEBUG(D_MALLOC, "kfreed '" #ptr "': %d at %p (tot %d).\n", \
505 (int)(size), ptr, atomic_read(&obd_memory)); \
506 POISON(ptr, 0x5a, size); \
508 (ptr) = (void *)0xdeadbeef; \
511 #define OBD_FREE(ptr, size) ((void)(size), free((ptr)))
515 # define OBD_VFREE(ptr, size) OBD_FREE(ptr, size)
517 # define OBD_VFREE(ptr, size) \
520 put_mem_track((ptr), (size), __FILE__, __LINE__); \
521 atomic_sub(size, &obd_memory); \
522 CDEBUG(D_MALLOC, "vfreed '" #ptr "': %d at %p (tot %d).\n", \
523 (int)(size), ptr, atomic_read(&obd_memory)); \
524 POISON(ptr, 0x5a, size); \
526 (ptr) = (void *)0xdeadbeef; \
531 * we memset() the slab object to 0 when allocation succeeds, so DO NOT HAVE A
532 * CTOR THAT DOES ANYTHING. Its work will be cleared here. We'd love to assert
533 * on that, but slab.c keeps kmem_cache_s all to itself.
535 #define OBD_SLAB_ALLOC(ptr, slab, type, size) \
537 LASSERT(!in_interrupt()); \
538 (ptr) = kmem_cache_alloc(slab, (type)); \
539 if ((ptr) == NULL) { \
540 CERROR("slab-alloc of '"#ptr"' (%d bytes) failed at %s:%d\n", \
541 (int)(size), __FILE__, __LINE__); \
542 CERROR("%d total bytes allocated by Lustre, %d by Portals\n", \
543 atomic_read(&obd_memory), atomic_read(&portal_kmemory)); \
545 memset(ptr, 0, size); \
546 atomic_add(size, &obd_memory); \
547 if (atomic_read(&obd_memory) > obd_memmax) \
548 obd_memmax = atomic_read(&obd_memory); \
549 get_mem_track((ptr), (size), __FILE__, __LINE__); \
550 CDEBUG(D_MALLOC, "slab-alloced '"#ptr"': %d at %p (tot %d)\n", \
551 (int)(size), ptr, atomic_read(&obd_memory)); \
555 #define OBD_SLAB_FREE(ptr, slab, size) \
558 CDEBUG(D_MALLOC, "slab-freed '" #ptr "': %d at %p (tot %d).\n", \
559 (int)(size), ptr, atomic_read(&obd_memory)); \
560 put_mem_track((ptr), (size), __FILE__, __LINE__); \
561 atomic_sub(size, &obd_memory); \
562 POISON(ptr, 0x5a, size); \
563 kmem_cache_free(slab, ptr); \
564 (ptr) = (void *)0xdeadbeef; \