1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
4 * Copyright (C) 2001, 2002 Cluster File Systems, Inc.
6 * This file is part of Lustre, http://www.lustre.org.
8 * Lustre is free software; you can redistribute it and/or
9 * modify it under the terms of version 2 of the GNU General Public
10 * License as published by the Free Software Foundation.
12 * Lustre is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Lustre; if not, write to the Free Software
19 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
27 #include <linux/config.h>
28 #include <linux/autoconf.h>
29 #include <linux/slab.h>
30 #include <linux/highmem.h>
31 #include <linux/buffer_head.h>
33 #include <libcfs/kp30.h>
34 #include <linux/lustre_compat25.h>
36 /* global variables */
37 extern int obd_memmax;
38 extern atomic_t obd_memory;
40 extern unsigned int obd_fail_loc;
41 extern unsigned int obd_timeout;
42 extern unsigned int ldlm_timeout;
43 extern char obd_lustre_upcall[128];
44 extern unsigned int obd_sync_filter;
45 extern unsigned int obd_dump_on_timeout;
46 extern wait_queue_head_t obd_race_waitq;
48 #define OBD_FAIL_MDS 0x100
49 #define OBD_FAIL_MDS_HANDLE_UNPACK 0x101
50 #define OBD_FAIL_MDS_GETATTR_NET 0x102
51 #define OBD_FAIL_MDS_GETATTR_PACK 0x103
52 #define OBD_FAIL_MDS_READPAGE_NET 0x104
53 #define OBD_FAIL_MDS_READPAGE_PACK 0x105
54 #define OBD_FAIL_MDS_SENDPAGE 0x106
55 #define OBD_FAIL_MDS_REINT_NET 0x107
56 #define OBD_FAIL_MDS_REINT_UNPACK 0x108
57 #define OBD_FAIL_MDS_REINT_SETATTR 0x109
58 #define OBD_FAIL_MDS_REINT_SETATTR_WRITE 0x10a
59 #define OBD_FAIL_MDS_REINT_CREATE 0x10b
60 #define OBD_FAIL_MDS_REINT_CREATE_WRITE 0x10c
61 #define OBD_FAIL_MDS_REINT_UNLINK 0x10d
62 #define OBD_FAIL_MDS_REINT_UNLINK_WRITE 0x10e
63 #define OBD_FAIL_MDS_REINT_LINK 0x10f
64 #define OBD_FAIL_MDS_REINT_LINK_WRITE 0x110
65 #define OBD_FAIL_MDS_REINT_RENAME 0x111
66 #define OBD_FAIL_MDS_REINT_RENAME_WRITE 0x112
67 #define OBD_FAIL_MDS_OPEN_NET 0x113
68 #define OBD_FAIL_MDS_OPEN_PACK 0x114
69 #define OBD_FAIL_MDS_CLOSE_NET 0x115
70 #define OBD_FAIL_MDS_CLOSE_PACK 0x116
71 #define OBD_FAIL_MDS_CONNECT_NET 0x117
72 #define OBD_FAIL_MDS_CONNECT_PACK 0x118
73 #define OBD_FAIL_MDS_REINT_NET_REP 0x119
74 #define OBD_FAIL_MDS_DISCONNECT_NET 0x11a
75 #define OBD_FAIL_MDS_GETSTATUS_NET 0x11b
76 #define OBD_FAIL_MDS_GETSTATUS_PACK 0x11c
77 #define OBD_FAIL_MDS_STATFS_PACK 0x11d
78 #define OBD_FAIL_MDS_STATFS_NET 0x11e
79 #define OBD_FAIL_MDS_GETATTR_LOCK_NET 0x11f
80 #define OBD_FAIL_MDS_PIN_NET 0x120
81 #define OBD_FAIL_MDS_UNPIN_NET 0x121
82 #define OBD_FAIL_MDS_ALL_REPLY_NET 0x122
83 #define OBD_FAIL_MDS_ALL_REQUEST_NET 0x123
84 #define OBD_FAIL_MDS_SYNC_NET 0x124
85 #define OBD_FAIL_MDS_SYNC_PACK 0x125
86 #define OBD_FAIL_MDS_DONE_WRITING_NET 0x126
87 #define OBD_FAIL_MDS_DONE_WRITING_PACK 0x127
88 #define OBD_FAIL_MDS_ALLOC_OBDO 0x128
89 #define OBD_FAIL_MDS_PAUSE_OPEN 0x129
90 #define OBD_FAIL_MDS_STATFS_LCW_SLEEP 0x12a
91 #define OBD_FAIL_MDS_OPEN_CREATE 0x12b
93 #define OBD_FAIL_OST 0x200
94 #define OBD_FAIL_OST_CONNECT_NET 0x201
95 #define OBD_FAIL_OST_DISCONNECT_NET 0x202
96 #define OBD_FAIL_OST_GET_INFO_NET 0x203
97 #define OBD_FAIL_OST_CREATE_NET 0x204
98 #define OBD_FAIL_OST_DESTROY_NET 0x205
99 #define OBD_FAIL_OST_GETATTR_NET 0x206
100 #define OBD_FAIL_OST_SETATTR_NET 0x207
101 #define OBD_FAIL_OST_OPEN_NET 0x208
102 #define OBD_FAIL_OST_CLOSE_NET 0x209
103 #define OBD_FAIL_OST_BRW_NET 0x20a
104 #define OBD_FAIL_OST_PUNCH_NET 0x20b
105 #define OBD_FAIL_OST_STATFS_NET 0x20c
106 #define OBD_FAIL_OST_HANDLE_UNPACK 0x20d
107 #define OBD_FAIL_OST_BRW_WRITE_BULK 0x20e
108 #define OBD_FAIL_OST_BRW_READ_BULK 0x20f
109 #define OBD_FAIL_OST_SYNC_NET 0x210
110 #define OBD_FAIL_OST_ALL_REPLY_NET 0x211
111 #define OBD_FAIL_OST_ALL_REQUESTS_NET 0x212
112 #define OBD_FAIL_OST_LDLM_REPLY_NET 0x213
113 #define OBD_FAIL_OST_BRW_PAUSE_BULK 0x214
114 #define OBD_FAIL_OST_ENOSPC 0x215
115 #define OBD_FAIL_OST_EROFS 0x216
118 #define OBD_FAIL_LDLM 0x300
119 #define OBD_FAIL_LDLM_NAMESPACE_NEW 0x301
120 #define OBD_FAIL_LDLM_ENQUEUE 0x302
121 #define OBD_FAIL_LDLM_CONVERT 0x303
122 #define OBD_FAIL_LDLM_CANCEL 0x304
123 #define OBD_FAIL_LDLM_BL_CALLBACK 0x305
124 #define OBD_FAIL_LDLM_CP_CALLBACK 0x306
125 #define OBD_FAIL_LDLM_GL_CALLBACK 0x307
126 #define OBD_FAIL_LDLM_ENQUEUE_EXTENT_ERR 0x308
127 #define OBD_FAIL_LDLM_ENQUEUE_INTENT_ERR 0x309
128 #define OBD_FAIL_LDLM_CREATE_RESOURCE 0x30a
129 #define OBD_FAIL_LDLM_ENQUEUE_BLOCKED 0x30b
130 #define OBD_FAIL_LDLM_REPLY 0x30c
133 #define OBD_FAIL_OSC 0x400
134 #define OBD_FAIL_OSC_BRW_READ_BULK 0x401
135 #define OBD_FAIL_OSC_BRW_WRITE_BULK 0x402
136 #define OBD_FAIL_OSC_LOCK_BL_AST 0x403
137 #define OBD_FAIL_OSC_LOCK_CP_AST 0x404
138 #define OBD_FAIL_OSC_MATCH 0x405
140 #define OBD_FAIL_PTLRPC 0x500
141 #define OBD_FAIL_PTLRPC_ACK 0x501
142 #define OBD_FAIL_PTLRPC_RQBD 0x502
143 #define OBD_FAIL_PTLRPC_BULK_GET_NET 0x503
144 #define OBD_FAIL_PTLRPC_BULK_PUT_NET 0x504
146 #define OBD_FAIL_OBD_PING_NET 0x600
147 #define OBD_FAIL_OBD_LOG_CANCEL_NET 0x601
148 #define OBD_FAIL_OBD_LOGD_NET 0x602
150 #define OBD_FAIL_TGT_REPLY_NET 0x700
151 #define OBD_FAIL_TGT_CONN_RACE 0x701
153 #define OBD_FAIL_SVCSEC_ACCEPT_BEG 0x750
154 #define OBD_FAIL_SVCSEC_ACCEPT_END 0x751
155 #define OBD_FAIL_SVCSEC_WRAP_BEG 0x752
156 #define OBD_FAIL_SVCSEC_WRAP_END 0x753
157 #define OBD_FAIL_SVCGSS_ERR_NOTIFY 0x760
158 #define OBD_FAIL_SVCGSS_INIT_REQ 0x780
159 #define OBD_FAIL_SVCGSS_INIT_REP 0x781
161 #define OBD_FAIL_MDC_REVALIDATE_PAUSE 0x800
163 /* preparation for a more advanced failure testbed (not functional yet) */
164 #define OBD_FAIL_MASK_SYS 0x0000FF00
165 #define OBD_FAIL_MASK_LOC (0x000000FF | OBD_FAIL_MASK_SYS)
166 #define OBD_FAIL_ONCE 0x80000000
167 #define OBD_FAILED 0x40000000
168 #define OBD_FAIL_MDS_ALL_NET 0x01000000
169 #define OBD_FAIL_OST_ALL_NET 0x02000000
171 #define OBD_FAIL_CHECK(id) (((obd_fail_loc & OBD_FAIL_MASK_LOC) == \
172 ((id) & OBD_FAIL_MASK_LOC)) && \
173 ((obd_fail_loc & (OBD_FAILED | OBD_FAIL_ONCE))!= \
174 (OBD_FAILED | OBD_FAIL_ONCE)))
176 #define OBD_FAIL_CHECK_ONCE(id) \
178 if (OBD_FAIL_CHECK(id)) { \
179 CERROR("obd_fail_loc=%x\n", id); \
180 obd_fail_loc |= OBD_FAILED; \
181 if ((id) & OBD_FAIL_ONCE) \
182 obd_fail_loc |= OBD_FAIL_ONCE; \
188 #define OBD_FAIL_RETURN(id, ret) \
190 if (OBD_FAIL_CHECK_ONCE(id)) { \
195 #define OBD_FAIL_GOTO(id, label, ret) \
197 if (OBD_FAIL_CHECK_ONCE(id)) { \
198 GOTO(label, (ret)); \
202 #define OBD_FAIL_TIMEOUT(id, secs) \
204 if (OBD_FAIL_CHECK_ONCE(id)) { \
205 CERROR("obd_fail_timeout id %x sleeping for %d secs\n", \
207 set_current_state(TASK_UNINTERRUPTIBLE); \
208 schedule_timeout((secs) * HZ); \
209 set_current_state(TASK_RUNNING); \
210 CERROR("obd_fail_timeout id %x awake\n", (id)); \
217 * sleep_on() is known to be racy, using wait_event() interface instead as
218 * recommended. --umka
220 #define OBD_SLEEP_ON(wq) \
222 DEFINE_WAIT(__wait); \
223 prepare_to_wait(&wq, &__wait, TASK_INTERRUPTIBLE); \
225 finish_wait(&wq, &__wait); \
228 /* The idea here is to synchronise two threads to force a race. The
229 * first thread that calls this with a matching fail_loc is put to
230 * sleep. The next thread that calls with the same fail_loc wakes up
231 * the first and continues. */
232 #define OBD_RACE(id) \
234 if (OBD_FAIL_CHECK_ONCE(id)) { \
235 CERROR("obd_race id %x sleeping\n", (id)); \
236 OBD_SLEEP_ON(obd_race_waitq); \
237 CERROR("obd_fail_race id %x awake\n", (id)); \
238 } else if ((obd_fail_loc & OBD_FAIL_MASK_LOC) == \
239 ((id) & OBD_FAIL_MASK_LOC)) { \
240 wake_up(&obd_race_waitq); \
244 /* sigh. an expedient fix until OBD_RACE is fixed up */
245 #define OBD_RACE(foo) LBUG()
248 #define fixme() CDEBUG(D_OTHER, "FIXME\n");
251 # include <linux/types.h>
252 # include <linux/blkdev.h>
255 # if (LINUX_VERSION_CODE >= KERNEL_VERSION(2,5,0))
256 # define BDEVNAME_DECLARE_STORAGE(foo) char foo[BDEVNAME_SIZE]
257 # define ll_bdevname(SB, STORAGE) __bdevname(kdev_t_to_nr(SB->s_dev), STORAGE)
258 # define ll_lock_kernel lock_kernel()
259 # define ll_sbdev(SB) ((SB)->s_bdev)
260 # define ll_sbdev_type struct block_device *
261 # define ll_sbdev_sync fsync_bdev
263 # define BDEVNAME_DECLARE_STORAGE(foo) char __unused_##foo
264 # define ll_sbdev(SB) (kdev_t_to_nr((SB)->s_dev))
265 # define ll_sbdev_type kdev_t
266 # define ll_sbdev_sync fsync_dev
267 # define ll_bdevname(SB,STORAGE) ((void)__unused_##STORAGE,bdevname(ll_sbdev(SB)))
268 # define ll_lock_kernel
271 #ifdef HAVE_OLD_DEV_SET_RDONLY
272 void dev_set_rdonly(ll_sbdev_type dev, int no_write);
273 void dev_clear_rdonly(int no_write);
275 void dev_set_rdonly(ll_sbdev_type dev);
276 void dev_clear_rdonly(ll_sbdev_type dev);
278 int dev_check_rdonly(ll_sbdev_type dev);
279 #define ll_check_rdonly(dev) dev_check_rdonly(dev)
281 static inline void ll_set_rdonly(ll_sbdev_type dev)
283 CDEBUG(D_IOCTL | D_HA, "set dev %ld rdonly\n", (long)dev);
285 #ifdef HAVE_OLD_DEV_SET_RDONLY
286 dev_set_rdonly(dev, 2);
292 static inline void ll_clear_rdonly(ll_sbdev_type dev)
294 CDEBUG(D_IOCTL | D_HA, "unset dev %ld rdonly\n", (long)dev);
295 if (ll_check_rdonly(dev)) {
297 #ifdef HAVE_OLD_DEV_SET_RDONLY
300 dev_clear_rdonly(dev);
305 static inline void OBD_FAIL_WRITE(int id, struct super_block *sb)
307 if (OBD_FAIL_CHECK(id)) {
308 BDEVNAME_DECLARE_STORAGE(tmp);
309 CERROR("obd_fail_loc=%x, fail write operation on %s\n",
310 id, ll_bdevname(sb, tmp));
311 ll_set_rdonly(ll_sbdev(sb));
312 /* We set FAIL_ONCE because we never "un-fail" a device */
313 obd_fail_loc |= OBD_FAILED | OBD_FAIL_ONCE;
316 #else /* !__KERNEL__ */
317 # define LTIME_S(time) (time)
318 /* for obd_class.h */
320 # define ERR_PTR(a) ((void *)(a))
322 #endif /* __KERNEL__ */
324 extern atomic_t portal_kmemory;
326 #if defined (CONFIG_DEBUG_MEMORY) && defined(__KERNEL__)
328 #define MT_FLAGS_WRONG_SIZE (1 << 0)
329 #define MEM_LOC_LEN 128
332 struct hlist_node m_hash;
333 char m_loc[MEM_LOC_LEN];
339 void lvfs_memdbg_show(void);
340 void lvfs_memdbg_insert(struct mem_track *mt);
341 void lvfs_memdbg_remove(struct mem_track *mt);
342 struct mem_track *lvfs_memdbg_find(void *ptr);
344 int lvfs_memdbg_check_insert(struct mem_track *mt);
345 struct mem_track *lvfs_memdbg_check_remove(void *ptr);
347 static inline struct mem_track *
348 __new_mem_track(void *ptr, int size,
349 char *file, int line)
351 struct mem_track *mt;
353 mt = kmalloc(sizeof(*mt), GFP_KERNEL);
357 snprintf(mt->m_loc, sizeof(mt->m_loc) - 1,
358 "%s:%d", file, line);
367 __free_mem_track(struct mem_track *mt)
373 __get_mem_track(void *ptr, int size,
374 char *file, int line)
376 struct mem_track *mt;
378 mt = __new_mem_track(ptr, size, file, line);
380 CWARN("can't allocate new memory track\n");
384 if (!lvfs_memdbg_check_insert(mt))
385 __free_mem_track(mt);
391 __put_mem_track(void *ptr, int size,
392 char *file, int line)
394 struct mem_track *mt;
396 if (!(mt = lvfs_memdbg_check_remove(ptr))) {
397 CWARN("ptr 0x%p is not allocated. Attempt to free "
398 "not allocated memory at %s:%d\n", ptr,
402 if (mt->m_size != size) {
403 mt->m_flags |= MT_FLAGS_WRONG_SIZE;
404 CWARN("freeing memory chunk of different size "
405 "than allocated (%d != %d) at %s:%d\n",
406 mt->m_size, size, file, line);
408 __free_mem_track(mt);
414 #define get_mem_track(ptr, size, file, line) \
415 __get_mem_track((ptr), (size), (file), (line))
417 #define put_mem_track(ptr, size, file, line) \
418 __put_mem_track((ptr), (size), (file), (line))
420 #else /* !CONFIG_DEBUG_MEMORY */
422 #define get_mem_track(ptr, size, file, line) \
425 #define put_mem_track(ptr, size, file, line) \
427 #endif /* !CONFIG_DEBUG_MEMORY */
429 #define OBD_ALLOC_GFP(ptr, size, gfp_mask) \
431 (ptr) = kmalloc(size, (gfp_mask)); \
432 if ((ptr) == NULL) { \
433 CERROR("kmalloc of '" #ptr "' (%d bytes) failed at %s:%d\n", \
434 (int)(size), __FILE__, __LINE__); \
435 CERROR("%d total bytes allocated by Lustre, %d by Portals\n", \
436 atomic_read(&obd_memory), atomic_read(&portal_kmemory)); \
438 memset(ptr, 0, size); \
439 atomic_add(size, &obd_memory); \
440 if (atomic_read(&obd_memory) > obd_memmax) \
441 obd_memmax = atomic_read(&obd_memory); \
442 get_mem_track((ptr), (size), __FILE__, __LINE__); \
443 CDEBUG(D_MALLOC, "kmalloced '" #ptr "': %d at %p (tot %d)\n", \
444 (int)(size), (ptr), atomic_read(&obd_memory)); \
449 # define OBD_GFP_MASK GFP_NOFS
453 #define OBD_ALLOC(ptr, size) OBD_ALLOC_GFP(ptr, size, OBD_GFP_MASK)
455 #define OBD_ALLOC(ptr, size) (ptr = malloc(size))
458 #define OBD_ALLOC_WAIT(ptr, size) OBD_ALLOC_GFP(ptr, size, GFP_KERNEL)
461 # define OBD_VMALLOC(ptr, size) OBD_ALLOC(ptr, size)
463 # define OBD_VMALLOC(ptr, size) \
465 (ptr) = vmalloc(size); \
466 if ((ptr) == NULL) { \
467 CERROR("vmalloc of '" #ptr "' (%d bytes) failed at %s:%d\n", \
468 (int)(size), __FILE__, __LINE__); \
469 CERROR("%d total bytes allocated by Lustre, %d by Portals\n", \
470 atomic_read(&obd_memory), atomic_read(&portal_kmemory)); \
472 memset(ptr, 0, size); \
473 atomic_add(size, &obd_memory); \
474 if (atomic_read(&obd_memory) > obd_memmax) \
475 obd_memmax = atomic_read(&obd_memory); \
476 get_mem_track((ptr), (size), __FILE__, __LINE__); \
477 CDEBUG(D_MALLOC, "vmalloced '" #ptr "': %d at %p (tot %d)\n", \
478 (int)(size), ptr, atomic_read(&obd_memory)); \
483 #ifdef CONFIG_DEBUG_SLAB
484 #define POISON(ptr, c, s) do {} while (0)
486 #define POISON(ptr, c, s) memset(ptr, c, s)
490 #define POISON_PAGE(page, val) do { memset(kmap(page), val, PAGE_SIZE); \
491 kunmap(page); } while (0)
493 #define POISON_PAGE(page, val) do { } while (0)
497 #define OBD_FREE(ptr, size) \
500 put_mem_track((ptr), (size), __FILE__, __LINE__); \
501 atomic_sub(size, &obd_memory); \
502 CDEBUG(D_MALLOC, "kfreed '" #ptr "': %d at %p (tot %d).\n", \
503 (int)(size), ptr, atomic_read(&obd_memory)); \
504 POISON(ptr, 0x5a, size); \
506 (ptr) = (void *)0xdeadbeef; \
509 #define OBD_FREE(ptr, size) ((void)(size), free((ptr)))
513 # define OBD_VFREE(ptr, size) OBD_FREE(ptr, size)
515 # define OBD_VFREE(ptr, size) \
518 put_mem_track((ptr), (size), __FILE__, __LINE__); \
519 atomic_sub(size, &obd_memory); \
520 CDEBUG(D_MALLOC, "vfreed '" #ptr "': %d at %p (tot %d).\n", \
521 (int)(size), ptr, atomic_read(&obd_memory)); \
522 POISON(ptr, 0x5a, size); \
524 (ptr) = (void *)0xdeadbeef; \
529 * we memset() the slab object to 0 when allocation succeeds, so DO NOT HAVE A
530 * CTOR THAT DOES ANYTHING. Its work will be cleared here. We'd love to assert
531 * on that, but slab.c keeps kmem_cache_s all to itself.
533 #define OBD_SLAB_ALLOC(ptr, slab, type, size) \
535 LASSERT(!in_interrupt()); \
536 (ptr) = kmem_cache_alloc(slab, (type)); \
537 if ((ptr) == NULL) { \
538 CERROR("slab-alloc of '"#ptr"' (%d bytes) failed at %s:%d\n", \
539 (int)(size), __FILE__, __LINE__); \
540 CERROR("%d total bytes allocated by Lustre, %d by Portals\n", \
541 atomic_read(&obd_memory), atomic_read(&portal_kmemory)); \
543 memset(ptr, 0, size); \
544 atomic_add(size, &obd_memory); \
545 if (atomic_read(&obd_memory) > obd_memmax) \
546 obd_memmax = atomic_read(&obd_memory); \
547 get_mem_track((ptr), (size), __FILE__, __LINE__); \
548 CDEBUG(D_MALLOC, "slab-alloced '"#ptr"': %d at %p (tot %d)\n", \
549 (int)(size), ptr, atomic_read(&obd_memory)); \
553 #define OBD_SLAB_FREE(ptr, slab, size) \
556 CDEBUG(D_MALLOC, "slab-freed '" #ptr "': %d at %p (tot %d).\n", \
557 (int)(size), ptr, atomic_read(&obd_memory)); \
558 put_mem_track((ptr), (size), __FILE__, __LINE__); \
559 atomic_sub(size, &obd_memory); \
560 POISON(ptr, 0x5a, size); \
561 kmem_cache_free(slab, ptr); \
562 (ptr) = (void *)0xdeadbeef; \