Whamcloud - gitweb
- fixes for dentry problems from Phil and myself
[fs/lustre-release.git] / lustre / ldlm / ldlm_lockd.c
1
2
3 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
4  * vim:expandtab:shiftwidth=8:tabstop=8:
5  *
6  * Copyright (C) 2002 Cluster File Systems, Inc.
7  *   Author: Peter Braam <braam@clusterfs.com>
8  *   Author: Phil Schwan <phil@clusterfs.com>
9  *
10  *   This file is part of Lustre, http://www.lustre.org.
11  *
12  *   Lustre is free software; you can redistribute it and/or
13  *   modify it under the terms of version 2 of the GNU General Public
14  *   License as published by the Free Software Foundation.
15  *
16  *   Lustre is distributed in the hope that it will be useful,
17  *   but WITHOUT ANY WARRANTY; without even the implied warranty of
18  *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
19  *   GNU General Public License for more details.
20  *
21  *   You should have received a copy of the GNU General Public License
22  *   along with Lustre; if not, write to the Free Software
23  *   Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
24  */
25
26 #define EXPORT_SYMTAB
27 #define DEBUG_SUBSYSTEM S_LDLM
28
29 #include <linux/module.h>
30 #include <linux/slab.h>
31 #include <linux/lustre_dlm.h>
32 #include <linux/init.h>
33 #include <linux/obd_class.h>
34
35 extern kmem_cache_t *ldlm_resource_slab;
36 extern kmem_cache_t *ldlm_lock_slab;
37 extern struct list_head ldlm_namespace_list;
38 extern int (*mds_reint_p)(int offset, struct ptlrpc_request *req);
39 extern int (*mds_getattr_name_p)(int offset, struct ptlrpc_request *req);
40
41 inline unsigned long round_timeout(unsigned long timeout)
42 {
43         return ((timeout / HZ) + 1) * HZ;
44 }
45
46 static struct list_head waiting_locks_list;
47 static spinlock_t waiting_locks_spinlock;
48 static struct timer_list waiting_locks_timer;
49 static int ldlm_already_setup = 0;
50
51 static void waiting_locks_callback(unsigned long unused)
52 {
53         struct list_head *liter, *n;
54
55         spin_lock_bh(&waiting_locks_spinlock);
56         list_for_each_safe(liter, n, &waiting_locks_list) {
57                 struct ldlm_lock *l = list_entry(liter, struct ldlm_lock,
58                                                  l_pending_chain);
59                 if (l->l_callback_timeout > jiffies)
60                         break;
61                 LDLM_DEBUG(l, "timer expired, recovering exp %p on conn %p",
62                            l->l_export, l->l_export->exp_connection);
63                 recovd_conn_fail(l->l_export->exp_connection);
64         }
65         spin_unlock_bh(&waiting_locks_spinlock);
66 }
67
68 /*
69  * Indicate that we're waiting for a client to call us back cancelling a given
70  * lock.  We add it to the pending-callback chain, and schedule the lock-timeout
71  * timer to fire appropriately.  (We round up to the next second, to avoid
72  * floods of timer firings during periods of high lock contention and traffic).
73  */
74 static int ldlm_add_waiting_lock(struct ldlm_lock *lock)
75 {
76         unsigned long timeout_rounded;
77         ENTRY;
78
79         LASSERT(list_empty(&lock->l_pending_chain));
80
81         spin_lock_bh(&waiting_locks_spinlock);
82         lock->l_callback_timeout = jiffies + (obd_timeout * HZ);
83
84         timeout_rounded = round_timeout(lock->l_callback_timeout);
85
86         if (timeout_rounded < waiting_locks_timer.expires ||
87             !timer_pending(&waiting_locks_timer)) {
88                 mod_timer(&waiting_locks_timer, timeout_rounded);
89         }
90         list_add_tail(&lock->l_pending_chain, &waiting_locks_list); /* FIFO */
91         spin_unlock_bh(&waiting_locks_spinlock);
92         RETURN(1);
93 }
94
95 /*
96  * Remove a lock from the pending list, likely because it had its cancellation
97  * callback arrive without incident.  This adjusts the lock-timeout timer if
98  * needed.  Returns 0 if the lock wasn't pending after all, 1 if it was.
99  */
100 int ldlm_del_waiting_lock(struct ldlm_lock *lock)
101 {
102         struct list_head *list_next;
103
104         ENTRY;
105
106         spin_lock_bh(&waiting_locks_spinlock);
107
108         if (list_empty(&lock->l_pending_chain)) {
109                 spin_unlock_bh(&waiting_locks_spinlock);
110                 RETURN(0);
111         }
112
113         list_next = lock->l_pending_chain.next;
114         if (lock->l_pending_chain.prev == &waiting_locks_list) {
115                 /* Removing the head of the list, adjust timer. */
116                 if (list_next == &waiting_locks_list) {
117                         /* No more, just cancel. */
118                         del_timer(&waiting_locks_timer);
119                 } else {
120                         struct ldlm_lock *next;
121                         next = list_entry(list_next, struct ldlm_lock,
122                                           l_pending_chain);
123                         mod_timer(&waiting_locks_timer,
124                                   round_timeout(next->l_callback_timeout));
125                 }
126         }
127         list_del_init(&lock->l_pending_chain);
128         spin_unlock_bh(&waiting_locks_spinlock);
129         RETURN(1);
130 }
131
132 static int ldlm_server_blocking_ast(struct ldlm_lock *lock,
133                                     struct ldlm_lock_desc *desc,
134                                     void *data, __u32 data_len, int flag)
135 {
136         struct ldlm_request *body;
137         struct ptlrpc_request *req;
138         int rc = 0, size = sizeof(*body);
139         ENTRY;
140
141         if (flag == LDLM_CB_CANCELING) {
142                 /* Don't need to do anything here. */
143                 RETURN(0);
144         }
145
146         req = ptlrpc_prep_req(&lock->l_export->exp_ldlm_data.led_import,
147                               LDLM_BL_CALLBACK, 1, &size, NULL);
148         if (!req)
149                 RETURN(-ENOMEM);
150
151         body = lustre_msg_buf(req->rq_reqmsg, 0);
152         memcpy(&body->lock_handle1, &lock->l_remote_handle,
153                sizeof(body->lock_handle1));
154         memcpy(&body->lock_desc, desc, sizeof(*desc));
155
156         LDLM_DEBUG(lock, "server preparing blocking AST");
157         req->rq_replen = 0; /* no reply needed */
158
159         ldlm_add_waiting_lock(lock);
160         (void)ptl_send_rpc(req);
161
162         /* no commit, and no waiting for reply, so 2x decref now */
163         ptlrpc_req_finished(req);
164         ptlrpc_req_finished(req);
165
166         RETURN(rc);
167 }
168
169 static int ldlm_server_completion_ast(struct ldlm_lock *lock, int flags)
170 {
171         struct ldlm_request *body;
172         struct ptlrpc_request *req;
173         int rc = 0, size = sizeof(*body);
174         ENTRY;
175
176         if (lock == NULL) {
177                 LBUG();
178                 RETURN(-EINVAL);
179         }
180
181         req = ptlrpc_prep_req(&lock->l_export->exp_ldlm_data.led_import,
182                               LDLM_CP_CALLBACK, 1, &size, NULL);
183         if (!req)
184                 RETURN(-ENOMEM);
185
186         body = lustre_msg_buf(req->rq_reqmsg, 0);
187         memcpy(&body->lock_handle1, &lock->l_remote_handle,
188                sizeof(body->lock_handle1));
189         body->lock_flags = flags;
190         ldlm_lock2desc(lock, &body->lock_desc);
191
192         LDLM_DEBUG(lock, "server preparing completion AST");
193         req->rq_replen = 0; /* no reply needed */
194
195         (void)ptl_send_rpc(req);
196         /* no commit, and no waiting for reply, so 2x decref now */
197         ptlrpc_req_finished(req);
198         ptlrpc_req_finished(req);
199
200         RETURN(rc);
201 }
202
203 int ldlm_handle_enqueue(struct ptlrpc_request *req)
204 {
205         struct obd_device *obddev = req->rq_export->exp_obd;
206         struct ldlm_reply *dlm_rep;
207         struct ldlm_request *dlm_req;
208         int rc, size = sizeof(*dlm_rep), cookielen = 0;
209         __u32 flags;
210         ldlm_error_t err;
211         struct ldlm_lock *lock = NULL;
212         void *cookie = NULL;
213         ENTRY;
214
215         LDLM_DEBUG_NOLOCK("server-side enqueue handler START");
216
217         dlm_req = lustre_msg_buf(req->rq_reqmsg, 0);
218         flags = dlm_req->lock_flags;
219         if (dlm_req->lock_desc.l_resource.lr_type == LDLM_PLAIN &&
220             (flags & LDLM_FL_HAS_INTENT)) {
221                 /* In this case, the reply buffer is allocated deep in
222                  * local_lock_enqueue by the policy function. */
223                 cookie = req;
224                 cookielen = sizeof(*req);
225         } else {
226                 rc = lustre_pack_msg(1, &size, NULL, &req->rq_replen,
227                                      &req->rq_repmsg);
228                 if (rc) {
229                         CERROR("out of memory\n");
230                         RETURN(-ENOMEM);
231                 }
232                 if (dlm_req->lock_desc.l_resource.lr_type == LDLM_EXTENT) {
233                         cookie = &dlm_req->lock_desc.l_extent;
234                         cookielen = sizeof(struct ldlm_extent);
235                 }
236         }
237
238         /* XXX notice that this lock has no callback data: of course the
239            export would be exactly what we may want to use here... */
240         lock = ldlm_lock_create(obddev->obd_namespace,
241                                 &dlm_req->lock_handle2,
242                                 dlm_req->lock_desc.l_resource.lr_name,
243                                 dlm_req->lock_desc.l_resource.lr_type,
244                                 dlm_req->lock_desc.l_req_mode, NULL, 0);
245         if (!lock)
246                 GOTO(out, err = -ENOMEM);
247
248         memcpy(&lock->l_remote_handle, &dlm_req->lock_handle1,
249                sizeof(lock->l_remote_handle));
250         LDLM_DEBUG(lock, "server-side enqueue handler, new lock created");
251
252         err = ldlm_lock_enqueue(lock, cookie, cookielen, &flags,
253                                 ldlm_server_completion_ast,
254                                 ldlm_server_blocking_ast);
255         if (err != ELDLM_OK)
256                 GOTO(out, err);
257
258         dlm_rep = lustre_msg_buf(req->rq_repmsg, 0);
259         dlm_rep->lock_flags = flags;
260
261         ldlm_lock2handle(lock, &dlm_rep->lock_handle);
262         if (dlm_req->lock_desc.l_resource.lr_type == LDLM_EXTENT)
263                 memcpy(&dlm_rep->lock_extent, &lock->l_extent,
264                        sizeof(lock->l_extent));
265         if (dlm_rep->lock_flags & LDLM_FL_LOCK_CHANGED) {
266                 memcpy(dlm_rep->lock_resource_name, lock->l_resource->lr_name,
267                        sizeof(dlm_rep->lock_resource_name));
268                 dlm_rep->lock_mode = lock->l_req_mode;
269         }
270
271         lock->l_export = req->rq_export;
272         if (lock->l_export) {
273                 l_lock(&lock->l_resource->lr_namespace->ns_lock);
274                 list_add(&lock->l_export_chain,
275                          &lock->l_export->exp_ldlm_data.led_held_locks);
276                 l_unlock(&lock->l_resource->lr_namespace->ns_lock);
277         }
278
279         EXIT;
280  out:
281         if (lock)
282                 LDLM_DEBUG(lock, "server-side enqueue handler, sending reply"
283                            "(err=%d)", err);
284         req->rq_status = err;
285
286         if (ptlrpc_reply(req->rq_svc, req))
287                 LBUG();
288
289         if (lock) {
290                 if (!err)
291                         ldlm_reprocess_all(lock->l_resource);
292                 LDLM_LOCK_PUT(lock);
293         }
294         LDLM_DEBUG_NOLOCK("server-side enqueue handler END (lock %p)", lock);
295
296         return 0;
297 }
298
299 int ldlm_handle_convert(struct ptlrpc_request *req)
300 {
301         struct ldlm_request *dlm_req;
302         struct ldlm_reply *dlm_rep;
303         struct ldlm_lock *lock;
304         int rc, size = sizeof(*dlm_rep);
305         ENTRY;
306
307         rc = lustre_pack_msg(1, &size, NULL, &req->rq_replen, &req->rq_repmsg);
308         if (rc) {
309                 CERROR("out of memory\n");
310                 RETURN(-ENOMEM);
311         }
312         dlm_req = lustre_msg_buf(req->rq_reqmsg, 0);
313         dlm_rep = lustre_msg_buf(req->rq_repmsg, 0);
314         dlm_rep->lock_flags = dlm_req->lock_flags;
315
316         lock = ldlm_handle2lock(&dlm_req->lock_handle1);
317         if (!lock) {
318                 req->rq_status = EINVAL;
319         } else {
320                 LDLM_DEBUG(lock, "server-side convert handler START");
321                 ldlm_lock_convert(lock, dlm_req->lock_desc.l_req_mode,
322                                   &dlm_rep->lock_flags);
323                 if (ldlm_del_waiting_lock(lock))
324                         CDEBUG(D_DLMTRACE, "converted waiting lock %p\n", lock);
325                 req->rq_status = 0;
326         }
327         if (ptlrpc_reply(req->rq_svc, req) != 0)
328                 LBUG();
329
330         if (lock) {
331                 ldlm_reprocess_all(lock->l_resource);
332                 LDLM_DEBUG(lock, "server-side convert handler END");
333                 LDLM_LOCK_PUT(lock);
334         } else
335                 LDLM_DEBUG_NOLOCK("server-side convert handler END");
336
337         RETURN(0);
338 }
339
340 int ldlm_handle_cancel(struct ptlrpc_request *req)
341 {
342         struct ldlm_request *dlm_req;
343         struct ldlm_lock *lock;
344         int rc;
345         ENTRY;
346
347         rc = lustre_pack_msg(0, NULL, NULL, &req->rq_replen, &req->rq_repmsg);
348         if (rc) {
349                 CERROR("out of memory\n");
350                 RETURN(-ENOMEM);
351         }
352         dlm_req = lustre_msg_buf(req->rq_reqmsg, 0);
353         if (!dlm_req) {
354                 CERROR("bad request buffer for cancel\n");
355                 RETURN(-EINVAL);
356         }
357
358         lock = ldlm_handle2lock(&dlm_req->lock_handle1);
359         if (!lock) {
360                 CERROR("bad lock handle\n");
361                 LDLM_DEBUG_NOLOCK("server-side cancel handler stale lock (lock "
362                                   "%p)", (void *)(unsigned long)
363                                   dlm_req->lock_handle1.addr);
364                 req->rq_status = ESTALE;
365         } else {
366                 LDLM_DEBUG(lock, "server-side cancel handler START");
367                 ldlm_lock_cancel(lock);
368                 if (ldlm_del_waiting_lock(lock))
369                         CDEBUG(D_DLMTRACE, "cancelled waiting lock %p\n", lock);
370                 req->rq_status = 0;
371         }
372
373         if (ptlrpc_reply(req->rq_svc, req) != 0)
374                 LBUG();
375
376         if (lock) {
377                 ldlm_reprocess_all(lock->l_resource);
378                 LDLM_DEBUG(lock, "server-side cancel handler END");
379                 LDLM_LOCK_PUT(lock);
380         }
381
382         RETURN(0);
383 }
384
385 static int ldlm_handle_bl_callback(struct ptlrpc_request *req)
386 {
387         struct ldlm_request *dlm_req;
388         struct ldlm_lock *lock;
389         int do_ast;
390         ENTRY;
391
392         OBD_FAIL_RETURN(OBD_FAIL_OSC_LOCK_BL_AST, 0);
393
394         dlm_req = lustre_msg_buf(req->rq_reqmsg, 0);
395
396         lock = ldlm_handle2lock(&dlm_req->lock_handle1);
397         if (!lock) {
398                 CERROR("blocking callback on lock "LPX64" - lock disappeared\n",
399                        dlm_req->lock_handle1.addr);
400                 RETURN(0);
401         }
402
403         LDLM_DEBUG(lock, "client blocking AST callback handler START");
404
405         l_lock(&lock->l_resource->lr_namespace->ns_lock);
406         lock->l_flags |= LDLM_FL_CBPENDING;
407         do_ast = (!lock->l_readers && !lock->l_writers);
408         l_unlock(&lock->l_resource->lr_namespace->ns_lock);
409
410         if (do_ast) {
411                 LDLM_DEBUG(lock, "already unused, calling "
412                            "callback (%p)", lock->l_blocking_ast);
413                 if (lock->l_blocking_ast != NULL) {
414                         lock->l_blocking_ast(lock, &dlm_req->lock_desc,
415                                              lock->l_data, lock->l_data_len,
416                                              LDLM_CB_BLOCKING);
417                 }
418         } else
419                 LDLM_DEBUG(lock, "Lock still has references, will be"
420                            " cancelled later");
421
422         LDLM_DEBUG(lock, "client blocking callback handler END");
423         LDLM_LOCK_PUT(lock);
424         RETURN(0);
425 }
426
427 static int ldlm_handle_cp_callback(struct ptlrpc_request *req)
428 {
429         struct list_head ast_list = LIST_HEAD_INIT(ast_list);
430         struct ldlm_request *dlm_req;
431         struct ldlm_lock *lock;
432         ENTRY;
433
434         OBD_FAIL_RETURN(OBD_FAIL_OSC_LOCK_CP_AST, 0);
435
436         dlm_req = lustre_msg_buf(req->rq_reqmsg, 0);
437
438         lock = ldlm_handle2lock(&dlm_req->lock_handle1);
439         if (!lock) {
440                 CERROR("completion callback on lock "LPX64" - lock "
441                        "disappeared\n", dlm_req->lock_handle1.addr);
442                 RETURN(0);
443         }
444
445         LDLM_DEBUG(lock, "client completion callback handler START");
446
447         l_lock(&lock->l_resource->lr_namespace->ns_lock);
448
449         /* If we receive the completion AST before the actual enqueue returned,
450          * then we might need to switch lock modes, resources, or extents. */
451         if (dlm_req->lock_desc.l_granted_mode != lock->l_req_mode) {
452                 lock->l_req_mode = dlm_req->lock_desc.l_granted_mode;
453                 LDLM_DEBUG(lock, "completion AST, new lock mode");
454         }
455         if (lock->l_resource->lr_type == LDLM_EXTENT)
456                 memcpy(&lock->l_extent, &dlm_req->lock_desc.l_extent,
457                        sizeof(lock->l_extent));
458         ldlm_resource_unlink_lock(lock);
459         if (memcmp(dlm_req->lock_desc.l_resource.lr_name,
460                    lock->l_resource->lr_name,
461                    sizeof(__u64) * RES_NAME_SIZE) != 0) {
462                 ldlm_lock_change_resource(lock, dlm_req->lock_desc.l_resource.lr_name);
463                 LDLM_DEBUG(lock, "completion AST, new resource");
464         }
465         lock->l_resource->lr_tmp = &ast_list;
466         ldlm_grant_lock(lock);
467         lock->l_resource->lr_tmp = NULL;
468         l_unlock(&lock->l_resource->lr_namespace->ns_lock);
469         LDLM_DEBUG(lock, "callback handler finished, about to run_ast_work");
470         LDLM_LOCK_PUT(lock);
471
472         ldlm_run_ast_work(&ast_list);
473
474         LDLM_DEBUG_NOLOCK("client completion callback handler END (lock %p)",
475                           lock);
476         RETURN(0);
477 }
478
479 static int ldlm_callback_handler(struct ptlrpc_request *req)
480 {
481         int rc;
482         ENTRY;
483
484         rc = lustre_unpack_msg(req->rq_reqmsg, req->rq_reqlen);
485         if (rc) {
486                 CERROR("lustre_ldlm: Invalid request: %d\n", rc);
487                 RETURN(rc);
488         }
489
490         if (req->rq_export == NULL) {
491                 CERROR("lustre_dlm: operation %d with missing/invalid export\n",
492                        req->rq_reqmsg->opc);
493                 RETURN(-ENOTCONN);
494         }
495
496         switch (req->rq_reqmsg->opc) {
497         case LDLM_BL_CALLBACK:
498                 CDEBUG(D_INODE, "blocking ast\n");
499                 OBD_FAIL_RETURN(OBD_FAIL_LDLM_BL_CALLBACK, 0);
500                 rc = ldlm_handle_bl_callback(req);
501                 RETURN(rc);
502         case LDLM_CP_CALLBACK:
503                 CDEBUG(D_INODE, "completion ast\n");
504                 OBD_FAIL_RETURN(OBD_FAIL_LDLM_CP_CALLBACK, 0);
505                 rc = ldlm_handle_cp_callback(req);
506                 RETURN(rc);
507
508         default:
509                 CERROR("invalid opcode %d\n", req->rq_reqmsg->opc);
510                 RETURN(-EINVAL);
511         }
512
513         RETURN(0);
514 }
515
516
517 static int ldlm_cancel_handler(struct ptlrpc_request *req)
518 {
519         int rc;
520         ENTRY;
521
522         rc = lustre_unpack_msg(req->rq_reqmsg, req->rq_reqlen);
523         if (rc) {
524                 CERROR("lustre_ldlm: Invalid request: %d\n", rc);
525                 RETURN(rc);
526         }
527
528         if (req->rq_export == NULL) {
529                 CERROR("lustre_dlm: operation %d with missing/invalid export\n",
530                        req->rq_reqmsg->opc);
531                 RETURN(-ENOTCONN);
532         }
533
534         switch (req->rq_reqmsg->opc) {
535  
536         /* XXX FIXME move this back to mds/handler.c, bug 625069 */
537         case LDLM_CANCEL:
538                 CDEBUG(D_INODE, "cancel\n");
539                 OBD_FAIL_RETURN(OBD_FAIL_LDLM_CANCEL, 0);
540                 rc = ldlm_handle_cancel(req);
541                 if (rc)
542                         break;
543                 RETURN(0);
544
545         default:
546                 CERROR("invalid opcode %d\n", req->rq_reqmsg->opc);
547                 RETURN(-EINVAL);
548         }
549
550         RETURN(0);
551 }
552
553
554 static int ldlm_iocontrol(long cmd, struct lustre_handle *conn, int len,
555                           void *karg, void *uarg)
556 {
557         struct obd_device *obddev = class_conn2obd(conn);
558         struct ptlrpc_connection *connection;
559         int err = 0;
560         ENTRY;
561
562         if (_IOC_TYPE(cmd) != IOC_LDLM_TYPE || _IOC_NR(cmd) < IOC_LDLM_MIN_NR ||
563             _IOC_NR(cmd) > IOC_LDLM_MAX_NR) {
564                 CDEBUG(D_IOCTL, "invalid ioctl (type %ld, nr %ld, size %ld)\n",
565                        _IOC_TYPE(cmd), _IOC_NR(cmd), _IOC_SIZE(cmd));
566                 RETURN(-EINVAL);
567         }
568
569         OBD_ALLOC(obddev->u.ldlm.ldlm_client,
570                   sizeof(*obddev->u.ldlm.ldlm_client));
571         connection = ptlrpc_uuid_to_connection("ldlm");
572         if (!connection)
573                 CERROR("No LDLM UUID found: assuming ldlm is local.\n");
574
575         switch (cmd) {
576         case IOC_LDLM_TEST:
577                 err = ldlm_test(obddev, conn);
578                 CERROR("-- done err %d\n", err);
579                 GOTO(out, err);
580         case IOC_LDLM_DUMP:
581                 ldlm_dump_all_namespaces();
582                 GOTO(out, err);
583         default:
584                 GOTO(out, err = -EINVAL);
585         }
586
587  out:
588         if (connection)
589                 ptlrpc_put_connection(connection);
590         OBD_FREE(obddev->u.ldlm.ldlm_client,
591                  sizeof(*obddev->u.ldlm.ldlm_client));
592         return err;
593 }
594
595 #define LDLM_NUM_THREADS        4
596
597 static int ldlm_setup(struct obd_device *obddev, obd_count len, void *buf)
598 {
599         struct ldlm_obd *ldlm = &obddev->u.ldlm;
600         int rc, i;
601         ENTRY;
602
603         if (ldlm_already_setup)
604                 RETURN(-EALREADY);
605
606         MOD_INC_USE_COUNT;
607         /*
608         rc = ldlm_proc_setup(obddev);
609         if (rc != 0)
610                 GOTO(out_dec, rc);
611         */
612         ldlm->ldlm_cb_service =
613                 ptlrpc_init_svc(LDLM_NEVENTS, LDLM_NBUFS, LDLM_BUFSIZE,
614                                 LDLM_MAXREQSIZE, LDLM_CB_REQUEST_PORTAL,
615                                 LDLM_CB_REPLY_PORTAL, "self",
616                                 ldlm_callback_handler, "ldlm_cbd");
617
618         if (!ldlm->ldlm_cb_service)
619                 GOTO(out_dec, rc = -ENOMEM);
620
621         ldlm->ldlm_cancel_service =
622                 ptlrpc_init_svc(LDLM_NEVENTS, LDLM_NBUFS, LDLM_BUFSIZE,
623                                 LDLM_MAXREQSIZE, 
624                                 LDLM_CANCEL_REQUEST_PORTAL,
625                                 LDLM_CANCEL_REPLY_PORTAL, "self",
626                                 ldlm_cancel_handler, "ldlm_canceld");
627
628         if (!ldlm->ldlm_cancel_service)
629                 GOTO(out_dec, rc = -ENOMEM);
630
631         for (i = 0; i < LDLM_NUM_THREADS; i++) {
632                 char name[32];
633                 sprintf(name, "lustre_dlm_%02d", i);
634                 rc = ptlrpc_start_thread(obddev, ldlm->ldlm_cancel_service, name);
635                 if (rc) {
636                         CERROR("cannot start LDLM thread #%d: rc %d\n", i, rc);
637                         LBUG();
638                         GOTO(out_thread, rc);
639                 }
640         }
641
642         for (i = 0; i < LDLM_NUM_THREADS; i++) {
643                 char name[32];
644                 sprintf(name, "lustre_dlm_%02d", i);
645                 rc = ptlrpc_start_thread(obddev, ldlm->ldlm_cb_service, name);
646                 if (rc) {
647                         CERROR("cannot start LDLM thread #%d: rc %d\n", i, rc);
648                         LBUG();
649                         GOTO(out_thread, rc);
650                 }
651         }
652
653         INIT_LIST_HEAD(&waiting_locks_list);
654         spin_lock_init(&waiting_locks_spinlock);
655         waiting_locks_timer.function = waiting_locks_callback;
656         waiting_locks_timer.data = 0;
657         init_timer(&waiting_locks_timer);
658
659         ldlm_already_setup = 1;
660
661         RETURN(0);
662
663  out_thread:
664         ptlrpc_stop_all_threads(ldlm->ldlm_cancel_service);
665         ptlrpc_unregister_service(ldlm->ldlm_cancel_service);
666         ptlrpc_stop_all_threads(ldlm->ldlm_cb_service);
667         ptlrpc_unregister_service(ldlm->ldlm_cb_service);
668         /*
669  out_proc:
670
671          ldlm_proc_cleanup(obddev);
672         */
673  out_dec:
674         MOD_DEC_USE_COUNT;
675         return rc;
676 }
677
678 static int ldlm_cleanup(struct obd_device *obddev)
679 {
680         struct ldlm_obd *ldlm = &obddev->u.ldlm;
681         ENTRY;
682
683         if (!list_empty(&ldlm_namespace_list)) {
684                 CERROR("ldlm still has namespaces; clean these up first.\n");
685                 RETURN(-EBUSY);
686         }
687
688         ptlrpc_stop_all_threads(ldlm->ldlm_cb_service);
689         ptlrpc_unregister_service(ldlm->ldlm_cb_service);
690         ptlrpc_stop_all_threads(ldlm->ldlm_cancel_service);
691         ptlrpc_unregister_service(ldlm->ldlm_cancel_service);
692         /* ldlm_proc_cleanup(obddev); */
693
694         ldlm_already_setup = 0;
695         MOD_DEC_USE_COUNT;
696         RETURN(0);
697 }
698
699 static int ldlm_connect(struct lustre_handle *conn, struct obd_device *src,
700                         obd_uuid_t cluuid, struct recovd_obd *recovd,
701                         ptlrpc_recovery_cb_t recover)
702 {
703         return class_connect(conn, src, cluuid);
704 }
705
706 struct obd_ops ldlm_obd_ops = {
707         o_iocontrol:   ldlm_iocontrol,
708         o_setup:       ldlm_setup,
709         o_cleanup:     ldlm_cleanup,
710         o_connect:     ldlm_connect,
711         o_disconnect:  class_disconnect
712 };
713
714 static int __init ldlm_init(void)
715 {
716         int rc = class_register_type(&ldlm_obd_ops, 0, OBD_LDLM_DEVICENAME);
717         if (rc != 0)
718                 return rc;
719
720         ldlm_resource_slab = kmem_cache_create("ldlm_resources",
721                                                sizeof(struct ldlm_resource), 0,
722                                                SLAB_HWCACHE_ALIGN, NULL, NULL);
723         if (ldlm_resource_slab == NULL)
724                 return -ENOMEM;
725
726         ldlm_lock_slab = kmem_cache_create("ldlm_locks",
727                                            sizeof(struct ldlm_lock), 0,
728                                            SLAB_HWCACHE_ALIGN, NULL, NULL);
729         if (ldlm_lock_slab == NULL) {
730                 kmem_cache_destroy(ldlm_resource_slab);
731                 return -ENOMEM;
732         }
733
734         return 0;
735 }
736
737 static void __exit ldlm_exit(void)
738 {
739         class_unregister_type(OBD_LDLM_DEVICENAME);
740         if (kmem_cache_destroy(ldlm_resource_slab) != 0)
741                 CERROR("couldn't free ldlm resource slab\n");
742         if (kmem_cache_destroy(ldlm_lock_slab) != 0)
743                 CERROR("couldn't free ldlm lock slab\n");
744 }
745
746 EXPORT_SYMBOL(ldlm_completion_ast);
747 EXPORT_SYMBOL(ldlm_handle_enqueue);
748 EXPORT_SYMBOL(ldlm_handle_cancel);
749 EXPORT_SYMBOL(ldlm_handle_convert);
750 EXPORT_SYMBOL(ldlm_register_intent);
751 EXPORT_SYMBOL(ldlm_unregister_intent);
752 EXPORT_SYMBOL(ldlm_lockname);
753 EXPORT_SYMBOL(ldlm_typename);
754 EXPORT_SYMBOL(ldlm_handle2lock);
755 EXPORT_SYMBOL(ldlm_lock2handle);
756 EXPORT_SYMBOL(ldlm_lock_put);
757 EXPORT_SYMBOL(ldlm_lock_match);
758 EXPORT_SYMBOL(ldlm_lock_addref);
759 EXPORT_SYMBOL(ldlm_lock_decref);
760 EXPORT_SYMBOL(ldlm_lock_change_resource);
761 EXPORT_SYMBOL(ldlm_lock_set_data);
762 EXPORT_SYMBOL(ldlm_cli_convert);
763 EXPORT_SYMBOL(ldlm_cli_enqueue);
764 EXPORT_SYMBOL(ldlm_cli_cancel);
765 EXPORT_SYMBOL(ldlm_cli_cancel_unused);
766 EXPORT_SYMBOL(ldlm_match_or_enqueue);
767 EXPORT_SYMBOL(ldlm_it2str);
768 EXPORT_SYMBOL(ldlm_test);
769 EXPORT_SYMBOL(ldlm_regression_start);
770 EXPORT_SYMBOL(ldlm_regression_stop);
771 EXPORT_SYMBOL(ldlm_lock_dump);
772 EXPORT_SYMBOL(ldlm_namespace_new);
773 EXPORT_SYMBOL(ldlm_namespace_cleanup);
774 EXPORT_SYMBOL(ldlm_namespace_free);
775 EXPORT_SYMBOL(ldlm_namespace_dump);
776 EXPORT_SYMBOL(ldlm_cancel_locks_for_export);
777 EXPORT_SYMBOL(l_lock);
778 EXPORT_SYMBOL(l_unlock);
779
780 MODULE_AUTHOR("Cluster File Systems, Inc. <info@clusterfs.com>");
781 MODULE_DESCRIPTION("Lustre Lock Management Module v0.1");
782 MODULE_LICENSE("GPL");
783
784 module_init(ldlm_init);
785 module_exit(ldlm_exit);