1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
4 * Copyright (C) 2002, 2003 Cluster File Systems, Inc.
6 * This file is part of Lustre, http://www.lustre.org.
8 * Lustre is free software; you can redistribute it and/or
9 * modify it under the terms of version 2 of the GNU General Public
10 * License as published by the Free Software Foundation.
12 * Lustre is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 * GNU General Public License for more details.
17 * You should have received a copy of the GNU General Public License
18 * along with Lustre; if not, write to the Free Software
19 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
27 #include <linux/version.h>
28 #if (LINUX_VERSION_CODE < KERNEL_VERSION(2,5,0))
29 #include <linux/tqueue.h>
31 #include <linux/workqueue.h>
35 #include <libcfs/kp30.h>
36 // #include <linux/obd.h>
37 #include <portals/p30.h>
38 #include <linux/lustre_idl.h>
39 #include <linux/lustre_ha.h>
40 #include <linux/lustre_import.h>
41 #include <linux/lprocfs_status.h>
42 #include <linux/lustre_compat25.h>
44 /* MD flags we _always_ use */
45 #define PTLRPC_MD_OPTIONS (PTL_MD_EVENT_START_DISABLE | \
46 PTL_MD_LUSTRE_COMPLETION_SEMANTICS)
48 /* Define some large-ish maxima for bulk I/O
49 * CAVEAT EMPTOR, with multinet (i.e. gateways forwarding between networks)
50 * these limits are system wide and not interface-local. */
51 #define PTLRPC_MAX_BRW_SIZE (1 << 20)
52 #define PTLRPC_MAX_BRW_PAGES 512
54 /* ...reduce to fit... */
57 /* include a cray header here if relevant
58 * NB liblustre SIZE/PAGES is affected too, but it merges contiguous
59 * chunks, so FTTB, it always used contiguous MDs */
61 # include <portals/lib-types.h>
64 #if (defined(PTL_MTU) && (PTL_MTU < PTLRPC_MAX_BRW_SIZE))
65 # undef PTLRPC_MAX_BRW_SIZE
66 # define PTLRPC_MAX_BRW_SIZE PTL_MTU
68 #if (defined(PTL_MD_MAX_IOV) && (PTL_MD_MAX_IOV < PTLRPC_MAX_BRW_PAGES ))
69 # undef PTLRPC_MAX_BRW_PAGES
70 # define PTLRPC_MAX_BRW_PAGES PTL_MD_MAX_IOV
73 /* ...and make consistent... */
75 #if (PTLRPC_MAX_BRW_SIZE > PTLRPC_MAX_BRW_PAGES * PAGE_SIZE)
76 # undef PTLRPC_MAX_BRW_SIZE
77 # define PTLRPC_MAX_BRW_SIZE (PTLRPC_MAX_BRW_PAGES * PAGE_SIZE)
79 # undef PTLRPC_MAX_BRW_PAGES
80 # define PTLRPC_MAX_BRW_PAGES (PTLRPC_MAX_BRW_SIZE / PAGE_SIZE)
83 #if ((PTLRPC_MAX_BRW_PAGES & (PTLRPC_MAX_BRW_PAGES - 1)) != 0)
84 #error "PTLRPC_MAX_BRW_PAGES isn't a power of two"
87 /* Size over which to OBD_VMALLOC() rather than OBD_ALLOC() service request
89 #define SVC_BUF_VMALLOC_THRESHOLD (2*PAGE_SIZE)
91 /* The following constants determine how memory is used to buffer incoming
94 * ?_NBUFS # buffers to allocate when growing the pool
95 * ?_BUFSIZE # bytes in a single request buffer
96 * ?_MAXREQSIZE # maximum request service will receive
98 * When fewer than ?_NBUFS/2 buffers are posted for receive, another chunk
99 * of ?_NBUFS is added to the pool.
101 * Messages larger than ?_MAXREQSIZE are dropped. Request buffers are
102 * considered full when less than ?_MAXREQSIZE is left in them.
105 #define LDLM_NUM_THREADS min(smp_num_cpus * smp_num_cpus * 8, 64)
106 #define LDLM_NBUFS 64
107 #define LDLM_BUFSIZE (8 * 1024)
108 #define LDLM_MAXREQSIZE (5 * 1024)
110 #define MDT_MAX_THREADS 32UL
111 #define MDT_NUM_THREADS max(min_t(unsigned long, num_physpages / 8192, \
112 MDT_MAX_THREADS), 2UL)
113 #define MDS_NBUFS (64 * smp_num_cpus)
114 #define MDS_BUFSIZE (8 * 1024)
115 /* Assume file name length = FNAME_MAX = 256 (true for extN).
116 * path name length = PATH_MAX = 4096
117 * LOV MD size max = EA_MAX = 4000
118 * symlink: FNAME_MAX + PATH_MAX <- largest
119 * link: FNAME_MAX + PATH_MAX (mds_rec_link < mds_rec_create)
120 * rename: FNAME_MAX + FNAME_MAX
121 * open: FNAME_MAX + EA_MAX
123 * MDS_MAXREQSIZE ~= 4736 bytes =
124 * lustre_msg + ldlm_request + mds_body + mds_rec_create + FNAME_MAX + PATH_MAX
126 * Realistic size is about 512 bytes (20 character name + 128 char symlink),
127 * except in the open case where there are a large number of OSTs in a LOV.
129 #define MDS_MAXREQSIZE (5 * 1024)
131 #define OST_MAX_THREADS 36UL
132 #define OST_NUM_THREADS max(min_t(unsigned long, num_physpages / 8192, \
133 OST_MAX_THREADS), 2UL)
134 #define OST_NBUFS (64 * smp_num_cpus)
135 #define OST_BUFSIZE (8 * 1024)
136 /* OST_MAXREQSIZE ~= 1640 bytes =
137 * lustre_msg + obdo + 16 * obd_ioobj + 64 * niobuf_remote
139 * - single object with 16 pages is 512 bytes
140 * - OST_MAXREQSIZE must be at least 1 page of cookies plus some spillover
142 #define OST_MAXREQSIZE (5 * 1024)
144 #define PTLBD_NUM_THREADS 4
145 #define PTLBD_NBUFS 64
146 #define PTLBD_BUFSIZE (32 * 1024)
147 #define PTLBD_MAXREQSIZE 1024
150 ptl_process_id_t peer_id;
151 struct ptlrpc_ni *peer_ni;
154 struct ptlrpc_connection {
155 struct list_head c_link;
156 struct ptlrpc_peer c_peer;
157 struct obd_uuid c_remote_uuid;
161 struct ptlrpc_client {
162 __u32 cli_request_portal;
163 __u32 cli_reply_portal;
167 /* state flags of requests */
168 /* XXX only ones left are those used by the bulk descs as well! */
169 #define PTL_RPC_FL_INTR (1 << 0) /* reply wait was interrupted by user */
170 #define PTL_RPC_FL_TIMEOUT (1 << 7) /* request timed out waiting for reply */
172 #define REQ_MAX_ACK_LOCKS 8
174 #define SWAB_PARANOIA 1
176 /* unpacking: assert idx not unpacked already */
177 #define LASSERT_REQSWAB(rq, idx) \
179 LASSERT ((idx) < sizeof ((rq)->rq_req_swab_mask) * 8); \
180 LASSERT (((rq)->rq_req_swab_mask & (1 << (idx))) == 0); \
181 (rq)->rq_req_swab_mask |= (1 << (idx)); \
184 #define LASSERT_REPSWAB(rq, idx) \
186 LASSERT ((idx) < sizeof ((rq)->rq_rep_swab_mask) * 8); \
187 LASSERT (((rq)->rq_rep_swab_mask & (1 << (idx))) == 0); \
188 (rq)->rq_rep_swab_mask |= (1 << (idx)); \
191 /* just looking: assert idx already unpacked */
192 #define LASSERT_REQSWABBED(rq, idx) \
193 LASSERT ((idx) < sizeof ((rq)->rq_req_swab_mask) * 8 && \
194 ((rq)->rq_req_swab_mask & (1 << (idx))) != 0)
196 #define LASSERT_REPSWABBED(rq, idx) \
197 LASSERT ((idx) < sizeof ((rq)->rq_rep_swab_mask) * 8 && \
198 ((rq)->rq_rep_swab_mask & (1 << (idx))) != 0)
200 #define LASSERT_REQSWAB(rq, idx)
201 #define LASSERT_REPSWAB(rq, idx)
202 #define LASSERT_REQSWABBED(rq, idx)
203 #define LASSERT_REPSWABBED(rq, idx)
206 union ptlrpc_async_args {
207 /* Scratchpad for passing args to completion interpreter. Users
208 * cast to the struct of their choosing, and LASSERT that this is
209 * big enough. For _tons_ of context, OBD_ALLOC a struct and store
210 * a pointer to it here. The pointer_arg ensures this struct is at
211 * least big enough for that. */
212 void *pointer_arg[9];
216 struct ptlrpc_request_set;
217 typedef int (*set_interpreter_func)(struct ptlrpc_request_set *, void *, int);
219 struct ptlrpc_request_set {
220 int set_remaining; /* # uncompleted requests */
221 wait_queue_head_t set_waitq;
222 wait_queue_head_t *set_wakeup_ptr;
223 struct list_head set_requests;
224 set_interpreter_func set_interpret; /* completion callback */
225 void *set_arg; /* completion context */
226 /* locked so that any old caller can communicate requests to
227 * the set holder who can then fold them into the lock-free set */
228 spinlock_t set_new_req_lock;
229 struct list_head set_new_requests;
232 struct ptlrpc_bulk_desc;
235 * ptlrpc callback & work item stuff
237 struct ptlrpc_cb_id {
238 void (*cbid_fn)(ptl_event_t *ev); /* specific callback fn */
239 void *cbid_arg; /* additional arg */
243 struct ptlrpc_svcsec;
245 #define RS_MAX_LOCKS 4
248 struct ptlrpc_reply_state {
249 struct ptlrpc_cb_id rs_cb_id;
250 struct list_head rs_list;
251 struct list_head rs_exp_list;
252 struct list_head rs_obd_list;
254 struct list_head rs_debug_list;
256 /* updates to following flag serialised by srv_request_lock */
257 unsigned int rs_difficult:1; /* ACK/commit stuff */
258 unsigned int rs_scheduled:1; /* being handled? */
259 unsigned int rs_scheduled_ever:1; /* any schedule attempts? */
260 unsigned int rs_handled:1; /* been handled yet? */
261 unsigned int rs_on_net:1; /* reply_out_callback pending? */
263 struct ptlrpc_svcsec *rs_svcsec;
264 char *rs_buf; /* backend buffer */
265 int rs_buf_len; /* backend buffer length */
266 char *rs_repbuf; /* will be sent on wire */
267 int rs_repbuf_len; /* max on-wire data length */
268 int rs_repdata_len; /* actual on-wire data length */
269 struct lustre_msg *rs_msg; /* lustre msg pointer */
270 int rs_msg_len; /* length of lustre msg */
274 struct obd_export *rs_export;
275 struct ptlrpc_srv_ni *rs_srv_ni;
276 ptl_handle_md_t rs_md_h;
278 /* locks awaiting client reply ACK */
280 struct lustre_handle rs_locks[RS_MAX_LOCKS];
281 ldlm_mode_t rs_modes[RS_MAX_LOCKS];
282 struct llog_create_locks *rs_llog_locks;
285 struct ptlrpc_request {
286 int rq_type; /* one of PTL_RPC_MSG_* */
287 struct list_head rq_list;
290 /* client-side flags */
291 unsigned int rq_intr:1, rq_replied:1, rq_err:1,
292 rq_timedout:1, rq_resend:1, rq_restart:1, rq_replay:1,
293 rq_no_resend:1, rq_waiting:1, rq_receiving_reply:1,
294 rq_no_delay:1, rq_net_err:1, rq_req_wrapped:1,
295 rq_ptlrpcs_restart:1;
297 /* client-side refcount for SENT race */
298 atomic_t rq_refcount;
300 int rq_request_portal; /* XXX FIXME bug 249 */
301 int rq_reply_portal; /* XXX FIXME bug 249 */
303 /* client-side # reply bytes actually received */
307 struct lustre_msg *rq_reqmsg;
311 struct lustre_msg *rq_repmsg;
314 struct list_head rq_replay_list;
316 struct ptlrpc_cred *rq_cred; /* client side credit */
317 struct ptlrpc_svcsec *rq_svcsec; /* server side security */
318 /* XXX temporarily put here XXX */
319 void *rq_sec_svcdata; /* server security data */
320 unsigned int rq_remote; /* from remote client */
323 char *rq_reqbuf; /* backend request buffer */
324 int rq_reqbuf_len; /* backend request buffer length */
325 int rq_reqdata_len; /* actual request data length */
326 char *rq_repbuf; /* backend reply buffer */
327 int rq_repbuf_len; /* backend reply buffer length */
328 int rq_repdata_len; /* actual reply data length, not used yet */
331 __u32 rq_req_swab_mask;
332 __u32 rq_rep_swab_mask;
335 int rq_import_generation;
336 enum lustre_imp_state rq_send_state;
338 /* client+server request */
339 ptl_handle_md_t rq_req_md_h;
340 struct ptlrpc_cb_id rq_req_cbid;
343 struct timeval rq_rpcd_start;
346 struct timeval rq_arrival_time; /* request arrival time */
347 struct ptlrpc_reply_state *rq_reply_state; /* separated reply state */
348 struct ptlrpc_request_buffer_desc *rq_rqbd; /* incoming request buffer */
350 ptl_uid_t rq_uid; /* peer uid, used in MDS only */
353 /* client-only incoming reply */
354 ptl_handle_md_t rq_reply_md_h;
355 wait_queue_head_t rq_reply_waitq;
356 struct ptlrpc_cb_id rq_reply_cbid;
358 struct ptlrpc_peer rq_peer; /* XXX see service.c can this be factored away? */
359 char rq_peerstr[PTL_NALFMT_SIZE];
360 struct obd_export *rq_export;
361 struct obd_import *rq_import;
363 void (*rq_replay_cb)(struct ptlrpc_request *);
364 void (*rq_commit_cb)(struct ptlrpc_request *);
367 struct ptlrpc_bulk_desc *rq_bulk; /* client side bulk */
368 time_t rq_sent; /* when the request was sent */
370 struct ptlrpc_service *rq_svc;
373 struct list_head rq_set_chain;
374 struct ptlrpc_request_set *rq_set;
375 void *rq_interpret_reply; /* Async completion handler */
376 union ptlrpc_async_args rq_async_args; /* Async completion context */
377 void * rq_ptlrpcd_data;
381 #define RQ_PHASE_NEW 0xebc0de00
382 #define RQ_PHASE_RPC 0xebc0de01
383 #define RQ_PHASE_BULK 0xebc0de02
384 #define RQ_PHASE_INTERPRET 0xebc0de03
385 #define RQ_PHASE_COMPLETE 0xebc0de04
387 /* Spare the preprocessor, spoil the bugs. */
388 #define FLAG(field, str) (field ? str : "")
390 #define DEBUG_REQ_FLAGS(req) \
391 ((req->rq_phase == RQ_PHASE_NEW) ? "New" : \
392 (req->rq_phase == RQ_PHASE_RPC) ? "Rpc" : \
393 (req->rq_phase == RQ_PHASE_INTERPRET) ? "Interpret" : \
394 (req->rq_phase == RQ_PHASE_COMPLETE) ? "Complete" : "?phase?"), \
395 FLAG(req->rq_intr, "I"), FLAG(req->rq_replied, "R"), \
396 FLAG(req->rq_err, "E"), \
397 FLAG(req->rq_timedout, "X") /* eXpired */, FLAG(req->rq_resend, "S"), \
398 FLAG(req->rq_restart, "T"), FLAG(req->rq_replay, "P"), \
399 FLAG(req->rq_no_resend, "N"), \
400 FLAG(req->rq_waiting, "W")
402 #define REQ_FLAGS_FMT "%s:%s%s%s%s%s%s%s%s%s"
404 #define DEBUG_REQ(level, req, fmt, args...) \
406 CDEBUG(level, "@@@ " fmt \
407 " req@%p x"LPD64"/t"LPD64" o%d->%s@%s:%d lens %d/%d ref %d fl " \
408 REQ_FLAGS_FMT"/%x/%x rc %d/%d\n" , ## args, req, req->rq_xid, \
410 req->rq_reqmsg ? req->rq_reqmsg->opc : -1, \
411 req->rq_import ? (char *)req->rq_import->imp_target_uuid.uuid : "<?>", \
413 (char *)req->rq_import->imp_connection->c_remote_uuid.uuid : "<?>", \
414 (req->rq_import && req->rq_import->imp_client) ? \
415 req->rq_import->imp_client->cli_request_portal : -1, \
416 req->rq_reqlen, req->rq_replen, \
417 atomic_read(&req->rq_refcount), \
418 DEBUG_REQ_FLAGS(req), \
419 req->rq_reqmsg ? req->rq_reqmsg->flags : 0, \
420 req->rq_repmsg ? req->rq_repmsg->flags : 0, \
421 req->rq_status, req->rq_repmsg ? req->rq_repmsg->status : 0); \
424 struct ptlrpc_bulk_page {
425 struct list_head bp_link;
427 int bp_pageoffset; /* offset within a page */
428 struct page *bp_page;
431 #define BULK_GET_SOURCE 0
432 #define BULK_PUT_SINK 1
433 #define BULK_GET_SINK 2
434 #define BULK_PUT_SOURCE 3
436 struct ptlrpc_bulk_desc {
437 unsigned int bd_success:1; /* completed successfully */
438 unsigned int bd_network_rw:1; /* accessible to the network */
439 unsigned int bd_type:2; /* {put,get}{source,sink} */
440 unsigned int bd_registered:1; /* client side */
441 spinlock_t bd_lock; /* serialise with callback */
442 int bd_import_generation;
443 struct obd_export *bd_export;
444 struct obd_import *bd_import;
446 struct ptlrpc_request *bd_req; /* associated request */
447 wait_queue_head_t bd_waitq; /* server side only WQ */
448 int bd_iov_count; /* # entries in bd_iov */
449 int bd_max_iov; /* allocated size of bd_iov */
450 int bd_nob; /* # bytes covered */
451 int bd_nob_transferred; /* # bytes GOT/PUT */
455 struct ptlrpc_cb_id bd_cbid; /* network callback info */
456 ptl_handle_md_t bd_md_h; /* associated MD */
458 #if (!CRAY_PORTALS && defined(__KERNEL__))
459 ptl_kiov_t bd_iov[0];
461 ptl_md_iovec_t bd_iov[0];
465 struct ptlrpc_thread {
466 struct list_head t_link;
469 wait_queue_head_t t_ctl_waitq;
472 struct ptlrpc_request_buffer_desc {
473 struct list_head rqbd_list;
474 struct ptlrpc_srv_ni *rqbd_srv_ni;
475 ptl_handle_md_t rqbd_md_h;
478 struct ptlrpc_cb_id rqbd_cbid;
479 struct ptlrpc_request rqbd_req;
482 /* event queues are per-ni, because one day we may get a hardware
483 * supported NAL that delivers events asynchonously wrt kernel portals
486 struct ptlrpc_ni { /* Generic interface state */
489 ptl_handle_ni_t pni_ni_h;
490 ptl_handle_eq_t pni_eq_h;
493 struct ptlrpc_srv_ni {
494 /* Interface-specific service state */
495 struct ptlrpc_service *sni_service; /* owning service */
496 struct ptlrpc_ni *sni_ni; /* network interface */
497 struct list_head sni_active_rqbds; /* req buffers receiving */
498 struct list_head sni_active_replies; /* all the active replies */
499 int sni_nrqbd_receiving; /* # posted request buffers */
502 typedef int (*svc_handler_t)(struct ptlrpc_request *req);
504 struct ptlrpc_service {
505 struct list_head srv_list; /* chain thru all services */
506 int srv_max_req_size; /* biggest request to receive */
507 int srv_buf_size; /* size of individual buffers */
508 int srv_nbuf_per_group; /* # buffers to allocate in 1 group */
509 int srv_nbufs; /* total # req buffer descs allocated */
510 int srv_nthreads; /* # running threads */
511 int srv_n_difficult_replies; /* # 'difficult' replies */
512 int srv_n_active_reqs; /* # reqs being served */
513 int srv_rqbd_timeout; /* timeout before re-posting reqs */
514 int srv_watchdog_timeout; /* soft watchdog timeout, in ms */
516 __u32 srv_req_portal;
517 __u32 srv_rep_portal;
519 int srv_n_queued_reqs; /* # reqs waiting to be served */
520 struct list_head srv_request_queue; /* reqs waiting for service */
522 struct list_head srv_idle_rqbds; /* request buffers to be reposted */
524 atomic_t srv_outstanding_replies;
525 struct list_head srv_reply_queue; /* replies waiting for service */
527 wait_queue_head_t srv_waitq; /* all threads sleep on this */
529 struct list_head srv_threads;
530 struct obd_device *srv_obddev;
531 svc_handler_t srv_handler;
533 char *srv_name; /* only statically allocated strings here; we don't clean them */
537 struct proc_dir_entry *srv_procroot;
538 struct lprocfs_stats *srv_stats;
540 struct ptlrpc_srv_ni srv_interfaces[0];
543 static inline char *ptlrpc_peernid2str(struct ptlrpc_peer *p, char *str)
545 LASSERT(p->peer_ni != NULL);
546 return (portals_nid2str(p->peer_ni->pni_number, p->peer_id.nid, str));
549 static inline char *ptlrpc_id2str(struct ptlrpc_peer *p, char *str)
551 LASSERT(p->peer_ni != NULL);
552 return (portals_id2str(p->peer_ni->pni_number, p->peer_id, str));
556 /* ptlrpc/events.c */
557 extern struct ptlrpc_ni ptlrpc_interfaces[];
558 extern int ptlrpc_ninterfaces;
559 extern int ptlrpc_uuid_to_peer(struct obd_uuid *uuid, struct ptlrpc_peer *peer);
560 extern void request_out_callback (ptl_event_t *ev);
561 extern void reply_in_callback(ptl_event_t *ev);
562 extern void client_bulk_callback (ptl_event_t *ev);
563 extern void request_in_callback(ptl_event_t *ev);
564 extern void reply_out_callback(ptl_event_t *ev);
565 extern void server_bulk_callback (ptl_event_t *ev);
566 extern int ptlrpc_default_nal(void);
568 /* ptlrpc/connection.c */
569 void ptlrpc_dump_connections(void);
570 void ptlrpc_readdress_connection(struct ptlrpc_connection *, struct obd_uuid *);
571 struct ptlrpc_connection *ptlrpc_get_connection(struct ptlrpc_peer *peer,
572 struct obd_uuid *uuid);
573 int ptlrpc_put_connection(struct ptlrpc_connection *c);
574 struct ptlrpc_connection *ptlrpc_connection_addref(struct ptlrpc_connection *);
575 void ptlrpc_init_connection(void);
576 void ptlrpc_cleanup_connection(void);
577 extern ptl_pid_t ptl_get_pid(void);
579 /* ptlrpc/niobuf.c */
580 int ptlrpc_start_bulk_transfer(struct ptlrpc_bulk_desc *desc);
581 void ptlrpc_abort_bulk(struct ptlrpc_bulk_desc *desc);
582 int ptlrpc_register_bulk(struct ptlrpc_request *req);
583 void ptlrpc_unregister_bulk (struct ptlrpc_request *req);
585 static inline int ptlrpc_bulk_active (struct ptlrpc_bulk_desc *desc)
590 spin_lock_irqsave (&desc->bd_lock, flags);
591 rc = desc->bd_network_rw;
592 spin_unlock_irqrestore (&desc->bd_lock, flags);
596 int ptlrpc_send_reply(struct ptlrpc_request *req, int);
597 int ptlrpc_reply(struct ptlrpc_request *req);
598 int ptlrpc_error(struct ptlrpc_request *req);
599 void ptlrpc_resend_req(struct ptlrpc_request *request);
600 int ptl_send_rpc(struct ptlrpc_request *request);
601 int ptlrpc_register_rqbd (struct ptlrpc_request_buffer_desc *rqbd);
602 int ptlrpc_do_rawrpc(struct obd_import *imp, char *reqbuf, int reqlen,
603 char *repbuf, int *replenp, int timeout);
605 /* ptlrpc/client.c */
606 void ptlrpc_init_client(int req_portal, int rep_portal, char *name,
607 struct ptlrpc_client *);
608 void ptlrpc_cleanup_client(struct obd_import *imp);
609 struct ptlrpc_connection *ptlrpc_uuid_to_connection(struct obd_uuid *uuid);
612 ptlrpc_client_receiving_reply (struct ptlrpc_request *req)
617 spin_lock_irqsave(&req->rq_lock, flags);
618 rc = req->rq_receiving_reply;
619 spin_unlock_irqrestore(&req->rq_lock, flags);
624 ptlrpc_client_replied (struct ptlrpc_request *req)
629 spin_lock_irqsave(&req->rq_lock, flags);
630 rc = req->rq_replied;
631 spin_unlock_irqrestore(&req->rq_lock, flags);
636 ptlrpc_wake_client_req (struct ptlrpc_request *req)
638 if (req->rq_set == NULL)
639 wake_up(&req->rq_reply_waitq);
641 wake_up(&req->rq_set->set_waitq);
644 int ptlrpc_queue_wait(struct ptlrpc_request *req);
645 int ptlrpc_replay_req(struct ptlrpc_request *req);
646 void ptlrpc_unregister_reply(struct ptlrpc_request *req);
647 void ptlrpc_restart_req(struct ptlrpc_request *req);
648 void ptlrpc_abort_inflight(struct obd_import *imp);
650 struct ptlrpc_request_set *ptlrpc_prep_set(void);
651 int ptlrpc_set_next_timeout(struct ptlrpc_request_set *);
652 int ptlrpc_check_set(struct ptlrpc_request_set *set);
653 int ptlrpc_set_wait(struct ptlrpc_request_set *);
654 int ptlrpc_expired_set(void *data);
655 void ptlrpc_interrupted_set(void *data);
656 void ptlrpc_mark_interrupted(struct ptlrpc_request *req);
657 void ptlrpc_set_destroy(struct ptlrpc_request_set *);
658 void ptlrpc_set_add_req(struct ptlrpc_request_set *, struct ptlrpc_request *);
659 void ptlrpc_set_add_new_req(struct ptlrpc_request_set *,
660 struct ptlrpc_request *);
662 struct ptlrpc_request *ptlrpc_prep_req(struct obd_import *imp, __u32 version,
663 int opcode, int count, int *lengths,
665 void ptlrpc_free_req(struct ptlrpc_request *request);
666 void ptlrpc_req_finished(struct ptlrpc_request *request);
667 void ptlrpc_req_finished_with_imp_lock(struct ptlrpc_request *request);
668 struct ptlrpc_request *ptlrpc_request_addref(struct ptlrpc_request *req);
669 struct ptlrpc_bulk_desc *ptlrpc_prep_bulk_imp (struct ptlrpc_request *req,
670 int npages, int type, int portal);
671 struct ptlrpc_bulk_desc *ptlrpc_prep_bulk_exp(struct ptlrpc_request *req,
672 int npages, int type, int portal);
673 void ptlrpc_free_bulk(struct ptlrpc_bulk_desc *bulk);
674 void ptlrpc_prep_bulk_page(struct ptlrpc_bulk_desc *desc,
675 struct page *page, int pageoffset, int len);
676 void ptlrpc_retain_replayable_request(struct ptlrpc_request *req,
677 struct obd_import *imp);
678 __u64 ptlrpc_next_xid(void);
680 /* ptlrpc/service.c */
681 void ptlrpc_require_repack (struct ptlrpc_request *req);
682 void ptlrpc_save_lock (struct ptlrpc_request *req,
683 struct lustre_handle *lock, int mode);
684 void ptlrpc_save_llog_lock (struct ptlrpc_request *req,
685 struct llog_create_locks *lcl);
686 void ptlrpc_commit_replies (struct obd_device *obd);
687 void ptlrpc_schedule_difficult_reply (struct ptlrpc_reply_state *rs);
688 struct ptlrpc_service *ptlrpc_init_svc(int nbufs, int bufsize, int max_req_size,
689 int req_portal, int rep_portal,
690 int watchdog_timeout, /* in ms */
691 svc_handler_t, char *name,
692 struct proc_dir_entry *proc_entry);
693 void ptlrpc_stop_all_threads(struct ptlrpc_service *svc);
694 int ptlrpc_start_n_threads(struct obd_device *dev, struct ptlrpc_service *svc,
695 int cnt, char *base_name);
696 int ptlrpc_start_thread(struct obd_device *dev, struct ptlrpc_service *svc,
698 int ptlrpc_unregister_service(struct ptlrpc_service *service);
699 int liblustre_check_services (void *arg);
700 void ptlrpc_daemonize(void);
703 struct ptlrpc_svc_data {
705 struct ptlrpc_service *svc;
706 struct ptlrpc_thread *thread;
707 struct obd_device *dev;
710 /* ptlrpc/import.c */
711 int ptlrpc_connect_import(struct obd_import *imp, char * new_uuid);
712 int ptlrpc_init_import(struct obd_import *imp);
713 int ptlrpc_disconnect_import(struct obd_import *imp);
714 int ptlrpc_import_recovery_state_machine(struct obd_import *imp);
716 /* ptlrpc/pack_generic.c */
717 int lustre_msg_swabbed(struct lustre_msg *msg);
718 int lustre_msg_check_version(struct lustre_msg *msg, __u32 version);
719 int lustre_pack_request(struct ptlrpc_request *, int count, int *lens,
721 int lustre_pack_reply(struct ptlrpc_request *, int count, int *lens,
723 void lustre_free_reply_state(struct ptlrpc_reply_state *rs);
724 int lustre_msg_size(int count, int *lengths);
725 int lustre_unpack_msg(struct lustre_msg *m, int len);
726 void *lustre_msg_buf(struct lustre_msg *m, int n, int minlen);
727 char *lustre_msg_string (struct lustre_msg *m, int n, int max_len);
728 void *lustre_swab_buf(struct lustre_msg *, int n, int minlen, void *swabber);
729 void *lustre_swab_reqbuf (struct ptlrpc_request *req, int n, int minlen,
731 void *lustre_swab_repbuf (struct ptlrpc_request *req, int n, int minlen,
734 void lustre_init_msg (struct lustre_msg *msg, int count,
735 int *lens, char **bufs);
736 void *mdc_setattr_pack(struct lustre_msg *msg, int offset,
737 struct mdc_op_data *data, struct iattr *iattr,
738 void *ea, int ealen, void *ea2, int ea2len);
739 void *mdc_create_pack(struct lustre_msg *msg, int offset,
740 struct mdc_op_data *op_data, __u32 mode,
741 __u64 rdev, const void *data, int datalen);
742 void *mdc_unlink_pack(struct lustre_msg *msg, int offset,
743 struct mdc_op_data *data);
744 void *mdc_link_pack(struct lustre_msg *msg, int offset,
745 struct mdc_op_data *data);
746 void *mdc_rename_pack(struct lustre_msg *msg, int offset,
747 struct mdc_op_data *data,
748 const char *old, int oldlen,
749 const char *new, int newlen);
751 /* lustre id helper functions and macros. */
753 void mdc_pack_id(struct lustre_id *id, obd_id ino,
754 __u32 gen, int type, __u64 mds,
759 id->li_fid.lf_id = fid;
760 id->li_fid.lf_group = mds;
762 id->li_stc.u.e3s.l3s_ino = ino;
763 id->li_stc.u.e3s.l3s_gen = gen;
764 id->li_stc.u.e3s.l3s_type = type;
768 (id)->li_stc.u.e3s.l3s_ino
771 (id)->li_stc.u.e3s.l3s_gen
773 #define id_type(id) \
774 (id)->li_stc.u.e3s.l3s_type
779 #define id_group(id) \
780 (id)->li_fid.lf_group
782 #define id_version(id) \
783 (id)->li_fid.lf_version
785 #define id_assign_fid(id1, id2) \
786 ((id1)->li_fid = (id2)->li_fid)
788 #define id_assign_stc(id1, id2) \
789 ((id1)->li_stc = (id2)->li_stc)
791 #define id_equal(id1, id2) \
792 (id_ino((id1)) == id_ino((id2)) && \
793 id_gen((id1)) == id_gen((id2)) && \
794 id_fid((id1)) == id_fid((id2)) && \
795 id_group((id1)) == id_group(id2))
797 #define id_equal_fid(id1, id2) \
798 (id_fid((id1)) == id_fid((id2)) && \
799 id_group((id1)) == id_group((id2)))
801 #define id_equal_stc(id1, id2) \
802 (id_ino((id1)) == id_ino((id2)) && \
803 id_gen((id1)) == id_gen((id2)))
805 #define id_le_to_cpu(id) \
807 id_fid((id)) = le64_to_cpu(id_fid((id))); \
808 id_group((id)) = le64_to_cpu(id_group((id))); \
809 id_version((id)) = le32_to_cpu(id_version((id))); \
810 id_ino((id)) = le64_to_cpu(id_ino((id))); \
811 id_gen((id)) = le32_to_cpu(id_gen((id))); \
812 id_type((id)) = le32_to_cpu(id_type((id))); \
815 #define id_cpu_to_le(id) \
817 id_fid((id)) = cpu_to_le64(id_fid((id))); \
818 id_group((id)) = cpu_to_le64(id_group((id))); \
819 id_version((id)) = cpu_to_le32(id_version((id))); \
820 id_ino((id)) = cpu_to_le64(id_ino((id))); \
821 id_gen((id)) = cpu_to_le32(id_gen((id))); \
822 id_type((id)) = cpu_to_le32(id_type((id))); \
827 mdc_inode2id(struct lustre_id *id, struct inode *inode)
829 mdc_pack_id(id, inode->i_ino, inode->i_generation,
830 (inode->i_mode & S_IFMT), 0, 0);
834 mdc_prepare_mdc_data(struct mdc_op_data *data, struct inode *i1,
835 struct inode *i2, const char *name, int namelen,
840 mdc_inode2id(&data->id1, i1);
842 mdc_inode2id(&data->id2, i2);
846 data->namelen = namelen;
847 data->create_mode = mode;
848 data->mod_time = LTIME_S(CURRENT_TIME);
852 /* ldlm/ldlm_lib.c */
853 int client_obd_setup(struct obd_device *obddev, obd_count len, void *buf);
854 int client_obd_cleanup(struct obd_device * obddev, int flags);
855 int client_connect_import(struct lustre_handle *conn, struct obd_device *obd,
856 struct obd_uuid *cluuid, unsigned long);
857 int client_disconnect_export(struct obd_export *exp, unsigned long);
859 int client_import_add_conn(struct obd_import *imp, struct obd_uuid *uuid,
861 int client_import_del_conn(struct obd_import *imp, struct obd_uuid *uuid);
862 int import_set_conn_priority(struct obd_import *imp, struct obd_uuid *uuid);
865 /* ptlrpc/pinger.c */
866 int ptlrpc_pinger_add_import(struct obd_import *imp);
867 int ptlrpc_pinger_del_import(struct obd_import *imp);
869 /* ptlrpc/ptlrpcd.c */
870 void ptlrpcd_wake(struct ptlrpc_request *req);
871 void ptlrpcd_add_req(struct ptlrpc_request *req);
872 int ptlrpcd_addref(void);
873 void ptlrpcd_decref(void);
875 /* ptlrpc/lproc_ptlrpc.c */
877 void ptlrpc_lprocfs_register_obd(struct obd_device *obddev);
878 void ptlrpc_lprocfs_unregister_obd(struct obd_device *obddev);
880 #define ptlrpc_lprocfs_register_obd(param...) do{}while(0)
881 #define ptlrpc_lprocfs_unregister_obd(param...) do{}while(0)
884 /* ptlrpc/llog_server.c */
885 int llog_origin_handle_open(struct ptlrpc_request *req);
886 int llog_origin_handle_prev_block(struct ptlrpc_request *req);
887 int llog_origin_handle_next_block(struct ptlrpc_request *req);
888 int llog_origin_handle_read_header(struct ptlrpc_request *req);
889 int llog_origin_handle_close(struct ptlrpc_request *req);
890 int llog_origin_handle_cancel(struct ptlrpc_request *req);
891 int llog_catinfo(struct ptlrpc_request *req);
893 /* ptlrpc/llog_client.c */
894 extern struct llog_operations llog_client_ops;