4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License version 2 for more details. A copy is
14 * included in the COPYING file that accompanied this code.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
24 * Use is subject to license terms.
26 * Copyright (c) 2011, 2012 Intel Corporation
29 * This file is part of Lustre, http://www.lustre.org/
31 * lustre/mdt/mdt_mds.c
33 * Lustre Metadata Service Layer
35 * Author: Di Wang <di.wang@whamcloud.com>
38 #define DEBUG_SUBSYSTEM S_MDS
40 #include <linux/module.h>
42 #include <obd_support.h>
43 /* struct ptlrpc_request */
44 #include <lustre_net.h>
45 /* struct obd_export */
46 #include <lustre_export.h>
47 /* struct obd_device */
50 #include <dt_object.h>
51 #include <lustre_mds.h>
52 #include <lustre_mdt.h>
53 #include "mdt_internal.h"
54 #ifdef HAVE_QUOTA_SUPPORT
55 # include <lustre_quota.h>
57 #include <lustre_acl.h>
58 #include <lustre_param.h>
59 #include <lustre_fsfilt.h>
63 struct md_device mds_md_dev;
64 struct ptlrpc_service *mds_regular_service;
65 struct ptlrpc_service *mds_readpage_service;
66 struct ptlrpc_service *mds_out_service;
67 struct ptlrpc_service *mds_setattr_service;
68 struct ptlrpc_service *mds_mdsc_service;
69 struct ptlrpc_service *mds_mdss_service;
70 struct ptlrpc_service *mds_fld_service;
74 * * Initialized in mdt_mod_init().
76 static unsigned long mdt_num_threads;
77 CFS_MODULE_PARM(mdt_num_threads, "ul", ulong, 0444,
78 "number of MDS service threads to start "
79 "(deprecated in favor of mds_num_threads)");
81 static unsigned long mds_num_threads;
82 CFS_MODULE_PARM(mds_num_threads, "ul", ulong, 0444,
83 "number of MDS service threads to start");
85 static char *mds_num_cpts;
86 CFS_MODULE_PARM(mds_num_cpts, "c", charp, 0444,
87 "CPU partitions MDS threads should run on");
89 static unsigned long mds_rdpg_num_threads;
90 CFS_MODULE_PARM(mds_rdpg_num_threads, "ul", ulong, 0444,
91 "number of MDS readpage service threads to start");
93 static char *mds_rdpg_num_cpts;
94 CFS_MODULE_PARM(mds_rdpg_num_cpts, "c", charp, 0444,
95 "CPU partitions MDS readpage threads should run on");
97 /* NB: these two should be removed along with setattr service in the future */
98 static unsigned long mds_attr_num_threads;
99 CFS_MODULE_PARM(mds_attr_num_threads, "ul", ulong, 0444,
100 "number of MDS setattr service threads to start");
102 static char *mds_attr_num_cpts;
103 CFS_MODULE_PARM(mds_attr_num_cpts, "c", charp, 0444,
104 "CPU partitions MDS setattr threads should run on");
106 #define DEFINE_RPC_HANDLER(base, flags, opc, fn, fmt) \
109 .mh_fail_id = OBD_FAIL_ ## opc ## _NET, \
116 /* Request with a format known in advance */
117 #define DEF_MDT_HDL(flags, name, fn) \
118 DEFINE_RPC_HANDLER(MDS_GETATTR, flags, name, fn, &RQF_ ## name)
120 /* Request with a format we do not yet know */
121 #define DEF_MDT_HDL_VAR(flags, name, fn) \
122 DEFINE_RPC_HANDLER(MDS_GETATTR, flags, name, fn, NULL)
124 /* Map one non-standard request format handler. This should probably get
125 * a common OBD_SET_INFO RPC opcode instead of this mismatch. */
126 #define RQF_MDS_SET_INFO RQF_OBD_SET_INFO
128 static struct mdt_handler mdt_mds_ops[] = {
129 DEF_MDT_HDL(0, MDS_CONNECT, mdt_connect),
130 DEF_MDT_HDL(0, MDS_DISCONNECT, mdt_disconnect),
131 DEF_MDT_HDL(0, MDS_SET_INFO, mdt_set_info),
132 DEF_MDT_HDL(0, MDS_GET_INFO, mdt_get_info),
133 DEF_MDT_HDL(0 | HABEO_REFERO, MDS_GETSTATUS, mdt_getstatus),
134 DEF_MDT_HDL(HABEO_CORPUS, MDS_GETATTR, mdt_getattr),
135 DEF_MDT_HDL(HABEO_CORPUS| HABEO_REFERO, MDS_GETATTR_NAME, mdt_getattr_name),
136 DEF_MDT_HDL(HABEO_CORPUS, MDS_GETXATTR, mdt_getxattr),
137 DEF_MDT_HDL(0 | HABEO_REFERO, MDS_STATFS, mdt_statfs),
138 DEF_MDT_HDL(0 | MUTABOR, MDS_REINT, mdt_reint),
139 DEF_MDT_HDL(HABEO_CORPUS, MDS_CLOSE, mdt_close),
140 DEF_MDT_HDL(HABEO_CORPUS, MDS_DONE_WRITING, mdt_done_writing),
141 DEF_MDT_HDL(0 | HABEO_REFERO, MDS_PIN, mdt_pin),
142 DEF_MDT_HDL_VAR(0, MDS_SYNC, mdt_sync),
143 DEF_MDT_HDL(HABEO_CORPUS| HABEO_REFERO, MDS_IS_SUBDIR, mdt_is_subdir),
144 DEF_MDT_HDL(0, MDS_QUOTACHECK, mdt_quotacheck),
145 DEF_MDT_HDL(0, MDS_QUOTACTL, mdt_quotactl),
146 DEF_MDT_HDL(0 | HABEO_REFERO, MDS_HSM_PROGRESS, mdt_hsm_progress),
147 DEF_MDT_HDL(0 | HABEO_REFERO, MDS_HSM_CT_REGISTER,
148 mdt_hsm_ct_register),
149 DEF_MDT_HDL(0 | HABEO_REFERO, MDS_HSM_CT_UNREGISTER,
150 mdt_hsm_ct_unregister),
151 DEF_MDT_HDL(HABEO_CORPUS| HABEO_REFERO, MDS_HSM_STATE_GET,
153 DEF_MDT_HDL(HABEO_CORPUS| HABEO_REFERO, MDS_HSM_STATE_SET,
155 DEF_MDT_HDL(HABEO_CORPUS| HABEO_REFERO, MDS_HSM_ACTION, mdt_hsm_action),
156 DEF_MDT_HDL(0 | HABEO_REFERO, MDS_HSM_REQUEST, mdt_hsm_request),
159 #define DEF_OBD_HDL(flags, name, fn) \
160 DEFINE_RPC_HANDLER(OBD_PING, flags, name, fn, NULL)
162 static struct mdt_handler mdt_obd_ops[] = {
163 DEF_OBD_HDL(0, OBD_PING, mdt_obd_ping),
164 DEF_OBD_HDL(0, OBD_LOG_CANCEL, mdt_obd_log_cancel),
165 DEF_OBD_HDL(0, OBD_QC_CALLBACK, mdt_obd_qc_callback),
166 DEF_OBD_HDL(0, OBD_IDX_READ, mdt_obd_idx_read)
169 #define DEF_DLM_HDL_VAR(flags, name, fn) \
170 DEFINE_RPC_HANDLER(LDLM_ENQUEUE, flags, name, fn, NULL)
171 #define DEF_DLM_HDL(flags, name, fn) \
172 DEFINE_RPC_HANDLER(LDLM_ENQUEUE, flags, name, fn, &RQF_ ## name)
174 static struct mdt_handler mdt_dlm_ops[] = {
175 DEF_DLM_HDL (HABEO_CLAVIS, LDLM_ENQUEUE, mdt_enqueue),
176 DEF_DLM_HDL_VAR(HABEO_CLAVIS, LDLM_CONVERT, mdt_convert),
177 DEF_DLM_HDL_VAR(0, LDLM_BL_CALLBACK, mdt_bl_callback),
178 DEF_DLM_HDL_VAR(0, LDLM_CP_CALLBACK, mdt_cp_callback)
181 #define DEF_LLOG_HDL(flags, name, fn) \
182 DEFINE_RPC_HANDLER(LLOG_ORIGIN_HANDLE_CREATE, flags, name, fn, NULL)
184 static struct mdt_handler mdt_llog_ops[] = {
185 DEF_LLOG_HDL(0, LLOG_ORIGIN_HANDLE_CREATE, mdt_llog_create),
186 DEF_LLOG_HDL(0, LLOG_ORIGIN_HANDLE_NEXT_BLOCK, mdt_llog_next_block),
187 DEF_LLOG_HDL(0, LLOG_ORIGIN_HANDLE_READ_HEADER, mdt_llog_read_header),
188 DEF_LLOG_HDL(0, LLOG_ORIGIN_HANDLE_WRITE_REC, NULL),
189 DEF_LLOG_HDL(0, LLOG_ORIGIN_HANDLE_CLOSE, NULL),
190 DEF_LLOG_HDL(0, LLOG_ORIGIN_CONNECT, NULL),
191 DEF_LLOG_HDL(0, LLOG_CATINFO, NULL),
192 DEF_LLOG_HDL(0, LLOG_ORIGIN_HANDLE_PREV_BLOCK, mdt_llog_prev_block),
193 DEF_LLOG_HDL(0, LLOG_ORIGIN_HANDLE_DESTROY, mdt_llog_destroy),
196 #define DEF_SEC_HDL(flags, name, fn) \
197 DEFINE_RPC_HANDLER(SEC_CTX_INIT, flags, name, fn, NULL)
199 static struct mdt_handler mdt_sec_ctx_ops[] = {
200 DEF_SEC_HDL(0, SEC_CTX_INIT, mdt_sec_ctx_handle),
201 DEF_SEC_HDL(0, SEC_CTX_INIT_CONT,mdt_sec_ctx_handle),
202 DEF_SEC_HDL(0, SEC_CTX_FINI, mdt_sec_ctx_handle)
205 #define DEF_QUOTA_HDL(flags, name, fn) \
206 DEFINE_RPC_HANDLER(QUOTA_DQACQ, flags, name, fn, &RQF_ ## name)
208 static struct mdt_handler mdt_quota_ops[] = {
209 DEF_QUOTA_HDL(HABEO_REFERO, QUOTA_DQACQ, mdt_quota_dqacq),
212 struct mdt_opc_slice mdt_regular_handlers[] = {
214 .mos_opc_start = MDS_GETATTR,
215 .mos_opc_end = MDS_LAST_OPC,
216 .mos_hs = mdt_mds_ops
219 .mos_opc_start = OBD_PING,
220 .mos_opc_end = OBD_LAST_OPC,
221 .mos_hs = mdt_obd_ops
224 .mos_opc_start = LDLM_ENQUEUE,
225 .mos_opc_end = LDLM_LAST_OPC,
226 .mos_hs = mdt_dlm_ops
229 .mos_opc_start = LLOG_ORIGIN_HANDLE_CREATE,
230 .mos_opc_end = LLOG_LAST_OPC,
231 .mos_hs = mdt_llog_ops
234 .mos_opc_start = SEC_CTX_INIT,
235 .mos_opc_end = SEC_LAST_OPC,
236 .mos_hs = mdt_sec_ctx_ops
239 .mos_opc_start = QUOTA_DQACQ,
240 .mos_opc_end = QUOTA_LAST_OPC,
241 .mos_hs = mdt_quota_ops
248 /* Readpage/readdir handlers */
249 static struct mdt_handler mdt_readpage_ops[] = {
250 DEF_MDT_HDL(0, MDS_CONNECT, mdt_connect),
251 DEF_MDT_HDL(HABEO_CORPUS | HABEO_REFERO, MDS_READPAGE, mdt_readpage),
252 /* XXX: this is ugly and should be fixed one day, see mdc_close() for
253 * detailed comments. --umka */
254 DEF_MDT_HDL(HABEO_CORPUS, MDS_CLOSE, mdt_close),
255 DEF_MDT_HDL(HABEO_CORPUS, MDS_DONE_WRITING, mdt_done_writing),
258 static struct mdt_opc_slice mdt_readpage_handlers[] = {
260 .mos_opc_start = MDS_GETATTR,
261 .mos_opc_end = MDS_LAST_OPC,
262 .mos_hs = mdt_readpage_ops
265 .mos_opc_start = OBD_FIRST_OPC,
266 .mos_opc_end = OBD_LAST_OPC,
267 .mos_hs = mdt_obd_ops
274 /* Sequence service handlers */
275 #define DEF_SEQ_HDL(flags, name, fn) \
276 DEFINE_RPC_HANDLER(SEQ_QUERY, flags, name, fn, &RQF_ ## name)
278 static struct mdt_handler mdt_seq_ops[] = {
279 DEF_SEQ_HDL(0, SEQ_QUERY, (void *)seq_query),
282 struct mdt_opc_slice mdt_seq_handlers[] = {
284 .mos_opc_start = SEQ_QUERY,
285 .mos_opc_end = SEQ_LAST_OPC,
286 .mos_hs = mdt_seq_ops
293 /* FID Location Database handlers */
294 #define DEF_FLD_HDL(flags, name, fn) \
295 DEFINE_RPC_HANDLER(FLD_QUERY, flags, name, fn, &RQF_ ## name)
297 static struct mdt_handler mdt_fld_ops[] = {
298 DEF_FLD_HDL(0, FLD_QUERY, (void *)fld_query),
301 struct mdt_opc_slice mdt_fld_handlers[] = {
303 .mos_opc_start = FLD_QUERY,
304 .mos_opc_end = FLD_LAST_OPC,
305 .mos_hs = mdt_fld_ops
312 /* Request with a format known in advance */
313 #define DEF_UPDATE_HDL(flags, name, fn) \
314 DEFINE_RPC_HANDLER(UPDATE_OBJ, flags, name, fn, &RQF_ ## name)
316 #define target_handler mdt_handler
317 static struct target_handler out_ops[] = {
318 DEF_UPDATE_HDL(MUTABOR, UPDATE_OBJ, out_handle),
321 static struct mdt_opc_slice update_handlers[] = {
323 .mos_opc_start = MDS_GETATTR,
324 .mos_opc_end = MDS_LAST_OPC,
325 .mos_hs = mdt_mds_ops
328 .mos_opc_start = OBD_PING,
329 .mos_opc_end = OBD_LAST_OPC,
330 .mos_hs = mdt_obd_ops
333 .mos_opc_start = LDLM_ENQUEUE,
334 .mos_opc_end = LDLM_LAST_OPC,
335 .mos_hs = mdt_dlm_ops
338 .mos_opc_start = SEC_CTX_INIT,
339 .mos_opc_end = SEC_LAST_OPC,
340 .mos_hs = mdt_sec_ctx_ops
343 .mos_opc_start = UPDATE_OBJ,
344 .mos_opc_end = UPDATE_LAST_OPC,
352 static int mds_regular_handle(struct ptlrpc_request *req)
354 return mdt_handle_common(req, mdt_regular_handlers);
357 static int mds_readpage_handle(struct ptlrpc_request *req)
359 return mdt_handle_common(req, mdt_readpage_handlers);
362 static int mds_mdsc_handle(struct ptlrpc_request *req)
364 return mdt_handle_common(req, mdt_seq_handlers);
367 static int mdt_out_handle(struct ptlrpc_request *req)
369 return mdt_handle_common(req, update_handlers);
372 static int mds_mdss_handle(struct ptlrpc_request *req)
374 return mdt_handle_common(req, mdt_seq_handlers);
377 static int mds_fld_handle(struct ptlrpc_request *req)
379 return mdt_handle_common(req, mdt_fld_handlers);
382 /* device init/fini methods */
383 static void mds_stop_ptlrpc_service(struct mds_device *m)
386 if (m->mds_regular_service != NULL) {
387 ptlrpc_unregister_service(m->mds_regular_service);
388 m->mds_regular_service = NULL;
390 if (m->mds_readpage_service != NULL) {
391 ptlrpc_unregister_service(m->mds_readpage_service);
392 m->mds_readpage_service = NULL;
394 if (m->mds_out_service != NULL) {
395 ptlrpc_unregister_service(m->mds_out_service);
396 m->mds_out_service = NULL;
398 if (m->mds_setattr_service != NULL) {
399 ptlrpc_unregister_service(m->mds_setattr_service);
400 m->mds_setattr_service = NULL;
402 if (m->mds_mdsc_service != NULL) {
403 ptlrpc_unregister_service(m->mds_mdsc_service);
404 m->mds_mdsc_service = NULL;
406 if (m->mds_mdss_service != NULL) {
407 ptlrpc_unregister_service(m->mds_mdss_service);
408 m->mds_mdss_service = NULL;
410 if (m->mds_fld_service != NULL) {
411 ptlrpc_unregister_service(m->mds_fld_service);
412 m->mds_fld_service = NULL;
417 static int mds_start_ptlrpc_service(struct mds_device *m)
419 static struct ptlrpc_service_conf conf;
420 struct obd_device *obd = m->mds_md_dev.md_lu_dev.ld_obd;
421 cfs_proc_dir_entry_t *procfs_entry;
425 procfs_entry = obd->obd_proc_entry;
426 LASSERT(procfs_entry != NULL);
428 conf = (typeof(conf)) {
429 .psc_name = LUSTRE_MDT_NAME,
430 .psc_watchdog_factor = MDT_SERVICE_WATCHDOG_FACTOR,
432 .bc_nbufs = MDS_NBUFS,
433 .bc_buf_size = MDS_BUFSIZE,
434 .bc_req_max_size = MDS_MAXREQSIZE,
435 .bc_rep_max_size = MDS_MAXREPSIZE,
436 .bc_req_portal = MDS_REQUEST_PORTAL,
437 .bc_rep_portal = MDC_REPLY_PORTAL,
440 * We'd like to have a mechanism to set this on a per-device
444 .tc_thr_name = LUSTRE_MDT_NAME,
445 .tc_thr_factor = MDS_THR_FACTOR,
446 .tc_nthrs_init = MDS_NTHRS_INIT,
447 .tc_nthrs_base = MDS_NTHRS_BASE,
448 .tc_nthrs_max = MDS_NTHRS_MAX,
449 .tc_nthrs_user = mds_num_threads,
450 .tc_cpu_affinity = 1,
451 .tc_ctx_tags = LCT_MD_THREAD,
454 .cc_pattern = mds_num_cpts,
457 .so_req_handler = mds_regular_handle,
458 .so_req_printer = target_print_req,
459 .so_hpreq_handler = ptlrpc_hpreq_handler,
462 m->mds_regular_service = ptlrpc_register_service(&conf, procfs_entry);
463 if (IS_ERR(m->mds_regular_service)) {
464 rc = PTR_ERR(m->mds_regular_service);
465 CERROR("failed to start regular mdt service: %d\n", rc);
466 m->mds_regular_service = NULL;
472 * readpage service configuration. Parameters have to be adjusted,
475 memset(&conf, 0, sizeof(conf));
476 conf = (typeof(conf)) {
477 .psc_name = LUSTRE_MDT_NAME "_readpage",
478 .psc_watchdog_factor = MDT_SERVICE_WATCHDOG_FACTOR,
480 .bc_nbufs = MDS_NBUFS,
481 .bc_buf_size = MDS_BUFSIZE,
482 .bc_req_max_size = MDS_MAXREQSIZE,
483 .bc_rep_max_size = MDS_MAXREPSIZE,
484 .bc_req_portal = MDS_READPAGE_PORTAL,
485 .bc_rep_portal = MDC_REPLY_PORTAL,
488 .tc_thr_name = LUSTRE_MDT_NAME "_rdpg",
489 .tc_thr_factor = MDS_RDPG_THR_FACTOR,
490 .tc_nthrs_init = MDS_RDPG_NTHRS_INIT,
491 .tc_nthrs_base = MDS_RDPG_NTHRS_BASE,
492 .tc_nthrs_max = MDS_RDPG_NTHRS_MAX,
493 .tc_nthrs_user = mds_rdpg_num_threads,
494 .tc_cpu_affinity = 1,
495 .tc_ctx_tags = LCT_MD_THREAD,
498 .cc_pattern = mds_rdpg_num_cpts,
501 .so_req_handler = mds_readpage_handle,
502 .so_req_printer = target_print_req,
505 m->mds_readpage_service = ptlrpc_register_service(&conf, procfs_entry);
506 if (IS_ERR(m->mds_readpage_service)) {
507 rc = PTR_ERR(m->mds_readpage_service);
508 CERROR("failed to start readpage service: %d\n", rc);
509 m->mds_readpage_service = NULL;
511 GOTO(err_mds_svc, rc);
515 * setattr service configuration.
517 * XXX To keep the compatibility with old client(< 2.2), we need to
518 * preserve this portal for a certain time, it should be removed
519 * eventually. LU-617.
521 memset(&conf, 0, sizeof(conf));
522 conf = (typeof(conf)) {
523 .psc_name = LUSTRE_MDT_NAME "_setattr",
524 .psc_watchdog_factor = MDT_SERVICE_WATCHDOG_FACTOR,
526 .bc_nbufs = MDS_NBUFS,
527 .bc_buf_size = MDS_BUFSIZE,
528 .bc_req_max_size = MDS_MAXREQSIZE,
529 .bc_rep_max_size = MDS_MAXREPSIZE,
530 .bc_req_portal = MDS_SETATTR_PORTAL,
531 .bc_rep_portal = MDC_REPLY_PORTAL,
534 .tc_thr_name = LUSTRE_MDT_NAME "_attr",
535 .tc_thr_factor = MDS_SETA_THR_FACTOR,
536 .tc_nthrs_init = MDS_SETA_NTHRS_INIT,
537 .tc_nthrs_base = MDS_SETA_NTHRS_BASE,
538 .tc_nthrs_max = MDS_SETA_NTHRS_MAX,
539 .tc_nthrs_user = mds_attr_num_threads,
540 .tc_cpu_affinity = 1,
541 .tc_ctx_tags = LCT_MD_THREAD,
544 .cc_pattern = mds_attr_num_cpts,
547 .so_req_handler = mds_regular_handle,
548 .so_req_printer = target_print_req,
549 .so_hpreq_handler = NULL,
552 m->mds_setattr_service = ptlrpc_register_service(&conf, procfs_entry);
553 if (IS_ERR(m->mds_setattr_service)) {
554 rc = PTR_ERR(m->mds_setattr_service);
555 CERROR("failed to start setattr service: %d\n", rc);
556 m->mds_setattr_service = NULL;
558 GOTO(err_mds_svc, rc);
561 /* Object update service */
562 conf = (typeof(conf)) {
563 .psc_name = LUSTRE_MDT_NAME "_out",
564 .psc_watchdog_factor = MDT_SERVICE_WATCHDOG_FACTOR,
566 .bc_nbufs = MDS_NBUFS,
567 .bc_buf_size = MDS_BUFSIZE,
568 .bc_req_max_size = MDS_MAXREQSIZE,
569 .bc_rep_max_size = MDS_MAXREPSIZE,
570 .bc_req_portal = MDS_MDS_PORTAL,
571 .bc_rep_portal = MDC_REPLY_PORTAL,
574 * We'd like to have a mechanism to set this on a per-device
578 .tc_thr_name = LUSTRE_MDT_NAME "_out",
579 .tc_thr_factor = MDS_THR_FACTOR,
580 .tc_nthrs_init = MDS_NTHRS_INIT,
581 .tc_nthrs_base = MDS_NTHRS_BASE,
582 .tc_nthrs_max = MDS_NTHRS_MAX,
583 .tc_nthrs_user = mds_num_threads,
584 .tc_cpu_affinity = 1,
585 .tc_ctx_tags = LCT_MD_THREAD,
588 .cc_pattern = mds_num_cpts,
591 .so_req_handler = mdt_out_handle,
592 .so_req_printer = target_print_req,
593 .so_hpreq_handler = NULL,
596 m->mds_out_service = ptlrpc_register_service(&conf, procfs_entry);
597 if (IS_ERR(m->mds_out_service)) {
598 rc = PTR_ERR(m->mds_out_service);
599 CERROR("failed to start out service: %d\n", rc);
600 m->mds_out_service = NULL;
601 GOTO(err_mds_svc, rc);
605 * sequence controller service configuration
607 memset(&conf, 0, sizeof(conf));
608 conf = (typeof(conf)) {
609 .psc_name = LUSTRE_MDT_NAME "_seqs",
610 .psc_watchdog_factor = MDT_SERVICE_WATCHDOG_FACTOR,
612 .bc_nbufs = MDS_NBUFS,
613 .bc_buf_size = MDS_BUFSIZE,
614 .bc_req_max_size = SEQ_MAXREQSIZE,
615 .bc_rep_max_size = SEQ_MAXREPSIZE,
616 .bc_req_portal = SEQ_CONTROLLER_PORTAL,
617 .bc_rep_portal = MDC_REPLY_PORTAL,
620 .tc_thr_name = LUSTRE_MDT_NAME "_seqs",
621 .tc_nthrs_init = MDS_OTHR_NTHRS_INIT,
622 .tc_nthrs_max = MDS_OTHR_NTHRS_MAX,
623 .tc_ctx_tags = LCT_MD_THREAD,
626 .so_req_handler = mds_mdsc_handle,
627 .so_req_printer = target_print_req,
628 .so_hpreq_handler = NULL,
631 m->mds_mdsc_service = ptlrpc_register_service(&conf, procfs_entry);
632 if (IS_ERR(m->mds_mdsc_service)) {
633 rc = PTR_ERR(m->mds_mdsc_service);
634 CERROR("failed to start seq controller service: %d\n", rc);
635 m->mds_mdsc_service = NULL;
637 GOTO(err_mds_svc, rc);
641 * metadata sequence server service configuration
643 memset(&conf, 0, sizeof(conf));
644 conf = (typeof(conf)) {
645 .psc_name = LUSTRE_MDT_NAME "_seqm",
646 .psc_watchdog_factor = MDT_SERVICE_WATCHDOG_FACTOR,
648 .bc_nbufs = MDS_NBUFS,
649 .bc_buf_size = MDS_BUFSIZE,
650 .bc_req_max_size = SEQ_MAXREQSIZE,
651 .bc_rep_max_size = SEQ_MAXREPSIZE,
652 .bc_req_portal = SEQ_METADATA_PORTAL,
653 .bc_rep_portal = MDC_REPLY_PORTAL,
656 .tc_thr_name = LUSTRE_MDT_NAME "_seqm",
657 .tc_nthrs_init = MDS_OTHR_NTHRS_INIT,
658 .tc_nthrs_max = MDS_OTHR_NTHRS_MAX,
659 .tc_ctx_tags = LCT_MD_THREAD | LCT_DT_THREAD
662 .so_req_handler = mds_mdss_handle,
663 .so_req_printer = target_print_req,
664 .so_hpreq_handler = NULL,
667 m->mds_mdss_service = ptlrpc_register_service(&conf, procfs_entry);
668 if (IS_ERR(m->mds_mdss_service)) {
669 rc = PTR_ERR(m->mds_mdss_service);
670 CERROR("failed to start metadata seq server service: %d\n", rc);
671 m->mds_mdss_service = NULL;
673 GOTO(err_mds_svc, rc);
676 /* FLD service start */
677 memset(&conf, 0, sizeof(conf));
678 conf = (typeof(conf)) {
679 .psc_name = LUSTRE_MDT_NAME "_fld",
680 .psc_watchdog_factor = MDT_SERVICE_WATCHDOG_FACTOR,
682 .bc_nbufs = MDS_NBUFS,
683 .bc_buf_size = MDS_BUFSIZE,
684 .bc_req_max_size = FLD_MAXREQSIZE,
685 .bc_rep_max_size = FLD_MAXREPSIZE,
686 .bc_req_portal = FLD_REQUEST_PORTAL,
687 .bc_rep_portal = MDC_REPLY_PORTAL,
690 .tc_thr_name = LUSTRE_MDT_NAME "_fld",
691 .tc_nthrs_init = MDS_OTHR_NTHRS_INIT,
692 .tc_nthrs_max = MDS_OTHR_NTHRS_MAX,
693 .tc_ctx_tags = LCT_DT_THREAD | LCT_MD_THREAD
696 .so_req_handler = mds_fld_handle,
697 .so_req_printer = target_print_req,
698 .so_hpreq_handler = NULL,
701 m->mds_fld_service = ptlrpc_register_service(&conf, procfs_entry);
702 if (IS_ERR(m->mds_fld_service)) {
703 rc = PTR_ERR(m->mds_fld_service);
704 CERROR("failed to start fld service: %d\n", rc);
705 m->mds_fld_service = NULL;
707 GOTO(err_mds_svc, rc);
713 mds_stop_ptlrpc_service(m);
718 static inline struct mds_device *mds_dev(struct lu_device *d)
720 return container_of0(d, struct mds_device, mds_md_dev.md_lu_dev);
723 static struct lu_device *mds_device_fini(const struct lu_env *env,
726 struct mds_device *m = mds_dev(d);
727 struct obd_device *obd = d->ld_obd;
730 mds_stop_ptlrpc_service(m);
731 lprocfs_obd_cleanup(obd);
735 static struct lu_device *mds_device_free(const struct lu_env *env,
738 struct mds_device *m = mds_dev(d);
741 md_device_fini(&m->mds_md_dev);
746 static struct lu_device *mds_device_alloc(const struct lu_env *env,
747 struct lu_device_type *t,
748 struct lustre_cfg *cfg)
750 struct mds_device *m;
751 struct obd_device *obd;
757 return ERR_PTR(-ENOMEM);
759 md_device_init(&m->mds_md_dev, t);
760 l = &m->mds_md_dev.md_lu_dev;
762 obd = class_name2obd(lustre_cfg_string(cfg, 0));
763 LASSERT(obd != NULL);
766 /* set this lu_device to obd, because error handling need it */
769 rc = lprocfs_obd_setup(obd, lprocfs_mds_obd_vars);
771 mds_device_free(env, l);
776 rc = mds_start_ptlrpc_service(m);
779 mds_device_free(env, l);
787 /* type constructor/destructor: mdt_type_init, mdt_type_fini */
788 LU_TYPE_INIT_FINI(mds, &mdt_thread_key);
790 static struct lu_device_type_operations mds_device_type_ops = {
791 .ldto_init = mds_type_init,
792 .ldto_fini = mds_type_fini,
794 .ldto_start = mds_type_start,
795 .ldto_stop = mds_type_stop,
797 .ldto_device_alloc = mds_device_alloc,
798 .ldto_device_free = mds_device_free,
799 .ldto_device_fini = mds_device_fini
802 static struct lu_device_type mds_device_type = {
803 .ldt_tags = LU_DEVICE_MD,
804 .ldt_name = LUSTRE_MDS_NAME,
805 .ldt_ops = &mds_device_type_ops,
806 .ldt_ctx_tags = LCT_MD_THREAD
809 static struct obd_ops mds_obd_device_ops = {
810 .o_owner = THIS_MODULE,
813 int mds_mod_init(void)
817 if (mdt_num_threads != 0 && mds_num_threads == 0) {
818 LCONSOLE_INFO("mdt_num_threads module parameter is deprecated, "
819 "use mds_num_threads instead or unset both for "
820 "dynamic thread startup\n");
821 mds_num_threads = mdt_num_threads;
824 rc = class_register_type(&mds_obd_device_ops, NULL,
825 lprocfs_mds_module_vars, LUSTRE_MDS_NAME,
830 void mds_mod_exit(void)
832 class_unregister_type(LUSTRE_MDS_NAME);