/* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*- * vim:expandtab:shiftwidth=8:tabstop=8: * * lustre/cmm/cmm_device.c * Lustre Cluster Metadata Manager (cmm) * * Copyright (c) 2006 Cluster File Systems, Inc. * Author: Mike Pershin * * This file is part of the Lustre file system, http://www.lustre.org * Lustre is a trademark of Cluster File Systems, Inc. * * You may have signed or agreed to another license before downloading * this software. If so, you are bound by the terms and conditions * of that agreement, and the following does not apply to you. See the * LICENSE file included with this distribution for more information. * * If you did not agree to a different license, then this copy of Lustre * is open source software; you can redistribute it and/or modify it * under the terms of version 2 of the GNU General Public License as * published by the Free Software Foundation. * * In either case, Lustre is distributed in the hope that it will be * useful, but WITHOUT ANY WARRANTY; without even the implied warranty * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * license text for more details. */ #ifndef EXPORT_SYMTAB # define EXPORT_SYMTAB #endif #define DEBUG_SUBSYSTEM S_MDS #include #include #include #include #include #include "cmm_internal.h" #include "mdc_internal.h" static struct obd_ops cmm_obd_device_ops = { .o_owner = THIS_MODULE }; static struct lu_device_operations cmm_lu_ops; static inline int lu_device_is_cmm(struct lu_device *d) { return ergo(d != NULL && d->ld_ops != NULL, d->ld_ops == &cmm_lu_ops); } int cmm_root_get(const struct lu_env *env, struct md_device *md, struct lu_fid *fid) { struct cmm_device *cmm_dev = md2cmm_dev(md); /* valid only on master MDS */ if (cmm_dev->cmm_local_num == 0) return cmm_child_ops(cmm_dev)->mdo_root_get(env, cmm_dev->cmm_child, fid); else return -EINVAL; } static int cmm_statfs(const struct lu_env *env, struct md_device *md, struct kstatfs *sfs) { struct cmm_device *cmm_dev = md2cmm_dev(md); int rc; ENTRY; rc = cmm_child_ops(cmm_dev)->mdo_statfs(env, cmm_dev->cmm_child, sfs); RETURN (rc); } static int cmm_maxsize_get(const struct lu_env *env, struct md_device *md, int *md_size, int *cookie_size) { struct cmm_device *cmm_dev = md2cmm_dev(md); int rc; ENTRY; rc = cmm_child_ops(cmm_dev)->mdo_maxsize_get(env, cmm_dev->cmm_child, md_size, cookie_size); RETURN(rc); } static int cmm_init_capa_ctxt(const struct lu_env *env, struct md_device *md, int mode , unsigned long timeout, __u32 alg, struct lustre_capa_key *keys) { struct cmm_device *cmm_dev = md2cmm_dev(md); int rc; ENTRY; LASSERT(cmm_child_ops(cmm_dev)->mdo_init_capa_ctxt); rc = cmm_child_ops(cmm_dev)->mdo_init_capa_ctxt(env, cmm_dev->cmm_child, mode, timeout, alg, keys); RETURN(rc); } static int cmm_update_capa_key(const struct lu_env *env, struct md_device *md, struct lustre_capa_key *key) { struct cmm_device *cmm_dev = md2cmm_dev(md); int rc; ENTRY; rc = cmm_child_ops(cmm_dev)->mdo_update_capa_key(env, cmm_dev->cmm_child, key); RETURN(rc); } static struct md_device_operations cmm_md_ops = { .mdo_statfs = cmm_statfs, .mdo_root_get = cmm_root_get, .mdo_maxsize_get = cmm_maxsize_get, .mdo_init_capa_ctxt = cmm_init_capa_ctxt, .mdo_update_capa_key = cmm_update_capa_key, }; extern struct lu_device_type mdc_device_type; static int cmm_post_init_mdc(const struct lu_env *env, struct cmm_device *cmm) { int max_mdsize, max_cookiesize, rc; struct mdc_device *mc, *tmp; /* get the max mdsize and cookiesize from lower layer */ rc = cmm_maxsize_get(env, &cmm->cmm_md_dev, &max_mdsize, &max_cookiesize); if (rc) RETURN(rc); spin_lock(&cmm->cmm_tgt_guard); list_for_each_entry_safe(mc, tmp, &cmm->cmm_targets, mc_linkage) { mdc_init_ea_size(env, mc, max_mdsize, max_cookiesize); } spin_unlock(&cmm->cmm_tgt_guard); RETURN(rc); } /* --- cmm_lu_operations --- */ /* add new MDC to the CMM, create MDC lu_device and connect it to mdc_obd */ static int cmm_add_mdc(const struct lu_env *env, struct cmm_device *cm, struct lustre_cfg *cfg) { struct lu_device_type *ldt = &mdc_device_type; char *p, *num = lustre_cfg_string(cfg, 2); struct mdc_device *mc, *tmp; struct lu_fld_target target; struct lu_device *ld; mdsno_t mdc_num; int rc; ENTRY; /* find out that there is no such mdc */ LASSERT(num); mdc_num = simple_strtol(num, &p, 10); if (*p) { CERROR("Invalid index in lustre_cgf, offset 2\n"); RETURN(-EINVAL); } spin_lock(&cm->cmm_tgt_guard); list_for_each_entry_safe(mc, tmp, &cm->cmm_targets, mc_linkage) { if (mc->mc_num == mdc_num) { spin_unlock(&cm->cmm_tgt_guard); RETURN(-EEXIST); } } spin_unlock(&cm->cmm_tgt_guard); ld = ldt->ldt_ops->ldto_device_alloc(env, ldt, cfg); ld->ld_site = cmm2lu_dev(cm)->ld_site; rc = ldt->ldt_ops->ldto_device_init(env, ld, NULL, NULL); if (rc) { ldt->ldt_ops->ldto_device_free(env, ld); RETURN (rc); } /* pass config to the just created MDC */ rc = ld->ld_ops->ldo_process_config(env, ld, cfg); if (rc) RETURN(rc); spin_lock(&cm->cmm_tgt_guard); list_for_each_entry_safe(mc, tmp, &cm->cmm_targets, mc_linkage) { if (mc->mc_num == mdc_num) { spin_unlock(&cm->cmm_tgt_guard); ldt->ldt_ops->ldto_device_fini(env, ld); ldt->ldt_ops->ldto_device_free(env, ld); RETURN(-EEXIST); } } mc = lu2mdc_dev(ld); list_add_tail(&mc->mc_linkage, &cm->cmm_targets); cm->cmm_tgt_count++; spin_unlock(&cm->cmm_tgt_guard); lu_device_get(cmm2lu_dev(cm)); target.ft_srv = NULL; target.ft_idx = mc->mc_num; target.ft_exp = mc->mc_desc.cl_exp; fld_client_add_target(cm->cmm_fld, &target); /* Set max md size for the mdc. */ rc = cmm_post_init_mdc(env, cm); RETURN(rc); } static void cmm_device_shutdown(const struct lu_env *env, struct cmm_device *cm, struct lustre_cfg *cfg) { struct mdc_device *mc, *tmp; ENTRY; /* Remove local target from FLD. */ fld_client_del_target(cm->cmm_fld, cm->cmm_local_num); /* Finish all mdc devices. */ spin_lock(&cm->cmm_tgt_guard); list_for_each_entry_safe(mc, tmp, &cm->cmm_targets, mc_linkage) { struct lu_device *ld_m = mdc2lu_dev(mc); fld_client_del_target(cm->cmm_fld, mc->mc_num); ld_m->ld_ops->ldo_process_config(env, ld_m, cfg); } spin_unlock(&cm->cmm_tgt_guard); /* remove upcall device*/ md_upcall_fini(&cm->cmm_md_dev); EXIT; } static int cmm_device_mount(const struct lu_env *env, struct cmm_device *m, struct lustre_cfg *cfg) { const char *index = lustre_cfg_string(cfg, 2); char *p; LASSERT(index != NULL); m->cmm_local_num = simple_strtol(index, &p, 10); if (*p) { CERROR("Invalid index in lustre_cgf\n"); RETURN(-EINVAL); } RETURN(0); } static int cmm_process_config(const struct lu_env *env, struct lu_device *d, struct lustre_cfg *cfg) { struct cmm_device *m = lu2cmm_dev(d); struct lu_device *next = md2lu_dev(m->cmm_child); int err; ENTRY; switch(cfg->lcfg_command) { case LCFG_ADD_MDC: /* On first ADD_MDC add also local target. */ if (!(m->cmm_flags & CMM_INITIALIZED)) { struct lu_site *ls = cmm2lu_dev(m)->ld_site; struct lu_fld_target target; target.ft_srv = ls->ls_server_fld; target.ft_idx = m->cmm_local_num; target.ft_exp = NULL; fld_client_add_target(m->cmm_fld, &target); } err = cmm_add_mdc(env, m, cfg); /* The first ADD_MDC can be counted as setup is finished. */ if (!(m->cmm_flags & CMM_INITIALIZED)) m->cmm_flags |= CMM_INITIALIZED; break; case LCFG_SETUP: { /* lower layers should be set up at first */ err = next->ld_ops->ldo_process_config(env, next, cfg); if (err == 0) err = cmm_device_mount(env, m, cfg); break; } case LCFG_CLEANUP: { cmm_device_shutdown(env, m, cfg); } default: err = next->ld_ops->ldo_process_config(env, next, cfg); } RETURN(err); } static int cmm_recovery_complete(const struct lu_env *env, struct lu_device *d) { struct cmm_device *m = lu2cmm_dev(d); struct lu_device *next = md2lu_dev(m->cmm_child); int rc; ENTRY; rc = next->ld_ops->ldo_recovery_complete(env, next); RETURN(rc); } static struct lu_device_operations cmm_lu_ops = { .ldo_object_alloc = cmm_object_alloc, .ldo_process_config = cmm_process_config, .ldo_recovery_complete = cmm_recovery_complete }; /* --- lu_device_type operations --- */ int cmm_upcall(const struct lu_env *env, struct md_device *md, enum md_upcall_event ev) { int rc; ENTRY; switch (ev) { case MD_LOV_SYNC: rc = cmm_post_init_mdc(env, md2cmm_dev(md)); if (rc) CERROR("can not init md size %d\n", rc); /* fall through */ default: rc = md_do_upcall(env, md, ev); } RETURN(rc); } static struct lu_device *cmm_device_alloc(const struct lu_env *env, struct lu_device_type *t, struct lustre_cfg *cfg) { struct lu_device *l; struct cmm_device *m; ENTRY; OBD_ALLOC_PTR(m); if (m == NULL) { l = ERR_PTR(-ENOMEM); } else { md_device_init(&m->cmm_md_dev, t); m->cmm_md_dev.md_ops = &cmm_md_ops; md_upcall_init(&m->cmm_md_dev, cmm_upcall); l = cmm2lu_dev(m); l->ld_ops = &cmm_lu_ops; OBD_ALLOC_PTR(m->cmm_fld); if (!m->cmm_fld) GOTO(out_free_cmm, l = ERR_PTR(-ENOMEM)); } RETURN(l); out_free_cmm: OBD_FREE_PTR(m); return l; } static void cmm_device_free(const struct lu_env *env, struct lu_device *d) { struct cmm_device *m = lu2cmm_dev(d); LASSERT(m->cmm_tgt_count == 0); LASSERT(list_empty(&m->cmm_targets)); if (m->cmm_fld != NULL) { OBD_FREE_PTR(m->cmm_fld); m->cmm_fld = NULL; } md_device_fini(&m->cmm_md_dev); OBD_FREE_PTR(m); } /* context key constructor/destructor */ static void *cmm_key_init(const struct lu_context *ctx, struct lu_context_key *key) { struct cmm_thread_info *info; CLASSERT(CFS_PAGE_SIZE >= sizeof *info); OBD_ALLOC_PTR(info); if (info == NULL) info = ERR_PTR(-ENOMEM); return info; } static void cmm_key_fini(const struct lu_context *ctx, struct lu_context_key *key, void *data) { struct cmm_thread_info *info = data; OBD_FREE_PTR(info); } static struct lu_context_key cmm_thread_key = { .lct_tags = LCT_MD_THREAD, .lct_init = cmm_key_init, .lct_fini = cmm_key_fini }; struct cmm_thread_info *cmm_env_info(const struct lu_env *env) { struct cmm_thread_info *info; info = lu_context_key_get(&env->le_ctx, &cmm_thread_key); LASSERT(info != NULL); return info; } static int cmm_type_init(struct lu_device_type *t) { LU_CONTEXT_KEY_INIT(&cmm_thread_key); return lu_context_key_register(&cmm_thread_key); } static void cmm_type_fini(struct lu_device_type *t) { lu_context_key_degister(&cmm_thread_key); } static int cmm_device_init(const struct lu_env *env, struct lu_device *d, const char *name, struct lu_device *next) { struct cmm_device *m = lu2cmm_dev(d); struct lu_site *ls; int err = 0; ENTRY; spin_lock_init(&m->cmm_tgt_guard); INIT_LIST_HEAD(&m->cmm_targets); m->cmm_tgt_count = 0; m->cmm_child = lu2md_dev(next); err = fld_client_init(m->cmm_fld, name, LUSTRE_CLI_FLD_HASH_DHT); if (err) { CERROR("Can't init FLD, err %d\n", err); RETURN(err); } /* Assign site's fld client ref, needed for asserts in osd. */ ls = cmm2lu_dev(m)->ld_site; ls->ls_client_fld = m->cmm_fld; err = cmm_procfs_init(m, name); RETURN(err); } static struct lu_device *cmm_device_fini(const struct lu_env *env, struct lu_device *ld) { struct cmm_device *cm = lu2cmm_dev(ld); struct mdc_device *mc, *tmp; struct lu_site *ls; ENTRY; /* Finish all mdc devices */ spin_lock(&cm->cmm_tgt_guard); list_for_each_entry_safe(mc, tmp, &cm->cmm_targets, mc_linkage) { struct lu_device *ld_m = mdc2lu_dev(mc); list_del_init(&mc->mc_linkage); lu_device_put(cmm2lu_dev(cm)); ld_m->ld_type->ldt_ops->ldto_device_fini(env, ld_m); ld_m->ld_type->ldt_ops->ldto_device_free(env, ld_m); cm->cmm_tgt_count--; } spin_unlock(&cm->cmm_tgt_guard); fld_client_fini(cm->cmm_fld); ls = cmm2lu_dev(cm)->ld_site; ls->ls_client_fld = NULL; cmm_procfs_fini(cm); RETURN (md2lu_dev(cm->cmm_child)); } static struct lu_device_type_operations cmm_device_type_ops = { .ldto_init = cmm_type_init, .ldto_fini = cmm_type_fini, .ldto_device_alloc = cmm_device_alloc, .ldto_device_free = cmm_device_free, .ldto_device_init = cmm_device_init, .ldto_device_fini = cmm_device_fini }; static struct lu_device_type cmm_device_type = { .ldt_tags = LU_DEVICE_MD, .ldt_name = LUSTRE_CMM_NAME, .ldt_ops = &cmm_device_type_ops, .ldt_ctx_tags = LCT_MD_THREAD | LCT_DT_THREAD }; struct lprocfs_vars lprocfs_cmm_obd_vars[] = { { 0 } }; struct lprocfs_vars lprocfs_cmm_module_vars[] = { { 0 } }; LPROCFS_INIT_VARS(cmm, lprocfs_cmm_module_vars, lprocfs_cmm_obd_vars); static int __init cmm_mod_init(void) { struct lprocfs_static_vars lvars; lprocfs_init_vars(cmm, &lvars); return class_register_type(&cmm_obd_device_ops, NULL, lvars.module_vars, LUSTRE_CMM_NAME, &cmm_device_type); } static void __exit cmm_mod_exit(void) { class_unregister_type(LUSTRE_CMM_NAME); } MODULE_AUTHOR("Cluster File Systems, Inc. "); MODULE_DESCRIPTION("Lustre Clustered Metadata Manager ("LUSTRE_CMM_NAME")"); MODULE_LICENSE("GPL"); cfs_module(cmm, "0.1.0", cmm_mod_init, cmm_mod_exit);