X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Flod%2Flod_dev.c;h=3cb717194ef42cbef0a4f0c743c327e93e7214c5;hp=608f754abc247f410de669b538a653e151c8de7a;hb=ad1810a2dbea1eed5e8b5feb55bdf915a545feb3;hpb=74ec68346e14851ad8a1912185e1dccd3e6d12cd diff --git a/lustre/lod/lod_dev.c b/lustre/lod/lod_dev.c index 608f754..3cb71719 100644 --- a/lustre/lod/lod_dev.c +++ b/lustre/lod/lod_dev.c @@ -6,13 +6,13 @@ * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License version 2 only, * as published by the Free Software Foundation. - + * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License version 2 for more details. A copy is * included in the COPYING file that accompanied this code. - + * * You should have received a copy of the GNU General Public License * along with this program; if not, write to the Free Software * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA @@ -23,8 +23,7 @@ * Copyright 2009 Sun Microsystems, Inc. All rights reserved * Use is subject to license terms. * - * Copyright (c) 2012, Intel Corporation. - * + * Copyright (c) 2012, 2014, Intel Corporation. */ /* * This file is part of Lustre, http://www.lustre.org/ @@ -37,67 +36,128 @@ * Author: Alex Zhuravlev * Author: Mikhail Pershin */ +/** + * The Logical Object Device (LOD) layer manages access to striped + * objects (both regular files and directories). It implements the DT + * device and object APIs and is responsible for creating, storing, + * and loading striping information as an extended attribute of the + * underlying OSD object. LOD is the server side analog of the LOV and + * LMV layers on the client side. + * + * Metadata LU object stack (layers of the same compound LU object, + * all have the same FID): + * + * MDT + * | MD API + * MDD + * | DT API + * LOD + * / \ DT API + * OSD OSP + * + * During LOD object initialization the localness or remoteness of the + * object FID dictates the choice between OSD and OSP. + * + * An LOD object (file or directory) with N stripes (each has a + * different FID): + * + * LOD + * | + * +---+---+---+...+ + * | | | | | + * S0 S1 S2 S3 S(N-1) OS[DP] objects, seen as DT objects by LOD + * + * When upper layers must access an object's stripes (which are + * themselves OST or MDT LU objects) LOD finds these objects by their + * FIDs and stores them as an array of DT object pointers on the + * object. Declarations and operations on LOD objects are received by + * LOD (as DT object operations) and performed on the underlying + * OS[DP] object and (as needed) on the stripes. From the perspective + * of LOD, a stripe-less file (created by mknod() or open with + * O_LOV_DELAY_CREATE) is an object which does not yet have stripes, + * while a non-striped directory (created by mkdir()) is an object + * which will never have stripes. + * + * The LOD layer also implements a small subset of the OBD device API + * to support MDT stack initialization and finalization (an MDD device + * connects and disconnects itself to and from the underlying LOD + * device), and pool management. In turn LOD uses the OBD device API + * to connect it self to the underlying OSD, and to connect itself to + * OSP devices representing the MDTs and OSTs that bear the stripes of + * its objects. + */ -#ifndef EXPORT_SYMTAB -# define EXPORT_SYMTAB -#endif #define DEBUG_SUBSYSTEM S_MDS #include +#include +#include #include +#include #include "lod_internal.h" -/** - * Lookup MDT/OST index \a tgt by FID \a fid. +/* + * Lookup target by FID. + * + * Lookup MDT/OST target index by FID. Type of the target can be + * specific or any. * - * \param lod LOD to be lookup at. - * \param fid FID of object to find MDT/OST. - * \param tgt MDT/OST index to return. - * \param flags indidcate the FID is on MDS or OST. + * \param[in] env LU environment provided by the caller + * \param[in] lod lod device + * \param[in] fid FID + * \param[out] tgt result target index + * \param[in] type expected type of the target: + * LU_SEQ_RANGE_{MDT,OST,ANY} + * + * \retval 0 on success + * \retval negative negated errno on error **/ int lod_fld_lookup(const struct lu_env *env, struct lod_device *lod, - const struct lu_fid *fid, __u32 *tgt, int flags) + const struct lu_fid *fid, __u32 *tgt, int *type) { - struct lu_seq_range range; + struct lu_seq_range range = { 0 }; struct lu_server_fld *server_fld; - int rc = 0; + int rc; ENTRY; - LASSERTF(fid_is_sane(fid), "Invalid FID "DFID"\n", PFID(fid)); + if (!fid_is_sane(fid)) { + CERROR("%s: invalid FID "DFID"\n", lod2obd(lod)->obd_name, + PFID(fid)); + RETURN(-EIO); + } + if (fid_is_idif(fid)) { *tgt = fid_idif_ost_idx(fid); - RETURN(rc); + *type = LU_SEQ_RANGE_OST; + RETURN(0); } - if (!lod->lod_initialized || !fid_is_norm(fid)) { + if (!lod->lod_initialized || (!fid_seq_in_fldb(fid_seq(fid)))) { LASSERT(lu_site2seq(lod2lu_dev(lod)->ld_site) != NULL); + *tgt = lu_site2seq(lod2lu_dev(lod)->ld_site)->ss_node_id; - RETURN(rc); + *type = LU_SEQ_RANGE_MDT; + RETURN(0); } server_fld = lu_site2seq(lod2lu_dev(lod)->ld_site)->ss_server_fld; - range.lsr_flags = flags; + fld_range_set_type(&range, *type); rc = fld_server_lookup(env, server_fld, fid_seq(fid), &range); - if (rc) { - CERROR("%s: Can't find tgt by seq "LPX64", rc %d\n", - lod2obd(lod)->obd_name, fid_seq(fid), rc); + if (rc != 0) RETURN(rc); - } *tgt = range.lsr_index; + *type = range.lsr_flags; - CDEBUG(D_INFO, "LOD: got tgt %x for sequence: " - LPX64"\n", *tgt, fid_seq(fid)); + CDEBUG(D_INFO, "%s: got tgt %x for sequence: "LPX64"\n", + lod2obd(lod)->obd_name, *tgt, fid_seq(fid)); - RETURN(rc); + RETURN(0); } -extern struct lu_object_operations lod_lu_obj_ops; -extern struct dt_object_operations lod_obj_ops; - /* Slab for OSD object allocation */ -cfs_mem_cache_t *lod_object_kmem; +struct kmem_cache *lod_object_kmem; static struct lu_kmem_descr lod_caches[] = { { @@ -113,25 +173,48 @@ static struct lu_kmem_descr lod_caches[] = { static struct lu_device *lod_device_fini(const struct lu_env *env, struct lu_device *d); -struct lu_object *lod_object_alloc(const struct lu_env *env, - const struct lu_object_header *hdr, - struct lu_device *dev) +/** + * Implementation of lu_device_operations::ldo_object_alloc() for LOD + * + * Allocates and initializes LOD's slice in the given object. + * + * see include/lu_object.h for the details. + */ +static struct lu_object *lod_object_alloc(const struct lu_env *env, + const struct lu_object_header *hdr, + struct lu_device *dev) { - struct lu_object *lu_obj; - struct lod_object *lo; + struct lod_object *lod_obj; + struct lu_object *lu_obj; + ENTRY; - OBD_SLAB_ALLOC_PTR_GFP(lo, lod_object_kmem, CFS_ALLOC_IO); - if (lo == NULL) - return NULL; + OBD_SLAB_ALLOC_PTR_GFP(lod_obj, lod_object_kmem, GFP_NOFS); + if (lod_obj == NULL) + RETURN(ERR_PTR(-ENOMEM)); - lu_obj = lod2lu_obj(lo); - dt_object_init(&lo->ldo_obj, NULL, dev); - lo->ldo_obj.do_ops = &lod_obj_ops; + lu_obj = lod2lu_obj(lod_obj); + dt_object_init(&lod_obj->ldo_obj, NULL, dev); + lod_obj->ldo_obj.do_ops = &lod_obj_ops; lu_obj->lo_ops = &lod_lu_obj_ops; - return lu_obj; + RETURN(lu_obj); } +/** + * Cleanup table of target's descriptors. + * + * The function goes through all the targets in the given table + * and apply given configuration command on to the targets. + * Used to cleanup the targets at unmount. + * + * \param[in] env LU environment provided by the caller + * \param[in] lod lod device + * \param[in] ltd target's table to go through + * \param[in] lcfg configuration command to apply + * + * \retval 0 on success + * \retval negative negated errno on error + **/ static int lod_cleanup_desc_tgts(const struct lu_env *env, struct lod_device *lod, struct lod_tgt_descs *ltd, @@ -139,7 +222,7 @@ static int lod_cleanup_desc_tgts(const struct lu_env *env, { struct lu_device *next; int rc = 0; - int i; + unsigned int i; lod_getref(ltd); if (ltd->ltd_tgts_size <= 0) { @@ -165,11 +248,22 @@ static int lod_cleanup_desc_tgts(const struct lu_env *env, return rc; } -static int lodname2mdt_index(char *lodname, int *index) +/** + * Extract MDT target index from a device name. + * + * a helper function to extract index from the given device name + * like "fsname-MDTxxxx-mdtlov" + * + * \param[in] lodname device name + * \param[out] index extracted index + * + * \retval 0 on success + * \retval -EINVAL if the name is invalid + */ +static int lodname2mdt_index(char *lodname, long *index) { char *ptr, *tmp; - /* The lodname suppose to be fsname-MDTxxxx-mdtlov */ ptr = strrchr(lodname, '-'); if (ptr == NULL) { CERROR("invalid MDT index in '%s'\n", lodname); @@ -199,6 +293,39 @@ static int lodname2mdt_index(char *lodname, int *index) return 0; } +/** + * Implementation of lu_device_operations::ldo_process_config() for LOD + * + * The method is called by the configuration subsystem during setup, + * cleanup and when the configuration changes. The method processes + * few specific commands like adding/removing the targets, changing + * the runtime parameters. + + * \param[in] env LU environment provided by the caller + * \param[in] dev lod device + * \param[in] lcfg configuration command to apply + * + * \retval 0 on success + * \retval negative negated errno on error + * + * The examples are below. + * + * Add osc config log: + * marker 20 (flags=0x01, v2.2.49.56) lustre-OST0001 'add osc' + * add_uuid nid=192.168.122.162@tcp(0x20000c0a87aa2) 0: 1:nidxxx + * attach 0:lustre-OST0001-osc-MDT0001 1:osc 2:lustre-MDT0001-mdtlov_UUID + * setup 0:lustre-OST0001-osc-MDT0001 1:lustre-OST0001_UUID 2:nid + * lov_modify_tgts add 0:lustre-MDT0001-mdtlov 1:lustre-OST0001_UUID 2:1 3:1 + * marker 20 (flags=0x02, v2.2.49.56) lustre-OST0001 'add osc' + * + * Add mdc config log: + * marker 10 (flags=0x01, v2.2.49.56) lustre-MDT0000 'add osp' + * add_uuid nid=192.168.122.162@tcp(0x20000c0a87aa2) 0: 1:nid + * attach 0:lustre-MDT0000-osp-MDT0001 1:osp 2:lustre-MDT0001-mdtlov_UUID + * setup 0:lustre-MDT0000-osp-MDT0001 1:lustre-MDT0000_UUID 2:nid + * modify_mdc_tgts add 0:lustre-MDT0001 1:lustre-MDT0000_UUID 2:0 3:1 + * marker 10 (flags=0x02, v2.2.49.56) lustre-MDT0000_UUID 'add osp' + */ static int lod_process_config(const struct lu_env *env, struct lu_device *dev, struct lustre_cfg *lcfg) @@ -235,10 +362,13 @@ static int lod_process_config(const struct lu_env *env, if (mdt == NULL) { mdt_index = 0; } else { + long long_index; rc = lodname2mdt_index( - lustre_cfg_string(lcfg, 0), &mdt_index); + lustre_cfg_string(lcfg, 0), + &long_index); if (rc != 0) GOTO(out, rc); + mdt_index = long_index; } rc = lod_add_device(env, lod, arg1, index, gen, mdt_index, LUSTRE_OSC_NAME, 1); @@ -254,27 +384,28 @@ static int lod_process_config(const struct lu_env *env, } else { rc = lod_del_device(env, lod, &lod->lod_ost_descs, - arg1, index, gen); + arg1, index, gen, true); } break; } case LCFG_PARAM: { - struct lprocfs_static_vars v = { 0 }; - struct obd_device *obd = lod2obd(lod); - - lprocfs_lod_init_vars(&v); + struct obd_device *obd = lod2obd(lod); - rc = class_process_proc_param(PARAM_LOV, v.obd_vars, lcfg, obd); + rc = class_process_proc_param(PARAM_LOV, obd->obd_vars, + lcfg, obd); if (rc > 0) rc = 0; GOTO(out, rc); } case LCFG_CLEANUP: + case LCFG_PRE_CLEANUP: { lu_dev_del_linkage(dev->ld_site, dev); lod_cleanup_desc_tgts(env, lod, &lod->lod_mdt_descs, lcfg); lod_cleanup_desc_tgts(env, lod, &lod->lod_ost_descs, lcfg); + if (lcfg->lcfg_command == LCFG_PRE_CLEANUP) + break; /* * do cleanup on underlying storage only when * all OSPs are cleaned up, as they use that OSD as well @@ -289,7 +420,7 @@ static int lod_process_config(const struct lu_env *env, if (rc) CERROR("error in disconnect from storage: %d\n", rc); break; - + } default: CERROR("%s: unknown command %u\n", lod2obd(lod)->obd_name, lcfg->lcfg_command); @@ -301,12 +432,21 @@ out: RETURN(rc); } +/** + * Implementation of lu_device_operations::ldo_recovery_complete() for LOD + * + * The method is called once the recovery is complete. This implementation + * distributes the notification to all the known targets. + * + * see include/lu_object.h for the details + */ static int lod_recovery_complete(const struct lu_env *env, struct lu_device *dev) { struct lod_device *lod = lu2lod_dev(dev); struct lu_device *next = &lod->lod_child->dd_lu_dev; - int i, rc; + unsigned int i; + int rc; ENTRY; LASSERT(lod->lod_recovery_completed == 0); @@ -331,6 +471,11 @@ static int lod_recovery_complete(const struct lu_env *env, RETURN(rc); } +/** + * Implementation of lu_device_operations::ldo_prepare() for LOD + * + * see include/lu_object.h for the details. + */ static int lod_prepare(const struct lu_env *env, struct lu_device *pdev, struct lu_device *cdev) { @@ -358,36 +503,117 @@ const struct lu_device_operations lod_lu_ops = { .ldo_prepare = lod_prepare, }; +/** + * Implementation of dt_device_operations::dt_root_get() for LOD + * + * see include/dt_object.h for the details. + */ static int lod_root_get(const struct lu_env *env, struct dt_device *dev, struct lu_fid *f) { return dt_root_get(env, dt2lod_dev(dev)->lod_child, f); } +/** + * Implementation of dt_device_operations::dt_statfs() for LOD + * + * see include/dt_object.h for the details. + */ static int lod_statfs(const struct lu_env *env, struct dt_device *dev, struct obd_statfs *sfs) { return dt_statfs(env, dt2lod_dev(dev)->lod_child, sfs); } +/** + * Implementation of dt_device_operations::dt_trans_create() for LOD + * + * Creates a transaction using local (to this node) OSD. + * + * see include/dt_object.h for the details. + */ static struct thandle *lod_trans_create(const struct lu_env *env, struct dt_device *dev) { - return dt_trans_create(env, dt2lod_dev(dev)->lod_child); + struct thandle *th; + + th = dt_trans_create(env, dt2lod_dev(dev)->lod_child); + if (IS_ERR(th)) + return th; + + return th; } +/** + * Implementation of dt_device_operations::dt_trans_start() for LOD + * + * Starts the set of local transactions using the targets involved + * in declare phase. Initial support for the distributed transactions. + * + * see include/dt_object.h for the details. + */ static int lod_trans_start(const struct lu_env *env, struct dt_device *dev, struct thandle *th) { - return dt_trans_start(env, dt2lod_dev(dev)->lod_child, th); + struct lod_device *lod = dt2lod_dev((struct dt_device *) dev); + int rc = 0; + + if (unlikely(th->th_update != NULL)) { + struct thandle_update *tu = th->th_update; + struct dt_update_request *update; + + list_for_each_entry(update, &tu->tu_remote_update_list, + dur_list) { + LASSERT(update->dur_dt != NULL); + rc = dt_trans_start(env, update->dur_dt, th); + if (rc != 0) + return rc; + } + } + return dt_trans_start(env, lod->lod_child, th); } -static int lod_trans_stop(const struct lu_env *env, struct thandle *th) +/** + * Implementation of dt_device_operations::dt_trans_stop() for LOD + * + * Stops the set of local transactions using the targets involved + * in declare phase. Initial support for the distributed transactions. + * + * see include/dt_object.h for the details. + */ +static int lod_trans_stop(const struct lu_env *env, struct dt_device *dt, + struct thandle *th) { - /* XXX: we don't know next device, will be fixed with DNE */ - return dt_trans_stop(env, th->th_dev, th); + struct thandle_update *tu = th->th_update; + struct dt_update_request *update; + struct dt_update_request *tmp; + int rc2 = 0; + int rc; + ENTRY; + + rc = dt_trans_stop(env, th->th_dev, th); + if (likely(tu == NULL)) + RETURN(rc); + + list_for_each_entry_safe(update, tmp, + &tu->tu_remote_update_list, + dur_list) { + /* update will be freed inside dt_trans_stop */ + rc2 = dt_trans_stop(env, update->dur_dt, th); + if (unlikely(rc2 != 0 && rc == 0)) + rc = rc2; + } + + RETURN(rc); } +/** + * Implementation of dt_device_operations::dt_conf_get() for LOD + * + * Currently returns the configuration provided by the local OSD. + * + * see include/dt_object.h for the details. + */ static void lod_conf_get(const struct lu_env *env, const struct dt_device *dev, struct dt_device_param *param) @@ -395,11 +621,20 @@ static void lod_conf_get(const struct lu_env *env, dt_conf_get(env, dt2lod_dev((struct dt_device *)dev)->lod_child, param); } +/** + * Implementation of dt_device_operations::dt_sync() for LOD + * + * Syncs all known OST targets. Very very expensive and used + * rarely by LFSCK now. Should not be used in general. + * + * see include/dt_object.h for the details. + */ static int lod_sync(const struct lu_env *env, struct dt_device *dev) { struct lod_device *lod = dt2lod_dev(dev); struct lod_ost_desc *ost; - int rc = 0, i; + unsigned int i; + int rc = 0; ENTRY; lod_getref(&lod->lod_ost_descs); @@ -420,16 +655,33 @@ static int lod_sync(const struct lu_env *env, struct dt_device *dev) RETURN(rc); } +/** + * Implementation of dt_device_operations::dt_ro() for LOD + * + * Turns local OSD read-only, used for the testing only. + * + * see include/dt_object.h for the details. + */ static int lod_ro(const struct lu_env *env, struct dt_device *dev) { return dt_ro(env, dt2lod_dev(dev)->lod_child); } +/** + * Implementation of dt_device_operations::dt_commit_async() for LOD + * + * Asks local OSD to commit sooner. + * + * see include/dt_object.h for the details. + */ static int lod_commit_async(const struct lu_env *env, struct dt_device *dev) { return dt_commit_async(env, dt2lod_dev(dev)->lod_child); } +/** + * Not used + */ static int lod_init_capa_ctxt(const struct lu_env *env, struct dt_device *dev, int mode, unsigned long timeout, __u32 alg, struct lustre_capa_key *keys) @@ -451,6 +703,20 @@ static const struct dt_device_operations lod_dt_ops = { .dt_init_capa_ctxt = lod_init_capa_ctxt, }; +/** + * Connect to a local OSD. + * + * Used to connect to the local OSD at mount. OSD name is taken from the + * configuration command passed. This connection is used to identify LU + * site and pin the OSD from early removal. + * + * \param[in] env LU environment provided by the caller + * \param[in] lod lod device + * \param[in] cfg configuration command to apply + * + * \retval 0 on success + * \retval negative negated errno on error + **/ static int lod_connect_to_osd(const struct lu_env *env, struct lod_device *lod, struct lustre_cfg *cfg) { @@ -535,6 +801,17 @@ out: RETURN(rc); } +/** + * Allocate and initialize target table. + * + * A helper function to initialize the target table and allocate + * a bitmap of the available targets. + * + * \param[in] ltd target's table to initialize + * + * \retval 0 on success + * \retval negative negated errno on error + **/ static int lod_tgt_desc_init(struct lod_tgt_descs *ltd) { mutex_init(<d->ltd_mutex); @@ -554,6 +831,21 @@ static int lod_tgt_desc_init(struct lod_tgt_descs *ltd) return 0; } +/** + * Initialize LOD device at setup. + * + * Initializes the given LOD device using the original configuration command. + * The function initiates a connection to the local OSD and initializes few + * internal structures like pools, target tables, etc. + * + * \param[in] env LU environment provided by the caller + * \param[in] lod lod device + * \param[in] ldt not used + * \param[in] cfg configuration command + * + * \retval 0 on success + * \retval negative negated errno on error + **/ static int lod_init0(const struct lu_env *env, struct lod_device *lod, struct lu_device_type *ldt, struct lustre_cfg *cfg) { @@ -604,6 +896,13 @@ out_disconnect: RETURN(rc); } +/** + * Implementation of lu_device_type_operations::ldto_device_free() for LOD + * + * Releases the memory allocated for LOD device. + * + * see include/lu_object.h for the details. + */ static struct lu_device *lod_device_free(const struct lu_env *env, struct lu_device *lu) { @@ -611,12 +910,19 @@ static struct lu_device *lod_device_free(const struct lu_env *env, struct lu_device *next = &lod->lod_child->dd_lu_dev; ENTRY; - LASSERT(cfs_atomic_read(&lu->ld_ref) == 0); + LASSERT(atomic_read(&lu->ld_ref) == 0); dt_device_fini(&lod->lod_dt_dev); OBD_FREE_PTR(lod); RETURN(next); } +/** + * Implementation of lu_device_type_operations::ldto_device_alloc() for LOD + * + * Allocates LOD device and calls the helpers to initialize it. + * + * see include/lu_object.h for the details. + */ static struct lu_device *lod_device_alloc(const struct lu_env *env, struct lu_device_type *type, struct lustre_cfg *lcfg) @@ -642,6 +948,13 @@ static struct lu_device *lod_device_alloc(const struct lu_env *env, return lu_dev; } +/** + * Implementation of lu_device_type_operations::ldto_device_fini() for LOD + * + * Releases the internal resources used by LOD device. + * + * see include/lu_object.h for the details. + */ static struct lu_device *lod_device_fini(const struct lu_env *env, struct lu_device *d) { @@ -653,12 +966,12 @@ static struct lu_device *lod_device_fini(const struct lu_env *env, lod_procfs_fini(lod); - rc = lod_fini_tgt(lod, &lod->lod_ost_descs); + rc = lod_fini_tgt(env, lod, &lod->lod_ost_descs, true); if (rc) CERROR("%s:can not fini ost descs %d\n", lod2obd(lod)->obd_name, rc); - rc = lod_fini_tgt(lod, &lod->lod_mdt_descs); + rc = lod_fini_tgt(env, lod, &lod->lod_mdt_descs, false); if (rc) CERROR("%s:can not fini mdt descs %d\n", lod2obd(lod)->obd_name, rc); @@ -666,9 +979,22 @@ static struct lu_device *lod_device_fini(const struct lu_env *env, RETURN(NULL); } -/* - * we use exports to track all LOD users - */ +/** + * Implementation of obd_ops::o_connect() for LOD + * + * Used to track all the users of this specific LOD device, + * so the device stays up until the last user disconnected. + * + * \param[in] env LU environment provided by the caller + * \param[out] exp export the caller will be using to access LOD + * \param[in] obd OBD device representing LOD device + * \param[in] cluuid unique identifier of the caller + * \param[in] data not used + * \param[in] localdata not used + * + * \retval 0 on success + * \retval negative negated errno on error + **/ static int lod_obd_connect(const struct lu_env *env, struct obd_export **exp, struct obd_device *obd, struct obd_uuid *cluuid, struct obd_connect_data *data, void *localdata) @@ -695,10 +1021,19 @@ static int lod_obd_connect(const struct lu_env *env, struct obd_export **exp, RETURN(0); } -/* - * once last export (we don't count self-export) disappeared - * lod can be released - */ +/** + * + * Implementation of obd_ops::o_disconnect() for LOD + * + * When the caller doesn't need to use this LOD instance, it calls + * obd_disconnect() and LOD releases corresponding export/reference count. + * Once all the users gone, LOD device is released. + * + * \param[in] exp export provided to the caller in obd_connect() + * + * \retval 0 on success + * \retval negative negated errno on error + **/ static int lod_obd_disconnect(struct obd_export *exp) { struct obd_device *obd = exp->exp_obd; @@ -744,6 +1079,7 @@ static void lod_key_fini(const struct lu_context *ctx, info->lti_ea_store = NULL; info->lti_ea_store_size = 0; } + lu_buf_free(&info->lti_linkea_buf); OBD_FREE_PTR(info); } @@ -772,25 +1108,57 @@ static struct lu_device_type lod_device_type = { .ldt_ctx_tags = LCT_MD_THREAD, }; -static int lod_obd_health_check(const struct lu_env *env, - struct obd_device *obd) +/** + * Implementation of obd_ops::o_get_info() for LOD + * + * Currently, there is only one supported key: KEY_OSP_CONNECTED , to provide + * the caller binary status whether LOD has seen connection to any OST target. + * + * \param[in] env LU environment provided by the caller + * \param[in] exp export of the caller + * \param[in] keylen len of the key + * \param[in] key the key + * \param[in] vallen not used + * \param[in] val not used + * \param[in] lsm not used + * + * \retval 0 if a connection was seen + * \retval -EAGAIN if LOD isn't running yet or no + * connection has been seen yet + * \retval -EINVAL if not supported key is requested + **/ +static int lod_obd_get_info(const struct lu_env *env, struct obd_export *exp, + __u32 keylen, void *key, __u32 *vallen, void *val, + struct lov_stripe_md *lsm) { - struct lod_device *d = lu2lod_dev(obd->obd_lu_dev); - struct lod_ost_desc *ost; - int i, rc = 1; - ENTRY; - - LASSERT(d); - lod_getref(&d->lod_ost_descs); - lod_foreach_ost(d, i) { - ost = OST_TGT(d, i); - LASSERT(ost && ost->ltd_ost); - rc = obd_health_check(env, ost->ltd_exp->exp_obd); - /* one healthy device is enough */ - if (rc == 0) - break; + int rc = -EINVAL; + + if (KEY_IS(KEY_OSP_CONNECTED)) { + struct obd_device *obd = exp->exp_obd; + struct lod_device *d; + struct lod_ost_desc *ost; + unsigned int i; + int rc = 1; + + if (!obd->obd_set_up || obd->obd_stopping) + RETURN(-EAGAIN); + + d = lu2lod_dev(obd->obd_lu_dev); + lod_getref(&d->lod_ost_descs); + lod_foreach_ost(d, i) { + ost = OST_TGT(d, i); + LASSERT(ost && ost->ltd_ost); + + rc = obd_get_info(env, ost->ltd_exp, keylen, key, + vallen, val, lsm); + /* one healthy device is enough */ + if (rc == 0) + break; + } + lod_putref(d, &d->lod_ost_descs); + RETURN(rc); } - lod_putref(d, &d->lod_ost_descs); + RETURN(rc); } @@ -798,7 +1166,7 @@ static struct obd_ops lod_obd_device_ops = { .o_owner = THIS_MODULE, .o_connect = lod_obd_connect, .o_disconnect = lod_obd_disconnect, - .o_health_check = lod_obd_health_check, + .o_get_info = lod_obd_get_info, .o_pool_new = lod_pool_new, .o_pool_rem = lod_pool_remove, .o_pool_add = lod_pool_add, @@ -807,17 +1175,14 @@ static struct obd_ops lod_obd_device_ops = { static int __init lod_mod_init(void) { - struct lprocfs_static_vars lvars = { 0 }; - cfs_proc_dir_entry_t *lov_proc_dir; - int rc; + struct obd_type *type; + int rc; rc = lu_kmem_init(lod_caches); if (rc) return rc; - lprocfs_lod_init_vars(&lvars); - - rc = class_register_type(&lod_obd_device_ops, NULL, lvars.module_vars, + rc = class_register_type(&lod_obd_device_ops, NULL, true, NULL, LUSTRE_LOD_NAME, &lod_device_type); if (rc) { lu_kmem_fini(lod_caches); @@ -825,23 +1190,23 @@ static int __init lod_mod_init(void) } /* create "lov" entry in procfs for compatibility purposes */ - lov_proc_dir = lprocfs_srch(proc_lustre_root, "lov"); - if (lov_proc_dir == NULL) { - lov_proc_dir = lprocfs_register("lov", proc_lustre_root, - NULL, NULL); - if (IS_ERR(lov_proc_dir)) - CERROR("lod: can't create compat entry \"lov\": %d\n", - (int)PTR_ERR(lov_proc_dir)); - } + type = class_search_type(LUSTRE_LOV_NAME); + if (type != NULL && type->typ_procroot != NULL) + return rc; + type = class_search_type(LUSTRE_LOD_NAME); + type->typ_procsym = lprocfs_seq_register("lov", proc_lustre_root, + NULL, NULL); + if (IS_ERR(type->typ_procsym)) { + CERROR("lod: can't create compat entry \"lov\": %d\n", + (int)PTR_ERR(type->typ_procsym)); + type->typ_procsym = NULL; + } return rc; } static void __exit lod_mod_exit(void) { - - lprocfs_try_remove_proc_entry("lov", proc_lustre_root); - class_unregister_type(LUSTRE_LOD_NAME); lu_kmem_fini(lod_caches); }