#include <linux/obd_class.h>
#include <linux/random.h>
#include <linux/slab.h>
-#else
+#include <linux/pagemap.h>
+#else
#include <liblustre.h>
#include <linux/obd_class.h>
#include <linux/obd.h>
int (*ptlrpc_put_connection_superhack)(struct ptlrpc_connection *c);
void (*ptlrpc_abort_inflight_superhack)(struct obd_import *imp);
-struct obd_uuid lctl_fake_uuid = { .uuid = "OBD_CLASS_UUID" };
-
/*
* support functions: we could use inter-module communication, but this
* is more portable to other OS's
}
#endif
if (type)
- __MOD_INC_USE_COUNT(type->typ_ops->o_owner);
+ try_module_get(type->typ_ops->o_owner);
return type;
}
void class_put_type(struct obd_type *type)
{
LASSERT(type);
- __MOD_DEC_USE_COUNT(type->typ_ops->o_owner);
+ module_put(type->typ_ops->o_owner);
}
-int class_register_type(struct obd_ops *ops, struct lprocfs_vars *vars,
- char *name)
+int class_register_type(struct obd_ops *ops, struct md_ops *md_ops,
+ struct lprocfs_vars *vars, char *name)
{
struct obd_type *type;
int rc = 0;
OBD_ALLOC(type->typ_ops, sizeof(*type->typ_ops));
OBD_ALLOC(type->typ_name, strlen(name) + 1);
- if (type->typ_ops == NULL || type->typ_name == NULL)
+ if (md_ops)
+ OBD_ALLOC(type->typ_md_ops, sizeof(*type->typ_md_ops));
+ if (type->typ_ops == NULL || type->typ_name == NULL ||
+ (md_ops && type->typ_md_ops == NULL))
GOTO (failed, rc);
*(type->typ_ops) = *ops;
+ if (md_ops)
+ *(type->typ_md_ops) = *md_ops;
+ else
+ type->typ_md_ops = NULL;
strcpy(type->typ_name, name);
+#ifdef LPROCFS
type->typ_procroot = lprocfs_register(type->typ_name, proc_lustre_root,
vars, type);
+#endif
if (IS_ERR(type->typ_procroot)) {
rc = PTR_ERR(type->typ_procroot);
type->typ_procroot = NULL;
RETURN (0);
failed:
- if (type->typ_ops != NULL)
+ if (type->typ_name != NULL)
OBD_FREE(type->typ_name, strlen(name) + 1);
if (type->typ_ops != NULL)
OBD_FREE (type->typ_ops, sizeof (*type->typ_ops));
+ if (type->typ_md_ops != NULL)
+ OBD_FREE (type->typ_md_ops, sizeof (*type->typ_md_ops));
+ OBD_FREE(type, sizeof(*type));
RETURN(rc);
}
OBD_FREE(type->typ_name, strlen(name) + 1);
if (type->typ_ops != NULL)
OBD_FREE(type->typ_ops, sizeof(*type->typ_ops));
+ if (type->typ_md_ops != NULL)
+ OBD_FREE (type->typ_md_ops, sizeof (*type->typ_md_ops));
OBD_FREE(type, sizeof(*type));
RETURN(0);
} /* class_unregister_type */
+struct obd_device *class_newdev(int *dev)
+{
+ struct obd_device *result = NULL;
+ int i;
+
+ for (i = 0 ; i < MAX_OBD_DEVICES ; i++) {
+ struct obd_device *obd = &obd_dev[i];
+ if (!obd->obd_type) {
+ result = obd;
+ if (dev)
+ *dev = i;
+ break;
+ }
+ }
+ return result;
+}
+
int class_name2dev(char *name)
{
int i;
return -1;
}
+struct obd_device *class_name2obd(char *name)
+{
+ int dev = class_name2dev(name);
+ if (dev < 0)
+ return NULL;
+ return &obd_dev[dev];
+}
+
int class_uuid2dev(struct obd_uuid *uuid)
{
int i;
struct obd_device *class_uuid2obd(struct obd_uuid *uuid)
{
+ int dev = class_uuid2dev(uuid);
+ if (dev < 0)
+ return NULL;
+ return &obd_dev[dev];
+}
+
+/* Search for a client OBD connected to tgt_uuid. If grp_uuid is
+ specified, then only the client with that uuid is returned,
+ otherwise any client connected to the tgt is returned.
+ If tgt_uuid is NULL, the lov with grp_uuid is returned. */
+struct obd_device * class_find_client_obd(struct obd_uuid *tgt_uuid,
+ char * typ_name,
+ struct obd_uuid *grp_uuid)
+{
int i;
for (i = 0; i < MAX_OBD_DEVICES; i++) {
struct obd_device *obd = &obd_dev[i];
- if (obd_uuid_equals(uuid, &obd->obd_uuid))
+ if (obd->obd_type == NULL)
+ continue;
+ if ((strncmp(obd->obd_type->typ_name, typ_name,
+ strlen(typ_name)) == 0)) {
+ struct client_obd *cli = &obd->u.cli;
+ struct obd_import *imp = cli->cl_import;
+ if (tgt_uuid == NULL) {
+ LASSERT(grp_uuid);
+ if (obd_uuid_equals(grp_uuid, &obd->obd_uuid))
+ return obd;
+ continue;
+ }
+ if (obd_uuid_equals(tgt_uuid, &imp->imp_target_uuid) &&
+ ((grp_uuid)? obd_uuid_equals(grp_uuid,
+ &obd->obd_uuid) : 1)) {
+ return obd;
+ }
+ }
+ }
+
+ return NULL;
+}
+
+/* Iterate the obd_device list looking devices have grp_uuid. Start
+ searching at *next, and if a device is found, the next index to look
+ it is saved in *next. If next is NULL, then the first matching device
+ will always be returned. */
+struct obd_device * class_devices_in_group(struct obd_uuid *grp_uuid, int *next)
+{
+ int i;
+ if (next == NULL)
+ i = 0;
+ else if (*next >= 0 && *next < MAX_OBD_DEVICES)
+ i = *next;
+ else
+ return NULL;
+
+ for (; i < MAX_OBD_DEVICES; i++) {
+ struct obd_device *obd = &obd_dev[i];
+ if (obd->obd_type == NULL)
+ continue;
+ if (obd_uuid_equals(grp_uuid, &obd->obd_uuid)) {
+ if (next != NULL)
+ *next = i+1;
return obd;
+ }
}
return NULL;
}
+
void obd_cleanup_caches(void)
{
int rc;
RETURN(export);
}
+struct obd_device *class_exp2obd(struct obd_export *exp)
+{
+ if (exp)
+ return exp->exp_obd;
+ return NULL;
+}
+
struct obd_device *class_conn2obd(struct lustre_handle *conn)
{
struct obd_export *export;
return NULL;
}
-struct obd_import *class_conn2cliimp(struct lustre_handle *conn)
+struct obd_import *class_exp2cliimp(struct obd_export *exp)
{
- return class_conn2obd(conn)->u.cli.cl_import;
+ struct obd_device *obd = exp->exp_obd;
+ if (obd == NULL)
+ return NULL;
+ return obd->u.cli.cl_import;
}
-struct obd_import *class_conn2ldlmimp(struct lustre_handle *conn)
+struct obd_import *class_conn2cliimp(struct lustre_handle *conn)
{
- struct obd_export *export;
- export = class_conn2export(conn);
- if (export) {
- struct obd_import *imp = export->exp_ldlm_data.led_import;
- class_export_put(export);
- return imp;
- }
- fixme();
- return NULL;
+ struct obd_device *obd = class_conn2obd(conn);
+ if (obd == NULL)
+ return NULL;
+ return obd->u.cli.cl_import;
}
/* Export management functions */
class_export_get(export);
}
-struct obd_export *class_export_get(struct obd_export *exp)
+void __class_export_put(struct obd_export *exp)
{
- atomic_inc(&exp->exp_refcount);
- CDEBUG(D_INFO, "GETting export %p : new refcount %d\n", exp,
- atomic_read(&exp->exp_refcount));
- return exp;
-}
-
-void class_export_put(struct obd_export *exp)
-{
- ENTRY;
-
- CDEBUG(D_INFO, "PUTting export %p : new refcount %d\n", exp,
- atomic_read(&exp->exp_refcount) - 1);
- LASSERT(atomic_read(&exp->exp_refcount) > 0);
- LASSERT(atomic_read(&exp->exp_refcount) < 0x5a5a5a);
if (atomic_dec_and_test(&exp->exp_refcount)) {
struct obd_device *obd = exp->exp_obd;
CDEBUG(D_IOCTL, "destroying export %p/%s\n", exp,
if (exp->exp_connection)
ptlrpc_put_connection_superhack(exp->exp_connection);
+ LASSERT(list_empty(&exp->exp_outstanding_replies));
LASSERT(list_empty(&exp->exp_handle.h_link));
-
obd_destroy_export(exp);
OBD_FREE(exp, sizeof(*exp));
- atomic_dec(&obd->obd_refcount);
- wake_up(&obd->obd_refcount_waitq);
+ if (obd->obd_set_up) {
+ atomic_dec(&obd->obd_refcount);
+ wake_up(&obd->obd_refcount_waitq);
+ } else {
+ CERROR("removing export %p from obd %s (%p) -- OBD "
+ "not set up (refcount = %d)\n", exp,
+ obd->obd_name, obd,
+ atomic_read(&obd->obd_refcount));
+ }
}
- EXIT;
}
-struct obd_export *class_new_export(struct obd_device *obddev)
+/* Creates a new export, adds it to the hash table, and returns a
+ * pointer to it. The refcount is 2: one for the hash reference, and
+ * one for the pointer returned by this function. */
+struct obd_export *class_new_export(struct obd_device *obd)
{
struct obd_export *export;
OBD_ALLOC(export, sizeof(*export));
if (!export) {
- CERROR("no memory! (minor %d)\n", obddev->obd_minor);
+ CERROR("no memory! (minor %d)\n", obd->obd_minor);
return NULL;
}
+ export->exp_conn_cnt = 0;
atomic_set(&export->exp_refcount, 2);
- export->exp_obd = obddev;
+ atomic_set(&export->exp_rpc_count, 0);
+ export->exp_obd = obd;
+ INIT_LIST_HEAD(&export->exp_outstanding_replies);
/* XXX this should be in LDLM init */
INIT_LIST_HEAD(&export->exp_ldlm_data.led_held_locks);
class_handle_hash(&export->exp_handle, export_handle_addref);
spin_lock_init(&export->exp_lock);
- spin_lock(&obddev->obd_dev_lock);
- LASSERT(!obddev->obd_stopping); /* shouldn't happen, but might race */
- atomic_inc(&obddev->obd_refcount);
+ spin_lock(&obd->obd_dev_lock);
+ LASSERT(!obd->obd_stopping); /* shouldn't happen, but might race */
+ atomic_inc(&obd->obd_refcount);
list_add(&export->exp_obd_chain, &export->exp_obd->obd_exports);
- spin_unlock(&obddev->obd_dev_lock);
+ export->exp_obd->obd_num_exports++;
+ spin_unlock(&obd->obd_dev_lock);
+ obd_init_export(export);
return export;
}
spin_lock(&exp->exp_obd->obd_dev_lock);
list_del_init(&exp->exp_obd_chain);
+ exp->exp_obd->obd_num_exports--;
spin_unlock(&exp->exp_obd->obd_dev_lock);
class_export_put(exp);
INIT_LIST_HEAD(&imp->imp_sending_list);
INIT_LIST_HEAD(&imp->imp_delayed_list);
spin_lock_init(&imp->imp_lock);
+ imp->imp_conn_cnt = 0;
imp->imp_max_transno = 0;
imp->imp_peer_committed_transno = 0;
+ imp->imp_state = LUSTRE_IMP_NEW;
+ init_waitqueue_head(&imp->imp_recovery_waitq);
atomic_set(&imp->imp_refcount, 2);
+ atomic_set(&imp->imp_inflight, 0);
+ atomic_set(&imp->imp_replay_inflight, 0);
INIT_LIST_HEAD(&imp->imp_handle.h_link);
class_handle_hash(&imp->imp_handle, import_handle_addref);
void class_destroy_import(struct obd_import *import)
{
LASSERT(import != NULL);
+ LASSERT(import != LP_POISON);
class_handle_unhash(&import->imp_handle);
/* Abort any inflight DLM requests and NULL out their (about to be
* freed) import. */
+ /* Invalidate all requests on import, would be better to call
+ ptlrpc_set_import_active(imp, 0); */
+ import->imp_generation++;
ptlrpc_abort_inflight_superhack(import);
class_import_put(import);
}
-/* a connection defines an export context in which preallocation can
- be managed. */
-int class_connect(struct lustre_handle *exporth, struct obd_device *obd,
+/* A connection defines an export context in which preallocation can
+ be managed. This releases the export pointer reference, and returns
+ the export handle, so the export refcount is 1 when this function
+ returns. */
+int class_connect(struct lustre_handle *conn, struct obd_device *obd,
struct obd_uuid *cluuid)
{
struct obd_export *export;
- LASSERT(exporth != NULL);
+ LASSERT(conn != NULL);
LASSERT(obd != NULL);
LASSERT(cluuid != NULL);
+ ENTRY;
export = class_new_export(obd);
if (export == NULL)
- return -ENOMEM;
+ RETURN(-ENOMEM);
- exporth->cookie = export->exp_handle.h_cookie;
+ conn->cookie = export->exp_handle.h_cookie;
memcpy(&export->exp_client_uuid, cluuid,
sizeof(export->exp_client_uuid));
class_export_put(export);
CDEBUG(D_IOCTL, "connect: client %s, cookie "LPX64"\n",
- cluuid->uuid, exporth->cookie);
- return 0;
+ cluuid->uuid, conn->cookie);
+ RETURN(0);
}
-int class_disconnect(struct lustre_handle *conn, int failover)
+/* This function removes two references from the export: one for the
+ * hash entry and one for the export pointer passed in. The export
+ * pointer passed to this function is destroyed should not be used
+ * again. */
+int class_disconnect(struct obd_export *export, int flags)
{
- struct obd_export *export = class_conn2export(conn);
ENTRY;
if (export == NULL) {
fixme();
- CDEBUG(D_IOCTL, "disconnect: attempting to free "
- "nonexistent client "LPX64"\n", conn->cookie);
+ CDEBUG(D_IOCTL, "attempting to free NULL export %p\n", export);
RETURN(-EINVAL);
}
- CDEBUG(D_IOCTL, "disconnect: cookie "LPX64"\n", conn->cookie);
+ /* XXX this shouldn't have to be here, but double-disconnect will crash
+ * otherwise, and sometimes double-disconnect happens. abort_recovery,
+ * for example. */
+ if (list_empty(&export->exp_handle.h_link))
+ RETURN(0);
- class_unlink_export(export);
- class_export_put(export);
+ CDEBUG(D_IOCTL, "disconnect: cookie "LPX64"\n",
+ export->exp_handle.h_cookie);
+
+ if (export->exp_handle.h_cookie == 0x5a5a5a5a5a5a5a5a) {
+ CERROR("disconnecting freed export %p, ignoring\n", export);
+ } else {
+ class_unlink_export(export);
+ class_export_put(export);
+ }
RETURN(0);
}
-void class_disconnect_exports(struct obd_device *obd, int failover)
+void class_disconnect_exports(struct obd_device *obd, int flags)
{
int rc;
struct list_head *tmp, *n, work_list;
struct lustre_handle fake_conn;
+ struct obd_export *fake_exp, *exp;
ENTRY;
/* Move all of the exports from obd_exports to a work list, en masse. */
list_del_init(&obd->obd_exports);
spin_unlock(&obd->obd_dev_lock);
- CDEBUG(D_IOCTL, "OBD device %d (%p) has exports, "
+ CDEBUG(D_HA, "OBD device %d (%p) has exports, "
"disconnecting them\n", obd->obd_minor, obd);
list_for_each_safe(tmp, n, &work_list) {
- struct obd_export *exp = list_entry(tmp, struct obd_export,
- exp_obd_chain);
-
+ exp = list_entry(tmp, struct obd_export, exp_obd_chain);
class_export_get(exp);
+
+ if (obd_uuid_equals(&exp->exp_client_uuid,
+ &exp->exp_obd->obd_uuid)) {
+ CDEBUG(D_HA,
+ "exp %p export uuid == obd uuid, don't discon\n",
+ exp);
+ /* Need to delete this now so we don't end up pointing
+ * to work_list later when this export is cleaned up. */
+ list_del_init(&exp->exp_obd_chain);
+ class_export_put(exp);
+ continue;
+ }
+
fake_conn.cookie = exp->exp_handle.h_cookie;
- rc = obd_disconnect(&fake_conn, failover);
- /* exports created from last_rcvd data, and "fake"
- exports created by lctl don't have an import */
- if (exp->exp_ldlm_data.led_import != NULL)
- class_destroy_import(exp->exp_ldlm_data.led_import);
+ fake_exp = class_conn2export(&fake_conn);
+ if (!fake_exp) {
+ class_export_put(exp);
+ continue;
+ }
+ rc = obd_disconnect(fake_exp, flags);
class_export_put(exp);
-
if (rc) {
- CDEBUG(D_IOCTL, "disconnecting export %p failed: %d\n",
+ CDEBUG(D_HA, "disconnecting export %p failed: %d\n",
exp, rc);
} else {
- CDEBUG(D_IOCTL, "export %p disconnected\n", exp);
+ CDEBUG(D_HA, "export %p disconnected\n", exp);
}
}
EXIT;
}
+
+int oig_init(struct obd_io_group **oig_out)
+{
+ struct obd_io_group *oig;
+ ENTRY;
+
+ OBD_ALLOC(oig, sizeof(*oig));
+ if (oig == NULL)
+ RETURN(-ENOMEM);
+
+ spin_lock_init(&oig->oig_lock);
+ oig->oig_rc = 0;
+ oig->oig_pending = 0;
+ atomic_set(&oig->oig_refcount, 1);
+ init_waitqueue_head(&oig->oig_waitq);
+ INIT_LIST_HEAD(&oig->oig_occ_list);
+
+ *oig_out = oig;
+ RETURN(0);
+};
+
+static inline void oig_grab(struct obd_io_group *oig)
+{
+ atomic_inc(&oig->oig_refcount);
+}
+void oig_release(struct obd_io_group *oig)
+{
+ if (atomic_dec_and_test(&oig->oig_refcount))
+ OBD_FREE(oig, sizeof(*oig));
+}
+
+void oig_add_one(struct obd_io_group *oig,
+ struct oig_callback_context *occ)
+{
+ unsigned long flags;
+ CDEBUG(D_CACHE, "oig %p ready to roll\n", oig);
+ spin_lock_irqsave(&oig->oig_lock, flags);
+ oig->oig_pending++;
+ if (occ != NULL)
+ list_add_tail(&occ->occ_oig_item, &oig->oig_occ_list);
+ spin_unlock_irqrestore(&oig->oig_lock, flags);
+ oig_grab(oig);
+}
+
+void oig_complete_one(struct obd_io_group *oig,
+ struct oig_callback_context *occ, int rc)
+{
+ unsigned long flags;
+ wait_queue_head_t *wake = NULL;
+ int old_rc;
+
+ spin_lock_irqsave(&oig->oig_lock, flags);
+
+ if (occ != NULL)
+ list_del_init(&occ->occ_oig_item);
+
+ old_rc = oig->oig_rc;
+ if (oig->oig_rc == 0 && rc != 0)
+ oig->oig_rc = rc;
+
+ if (--oig->oig_pending <= 0)
+ wake = &oig->oig_waitq;
+
+ spin_unlock_irqrestore(&oig->oig_lock, flags);
+
+ CDEBUG(D_CACHE, "oig %p completed, rc %d -> %d via %d, %d now "
+ "pending (racey)\n", oig, old_rc, oig->oig_rc, rc,
+ oig->oig_pending);
+ if (wake)
+ wake_up(wake);
+ oig_release(oig);
+}
+
+static int oig_done(struct obd_io_group *oig)
+{
+ unsigned long flags;
+ int rc = 0;
+ spin_lock_irqsave(&oig->oig_lock, flags);
+ if (oig->oig_pending <= 0)
+ rc = 1;
+ spin_unlock_irqrestore(&oig->oig_lock, flags);
+ return rc;
+}
+
+static void interrupted_oig(void *data)
+{
+ struct obd_io_group *oig = data;
+ struct list_head *pos;
+ struct oig_callback_context *occ;
+ unsigned long flags;
+
+ spin_lock_irqsave(&oig->oig_lock, flags);
+ list_for_each(pos, &oig->oig_occ_list) {
+ occ = list_entry(pos, struct oig_callback_context,
+ occ_oig_item);
+ occ->occ_interrupted(occ);
+ }
+ spin_unlock_irqrestore(&oig->oig_lock, flags);
+}
+
+int oig_wait(struct obd_io_group *oig)
+{
+ struct l_wait_info lwi = LWI_INTR(interrupted_oig, oig);
+ int rc;
+
+ CDEBUG(D_CACHE, "waiting for oig %p\n", oig);
+
+ do {
+ rc = l_wait_event(oig->oig_waitq, oig_done(oig), &lwi);
+ LASSERTF(rc == 0 || rc == -EINTR, "rc: %d\n", rc);
+ /* we can't continue until the oig has emptied and stopped
+ * referencing state that the caller will free upon return */
+ if (rc == -EINTR)
+ lwi = (struct l_wait_info){ 0, };
+ } while (rc == -EINTR);
+
+ LASSERTF(oig->oig_pending == 0,
+ "exiting oig_wait(oig = %p) with %d pending\n", oig,
+ oig->oig_pending);
+
+ CDEBUG(D_CACHE, "done waiting on oig %p rc %d\n", oig, oig->oig_rc);
+ return oig->oig_rc;
+}