Whamcloud - gitweb
LU-1182 quota: quota accounting library
[fs/lustre-release.git] / lustre / obdclass / dt_object.c
index c429bd2..052cb4e 100644 (file)
@@ -1,6 +1,4 @@
-/* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
- * vim:expandtab:shiftwidth=8:tabstop=8:
- *
+/*
  * GPL HEADER START
  *
  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
  * GPL HEADER END
  */
 /*
- * Copyright  2008 Sun Microsystems, Inc. All rights reserved
+ * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
  * Use is subject to license terms.
+ *
+ * Copyright (c) 2011, 2012, Whamcloud, Inc.
  */
 /*
  * This file is part of Lustre, http://www.lustre.org/
@@ -42,9 +42,6 @@
  */
 
 #define DEBUG_SUBSYSTEM S_CLASS
-#ifndef EXPORT_SYMTAB
-# define EXPORT_SYMTAB
-#endif
 
 #include <obd.h>
 #include <dt_object.h>
 /* fid_be_to_cpu() */
 #include <lustre_fid.h>
 
+#include <lquota.h>
+
+struct dt_find_hint {
+        struct lu_fid        *dfh_fid;
+        struct dt_device     *dfh_dt;
+        struct dt_object     *dfh_o;
+};
+
+struct dt_thread_info {
+        char                    dti_buf[DT_MAX_PATH];
+        struct dt_find_hint     dti_dfh;
+};
+
+/* context key constructor/destructor: dt_global_key_init, dt_global_key_fini */
+LU_KEY_INIT(dt_global, struct dt_thread_info);
+LU_KEY_FINI(dt_global, struct dt_thread_info);
+
+static struct lu_context_key dt_key = {
+        .lct_tags = LCT_MD_THREAD | LCT_DT_THREAD | LCT_MG_THREAD | LCT_LOCAL,
+        .lct_init = dt_global_key_init,
+        .lct_fini = dt_global_key_fini
+};
+
 /* no lock is necessary to protect the list, because call-backs
  * are added during system startup. Please refer to "struct dt_device".
  */
 void dt_txn_callback_add(struct dt_device *dev, struct dt_txn_callback *cb)
 {
-        list_add(&cb->dtc_linkage, &dev->dd_txn_callbacks);
+        cfs_list_add(&cb->dtc_linkage, &dev->dd_txn_callbacks);
 }
 EXPORT_SYMBOL(dt_txn_callback_add);
 
 void dt_txn_callback_del(struct dt_device *dev, struct dt_txn_callback *cb)
 {
-        list_del_init(&cb->dtc_linkage);
+        cfs_list_del_init(&cb->dtc_linkage);
 }
 EXPORT_SYMBOL(dt_txn_callback_del);
 
 int dt_txn_hook_start(const struct lu_env *env,
-                      struct dt_device *dev, struct txn_param *param)
+                      struct dt_device *dev, struct thandle *th)
 {
-        int result;
+        int rc = 0;
         struct dt_txn_callback *cb;
 
-        result = 0;
-        list_for_each_entry(cb, &dev->dd_txn_callbacks, dtc_linkage) {
-                if (cb->dtc_txn_start == NULL)
+        if (th->th_local)
+                return 0;
+
+        cfs_list_for_each_entry(cb, &dev->dd_txn_callbacks, dtc_linkage) {
+                if (cb->dtc_txn_start == NULL ||
+                    !(cb->dtc_tag & env->le_ctx.lc_tags))
                         continue;
-                result = cb->dtc_txn_start(env, param, cb->dtc_cookie);
-                if (result < 0)
+                rc = cb->dtc_txn_start(env, th, cb->dtc_cookie);
+                if (rc < 0)
                         break;
         }
-        return result;
+        return rc;
 }
 EXPORT_SYMBOL(dt_txn_hook_start);
 
@@ -89,35 +112,35 @@ int dt_txn_hook_stop(const struct lu_env *env, struct thandle *txn)
 {
         struct dt_device       *dev = txn->th_dev;
         struct dt_txn_callback *cb;
-        int                     result;
+        int                     rc = 0;
+
+        if (txn->th_local)
+                return 0;
 
-        result = 0;
-        list_for_each_entry(cb, &dev->dd_txn_callbacks, dtc_linkage) {
-                if (cb->dtc_txn_stop == NULL)
+        cfs_list_for_each_entry(cb, &dev->dd_txn_callbacks, dtc_linkage) {
+                if (cb->dtc_txn_stop == NULL ||
+                    !(cb->dtc_tag & env->le_ctx.lc_tags))
                         continue;
-                result = cb->dtc_txn_stop(env, txn, cb->dtc_cookie);
-                if (result < 0)
+                rc = cb->dtc_txn_stop(env, txn, cb->dtc_cookie);
+                if (rc < 0)
                         break;
         }
-        return result;
+        return rc;
 }
 EXPORT_SYMBOL(dt_txn_hook_stop);
 
-int dt_txn_hook_commit(const struct lu_env *env, struct thandle *txn)
+void dt_txn_hook_commit(struct thandle *txn)
 {
-        struct dt_device       *dev = txn->th_dev;
         struct dt_txn_callback *cb;
-        int                     result;
 
-        result = 0;
-        list_for_each_entry(cb, &dev->dd_txn_callbacks, dtc_linkage) {
-                if (cb->dtc_txn_commit == NULL)
-                        continue;
-                result = cb->dtc_txn_commit(env, txn, cb->dtc_cookie);
-                if (result < 0)
-                        break;
+        if (txn->th_local)
+                return;
+
+        cfs_list_for_each_entry(cb, &txn->th_dev->dd_txn_callbacks,
+                                dtc_linkage) {
+                if (cb->dtc_txn_commit)
+                        cb->dtc_txn_commit(txn, cb->dtc_cookie);
         }
-        return result;
 }
 EXPORT_SYMBOL(dt_txn_hook_commit);
 
@@ -157,72 +180,404 @@ int dt_try_as_dir(const struct lu_env *env, struct dt_object *obj)
 }
 EXPORT_SYMBOL(dt_try_as_dir);
 
-extern struct lu_context_key lu_global_key;
-
-static int dt_lookup(const struct lu_env *env, struct dt_object *dir,
-                     const char *name, struct lu_fid *fid)
+enum dt_format_type dt_mode_to_dft(__u32 mode)
 {
-        struct lu_fid_pack  *pack = lu_context_key_get(&env->le_ctx,
-                                                       &lu_global_key);
-        struct dt_rec       *rec = (struct dt_rec *)pack;
-        const struct dt_key *key = (const struct dt_key *)name;
-        int result;
+        enum dt_format_type result;
 
-        if (dt_try_as_dir(env, dir)) {
-                result = dir->do_index_ops->dio_lookup(env, dir, rec, key,
-                                                       BYPASS_CAPA);
-                if (result == 0)
-                        result = fid_unpack(pack, fid);
-        } else
-                result = -ENOTDIR;
+        switch (mode & S_IFMT) {
+        case S_IFDIR:
+                result = DFT_DIR;
+                break;
+        case S_IFREG:
+                result = DFT_REGULAR;
+                break;
+        case S_IFLNK:
+                result = DFT_SYM;
+                break;
+        case S_IFCHR:
+        case S_IFBLK:
+        case S_IFIFO:
+        case S_IFSOCK:
+                result = DFT_NODE;
+                break;
+        default:
+                LBUG();
+                break;
+        }
         return result;
 }
+EXPORT_SYMBOL(dt_mode_to_dft);
+
+/**
+ * lookup fid for object named \a name in directory \a dir.
+ */
 
-static struct dt_object *dt_locate(const struct lu_env *env,
-                                   struct dt_device *dev,
-                                   const struct lu_fid *fid)
+int dt_lookup_dir(const struct lu_env *env, struct dt_object *dir,
+                  const char *name, struct lu_fid *fid)
+{
+        if (dt_try_as_dir(env, dir))
+                return dt_lookup(env, dir, (struct dt_rec *)fid,
+                                 (const struct dt_key *)name, BYPASS_CAPA);
+        return -ENOTDIR;
+}
+EXPORT_SYMBOL(dt_lookup_dir);
+/**
+ * get object for given \a fid.
+ */
+struct dt_object *dt_locate(const struct lu_env *env,
+                            struct dt_device *dev,
+                            const struct lu_fid *fid)
 {
         struct lu_object *obj;
         struct dt_object *dt;
 
-        obj = lu_object_find(env, dev->dd_lu_dev.ld_site, fid);
+        obj = lu_object_find(env, &dev->dd_lu_dev, fid, NULL);
         if (!IS_ERR(obj)) {
                 obj = lu_object_locate(obj->lo_header, dev->dd_lu_dev.ld_type);
                 LASSERT(obj != NULL);
                 dt = container_of(obj, struct dt_object, do_lu);
         } else
-                dt = (void *)obj;
+                dt = (struct dt_object *)obj;
         return dt;
 }
+EXPORT_SYMBOL(dt_locate);
 
-struct dt_object *dt_store_open(const struct lu_env *env,
-                                struct dt_device *dt, const char *name,
-                                struct lu_fid *fid)
+/**
+ * find a object named \a entry in given \a dfh->dfh_o directory.
+ */
+static int dt_find_entry(const struct lu_env *env, const char *entry, void *data)
 {
+        struct dt_find_hint  *dfh = data;
+        struct dt_device     *dt = dfh->dfh_dt;
+        struct lu_fid        *fid = dfh->dfh_fid;
+        struct dt_object     *obj = dfh->dfh_o;
+        int                   result;
+
+        result = dt_lookup_dir(env, obj, entry, fid);
+        lu_object_put(env, &obj->do_lu);
+        if (result == 0) {
+                obj = dt_locate(env, dt, fid);
+                if (IS_ERR(obj))
+                        result = PTR_ERR(obj);
+        }
+        dfh->dfh_o = obj;
+        return result;
+}
+
+/**
+ * Abstract function which parses path name. This function feeds
+ * path component to \a entry_func.
+ */
+int dt_path_parser(const struct lu_env *env,
+                   char *path, dt_entry_func_t entry_func,
+                   void *data)
+{
+        char *e;
+        int rc = 0;
+
+        while (1) {
+                e = strsep(&path, "/");
+                if (e == NULL)
+                        break;
+
+                if (e[0] == 0) {
+                        if (!path || path[0] == '\0')
+                                break;
+                        continue;
+                }
+                rc = entry_func(env, e, data);
+                if (rc)
+                        break;
+        }
+
+        return rc;
+}
+
+static struct dt_object *dt_store_resolve(const struct lu_env *env,
+                                          struct dt_device *dt,
+                                          const char *path,
+                                          struct lu_fid *fid)
+{
+        struct dt_thread_info *info = lu_context_key_get(&env->le_ctx,
+                                                         &dt_key);
+        struct dt_find_hint *dfh = &info->dti_dfh;
+        struct dt_object     *obj;
+        char *local = info->dti_buf;
         int result;
 
-        struct dt_object *root;
-        struct dt_object *child;
+        dfh->dfh_dt = dt;
+        dfh->dfh_fid = fid;
+
+        strncpy(local, path, DT_MAX_PATH);
+        local[DT_MAX_PATH - 1] = '\0';
 
         result = dt->dd_ops->dt_root_get(env, dt, fid);
         if (result == 0) {
-                root = dt_locate(env, dt, fid);
-                if (!IS_ERR(root)) {
-                        result = dt_lookup(env, root, name, fid);
-                        if (result == 0)
-                                child = dt_locate(env, dt, fid);
+                obj = dt_locate(env, dt, fid);
+                if (!IS_ERR(obj)) {
+                        dfh->dfh_o = obj;
+                        result = dt_path_parser(env, local, dt_find_entry, dfh);
+                        if (result != 0)
+                                obj = ERR_PTR(result);
                         else
-                                child = ERR_PTR(result);
-                        lu_object_put(env, &root->do_lu);
-                } else {
-                        CERROR("No root\n");
-                        child = (void *)root;
+                                obj = dfh->dfh_o;
                 }
-        } else
-                child = ERR_PTR(result);
-        return child;
+        } else {
+                obj = ERR_PTR(result);
+        }
+        return obj;
+}
+
+static struct dt_object *dt_reg_open(const struct lu_env *env,
+                                     struct dt_device *dt,
+                                     struct dt_object *p,
+                                     const char *name,
+                                     struct lu_fid *fid)
+{
+        struct dt_object *o;
+        int result;
+
+        result = dt_lookup_dir(env, p, name, fid);
+        if (result == 0){
+                o = dt_locate(env, dt, fid);
+        }
+        else
+                o = ERR_PTR(result);
+
+        return o;
+}
+
+/**
+ * Open dt object named \a filename from \a dirname directory.
+ *      \param  dt      dt device
+ *      \param  fid     on success, object fid is stored in *fid
+ */
+struct dt_object *dt_store_open(const struct lu_env *env,
+                                struct dt_device *dt,
+                                const char *dirname,
+                                const char *filename,
+                                struct lu_fid *fid)
+{
+        struct dt_object *file;
+        struct dt_object *dir;
+
+        dir = dt_store_resolve(env, dt, dirname, fid);
+        if (!IS_ERR(dir)) {
+                file = dt_reg_open(env, dt, dir,
+                                   filename, fid);
+                lu_object_put(env, &dir->do_lu);
+        } else {
+                file = dir;
+        }
+        return file;
 }
 EXPORT_SYMBOL(dt_store_open);
 
+struct dt_object *dt_find_or_create(const struct lu_env *env,
+                                    struct dt_device *dt,
+                                    const struct lu_fid *fid,
+                                    struct dt_object_format *dof,
+                                    struct lu_attr *at)
+{
+        struct dt_object *dto;
+        struct thandle *th;
+        int rc;
+
+        ENTRY;
+
+        dto = dt_locate(env, dt, fid);
+        if (IS_ERR(dto))
+                RETURN(dto);
+
+        LASSERT(dto != NULL);
+        if (dt_object_exists(dto))
+                RETURN(dto);
+
+        th = dt_trans_create(env, dt);
+        if (IS_ERR(th))
+                GOTO(out, rc = PTR_ERR(th));
+
+        rc = dt_declare_create(env, dto, at, NULL, dof, th);
+        if (rc)
+                GOTO(trans_stop, rc);
+
+        rc = dt_trans_start_local(env, dt, th);
+        if (rc)
+                GOTO(trans_stop, rc);
+
+        dt_write_lock(env, dto, 0);
+        if (dt_object_exists(dto))
+                GOTO(unlock, rc = 0);
+
+        CDEBUG(D_OTHER, "create new object "DFID"\n", PFID(fid));
+
+        rc = dt_create(env, dto, at, NULL, dof, th);
+        if (rc)
+                GOTO(unlock, rc);
+        LASSERT(dt_object_exists(dto));
+unlock:
+        dt_write_unlock(env, dto);
+trans_stop:
+        dt_trans_stop(env, dt, th);
+out:
+        if (rc) {
+                lu_object_put(env, &dto->do_lu);
+                RETURN(ERR_PTR(rc));
+        }
+        RETURN(dto);
+}
+EXPORT_SYMBOL(dt_find_or_create);
+
+/* dt class init function. */
+int dt_global_init(void)
+{
+        int result;
+
+        LU_CONTEXT_KEY_INIT(&dt_key);
+        result = lu_context_key_register(&dt_key);
+        return result;
+}
+
+void dt_global_fini(void)
+{
+        lu_context_key_degister(&dt_key);
+}
+
+/**
+ * Generic read helper. May return an error for partial reads.
+ *
+ * \param env  lustre environment
+ * \param dt   object to be read
+ * \param buf  lu_buf to be filled, with buffer pointer and length
+ * \param pos position to start reading, updated as data is read
+ *
+ * \retval real size of data read
+ * \retval -ve errno on failure
+ */
+int dt_read(const struct lu_env *env, struct dt_object *dt,
+            struct lu_buf *buf, loff_t *pos)
+{
+        LASSERTF(dt != NULL, "dt is NULL when we want to read record\n");
+        return dt->do_body_ops->dbo_read(env, dt, buf, pos, BYPASS_CAPA);
+}
+EXPORT_SYMBOL(dt_read);
+
+/**
+ * Read structures of fixed size from storage.  Unlike dt_read(), using
+ * dt_record_read() will return an error for partial reads.
+ *
+ * \param env  lustre environment
+ * \param dt   object to be read
+ * \param buf  lu_buf to be filled, with buffer pointer and length
+ * \param pos position to start reading, updated as data is read
+ *
+ * \retval 0 on successfully reading full buffer
+ * \retval -EFAULT on short read
+ * \retval -ve errno on failure
+ */
+int dt_record_read(const struct lu_env *env, struct dt_object *dt,
+                   struct lu_buf *buf, loff_t *pos)
+{
+        int rc;
+
+        LASSERTF(dt != NULL, "dt is NULL when we want to read record\n");
+
+        rc = dt->do_body_ops->dbo_read(env, dt, buf, pos, BYPASS_CAPA);
+
+        if (rc == buf->lb_len)
+                rc = 0;
+        else if (rc >= 0)
+                rc = -EFAULT;
+        return rc;
+}
+EXPORT_SYMBOL(dt_record_read);
+
+int dt_record_write(const struct lu_env *env, struct dt_object *dt,
+                    const struct lu_buf *buf, loff_t *pos, struct thandle *th)
+{
+        int rc;
+
+        LASSERTF(dt != NULL, "dt is NULL when we want to write record\n");
+        LASSERT(th != NULL);
+        LASSERT(dt->do_body_ops);
+        LASSERT(dt->do_body_ops->dbo_write);
+        rc = dt->do_body_ops->dbo_write(env, dt, buf, pos, th, BYPASS_CAPA, 1);
+        if (rc == buf->lb_len)
+                rc = 0;
+        else if (rc >= 0)
+                rc = -EFAULT;
+        return rc;
+}
+EXPORT_SYMBOL(dt_record_write);
+
+int dt_declare_version_set(const struct lu_env *env, struct dt_object *o,
+                           struct thandle *th)
+{
+        struct lu_buf vbuf;
+        char *xname = XATTR_NAME_VERSION;
+
+        LASSERT(o);
+        vbuf.lb_buf = NULL;
+        vbuf.lb_len = sizeof(dt_obj_version_t);
+        return dt_declare_xattr_set(env, o, &vbuf, xname, 0, th);
+
+}
+EXPORT_SYMBOL(dt_declare_version_set);
+
+void dt_version_set(const struct lu_env *env, struct dt_object *o,
+                    dt_obj_version_t version, struct thandle *th)
+{
+        struct lu_buf vbuf;
+        char *xname = XATTR_NAME_VERSION;
+        int rc;
+
+        LASSERT(o);
+        vbuf.lb_buf = &version;
+        vbuf.lb_len = sizeof(version);
+
+        rc = dt_xattr_set(env, o, &vbuf, xname, 0, th, BYPASS_CAPA);
+        if (rc < 0)
+                CDEBUG(D_INODE, "Can't set version, rc %d\n", rc);
+        return;
+}
+EXPORT_SYMBOL(dt_version_set);
+
+dt_obj_version_t dt_version_get(const struct lu_env *env, struct dt_object *o)
+{
+        struct lu_buf vbuf;
+        char *xname = XATTR_NAME_VERSION;
+        dt_obj_version_t version;
+        int rc;
+
+        LASSERT(o);
+        vbuf.lb_buf = &version;
+        vbuf.lb_len = sizeof(version);
+        rc = dt_xattr_get(env, o, &vbuf, xname, BYPASS_CAPA);
+        if (rc != sizeof(version)) {
+                CDEBUG(D_INODE, "Can't get version, rc %d\n", rc);
+                version = 0;
+        }
+        return version;
+}
+EXPORT_SYMBOL(dt_version_get);
+
+/* list of all supported index types */
+
+/* directories */
 const struct dt_index_features dt_directory_features;
 EXPORT_SYMBOL(dt_directory_features);
+
+/* scrub iterator */
+const struct dt_index_features dt_otable_features;
+EXPORT_SYMBOL(dt_otable_features);
+
+/* accounting indexes */
+const struct dt_index_features dt_acct_features = {
+       .dif_flags              = DT_IND_UPDATE,
+       .dif_keysize_min        = sizeof(__u64), /* 64-bit uid/gid */
+       .dif_keysize_max        = sizeof(__u64), /* 64-bit uid/gid */
+       .dif_recsize_min        = sizeof(struct acct_rec), /* 32 bytes */
+       .dif_recsize_max        = sizeof(struct acct_rec), /* 32 bytes */
+       .dif_ptrsize            = 4
+};
+EXPORT_SYMBOL(dt_acct_features);