Whamcloud - gitweb
LU-8130 obd: convert obd_nid_hash to rhashtable
[fs/lustre-release.git] / lustre / include / lustre_export.h
index bb1237c..3ba56cb 100644 (file)
  *
  * You should have received a copy of the GNU General Public License
  * version 2 along with this program; If not, see
- * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
- *
- * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
- * CA 95054 USA or visit www.sun.com if you need additional information or
- * have any questions.
+ * http://www.gnu.org/licenses/gpl-2.0.html
  *
  * GPL HEADER END
  */
@@ -27,7 +23,7 @@
  * Copyright (c) 2002, 2010, Oracle and/or its affiliates. All rights reserved.
  * Use is subject to license terms.
  *
- * Copyright (c) 2011, 2013, Intel Corporation.
+ * Copyright (c) 2011, 2017, Intel Corporation.
  */
 /*
  * This file is part of Lustre, http://www.lustre.org/
  * @{
  */
 
+#include <linux/rhashtable.h>
+#include <linux/workqueue.h>
+
 #include <lprocfs_status.h>
-#include <lustre/lustre_idl.h>
+#include <uapi/linux/lustre/lustre_idl.h>
 #include <lustre_dlm.h>
 
 struct mds_client_data;
@@ -59,7 +58,8 @@ struct mdt_idmap_table;
  * Target-specific export data
  */
 struct tg_export_data {
-       /** Protects led_lcd below */
+       /** Protects ted_lcd, ted_reply_* and
+        * ted_release_* fields below */
        struct mutex            ted_lcd_lock;
        /** Per-client data for each export */
        struct lsd_client_data  *ted_lcd;
@@ -67,6 +67,48 @@ struct tg_export_data {
        loff_t                  ted_lr_off;
        /** Client index in last_rcvd file */
        int                     ted_lr_idx;
+
+       /**
+        * ted_nodemap_lock is used to ensure that the nodemap is not destroyed
+        * between the time that ted_nodemap is checked for NULL, and a
+        * reference is taken. Modifications to ted_nodemap require that the
+        * active_config_lock and the nodemap(s)'s nm_member_list_lock be
+        * taken, as well as ted_nodemap_lock, so the export can be properly
+        * added to or removed from the nodemap's member list. When an export
+        * is added to a nodemap, a reference on that nodemap must be taken.
+        * That reference can be put only after ted_nodemap no longer refers to
+        * it.
+        */
+       spinlock_t              ted_nodemap_lock;
+       struct lu_nodemap       *ted_nodemap;
+       struct list_head        ted_nodemap_member;
+
+       /** last version of nodemap config sent to client */
+       __u64                   ted_nodemap_version;
+
+       /* Every reply data fields below are
+        * protected by ted_lcd_lock */
+       /** List of reply data */
+       struct list_head        ted_reply_list;
+       int                     ted_reply_cnt;
+       /** Reply data with highest transno is retained */
+       struct tg_reply_data    *ted_reply_last;
+       /* Statistics */
+       int                     ted_reply_max; /* high water mark */
+       int                     ted_release_xid;
+       int                     ted_release_tag;
+       /* grants */
+       long                    ted_dirty;    /* in bytes */
+       long                    ted_grant;    /* in bytes */
+       long                    ted_pending;  /* bytes just being written */
+       __u8                    ted_pagebits; /* log2 of client page size */
+
+       /**
+        * File Modification Data (FMD) tracking
+        */
+       spinlock_t              ted_fmd_lock; /* protects ted_fmd_list */
+       struct list_head        ted_fmd_list; /* FIDs being modified */
+       int                     ted_fmd_count;/* items in ted_fmd_list */
 };
 
 /**
@@ -77,8 +119,6 @@ struct mdt_export_data {
        /** List of all files opened by client on this MDT */
        struct list_head        med_open_head;
        spinlock_t              med_open_lock; /* med_open_head, mfd_list */
-       struct mutex            med_idmap_mutex;
-       struct lustre_idmap_table *med_idmap;
 };
 
 struct ec_export_data { /* echo client */
@@ -89,18 +129,11 @@ struct ec_export_data { /* echo client */
 /** Filter (oss-side) specific import data */
 struct filter_export_data {
        struct tg_export_data   fed_ted;
-       spinlock_t              fed_lock;       /**< protects fed_mod_list */
        __u64                   fed_lastid_gen;
-       long                    fed_dirty;    /* in bytes */
-       long                    fed_grant;    /* in bytes */
-       struct list_head        fed_mod_list; /* files being modified */
-       long                    fed_pending;  /* bytes just being written */
        /* count of SOFT_SYNC RPCs, which will be reset after
         * ofd_soft_sync_limit number of RPCs, and trigger a sync. */
        atomic_t                fed_soft_sync_count;
-       int                     fed_mod_count;/* items in fed_writing list */
        __u32                   fed_group;
-       __u8                    fed_pagesize; /* log2 of client page size */
 };
 
 struct mgs_export_data {
@@ -156,12 +189,11 @@ struct obd_export {
         * what export they are talking to.
         */
        struct portals_handle   exp_handle;
-       atomic_t                exp_refcount;
        /**
         * Set of counters below is to track where export references are
         * kept. The exp_rpc_count is used for reconnect handling also,
         * the cb_count and locks_count are for debug purposes only for now.
-        * The sum of them should be less than exp_refcount by 3
+        * The sum of them should be less than exp_handle.href by 3
         */
        atomic_t                exp_rpc_count; /* RPC references */
        atomic_t                exp_cb_count; /* Commit callback references */
@@ -176,8 +208,13 @@ struct obd_export {
        struct obd_uuid         exp_client_uuid;
         /** To link all exports on an obd device */
        struct list_head        exp_obd_chain;
-       struct hlist_node       exp_uuid_hash;  /** uuid-export hash*/
-       struct hlist_node       exp_nid_hash;   /** nid-export hash */
+       /** work_struct for destruction of export */
+       struct work_struct      exp_zombie_work;
+       /* Unlinked export list */
+       struct list_head        exp_stale_list;
+       struct rhash_head       exp_uuid_hash;  /** uuid-export hash */
+       struct rhlist_head      exp_nid_hash;   /** nid-export hash */
+       struct hlist_node       exp_gen_hash;   /** last_rcvd clt gen hash */
         /**
          * All exports eligible for ping evictor are linked into a list
          * through this field in "most time since last request on this export"
@@ -195,58 +232,62 @@ struct obd_export {
         struct nid_stat          *exp_nid_stats;
         /** Active connetion */
         struct ptlrpc_connection *exp_connection;
-        /** Connection count value from last succesful reconnect rpc */
-        __u32                     exp_conn_cnt;
-        /** Hash list of all ldlm locks granted on this export */
-        cfs_hash_t               *exp_lock_hash;
+       /** Connection count value from last successful reconnect rpc */
+       __u32                     exp_conn_cnt;
+       /** Hash list of all ldlm locks granted on this export */
+       struct cfs_hash          *exp_lock_hash;
        /**
         * Hash list for Posix lock deadlock detection, added with
         * ldlm_lock::l_exp_flock_hash.
         */
-       cfs_hash_t             *exp_flock_hash;
+       struct cfs_hash        *exp_flock_hash;
        struct list_head        exp_outstanding_replies;
        struct list_head        exp_uncommitted_replies;
        spinlock_t              exp_uncommitted_replies_lock;
        /** Last committed transno for this export */
        __u64                   exp_last_committed;
        /** When was last request received */
-       cfs_time_t              exp_last_request_time;
+       time64_t                exp_last_request_time;
        /** On replay all requests waiting for replay are linked here */
        struct list_head        exp_req_replay_queue;
        /**
         * protects exp_flags, exp_outstanding_replies and the change
         * of exp_imp_reverse
         */
-       spinlock_t                exp_lock;
+       spinlock_t              exp_lock;
        /** Compatibility flags for this export are embedded into
         *  exp_connect_data */
-       struct obd_connect_data   exp_connect_data;
-        enum obd_option           exp_flags;
-        unsigned long             exp_failed:1,
-                                  exp_in_recovery:1,
-                                  exp_disconnected:1,
-                                  exp_connecting:1,
-                                  /** VBR: export missed recovery */
-                                  exp_delayed:1,
-                                  /** VBR: failed version checking */
-                                  exp_vbr_failed:1,
-                                  exp_req_replay_needed:1,
-                                  exp_lock_replay_needed:1,
-                                  exp_need_sync:1,
-                                 exp_keep_sync:1,
-                                  exp_flvr_changed:1,
-                                  exp_flvr_adapt:1,
-                                  exp_libclient:1, /* liblustre client? */
-                                 /* if to swap nidtbl entries for 2.2 clients.
-                                  * Only used by the MGS to fix LU-1644. */
-                                 exp_need_mne_swab:1;
-        /* also protected by exp_lock */
-        enum lustre_sec_part      exp_sp_peer;
-        struct sptlrpc_flavor     exp_flvr;             /* current */
-        struct sptlrpc_flavor     exp_flvr_old[2];      /* about-to-expire */
-        cfs_time_t                exp_flvr_expire[2];   /* seconds */
-
-        /** protects exp_hp_rpcs */
+       struct obd_connect_data exp_connect_data;
+       enum obd_option         exp_flags;
+       unsigned long           exp_failed:1,
+                               exp_in_recovery:1,
+                               exp_disconnected:1,
+                               exp_connecting:1,
+                               /** VBR: export missed recovery */
+                               exp_delayed:1,
+                               /** VBR: failed version checking */
+                               exp_vbr_failed:1,
+                               exp_req_replay_needed:1,
+                               exp_lock_replay_needed:1,
+                               exp_need_sync:1,
+                               exp_flvr_changed:1,
+                               exp_flvr_adapt:1,
+                               /* if to swap nidtbl entries for 2.2 clients.
+                                * Only used by the MGS to fix LU-1644. */
+                               exp_need_mne_swab:1,
+                               /* The export already got final replay ping
+                                * request. */
+                               exp_replay_done:1,
+                               /* local client with recovery disabled */
+                               exp_no_recovery:1,
+                               exp_hashed:1;
+       /* also protected by exp_lock */
+       enum lustre_sec_part    exp_sp_peer;
+       struct sptlrpc_flavor   exp_flvr;               /* current */
+       struct sptlrpc_flavor   exp_flvr_old[2];        /* about-to-expire */
+       time64_t                exp_flvr_expire[2];     /* seconds */
+
+       /** protects exp_hp_rpcs */
        spinlock_t              exp_rpc_lock;
        struct list_head        exp_hp_rpcs;    /* (potential) HP RPCs */
        struct list_head        exp_reg_rpcs;  /* RPC being handled */
@@ -264,7 +305,13 @@ struct obd_export {
                 struct mgs_export_data    eu_mgs_data;
         } u;
 
-       struct nodemap            *exp_nodemap;
+       struct adaptive_timeout    exp_bl_lock_at;
+
+       /** highest XID received by export client that has no
+        * unreceived lower-numbered XID
+        */
+       __u64                   exp_last_xid;
+       long                    *exp_used_slots;
 };
 
 #define exp_target_data u.eu_target_data
@@ -282,6 +329,18 @@ static inline __u64 exp_connect_flags(struct obd_export *exp)
        return *exp_connect_flags_ptr(exp);
 }
 
+static inline __u64 *exp_connect_flags2_ptr(struct obd_export *exp)
+{
+       return &exp->exp_connect_data.ocd_connect_flags2;
+}
+
+static inline __u64 exp_connect_flags2(struct obd_export *exp)
+{
+       if (exp_connect_flags(exp) & OBD_CONNECT_FLAGS2)
+               return *exp_connect_flags2_ptr(exp);
+       return 0;
+}
+
 static inline int exp_max_brw_size(struct obd_export *exp)
 {
        LASSERT(exp != NULL);
@@ -296,13 +355,6 @@ static inline int exp_connect_multibulk(struct obd_export *exp)
        return exp_max_brw_size(exp) > ONE_MB_BRW_SIZE;
 }
 
-static inline int exp_expired(struct obd_export *exp, cfs_duration_t age)
-{
-        LASSERT(exp->exp_delayed);
-        return cfs_time_before(cfs_time_add(exp->exp_last_request_time, age),
-                               cfs_time_current_sec());
-}
-
 static inline int exp_connect_cancelset(struct obd_export *exp)
 {
        LASSERT(exp != NULL);
@@ -315,20 +367,6 @@ static inline int exp_connect_lru_resize(struct obd_export *exp)
        return !!(exp_connect_flags(exp) & OBD_CONNECT_LRU_RESIZE);
 }
 
-static inline int exp_connect_rmtclient(struct obd_export *exp)
-{
-       LASSERT(exp != NULL);
-       return !!(exp_connect_flags(exp) & OBD_CONNECT_RMT_CLIENT);
-}
-
-static inline int client_is_remote(struct obd_export *exp)
-{
-        struct obd_import *imp = class_exp2cliimp(exp);
-
-        return !!(imp->imp_connect_data.ocd_connect_flags &
-                  OBD_CONNECT_RMT_CLIENT);
-}
-
 static inline int exp_connect_vbr(struct obd_export *exp)
 {
        LASSERT(exp != NULL);
@@ -336,12 +374,6 @@ static inline int exp_connect_vbr(struct obd_export *exp)
        return !!(exp_connect_flags(exp) & OBD_CONNECT_VBR);
 }
 
-static inline int exp_connect_som(struct obd_export *exp)
-{
-       LASSERT(exp != NULL);
-       return !!(exp_connect_flags(exp) & OBD_CONNECT_SOM);
-}
-
 static inline int exp_connect_umask(struct obd_export *exp)
 {
        return !!(exp_connect_flags(exp) & OBD_CONNECT_UMASK);
@@ -391,6 +423,13 @@ static inline bool imp_connect_disp_stripe(struct obd_import *imp)
        return ocd->ocd_connect_flags & OBD_CONNECT_DISP_STRIPE;
 }
 
+static inline bool imp_connect_shortio(struct obd_import *imp)
+{
+       struct obd_connect_data *ocd = &imp->imp_connect_data;
+
+       return ocd->ocd_connect_flags & OBD_CONNECT_SHORTIO;
+}
+
 static inline __u64 exp_connect_ibits(struct obd_export *exp)
 {
        struct obd_connect_data *ocd;
@@ -399,14 +438,55 @@ static inline __u64 exp_connect_ibits(struct obd_export *exp)
        return ocd->ocd_ibits_known;
 }
 
+static inline int exp_connect_large_acl(struct obd_export *exp)
+{
+       return !!(exp_connect_flags(exp) & OBD_CONNECT_LARGE_ACL);
+}
+
+static inline int exp_connect_lockahead(struct obd_export *exp)
+{
+       return !!(exp_connect_flags2(exp) & OBD_CONNECT2_LOCKAHEAD);
+}
+
+static inline int exp_connect_overstriping(struct obd_export *exp)
+{
+       return !!(exp_connect_flags2(exp) & OBD_CONNECT2_OVERSTRIPING);
+}
+
+static inline int exp_connect_flr(struct obd_export *exp)
+{
+       return !!(exp_connect_flags2(exp) & OBD_CONNECT2_FLR);
+}
+
+static inline int exp_connect_lock_convert(struct obd_export *exp)
+{
+       return !!(exp_connect_flags2(exp) & OBD_CONNECT2_LOCK_CONVERT);
+}
+
 extern struct obd_export *class_conn2export(struct lustre_handle *conn);
-extern struct obd_device *class_conn2obd(struct lustre_handle *conn);
 
-#define KKUC_CT_DATA_MAGIC     0x092013cea
+static inline int exp_connect_archive_id_array(struct obd_export *exp)
+{
+       return !!(exp_connect_flags2(exp) & OBD_CONNECT2_ARCHIVE_ID_ARRAY);
+}
+
+static inline int exp_connect_sepol(struct obd_export *exp)
+{
+       return !!(exp_connect_flags2(exp) & OBD_CONNECT2_SELINUX_POLICY);
+}
+
+enum {
+       /* archive_ids in array format */
+       KKUC_CT_DATA_ARRAY_MAGIC        = 0x092013cea,
+       /* archive_ids in bitmap format */
+       KKUC_CT_DATA_BITMAP_MAGIC       = 0x082018cea,
+};
+
+
 struct kkuc_ct_data {
        __u32           kcd_magic;
-       struct obd_uuid kcd_uuid;
-       __u32           kcd_archive;
+       __u32           kcd_nr_archives;
+       __u32           kcd_archives[0];
 };
 
 /** @} export */