LU-8066 obd_type: discard obd_type_lock

[fs/lustre-release.git] / lustre / include / obd.h
diff --git a/lustre/include/obd.h b/lustre/include/obd.h

index 0d04870..96c77a0 100644 (file)
--- a/lustre/include/obd.h
+++ b/lustre/include/obd.h
@@ -87,6 +87,8 @@ typedef int (*obd_enqueue_update_f)(void *cookie, int rc);
  struct obd_info {
         /* OBD_STATFS_* flags */
         __u64                   oi_flags;
+       struct obd_device      *oi_obd;
+       struct lu_tgt_desc     *oi_tgt;
          /* statfs data specific for every OSC, if needed at all. */
          struct obd_statfs      *oi_osfs;
          /* An update callback which is called to update some data on upper
@@ -97,21 +99,18 @@ struct obd_info {
  };
  
  struct obd_type {
-       struct list_head         typ_chain;
         struct obd_ops          *typ_dt_ops;
         struct md_ops           *typ_md_ops;
         struct proc_dir_entry   *typ_procroot;
-       struct proc_dir_entry   *typ_procsym;
         struct dentry           *typ_debugfs_entry;
  #ifdef HAVE_SERVER_SUPPORT
         bool                     typ_sym_filter;
  #endif
-       char                    *typ_name;
-       int                      typ_refcnt;
+       atomic_t                 typ_refcnt;
         struct lu_device_type   *typ_lu;
-       spinlock_t               obd_type_lock;
-       struct kobject          *typ_kobj;
+       struct kobject           typ_kobj;
  };
+#define typ_name typ_kobj.name
  
  struct brw_page {
         u64              off;
@@ -151,7 +150,15 @@ enum {
   * vmalloc(). Excessive use of vmalloc() may cause spinlock contention
   * on the MDS.
   */
-#define OBD_MAX_DEFAULT_EA_SIZE                4096
+#define OBD_MAX_DEFAULT_EA_SIZE        4096
+
+/*
+ * Lustre can handle larger xattrs internally, but we must respect the Linux
+ * VFS limitation or tools like tar cannot interact with Lustre volumes
+ * correctly.
+ */
+#define OBD_MAX_EA_SIZE                XATTR_SIZE_MAX
+
  
  enum obd_cl_sem_lock_class {
         OBD_CLI_SEM_NORMAL,
@@ -333,6 +340,8 @@ struct client_obd {
          __u32                    cl_supp_cksum_types;
          /* checksum algorithm to be used */
         enum cksum_types         cl_cksum_type;
+       /* preferred checksum algorithm to be used */
+       enum cksum_types         cl_preferred_cksum_type;
  
          /* also protected by the poorly named _loi_list_lock lock above */
          struct osc_async_rc      cl_ar;
@@ -369,29 +378,12 @@ struct echo_client_obd {
         __u64                   ec_unique;
  };
  
-/* Generic subset of OSTs */
-struct ost_pool {
-        __u32              *op_array;      /* array of index of
-                                                   lov_obd->lov_tgts */
-        unsigned int        op_count;      /* number of OSTs in the array */
-        unsigned int        op_size;       /* allocated size of lp_array */
-       struct rw_semaphore op_rw_sem;     /* to protect ost_pool use */
-};
-
  /* allow statfs data caching for 1 second */
  #define OBD_STATFS_CACHE_SECONDS 1
+/* arbitrary maximum. larger would be useless, allows catching bogus input */
+#define OBD_STATFS_CACHE_MAX_AGE 3600 /* seconds */
  
-struct lov_tgt_desc {
-       struct list_head    ltd_kill;
-        struct obd_uuid     ltd_uuid;
-        struct obd_device  *ltd_obd;
-        struct obd_export  *ltd_exp;
-        __u32               ltd_gen;
-        __u32               ltd_index;   /* index in lov_obd->tgts */
-        unsigned long       ltd_active:1,/* is this target up for requests */
-                            ltd_activate:1,/* should  target be activated */
-                            ltd_reap:1;  /* should this target be deleted */
-};
+#define lov_tgt_desc lu_tgt_desc
  
  struct lov_md_tgt_desc {
         struct obd_device *lmtd_mdc;
@@ -401,7 +393,7 @@ struct lov_md_tgt_desc {
  struct lov_obd {
         struct lov_desc         desc;
         struct lov_tgt_desc   **lov_tgts;               /* sparse array */
-       struct ost_pool         lov_packed;             /* all OSTs in a packed
+       struct lu_tgt_pool      lov_packed;             /* all OSTs in a packed
                                                            array */
         struct mutex            lov_lock;
         struct obd_connect_data lov_ocd;
@@ -426,34 +418,29 @@ struct lov_obd {
         struct kobject          *lov_tgts_kobj;
  };
  
-struct lmv_tgt_desc {
-       struct obd_uuid         ltd_uuid;
-       struct obd_device       *ltd_obd;
-       struct obd_export       *ltd_exp;
-       __u32                   ltd_idx;
-       struct mutex            ltd_fid_mutex;
-       unsigned long           ltd_active:1; /* target up for requests */
-};
+#define lmv_tgt_desc lu_tgt_desc
  
  struct lmv_obd {
         struct lu_client_fld    lmv_fld;
         spinlock_t              lmv_lock;
-       struct lmv_desc         desc;
  
-       struct mutex            lmv_init_mutex;
         int                     connected;
         int                     max_easize;
         int                     max_def_easize;
         u32                     lmv_statfs_start;
  
-       u32                     tgts_size; /* size of tgts array */
-       struct lmv_tgt_desc     **tgts;
+       struct lu_tgt_descs     lmv_mdt_descs;
  
         struct obd_connect_data conn_data;
         struct kobject          *lmv_tgts_kobj;
         void                    *lmv_cache;
+
+       __u32                   lmv_qos_rr_index;
  };
  
+#define lmv_mdt_count  lmv_mdt_descs.ltd_lmv_desc.ld_tgt_count
+#define lmv_qos                lmv_mdt_descs.ltd_qos
+
  /* Minimum sector size is 512 */
  #define MAX_GUARD_NUMBER (PAGE_SIZE / 512)
  
@@ -468,6 +455,8 @@ struct niobuf_local {
         __u16           lnb_guards[MAX_GUARD_NUMBER];
         __u16           lnb_guard_rpc:1;
         __u16           lnb_guard_disk:1;
+       /* separate unlock for read path to allow shared access */
+       __u16           lnb_locked:1;
  };
  
  struct tgt_thread_big_cache {
@@ -600,7 +589,6 @@ struct obd_llog_group {
         struct llog_ctxt   *olg_ctxts[LLOG_MAX_CTXTS];
         wait_queue_head_t  olg_waitq;
         spinlock_t         olg_lock;
-       struct mutex       olg_cat_processing;
  };
  
  /* corresponds to one of the obd's */
@@ -676,7 +664,7 @@ struct obd_device {
         struct list_head        obd_exports_timed;
         time64_t                obd_eviction_timer;     /* for ping evictor */
  
-       int                     obd_max_recoverable_clients;
+       atomic_t                obd_max_recoverable_clients;
         atomic_t                obd_connected_clients;
         int                     obd_stale_clients;
          /* this lock protects all recovery list_heads, timer and
@@ -692,8 +680,11 @@ struct obd_device {
         time64_t                obd_recovery_start;
         /* seconds, for lprocfs_status */
         time64_t                obd_recovery_end;
-       time64_t                obd_recovery_time_hard;
-       time64_t                obd_recovery_timeout;
+       /* To tell timeouts from time stamps Lustre uses time_t
+        * instead of time64_t.
+        */
+       time_t                  obd_recovery_time_hard;
+       time_t                  obd_recovery_timeout;
         int                     obd_recovery_ir_factor;
  
         /* new recovery stuff from CMD2 */
@@ -830,6 +821,14 @@ enum md_cli_flags {
         CLI_MIGRATE     = 1 << 4,
  };
  
+enum md_op_code {
+       LUSTRE_OPC_MKDIR        = 0,
+       LUSTRE_OPC_SYMLINK      = 1,
+       LUSTRE_OPC_MKNOD        = 2,
+       LUSTRE_OPC_CREATE       = 3,
+       LUSTRE_OPC_ANY          = 5,
+};
+
  /**
   * GETXATTR is not included as only a couple of fields in the reply body
   * is filled, but not FID which is needed for common intent handling in
@@ -847,6 +846,7 @@ struct md_op_data {
         struct lu_fid           op_fid4; /* to the operation locks. */
         u32                     op_mds;  /* what mds server open will go to */
         __u32                   op_mode;
+       enum md_op_code         op_code;
         struct lustre_handle    op_open_handle;
         s64                     op_mod_time;
         const char              *op_name;
@@ -855,6 +855,7 @@ struct md_op_data {
         struct rw_semaphore     *op_mea2_sem;
         struct lmv_stripe_md    *op_mea1;
         struct lmv_stripe_md    *op_mea2;
+       struct lmv_stripe_md    *op_default_mea1;       /* default LMV */
         __u32                   op_suppgids[2];
         __u32                   op_fsuid;
         __u32                   op_fsgid;
@@ -888,9 +889,6 @@ struct md_op_data {
         void                   *op_file_secctx;
         __u32                   op_file_secctx_size;
  
-       /* default stripe offset */
-       __u32                   op_default_stripe_offset;
-
         __u32                   op_projid;
  
         /* Used by readdir */
@@ -909,6 +907,8 @@ struct md_op_data {
         bool                    op_post_migrate;
         /* used to access dir with bash hash */
         __u32                   op_stripe_index;
+       /* Archive ID for PCC attach */
+       __u32                   op_archive_id;
  };
  
  struct md_callback {
@@ -1029,8 +1029,12 @@ struct obd_ops {
  struct lustre_md {
         struct mdt_body         *body;
         struct lu_buf            layout;
-       struct lmv_stripe_md    *lmv;
-#ifdef CONFIG_FS_POSIX_ACL
+       union {
+               struct lmv_stripe_md    *lmv;
+               struct lmv_foreign_md   *lfm;
+       };
+       struct lmv_stripe_md    *default_lmv;
+#ifdef CONFIG_LUSTRE_FS_POSIX_ACL
         struct posix_acl        *posix_acl;
  #endif
  };
@@ -1155,6 +1159,8 @@ struct md_ops {
                                   struct lu_fid *fid);
         int (*m_unpackmd)(struct obd_export *exp, struct lmv_stripe_md **plsm,
                           const union lmv_mds_md *lmv, size_t lmv_size);
+       int (*m_rmfid)(struct obd_export *exp, struct fid_array *fa, int *rcs,
+                      struct ptlrpc_request_set *set);
  };
  
  static inline struct md_open_data *obd_mod_alloc(void)
@@ -1269,8 +1275,8 @@ static inline void client_adjust_max_dirty(struct client_obd *cli)
                         cli->cl_dirty_max_pages = dirty_max;
         }
  
-       if (cli->cl_dirty_max_pages > totalram_pages / 8)
-               cli->cl_dirty_max_pages = totalram_pages / 8;
+       if (cli->cl_dirty_max_pages > cfs_totalram_pages() / 8)
+               cli->cl_dirty_max_pages = cfs_totalram_pages() / 8;
  
         /* This value is exported to userspace through the max_dirty_mb
          * parameter.  So we round up the number of pages to make it a round