LU-7543 obd: reserve connection flag OBD_CONNECT_SUBTREE

[fs/lustre-release.git] / lustre / include / lustre / lustre_idl.h
diff --git a/lustre/include/lustre/lustre_idl.h b/lustre/include/lustre/lustre_idl.h

index d758c8c..538bf76 100644 (file)
--- a/lustre/include/lustre/lustre_idl.h
+++ b/lustre/include/lustre/lustre_idl.h
@@ -27,7 +27,7 @@
   * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
   * Use is subject to license terms.
   *
- * Copyright (c) 2011, 2014, Intel Corporation.
+ * Copyright (c) 2011, 2015, Intel Corporation.
   */
  /*
   * This file is part of Lustre, http://www.lustre.org/
@@ -91,7 +91,7 @@
  #ifndef _LUSTRE_IDL_H_
  #define _LUSTRE_IDL_H_
  
-#include <libcfs/libcfs.h> /* for LPUX64, etc */
+#include <libcfs/libcfs.h>
  #include <lnet/types.h>
  #include <lustre/lustre_user.h> /* Defn's shared with user-space. */
  #include <lustre/lustre_errno.h>
@@ -186,113 +186,6 @@ struct lu_seq_range_array {
  
  #define LU_SEQ_RANGE_MASK      0x3
  
-static inline unsigned fld_range_type(const struct lu_seq_range *range)
-{
-       return range->lsr_flags & LU_SEQ_RANGE_MASK;
-}
-
-static inline bool fld_range_is_ost(const struct lu_seq_range *range)
-{
-       return fld_range_type(range) == LU_SEQ_RANGE_OST;
-}
-
-static inline bool fld_range_is_mdt(const struct lu_seq_range *range)
-{
-       return fld_range_type(range) == LU_SEQ_RANGE_MDT;
-}
-
-/**
- * This all range is only being used when fld client sends fld query request,
- * but it does not know whether the seq is MDT or OST, so it will send req
- * with ALL type, which means either seq type gotten from lookup can be
- * expected.
- */
-static inline unsigned fld_range_is_any(const struct lu_seq_range *range)
-{
-       return fld_range_type(range) == LU_SEQ_RANGE_ANY;
-}
-
-static inline void fld_range_set_type(struct lu_seq_range *range,
-                                     unsigned flags)
-{
-       range->lsr_flags |= flags;
-}
-
-static inline void fld_range_set_mdt(struct lu_seq_range *range)
-{
-       fld_range_set_type(range, LU_SEQ_RANGE_MDT);
-}
-
-static inline void fld_range_set_ost(struct lu_seq_range *range)
-{
-       fld_range_set_type(range, LU_SEQ_RANGE_OST);
-}
-
-static inline void fld_range_set_any(struct lu_seq_range *range)
-{
-       fld_range_set_type(range, LU_SEQ_RANGE_ANY);
-}
-
-/**
- * returns  width of given range \a r
- */
-
-static inline __u64 range_space(const struct lu_seq_range *range)
-{
-       return range->lsr_end - range->lsr_start;
-}
-
-/**
- * initialize range to zero
- */
-
-static inline void range_init(struct lu_seq_range *range)
-{
-       memset(range, 0, sizeof(*range));
-}
-
-/**
- * check if given seq id \a s is within given range \a r
- */
-
-static inline bool range_within(const struct lu_seq_range *range,
-                               __u64 s)
-{
-       return s >= range->lsr_start && s < range->lsr_end;
-}
-
-static inline bool range_is_sane(const struct lu_seq_range *range)
-{
-       return range->lsr_end >= range->lsr_start;
-}
-
-static inline bool range_is_zero(const struct lu_seq_range *range)
-{
-       return range->lsr_start == 0 && range->lsr_end == 0;
-}
-
-static inline bool range_is_exhausted(const struct lu_seq_range *range)
-{
-       return range_space(range) == 0;
-}
-
-/* return 0 if two range have the same location */
-static inline int range_compare_loc(const struct lu_seq_range *r1,
-                                    const struct lu_seq_range *r2)
-{
-        return r1->lsr_index != r2->lsr_index ||
-               r1->lsr_flags != r2->lsr_flags;
-}
-
-#define DRANGE "[%#16.16"LPF64"x-%#16.16"LPF64"x):%x:%s"
-
-#define PRANGE(range)          \
-       (range)->lsr_start,     \
-       (range)->lsr_end,       \
-       (range)->lsr_index,     \
-       fld_range_is_mdt(range) ? "mdt" : "ost"
-
-
  /** \defgroup lu_fid lu_fid
   * @{ */
  
@@ -401,8 +294,8 @@ enum fid_seq {
         FID_SEQ_OST_MDT0        = 0,
         FID_SEQ_LLOG            = 1, /* unnamed llogs */
         FID_SEQ_ECHO            = 2,
-       FID_SEQ_OST_MDT1        = 3,
-       FID_SEQ_OST_MAX         = 9, /* Max MDT count before OST_on_FID */
+       FID_SEQ_UNUSED_START    = 3,
+       FID_SEQ_UNUSED_END      = 9,
         FID_SEQ_LLOG_NAME       = 10, /* named llogs */
         FID_SEQ_RSVD            = 11,
         FID_SEQ_IGIF            = 12,
@@ -426,6 +319,11 @@ enum fid_seq {
         FID_SEQ_QUOTA_GLB       = 0x200000006ULL,
         FID_SEQ_ROOT            = 0x200000007ULL,  /* Located on MDT0 */
         FID_SEQ_LAYOUT_RBTREE   = 0x200000008ULL,
+       /* sequence is used for update logs of cross-MDT operation */
+       FID_SEQ_UPDATE_LOG      = 0x200000009ULL,
+       /* Sequence is used for the directory under which update logs
+        * are created. */
+       FID_SEQ_UPDATE_LOG_DIR  = 0x20000000aULL,
         FID_SEQ_NORMAL          = 0x200000400ULL,
         FID_SEQ_LOV_DEFAULT     = 0xffffffffffffffffULL
  };
@@ -537,6 +435,20 @@ static inline void lu_echo_root_fid(struct lu_fid *fid)
         fid->f_ver = 0;
  }
  
+static inline void lu_update_log_fid(struct lu_fid *fid, __u32 index)
+{
+       fid->f_seq = FID_SEQ_UPDATE_LOG;
+       fid->f_oid = index;
+       fid->f_ver = 0;
+}
+
+static inline void lu_update_log_dir_fid(struct lu_fid *fid, __u32 index)
+{
+       fid->f_seq = FID_SEQ_UPDATE_LOG_DIR;
+       fid->f_oid = index;
+       fid->f_ver = 0;
+}
+
  /**
   * Check if a fid is igif or not.
   * \param fid the fid to be tested.
@@ -587,6 +499,26 @@ static inline int fid_is_layout_rbtree(const struct lu_fid *fid)
         return fid_seq(fid) == FID_SEQ_LAYOUT_RBTREE;
  }
  
+static inline bool fid_seq_is_update_log(__u64 seq)
+{
+       return seq == FID_SEQ_UPDATE_LOG;
+}
+
+static inline bool fid_is_update_log(const struct lu_fid *fid)
+{
+       return fid_seq_is_update_log(fid_seq(fid));
+}
+
+static inline bool fid_seq_is_update_log_dir(__u64 seq)
+{
+       return seq == FID_SEQ_UPDATE_LOG_DIR;
+}
+
+static inline bool fid_is_update_log_dir(const struct lu_fid *fid)
+{
+       return fid_seq_is_update_log_dir(fid_seq(fid));
+}
+
  /* convert an OST objid into an IDIF FID SEQ number */
  static inline __u64 fid_idif_seq(__u64 id, __u32 ost_idx)
  {
@@ -678,15 +610,15 @@ static inline void ostid_set_id(struct ost_id *oi, __u64 oid)
  {
         if (fid_seq_is_mdt0(oi->oi.oi_seq)) {
                 if (oid >= IDIF_MAX_OID) {
-                       CERROR("Bad "LPU64" to set "DOSTID"\n",
-                               oid, POSTID(oi));
+                       CERROR("Too large OID %#llx to set MDT0 "DOSTID"\n",
+                              (unsigned long long)oid, POSTID(oi));
                         return;
                 }
                 oi->oi.oi_id = oid;
         } else if (fid_is_idif(&oi->oi_fid)) {
                 if (oid >= IDIF_MAX_OID) {
-                       CERROR("Bad "LPU64" to set "DOSTID"\n",
-                               oid, POSTID(oi));
+                       CERROR("Too large OID %#llx to set IDIF "DOSTID"\n",
+                              (unsigned long long)oid, POSTID(oi));
                         return;
                 }
                 oi->oi_fid.f_seq = fid_idif_seq(oid,
@@ -695,8 +627,8 @@ static inline void ostid_set_id(struct ost_id *oi, __u64 oid)
                 oi->oi_fid.f_ver = oid >> 48;
         } else {
                 if (oid > OBIF_MAX_OID) {
-                       CERROR("Bad "LPU64" to set "DOSTID"\n",
-                               oid, POSTID(oi));
+                       CERROR("Too large oid %#llx to set REG "DOSTID"\n",
+                              (unsigned long long)oid, POSTID(oi));
                         return;
                 }
                 oi->oi_fid.f_oid = oid;
@@ -712,8 +644,8 @@ static inline int fid_set_id(struct lu_fid *fid, __u64 oid)
  
         if (fid_is_idif(fid)) {
                 if (oid >= IDIF_MAX_OID) {
-                       CERROR("Bad "LPU64" to set "DFID"\n",
-                               oid, PFID(fid));
+                       CERROR("Too large OID %#llx to set IDIF "DFID"\n",
+                              (unsigned long long)oid, PFID(fid));
                         return -EBADF;
                 }
                 fid->f_seq = fid_idif_seq(oid, fid_idif_ost_idx(fid));
@@ -721,8 +653,8 @@ static inline int fid_set_id(struct lu_fid *fid, __u64 oid)
                 fid->f_ver = oid >> 48;
         } else {
                 if (oid > OBIF_MAX_OID) {
-                       CERROR("Bad "LPU64" to set "DFID"\n",
-                               oid, PFID(fid));
+                       CERROR("Too large OID %#llx to set REG "DFID"\n",
+                              (unsigned long long)oid, PFID(fid));
                         return -EBADF;
                 }
                 fid->f_oid = oid;
@@ -770,10 +702,10 @@ static inline int ostid_to_fid(struct lu_fid *fid, const struct ost_id *ostid,
                 fid->f_ver = oid >> 48;
         } else if (likely(!fid_seq_is_default(seq)))
                 /* if (fid_seq_is_idif(seq) || fid_seq_is_norm(seq)) */ {
-               /* This is either an IDIF object, which identifies objects across
-                * all OSTs, or a regular FID.  The IDIF namespace maps legacy
-                * OST objects into the FID namespace.  In both cases, we just
-                * pass the FID through, no conversion needed. */
+               /* This is either an IDIF object, which identifies objects
+                * across all OSTs, or a regular FID.  The IDIF namespace maps
+                * legacy OST objects into the FID namespace.  In both cases,
+                * we just pass the FID through, no conversion needed. */
                 if (ostid->oi_fid.f_ver != 0) {
                         CERROR("bad MDT0 id(2), "DOSTID" ost_idx:%u\n",
                                 POSTID(ostid), ost_idx);
@@ -807,7 +739,8 @@ static inline int fid_to_ostid(const struct lu_fid *fid, struct ost_id *ostid)
  /* Check whether the fid is for LAST_ID */
  static inline bool fid_is_last_id(const struct lu_fid *fid)
  {
-       return fid_oid(fid) == 0;
+       return fid_oid(fid) == 0 && fid_seq(fid) != FID_SEQ_UPDATE_LOG &&
+              fid_seq(fid) != FID_SEQ_UPDATE_LOG_DIR;
  }
  
  /**
@@ -883,7 +816,6 @@ static inline bool fid_is_sane(const struct lu_fid *fid)
  }
  
  extern void lustre_swab_lu_fid(struct lu_fid *fid);
-extern void lustre_swab_lu_seq_range(struct lu_seq_range *range);
  
  static inline bool lu_fid_eq(const struct lu_fid *f0, const struct lu_fid *f1)
  {
@@ -962,19 +894,21 @@ enum lu_dirent_attrs {
         /* The following attrs are used for MDT internal only,
          * not visible to client */
  
-       /* Verify the dirent consistency */
-       LUDA_VERIFY             = 0x8000,
-       /* Only check but not repair the dirent inconsistency */
-       LUDA_VERIFY_DRYRUN      = 0x4000,
-       /* The dirent has been repaired, or to be repaired (dryrun). */
-       LUDA_REPAIR             = 0x2000,
-       /* The system is upgraded, has beed or to be repaired (dryrun). */
-       LUDA_UPGRADE            = 0x1000,
+       /* Something in the record is unknown, to be verified in further. */
+       LUDA_UNKNOWN            = 0x0400,
         /* Ignore this record, go to next directly. */
         LUDA_IGNORE             = 0x0800,
+       /* The system is upgraded, has beed or to be repaired (dryrun). */
+       LUDA_UPGRADE            = 0x1000,
+       /* The dirent has been repaired, or to be repaired (dryrun). */
+       LUDA_REPAIR             = 0x2000,
+       /* Only check but not repair the dirent inconsistency */
+       LUDA_VERIFY_DRYRUN      = 0x4000,
+       /* Verify the dirent consistency */
+       LUDA_VERIFY             = 0x8000,
  };
  
-#define LU_DIRENT_ATTRS_MASK   0xf800
+#define LU_DIRENT_ATTRS_MASK   0xff00
  
  /**
   * Layout of readdir pages, as transmitted on wire.
@@ -1163,8 +1097,11 @@ struct ptlrpc_body_v3 {
         __u64 pb_slv;
         /* VBR: pre-versions */
         __u64 pb_pre_versions[PTLRPC_NUM_VERSIONS];
+       __u64 pb_mbits; /**< match bits for bulk request */
         /* padding for future needs */
-       __u64 pb_padding[4];
+       __u64 pb_padding64_0;
+       __u64 pb_padding64_1;
+       __u64 pb_padding64_2;
         char  pb_jobid[LUSTRE_JOBID_SIZE];
  };
  #define ptlrpc_body     ptlrpc_body_v3
@@ -1191,8 +1128,11 @@ struct ptlrpc_body_v2 {
          __u64 pb_slv;
          /* VBR: pre-versions */
          __u64 pb_pre_versions[PTLRPC_NUM_VERSIONS];
+       __u64 pb_mbits; /**< unused in V2 */
          /* padding for future needs */
-        __u64 pb_padding[4];
+       __u64 pb_padding64_0;
+       __u64 pb_padding64_1;
+       __u64 pb_padding64_2;
  };
  
  extern void lustre_swab_ptlrpc_body(struct ptlrpc_body *pb);
@@ -1321,7 +1261,9 @@ extern void lustre_swab_ptlrpc_body(struct ptlrpc_body *pb);
  #define OBD_CONNECT_MULTIMODRPCS 0x200000000000000ULL /* support multiple modify
                                                          RPCs in parallel */
  #define OBD_CONNECT_DIR_STRIPE  0x400000000000000ULL /* striped DNE dir */
-
+#define OBD_CONNECT_SUBTREE    0x800000000000000ULL /* fileset mount */
+/** bulk matchbits is sent within ptlrpc_body */
+#define OBD_CONNECT_BULK_MBITS  0x2000000000000000ULL
  /* XXX README XXX:
   * Please DO NOT add flag values here before first ensuring that this same
   * flag value is not in use on some other branch.  Please clear any such
@@ -1354,8 +1296,7 @@ extern void lustre_swab_ptlrpc_body(struct ptlrpc_body *pb);
                                  OBD_CONNECT_CANCELSET | OBD_CONNECT_AT | \
                                  OBD_CONNECT_RMT_CLIENT | \
                                  OBD_CONNECT_RMT_CLIENT_FORCE | \
-                                OBD_CONNECT_BRW_SIZE | OBD_CONNECT_MDS_CAPA | \
-                                OBD_CONNECT_OSS_CAPA | OBD_CONNECT_MDS_MDS | \
+                               OBD_CONNECT_BRW_SIZE | OBD_CONNECT_MDS_MDS | \
                                  OBD_CONNECT_FID | LRU_RESIZE_CONNECT_FLAG | \
                                  OBD_CONNECT_VBR | OBD_CONNECT_LOV_V3 | \
                                 OBD_CONNECT_FULL20 | \
@@ -1367,12 +1308,14 @@ extern void lustre_swab_ptlrpc_body(struct ptlrpc_body *pb);
                                 OBD_CONNECT_FLOCK_DEAD | \
                                 OBD_CONNECT_DISP_STRIPE | OBD_CONNECT_LFSCK | \
                                 OBD_CONNECT_OPEN_BY_FID | \
-                               OBD_CONNECT_DIR_STRIPE)
+                               OBD_CONNECT_DIR_STRIPE | \
+                               OBD_CONNECT_BULK_MBITS | \
+                               OBD_CONNECT_MULTIMODRPCS)
  
  #define OST_CONNECT_SUPPORTED  (OBD_CONNECT_SRVLOCK | OBD_CONNECT_GRANT | \
                                  OBD_CONNECT_REQPORTAL | OBD_CONNECT_VERSION | \
                                  OBD_CONNECT_TRUNCLOCK | OBD_CONNECT_INDEX | \
-                               OBD_CONNECT_BRW_SIZE | OBD_CONNECT_OSS_CAPA | \
+                               OBD_CONNECT_BRW_SIZE | \
                                  OBD_CONNECT_CANCELSET | OBD_CONNECT_AT | \
                                  LRU_RESIZE_CONNECT_FLAG | OBD_CONNECT_CKSUM | \
                                  OBD_CONNECT_RMT_CLIENT | \
@@ -1385,11 +1328,13 @@ extern void lustre_swab_ptlrpc_body(struct ptlrpc_body *pb);
                                 OBD_CONNECT_JOBSTATS | \
                                 OBD_CONNECT_LIGHTWEIGHT | OBD_CONNECT_LVB_TYPE|\
                                 OBD_CONNECT_LAYOUTLOCK | OBD_CONNECT_FID | \
-                               OBD_CONNECT_PINGLESS | OBD_CONNECT_LFSCK)
+                               OBD_CONNECT_PINGLESS | OBD_CONNECT_LFSCK | \
+                               OBD_CONNECT_BULK_MBITS)
  #define ECHO_CONNECT_SUPPORTED (0)
  #define MGS_CONNECT_SUPPORTED  (OBD_CONNECT_VERSION | OBD_CONNECT_AT | \
                                 OBD_CONNECT_FULL20 | OBD_CONNECT_IMP_RECOV | \
-                               OBD_CONNECT_MNE_SWAB | OBD_CONNECT_PINGLESS)
+                               OBD_CONNECT_MNE_SWAB | OBD_CONNECT_PINGLESS |\
+                               OBD_CONNECT_BULK_MBITS)
  
  /* Features required for this version of the client to work with server */
  #define CLIENT_CONNECT_MDT_REQD (OBD_CONNECT_IBITS | OBD_CONNECT_FID | \
@@ -1750,7 +1695,7 @@ lov_mds_md_max_stripe_count(size_t buf_size, __u32 lmm_magic)
  #define OBD_MD_FLCKSUM     (0x00100000ULL) /* bulk data checksum */
  #define OBD_MD_FLQOS       (0x00200000ULL) /* quality of service stats */
  /*#define OBD_MD_FLOSCOPQ    (0x00400000ULL) osc opaque data, never used */
-#define OBD_MD_FLCOOKIE    (0x00800000ULL) /* log cancellation cookie */
+/*     OBD_MD_FLCOOKIE    (0x00800000ULL)    obsolete in 2.8 */
  #define OBD_MD_FLGROUP     (0x01000000ULL) /* group */
  #define OBD_MD_FLFID       (0x02000000ULL) /* ->ost write inline fid */
  #define OBD_MD_FLEPOCH     (0x04000000ULL) /* ->ost write with ioepoch */
@@ -1787,7 +1732,8 @@ lov_mds_md_max_stripe_count(size_t buf_size, __u32 lmm_magic)
  #define OBD_MD_FLRMTRGETFACL (0x0008000000000000ULL) /* lfs rgetfacl case */
  
  #define OBD_MD_FLDATAVERSION (0x0010000000000000ULL) /* iversion sum */
-#define OBD_MD_FLRELEASED    (0x0020000000000000ULL) /* file released */
+#define OBD_MD_CLOSE_INTENT_EXECED (0x0020000000000000ULL) /* close intent
+                                                             executed */
  
  #define OBD_MD_DEFAULT_MEA   (0x0040000000000000ULL) /* default MEA */
  
@@ -2206,15 +2152,18 @@ enum {
  #define MDS_STATUS_CONN 1
  #define MDS_STATUS_LOV 2
  
-#define LUSTRE_BFLAG_UNCOMMITTED_WRITES   0x1
-
  /* these should be identical to their EXT4_*_FL counterparts, they are
   * redefined here only to avoid dragging in fs/ext4/ext4.h */
-#define LUSTRE_SYNC_FL         0x00000008 /* Synchronous updates */
-#define LUSTRE_IMMUTABLE_FL    0x00000010 /* Immutable file */
-#define LUSTRE_APPEND_FL       0x00000020 /* writes to file may only append */
-#define LUSTRE_NOATIME_FL      0x00000080 /* do not update atime */
-#define LUSTRE_DIRSYNC_FL      0x00010000 /* dirsync behaviour (dir only) */
+#define LUSTRE_SYNC_FL         0x00000008 /* Synchronous updates */
+#define LUSTRE_IMMUTABLE_FL    0x00000010 /* Immutable file */
+#define LUSTRE_APPEND_FL       0x00000020 /* writes to file may only append */
+#define LUSTRE_NODUMP_FL       0x00000040 /* do not dump file */
+#define LUSTRE_NOATIME_FL      0x00000080 /* do not update atime */
+#define LUSTRE_INDEX_FL                0x00001000 /* hash-indexed directory */
+#define LUSTRE_DIRSYNC_FL      0x00010000 /* dirsync behaviour (dir only) */
+#define LUSTRE_TOPDIR_FL       0x00020000 /* Top of directory hierarchies*/
+#define LUSTRE_DIRECTIO_FL     0x00100000 /* Use direct i/o */
+#define LUSTRE_INLINE_DATA_FL  0x10000000 /* Inode has inline data. */
  
  #ifdef __KERNEL__
  /* Convert wire LUSTRE_*_FL to corresponding client local VFS S_* values
@@ -2271,7 +2220,7 @@ struct mdt_body {
         __u32   mbo_mode;
         __u32   mbo_uid;
         __u32   mbo_gid;
-       __u32   mbo_flags;
+       __u32   mbo_flags;   /* LUSTRE_*_FL file attributes */
         __u32   mbo_rdev;
         __u32   mbo_nlink; /* #bytes to read in the case of MDS_READPAGE */
         __u32   mbo_unused2; /* was "generation" until 2.4.0 */
@@ -2279,7 +2228,7 @@ struct mdt_body {
         __u32   mbo_eadatasize;
         __u32   mbo_aclsize;
         __u32   mbo_max_mdsize;
-       __u32   mbo_max_cookiesize;
+       __u32   mbo_unused3; /* was max_cookiesize until 2.8 */
         __u32   mbo_uid_h; /* high 32-bits of uid, for FUID */
         __u32   mbo_gid_h; /* high 32-bits of gid, for FUID */
         __u32   mbo_padding_5; /* also fix lustre_swab_mdt_body */
@@ -2428,23 +2377,6 @@ extern void lustre_swab_mdt_rec_setattr (struct mdt_rec_setattr *sa);
                               MDS_OPEN_BY_FID | MDS_OPEN_LEASE |        \
                               MDS_OPEN_RELEASE)
  
-/* permission for create non-directory file */
-#define MAY_CREATE      (1 << 7)
-/* permission for create directory file */
-#define MAY_LINK        (1 << 8)
-/* permission for delete from the directory */
-#define MAY_UNLINK      (1 << 9)
-/* source's permission for rename */
-#define MAY_RENAME_SRC  (1 << 10)
-/* target's permission for rename */
-#define MAY_RENAME_TAR  (1 << 11)
-/* part (parent's) VTX permission check */
-#define MAY_VTX_PART    (1 << 12)
-/* full VTX permission check */
-#define MAY_VTX_FULL    (1 << 13)
-/* lfs rgetfacl permission check */
-#define MAY_RGETFACL    (1 << 14)
-
  enum mds_op_bias {
         MDS_CHECK_SPLIT         = 1 << 0,
         MDS_CROSS_REF           = 1 << 1,
@@ -2460,6 +2392,7 @@ enum mds_op_bias {
         MDS_OWNEROVERRIDE       = 1 << 11,
         MDS_HSM_RELEASE         = 1 << 12,
         MDS_RENAME_MIGRATE      = 1 << 13,
+       MDS_CLOSE_LAYOUT_SWAP   = 1 << 14,
  };
  
  /* instance of mdt_reint_rec */
@@ -2871,9 +2804,11 @@ struct ldlm_res_id {
          __u64 name[RES_NAME_SIZE];
  };
  
-#define DLDLMRES       "["LPX64":"LPX64":"LPX64"]."LPX64i
-#define PLDLMRES(res)  (res)->lr_name.name[0], (res)->lr_name.name[1], \
-                       (res)->lr_name.name[2], (res)->lr_name.name[3]
+#define DLDLMRES       "[%#llx:%#llx:%#llx].%#llx"
+#define PLDLMRES(res)  (unsigned long long)(res)->lr_name.name[0],     \
+                       (unsigned long long)(res)->lr_name.name[1],     \
+                       (unsigned long long)(res)->lr_name.name[2],     \
+                       (unsigned long long)(res)->lr_name.name[3]
  
  extern void lustre_swab_ldlm_res_id (struct ldlm_res_id *id);
  
@@ -2884,27 +2819,27 @@ static inline bool ldlm_res_eq(const struct ldlm_res_id *res0,
  }
  
  /* lock types */
-typedef enum {
-        LCK_MINMODE = 0,
-        LCK_EX      = 1,
-        LCK_PW      = 2,
-        LCK_PR      = 4,
-        LCK_CW      = 8,
-        LCK_CR      = 16,
-        LCK_NL      = 32,
-        LCK_GROUP   = 64,
-        LCK_COS     = 128,
-        LCK_MAXMODE
+typedef enum ldlm_mode {
+       LCK_MINMODE     = 0,
+       LCK_EX          = 1,
+       LCK_PW          = 2,
+       LCK_PR          = 4,
+       LCK_CW          = 8,
+       LCK_CR          = 16,
+       LCK_NL          = 32,
+       LCK_GROUP       = 64,
+       LCK_COS         = 128,
+       LCK_MAXMODE
  } ldlm_mode_t;
  
  #define LCK_MODE_NUM    8
  
-typedef enum {
-        LDLM_PLAIN     = 10,
-        LDLM_EXTENT    = 11,
-        LDLM_FLOCK     = 12,
-        LDLM_IBITS     = 13,
-        LDLM_MAX_TYPE
+typedef enum ldlm_type {
+       LDLM_PLAIN      = 10,
+       LDLM_EXTENT     = 11,
+       LDLM_FLOCK      = 12,
+       LDLM_IBITS      = 13,
+       LDLM_MAX_TYPE
  } ldlm_type_t;
  
  #define LDLM_MIN_TYPE LDLM_PLAIN
@@ -2946,13 +2881,13 @@ struct ldlm_flock_wire {
   * this ever changes we will need to swab the union differently based
   * on the resource type. */
  
-typedef union {
-        struct ldlm_extent l_extent;
-        struct ldlm_flock_wire l_flock;
-        struct ldlm_inodebits l_inodebits;
+typedef union ldlm_wire_policy_data {
+       struct ldlm_extent      l_extent;
+       struct ldlm_flock_wire  l_flock;
+       struct ldlm_inodebits   l_inodebits;
  } ldlm_wire_policy_data_t;
  
-extern void lustre_swab_ldlm_policy_data (ldlm_wire_policy_data_t *d);
+extern void lustre_swab_ldlm_policy_data(union ldlm_wire_policy_data *d);
  
  union ldlm_gl_desc {
         struct ldlm_gl_lquota_desc      lquota_desc;
@@ -2960,28 +2895,46 @@ union ldlm_gl_desc {
  
  extern void lustre_swab_gl_desc(union ldlm_gl_desc *);
  
+enum ldlm_intent_flags {
+       IT_OPEN        = 0x00000001,
+       IT_CREAT       = 0x00000002,
+       IT_OPEN_CREAT  = 0x00000003,
+       IT_READDIR     = 0x00000004,
+       IT_GETATTR     = 0x00000008,
+       IT_LOOKUP      = 0x00000010,
+       IT_UNLINK      = 0x00000020,
+       IT_TRUNC       = 0x00000040,
+       IT_GETXATTR    = 0x00000080,
+       IT_EXEC        = 0x00000100,
+       IT_PIN         = 0x00000200,
+       IT_LAYOUT      = 0x00000400,
+       IT_QUOTA_DQACQ = 0x00000800,
+       IT_QUOTA_CONN  = 0x00001000,
+       IT_SETXATTR    = 0x00002000,
+};
+
  struct ldlm_intent {
-        __u64 opc;
+       __u64 opc;
  };
  
  extern void lustre_swab_ldlm_intent (struct ldlm_intent *i);
  
  struct ldlm_resource_desc {
-        ldlm_type_t lr_type;
-        __u32 lr_padding;       /* also fix lustre_swab_ldlm_resource_desc */
-        struct ldlm_res_id lr_name;
+       enum ldlm_type     lr_type;
+       __u32              lr_pad; /* also fix lustre_swab_ldlm_resource_desc */
+       struct ldlm_res_id lr_name;
  };
  
  extern void lustre_swab_ldlm_resource_desc (struct ldlm_resource_desc *r);
  
  struct ldlm_lock_desc {
-        struct ldlm_resource_desc l_resource;
-        ldlm_mode_t l_req_mode;
-        ldlm_mode_t l_granted_mode;
-        ldlm_wire_policy_data_t l_policy_data;
+       struct ldlm_resource_desc l_resource;
+       enum ldlm_mode l_req_mode;
+       enum ldlm_mode l_granted_mode;
+       union ldlm_wire_policy_data l_policy_data;
  };
  
-extern void lustre_swab_ldlm_lock_desc (struct ldlm_lock_desc *l);
+extern void lustre_swab_ldlm_lock_desc(struct ldlm_lock_desc *l);
  
  #define LDLM_LOCKREQ_HANDLES 2
  #define LDLM_ENQUEUE_CANCEL_OFF 1
@@ -3148,6 +3101,8 @@ enum llog_ctxt_id {
         /* for multiple changelog consumers */
         LLOG_CHANGELOG_USER_ORIG_CTXT = 14,
         LLOG_AGENT_ORIG_CTXT = 15, /**< agent requests generation on cdt */
+       LLOG_UPDATELOG_ORIG_CTXT = 16, /* update log */
+       LLOG_UPDATELOG_REPL_CTXT = 17, /* update log */
         LLOG_MAX_CTXTS
  };
  
@@ -3190,6 +3145,7 @@ typedef enum {
         CHANGELOG_REC           = LLOG_OP_MAGIC | 0x60000,
         CHANGELOG_USER_REC      = LLOG_OP_MAGIC | 0x70000,
         HSM_AGENT_REC           = LLOG_OP_MAGIC | 0x80000,
+       UPDATE_REC              = LLOG_OP_MAGIC | 0xa0000,
         LLOG_HDR_MAGIC          = LLOG_OP_MAGIC | 0x45539,
         LLOG_LOGID_MAGIC        = LLOG_OP_MAGIC | 0x4553b,
  } llog_op_type;
@@ -3372,41 +3328,63 @@ struct llog_gen_rec {
         struct llog_rec_tail    lgr_tail;
  };
  
-/* On-disk header structure of each log object, stored in little endian order */
-#define LLOG_CHUNK_SIZE         8192
-#define LLOG_HEADER_SIZE        (96)
-#define LLOG_BITMAP_BYTES       (LLOG_CHUNK_SIZE - LLOG_HEADER_SIZE)
-
-#define LLOG_MIN_REC_SIZE       (24) /* round(llog_rec_hdr + llog_rec_tail) */
-
  /* flags for the logs */
  enum llog_flag {
         LLOG_F_ZAP_WHEN_EMPTY   = 0x1,
         LLOG_F_IS_CAT           = 0x2,
         LLOG_F_IS_PLAIN         = 0x4,
         LLOG_F_EXT_JOBID        = 0x8,
+       LLOG_F_IS_FIXSIZE       = 0x10,
  
+       /* Note: Flags covered by LLOG_F_EXT_MASK will be inherited from
+        * catlog to plain log, so do not add LLOG_F_IS_FIXSIZE here,
+        * because the catlog record is usually fixed size, but its plain
+        * log record can be variable */
         LLOG_F_EXT_MASK = LLOG_F_EXT_JOBID,
  };
  
+/* On-disk header structure of each log object, stored in little endian order */
+#define LLOG_MIN_CHUNK_SIZE    8192
+#define LLOG_HEADER_SIZE        (96) /* sizeof (llog_log_hdr) + sizeof(llh_tail)
+                                     * - sizeof(llh_bitmap) */
+#define LLOG_BITMAP_BYTES       (LLOG_MIN_CHUNK_SIZE - LLOG_HEADER_SIZE)
+#define LLOG_MIN_REC_SIZE       (24) /* round(llog_rec_hdr + llog_rec_tail) */
+
  struct llog_log_hdr {
         struct llog_rec_hdr     llh_hdr;
         __s64                   llh_timestamp;
-        __u32                   llh_count;
-        __u32                   llh_bitmap_offset;
-        __u32                   llh_size;
-        __u32                   llh_flags;
-        __u32                   llh_cat_idx;
-        /* for a catalog the first plain slot is next to it */
-        struct obd_uuid         llh_tgtuuid;
-        __u32                   llh_reserved[LLOG_HEADER_SIZE/sizeof(__u32) - 23];
-        __u32                   llh_bitmap[LLOG_BITMAP_BYTES/sizeof(__u32)];
-        struct llog_rec_tail    llh_tail;
+       __u32                   llh_count;
+       __u32                   llh_bitmap_offset;
+       __u32                   llh_size;
+       __u32                   llh_flags;
+       /* for a catalog the first/oldest and still in-use plain slot is just
+        * next to it. It will serve as the upper limit after Catalog has
+        * wrapped around */
+       __u32                   llh_cat_idx;
+       struct obd_uuid         llh_tgtuuid;
+       __u32                   llh_reserved[LLOG_HEADER_SIZE/sizeof(__u32)-23];
+       /* These fields must always be at the end of the llog_log_hdr.
+        * Note: llh_bitmap size is variable because llog chunk size could be
+        * bigger than LLOG_MIN_CHUNK_SIZE, i.e. sizeof(llog_log_hdr) > 8192
+        * bytes, and the real size is stored in llh_hdr.lrh_len, which means
+        * llh_tail should only be refered by LLOG_HDR_TAIL().
+        * But this structure is also used by client/server llog interface
+        * (see llog_client.c), it will be kept in its original way to avoid
+        * compatiblity issue. */
+       __u32                   llh_bitmap[LLOG_BITMAP_BYTES / sizeof(__u32)];
+       struct llog_rec_tail    llh_tail;
  } __attribute__((packed));
-
-#define LLOG_BITMAP_SIZE(llh)  (__u32)((llh->llh_hdr.lrh_len -         \
-                                       llh->llh_bitmap_offset -        \
-                                       sizeof(llh->llh_tail)) * 8)
+#undef LLOG_HEADER_SIZE
+#undef LLOG_BITMAP_BYTES
+
+#define LLOG_HDR_BITMAP_SIZE(llh)      (__u32)((llh->llh_hdr.lrh_len - \
+                                        llh->llh_bitmap_offset -       \
+                                        sizeof(llh->llh_tail)) * 8)
+#define LLOG_HDR_BITMAP(llh)   (__u32 *)((char *)(llh) +               \
+                                         (llh)->llh_bitmap_offset)
+#define LLOG_HDR_TAIL(llh)     ((struct llog_rec_tail *)((char *)llh + \
+                                                llh->llh_hdr.lrh_len - \
+                                                sizeof(llh->llh_tail)))
  
  /** log cookies are used to reference a specific log file and a record therein */
  struct llog_cookie {
@@ -3475,7 +3453,8 @@ struct obdo {
         struct lustre_handle    o_handle;       /* brw: lock handle to prolong
                                                  * locks */
         struct llog_cookie      o_lcookie;      /* destroy: unlink cookie from
-                                                * MDS */
+                                                * MDS, obsolete in 2.8, reused
+                                                * in OSP */
         __u32                   o_uid_h;
         __u32                   o_gid_h;
  
@@ -3606,14 +3585,14 @@ struct ost_body {
  
  /* Key for FIEMAP to be used in get_info calls */
  struct ll_fiemap_info_key {
-        char    name[8];
-        struct  obdo oa;
-        struct  ll_user_fiemap fiemap;
+       char            lfik_name[8];
+       struct obdo     lfik_oa;
+       struct fiemap   lfik_fiemap;
  };
  
  extern void lustre_swab_ost_body (struct ost_body *b);
  extern void lustre_swab_ost_last_id(__u64 *id);
-extern void lustre_swab_fiemap(struct ll_user_fiemap *fiemap);
+extern void lustre_swab_fiemap(struct fiemap *fiemap);
  
  extern void lustre_swab_lov_user_md_v1(struct lov_user_md_v1 *lum);
  extern void lustre_swab_lov_user_md_v3(struct lov_user_md_v3 *lum);
@@ -3783,21 +3762,6 @@ enum {
  #define CAPA_OPC_MDS_DEFAULT ~CAPA_OPC_OSS_ONLY
  #define CAPA_OPC_OSS_DEFAULT ~(CAPA_OPC_MDS_ONLY | CAPA_OPC_OSS_ONLY)
  
-/* MDS capability covers object capability for operations of body r/w
- * (dir readpage/sendpage), index lookup/insert/delete and meta data r/w,
- * while OSS capability only covers object capability for operations of
- * oss data(file content) r/w/truncate.
- */
-static inline int capa_for_mds(struct lustre_capa *c)
-{
-        return (c->lc_opc & CAPA_OPC_INDEX_LOOKUP) != 0;
-}
-
-static inline int capa_for_oss(struct lustre_capa *c)
-{
-        return (c->lc_opc & CAPA_OPC_INDEX_LOOKUP) == 0;
-}
-
  static inline bool lovea_slot_is_dummy(const struct lov_ost_data_v1 *obj)
  {
         /* zero area does not care about the bytes-order. */
@@ -3944,9 +3908,11 @@ extern void lustre_swab_hsm_request(struct hsm_request *hr);
   */
  
  /**
- * Type of each update
+ * Type of each update, if adding/deleting update, please also update
+ * update_opcode in lustre/target/out_lib.c.
   */
  enum update_type {
+       OUT_START               = 0,
         OUT_CREATE              = 1,
         OUT_DESTROY             = 2,
         OUT_REF_ADD             = 3,
@@ -3960,6 +3926,9 @@ enum update_type {
         OUT_INDEX_DELETE        = 11,
         OUT_WRITE               = 12,
         OUT_XATTR_DEL           = 13,
+       OUT_PUNCH               = 14,
+       OUT_READ                = 15,
+       OUT_NOOP                = 16,
         OUT_LAST
  };
  
@@ -3987,7 +3956,7 @@ object_update_param_size(const struct object_update_param *param)
  struct object_update {
         __u16           ou_type;                /* enum update_type */
         __u16           ou_params_count;        /* update parameters count */
-       __u32           ou_master_index;        /* master MDT/OST index */
+       __u32           ou_result_size;         /* how many bytes can return */
         __u32           ou_flags;               /* enum update_flag */
         __u32           ou_padding1;            /* padding 1 */
         __u64           ou_batchid;             /* op transno on master */
@@ -4006,23 +3975,50 @@ struct object_update_request {
         struct object_update    ourq_updates[0];
  };
  
+#define OUT_UPDATE_HEADER_MAGIC                0xBDDF0001
+#define OUT_UPDATE_MAX_INLINE_SIZE     4096
+/* Header for updates request between MDTs */
+struct out_update_header {
+       __u32           ouh_magic;
+       __u32           ouh_count;
+       __u32           ouh_inline_length;
+       __u32           ouh_reply_size;
+       __u32           ouh_inline_data[0];
+};
+
+struct out_update_buffer {
+       __u32   oub_size;
+       __u32   oub_padding;
+};
+
  void lustre_swab_object_update(struct object_update *ou);
  void lustre_swab_object_update_request(struct object_update_request *our);
+void lustre_swab_out_update_header(struct out_update_header *ouh);
+void lustre_swab_out_update_buffer(struct out_update_buffer *oub);
  
  static inline size_t
-object_update_size(const struct object_update *update)
+object_update_params_size(const struct object_update *update)
  {
-       const struct    object_update_param *param;
-       size_t          size;
-       unsigned int    i;
+       const struct object_update_param *param;
+       size_t                           total_size = 0;
+       unsigned int                     i;
  
-       size = offsetof(struct object_update, ou_params[0]);
+       param = &update->ou_params[0];
         for (i = 0; i < update->ou_params_count; i++) {
-               param = (struct object_update_param *)((char *)update + size);
-               size += object_update_param_size(param);
+               size_t size = object_update_param_size(param);
+
+               param = (struct object_update_param *)((char *)param + size);
+               total_size += size;
         }
  
-       return size;
+       return total_size;
+}
+
+static inline size_t
+object_update_size(const struct object_update *update)
+{
+       return offsetof(struct object_update, ou_params[0]) +
+              object_update_params_size(update);
  }
  
  static inline struct object_update *
@@ -4095,6 +4091,30 @@ object_update_result_get(const struct object_update_reply *reply,
         return ptr;
  }
  
+/* read update result */
+struct out_read_reply {
+       __u32   orr_size;
+       __u32   orr_padding;
+       __u64   orr_offset;
+       char    orr_data[0];
+};
+
+static inline void orr_cpu_to_le(struct out_read_reply *orr_dst,
+                                const struct out_read_reply *orr_src)
+{
+       orr_dst->orr_size = cpu_to_le32(orr_src->orr_size);
+       orr_dst->orr_padding = cpu_to_le32(orr_src->orr_padding);
+       orr_dst->orr_offset = cpu_to_le64(orr_dst->orr_offset);
+}
+
+static inline void orr_le_to_cpu(struct out_read_reply *orr_dst,
+                                const struct out_read_reply *orr_src)
+{
+       orr_dst->orr_size = le32_to_cpu(orr_src->orr_size);
+       orr_dst->orr_padding = le32_to_cpu(orr_src->orr_padding);
+       orr_dst->orr_offset = le64_to_cpu(orr_dst->orr_offset);
+}
+
  /** layout swap request structure
   * fid1 and fid2 are in mdt_body
   */
@@ -4113,5 +4133,66 @@ struct close_data {
  
  void lustre_swab_close_data(struct close_data *data);
  
+struct update_ops;
+void lustre_swab_update_ops(struct update_ops *uops, unsigned int op_count);
+
+/* Update llog format */
+struct update_op {
+       struct lu_fid   uop_fid;
+       __u16           uop_type;
+       __u16           uop_param_count;
+       __u16           uop_params_off[0];
+};
+
+struct update_ops {
+       struct update_op        uops_op[0];
+};
+
+struct update_params {
+       struct object_update_param      up_params[0];
+};
+
+enum update_records_flag {
+       UPDATE_RECORD_CONTINUE = 1 >> 0,
+};
+/*
+ * This is the update record format used to store the updates in
+ * disk. All updates of the operation will be stored in ur_ops.
+ * All of parameters for updates of the operation will be stored
+ * in ur_params.
+ * To save the space of the record, parameters in ur_ops will only
+ * remember their offset in ur_params, so to avoid storing duplicate
+ * parameters in ur_params, which can help us save a lot space for
+ * operation like creating striped directory.
+ */
+struct update_records {
+       __u64                   ur_master_transno;
+       __u64                   ur_batchid;
+       __u32                   ur_flags;
+       /* If the operation includes multiple updates, then ur_index
+        * means the index of the update inside the whole updates. */
+       __u32                   ur_index;
+       __u32                   ur_update_count;
+       __u32                   ur_param_count;
+       struct update_ops       ur_ops;
+        /* Note ur_ops has a variable size, so comment out
+         * the following ur_params, in case some use it directly
+         * update_records->ur_params
+         *
+         * struct update_params        ur_params;
+         */
+};
+
+struct llog_update_record {
+       struct llog_rec_hdr     lur_hdr;
+       struct update_records   lur_update_rec;
+       /* Note ur_update_rec has a variable size, so comment out
+       * the following ur_tail, in case someone use it directly
+       *
+       * struct llog_rec_tail lur_tail;
+       */
+};
+
+
  #endif
  /** @} lustreidl */