LU-3289 gss: Cleanup gss print statements and comments

[fs/lustre-release.git] / lustre / ptlrpc / gss / sec_gss.c
diff --git a/lustre/ptlrpc/gss/sec_gss.c b/lustre/ptlrpc/gss/sec_gss.c

index 1337b8e..9dd7898 100644 (file)
--- a/lustre/ptlrpc/gss/sec_gss.c
+++ b/lustre/ptlrpc/gss/sec_gss.c
@@ -1,9 +1,10 @@
-/* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
- * vim:expandtab:shiftwidth=8:tabstop=8:
- *
+/*
   * Modifications for Lustre
- * Copyright 2004 - 2007, Cluster File Systems, Inc.
- * All rights reserved
+ *
+ * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
+ *
+ * Copyright (c) 2011, 2014, Intel Corporation.
+ *
   * Author: Eric Mei <ericm@clusterfs.com>
   */
  
@@ -45,26 +46,19 @@
   *
   */
  
-#ifndef EXPORT_SYMTAB
-# define EXPORT_SYMTAB
-#endif
  #define DEBUG_SUBSYSTEM S_SEC
-#ifdef __KERNEL__
  #include <linux/init.h>
  #include <linux/module.h>
  #include <linux/slab.h>
  #include <linux/dcache.h>
  #include <linux/fs.h>
-#include <linux/random.h>
  #include <linux/mutex.h>
  #include <asm/atomic.h>
-#else
-#include <liblustre.h>
-#endif
  
  #include <obd.h>
  #include <obd_class.h>
  #include <obd_support.h>
+#include <obd_cksum.h>
  #include <lustre/lustre_idl.h>
  #include <lustre_net.h>
  #include <lustre_import.h>
@@ -75,6 +69,14 @@
  #include "gss_api.h"
  
  #include <linux/crypto.h>
+#include <linux/crc32.h>
+
+/*
+ * early reply have fixed size, respectively in privacy and integrity mode.
+ * so we calculate them only once.
+ */
+static int gss_at_reply_off_integ;
+static int gss_at_reply_off_priv;
  
  
  static inline int msg_last_segidx(struct lustre_msg *msg)
@@ -94,28 +96,29 @@ static inline int msg_last_seglen(struct lustre_msg *msg)
  static
  void gss_header_swabber(struct gss_header *ghdr)
  {
-        __swab32s(&ghdr->gh_version);
          __swab32s(&ghdr->gh_flags);
          __swab32s(&ghdr->gh_proc);
          __swab32s(&ghdr->gh_seq);
          __swab32s(&ghdr->gh_svc);
          __swab32s(&ghdr->gh_pad1);
-        __swab32s(&ghdr->gh_pad2);
-        __swab32s(&ghdr->gh_pad3);
          __swab32s(&ghdr->gh_handle.len);
  }
  
-struct gss_header *gss_swab_header(struct lustre_msg *msg, int segment)
+struct gss_header *gss_swab_header(struct lustre_msg *msg, int segment,
+                                   int swabbed)
  {
          struct gss_header *ghdr;
  
-        ghdr = lustre_swab_buf(msg, segment, sizeof(*ghdr),
-                               gss_header_swabber);
+        ghdr = lustre_msg_buf(msg, segment, sizeof(*ghdr));
+        if (ghdr == NULL)
+                return NULL;
  
-        if (ghdr &&
-            sizeof(*ghdr) + ghdr->gh_handle.len > msg->lm_buflens[segment]) {
-                CERROR("gss header require length %u, now %u received\n",
-                       (unsigned int) sizeof(*ghdr) + ghdr->gh_handle.len,
+        if (swabbed)
+                gss_header_swabber(ghdr);
+
+        if (sizeof(*ghdr) + ghdr->gh_handle.len > msg->lm_buflens[segment]) {
+                CERROR("gss header has length %d, now %u received\n",
+                       (int) sizeof(*ghdr) + ghdr->gh_handle.len,
                         msg->lm_buflens[segment]);
                  return NULL;
          }
@@ -123,6 +126,7 @@ struct gss_header *gss_swab_header(struct lustre_msg *msg, int segment)
          return ghdr;
  }
  
+#if 0
  static
  void gss_netobj_swabber(netobj_t *obj)
  {
@@ -143,38 +147,41 @@ netobj_t *gss_swab_netobj(struct lustre_msg *msg, int segment)
  
          return obj;
  }
+#endif
  
  /*
   * payload should be obtained from mechanism. but currently since we
   * only support kerberos, we could simply use fixed value.
- * krb5 header:         16
- * krb5 checksum:       20
+ * krb5 "meta" data:
+ *  - krb5 header:      16
+ *  - krb5 checksum:    20
+ *
+ * for privacy mode, payload also include the cipher text which has the same
+ * size as plain text, plus possible confounder, padding both at maximum cipher
+ * block size.
   */
  #define GSS_KRB5_INTEG_MAX_PAYLOAD      (40)
  
  static inline
-int gss_estimate_payload(struct gss_ctx *mechctx, int msgsize, int privacy)
+int gss_mech_payload(struct gss_ctx *mechctx, int msgsize, int privacy)
  {
-        if (privacy) {
-                /* we suppose max cipher block size is 16 bytes. here we
-                 * add 16 for confounder and 16 for padding. */
-                return GSS_KRB5_INTEG_MAX_PAYLOAD + msgsize + 16 + 16 + 16;
-        } else {
+        if (privacy)
+                return GSS_KRB5_INTEG_MAX_PAYLOAD + 16 + 16 + 16 + msgsize;
+        else
                  return GSS_KRB5_INTEG_MAX_PAYLOAD;
-        }
  }
  
  /*
   * return signature size, otherwise < 0 to indicate error
   */
-static
-int gss_sign_msg(struct lustre_msg *msg,
-                 struct gss_ctx *mechctx,
-                 __u32 proc, __u32 seq, __u32 svc,
-                 rawobj_t *handle)
+static int gss_sign_msg(struct lustre_msg *msg,
+                        struct gss_ctx *mechctx,
+                        enum lustre_sec_part sp,
+                        __u32 flags, __u32 proc, __u32 seq, __u32 svc,
+                        rawobj_t *handle)
  {
          struct gss_header      *ghdr;
-        rawobj_t                text[3], mic;
+        rawobj_t                text[4], mic;
          int                     textcnt, max_textcnt, mic_idx;
          __u32                   major;
  
@@ -186,7 +193,8 @@ int gss_sign_msg(struct lustre_msg *msg,
          ghdr = lustre_msg_buf(msg, 0, 0);
  
          ghdr->gh_version = PTLRPC_GSS_VERSION;
-        ghdr->gh_flags = 0;
+        ghdr->gh_sp = (__u8) sp;
+        ghdr->gh_flags = flags;
          ghdr->gh_proc = proc;
          ghdr->gh_seq = seq;
          ghdr->gh_svc = svc;
@@ -214,7 +222,7 @@ int gss_sign_msg(struct lustre_msg *msg,
          mic.len = msg->lm_buflens[mic_idx];
          mic.data = lustre_msg_buf(msg, mic_idx, 0);
  
-        major = lgss_get_mic(mechctx, textcnt, text, &mic);
+        major = lgss_get_mic(mechctx, textcnt, text, 0, NULL, &mic);
          if (major != GSS_S_COMPLETE) {
                  CERROR("fail to generate MIC: %08x\n", major);
                  return -EPERM;
@@ -232,7 +240,7 @@ __u32 gss_verify_msg(struct lustre_msg *msg,
                       struct gss_ctx *mechctx,
                       __u32 svc)
  {
-        rawobj_t        text[3], mic;
+        rawobj_t        text[4], mic;
          int             textcnt, max_textcnt;
          int             mic_idx;
          __u32           major;
@@ -253,7 +261,7 @@ __u32 gss_verify_msg(struct lustre_msg *msg,
          mic.len = msg->lm_buflens[mic_idx];
          mic.data = lustre_msg_buf(msg, mic_idx, 0);
  
-        major = lgss_verify_mic(mechctx, textcnt, text, &mic);
+        major = lgss_verify_mic(mechctx, textcnt, text, 0, NULL, &mic);
          if (major != GSS_S_COMPLETE)
                  CERROR("mic verify error: %08x\n", major);
  
@@ -268,47 +276,39 @@ __u32 gss_unseal_msg(struct gss_ctx *mechctx,
                     struct lustre_msg *msgbuf,
                     int *msg_len, int msgbuf_len)
  {
-        rawobj_t                 clear_obj, micobj, msgobj, token;
+        rawobj_t                 clear_obj, hdrobj, token;
          __u8                    *clear_buf;
          int                      clear_buflen;
          __u32                    major;
          ENTRY;
  
-        if (msgbuf->lm_bufcount != 3) {
+        if (msgbuf->lm_bufcount != 2) {
                  CERROR("invalid bufcount %d\n", msgbuf->lm_bufcount);
                  RETURN(GSS_S_FAILURE);
          }
  
-        /* verify gss header */
-        msgobj.len = msgbuf->lm_buflens[0];
-        msgobj.data = lustre_msg_buf(msgbuf, 0, 0);
-        micobj.len = msgbuf->lm_buflens[1];
-        micobj.data = lustre_msg_buf(msgbuf, 1, 0);
-
-        major = lgss_verify_mic(mechctx, 1, &msgobj, &micobj);
-        if (major != GSS_S_COMPLETE) {
-                CERROR("priv: mic verify error: %08x\n", major);
-                RETURN(major);
-        }
-
-        /* temporary clear text buffer */
-        clear_buflen = msgbuf->lm_buflens[2];
-        OBD_ALLOC(clear_buf, clear_buflen);
+        /* allocate a temporary clear text buffer, same sized as token,
+         * we assume the final clear text size <= token size */
+        clear_buflen = lustre_msg_buflen(msgbuf, 1);
+        OBD_ALLOC_LARGE(clear_buf, clear_buflen);
          if (!clear_buf)
                  RETURN(GSS_S_FAILURE);
  
-        token.len = msgbuf->lm_buflens[2];
-        token.data = lustre_msg_buf(msgbuf, 2, 0);
-
+        /* buffer objects */
+        hdrobj.len = lustre_msg_buflen(msgbuf, 0);
+        hdrobj.data = lustre_msg_buf(msgbuf, 0, 0);
+        token.len = lustre_msg_buflen(msgbuf, 1);
+        token.data = lustre_msg_buf(msgbuf, 1, 0);
          clear_obj.len = clear_buflen;
          clear_obj.data = clear_buf;
  
-        major = lgss_unwrap(mechctx, &token, &clear_obj);
+        major = lgss_unwrap(mechctx, &hdrobj, &token, &clear_obj);
          if (major != GSS_S_COMPLETE) {
-                CERROR("priv: unwrap message error: %08x\n", major);
+                CERROR("unwrap message error: %08x\n", major);
                  GOTO(out_free, major = GSS_S_FAILURE);
          }
          LASSERT(clear_obj.len <= clear_buflen);
+        LASSERT(clear_obj.len <= msgbuf_len);
  
          /* now the decrypted message */
          memcpy(msgbuf, clear_obj.data, clear_obj.len);
@@ -316,7 +316,7 @@ __u32 gss_unseal_msg(struct gss_ctx *mechctx,
  
          major = GSS_S_COMPLETE;
  out_free:
-        OBD_FREE(clear_buf, clear_buflen);
+        OBD_FREE_LARGE(clear_buf, clear_buflen);
          RETURN(major);
  }
  
@@ -326,30 +326,23 @@ out_free:
  
  int cli_ctx_expire(struct ptlrpc_cli_ctx *ctx)
  {
-        LASSERT(atomic_read(&ctx->cc_refcount));
+       LASSERT(atomic_read(&ctx->cc_refcount));
  
-        if (!test_and_set_bit(PTLRPC_CTX_DEAD_BIT, &ctx->cc_flags)) {
-                cfs_time_t now;
+       if (!test_and_set_bit(PTLRPC_CTX_DEAD_BIT, &ctx->cc_flags)) {
+               if (!ctx->cc_early_expire)
+                       clear_bit(PTLRPC_CTX_UPTODATE_BIT, &ctx->cc_flags);
  
-                if (!ctx->cc_early_expire)
-                        clear_bit(PTLRPC_CTX_UPTODATE_BIT, &ctx->cc_flags);
+               CWARN("ctx %p(%u->%s) get expired: %lu(%+lds)\n",
+                     ctx, ctx->cc_vcred.vc_uid, sec2target_str(ctx->cc_sec),
+                     ctx->cc_expire,
+                     ctx->cc_expire == 0 ? 0 :
+                     cfs_time_sub(ctx->cc_expire, cfs_time_current_sec()));
  
-                now = cfs_time_current_sec();
-                if (ctx->cc_expire && cfs_time_aftereq(now, ctx->cc_expire))
-                        CWARN("ctx %p(%u->%s): get expired (%lds exceeds)\n",
-                              ctx, ctx->cc_vcred.vc_uid,
-                              sec2target_str(ctx->cc_sec),
-                              cfs_time_sub(now, ctx->cc_expire));
-                else
-                        CWARN("ctx %p(%u->%s): force to die (%lds remains)\n",
-                              ctx, ctx->cc_vcred.vc_uid,
-                              sec2target_str(ctx->cc_sec),
-                              ctx->cc_expire == 0 ? 0 :
-                              cfs_time_sub(ctx->cc_expire, now));
+               sptlrpc_cli_ctx_wakeup(ctx);
+               return 1;
+       }
  
-                return 1;
-        }
-        return 0;
+       return 0;
  }
  
  /*
@@ -385,81 +378,94 @@ void gss_cli_ctx_uptodate(struct gss_cli_ctx *gctx)
          }
  
          ctx->cc_expire = gss_round_ctx_expiry(ctx_expiry,
-                                              ctx->cc_sec->ps_flags);
+                                              ctx->cc_sec->ps_flvr.sf_flags);
  
          /* At this point this ctx might have been marked as dead by
           * someone else, in which case nobody will make further use
           * of it. we don't care, and mark it UPTODATE will help
-         * destroying server side context when it be destroied. */
-        set_bit(PTLRPC_CTX_UPTODATE_BIT, &ctx->cc_flags);
+         * destroying server side context when it be destroyed. */
+       set_bit(PTLRPC_CTX_UPTODATE_BIT, &ctx->cc_flags);
+
+       if (sec_is_reverse(ctx->cc_sec)) {
+               CWARN("server installed reverse ctx %p idx "LPX64", "
+                     "expiry %lu(%+lds)\n", ctx,
+                     gss_handle_to_u64(&gctx->gc_handle),
+                     ctx->cc_expire,
+                     cfs_time_sub(ctx->cc_expire, cfs_time_current_sec()));
+        } else {
+               CWARN("client refreshed ctx %p idx "LPX64" (%u->%s), "
+                     "expiry %lu(%+lds)\n", ctx,
+                     gss_handle_to_u64(&gctx->gc_handle),
+                     ctx->cc_vcred.vc_uid, sec2target_str(ctx->cc_sec),
+                     ctx->cc_expire,
+                     cfs_time_sub(ctx->cc_expire, cfs_time_current_sec()));
  
-        if (sec_is_reverse(ctx->cc_sec))
-                CDEBUG(D_SEC, "server installed reverse ctx %p, "
-                       "will expire at %lu(%lds lifetime)\n",
-                       ctx, ctx->cc_expire,
-                       ctx->cc_expire - cfs_time_current_sec());
-        else
-                CWARN("client refreshed ctx %p(%u->%s), will expire at "
-                      "%lu(%lds lifetime)\n", ctx, ctx->cc_vcred.vc_uid,
-                      sec2target_str(ctx->cc_sec), ctx->cc_expire,
-                      ctx->cc_expire - cfs_time_current_sec());
+               /* install reverse svc ctx for root context */
+               if (ctx->cc_vcred.vc_uid == 0)
+                       gss_sec_install_rctx(ctx->cc_sec->ps_import,
+                                            ctx->cc_sec, ctx);
+       }
  
-        /* install reverse svc ctx, but only for forward connection
-         * and root context */
-        if (!sec_is_reverse(ctx->cc_sec) && ctx->cc_vcred.vc_uid == 0) {
-                gss_sec_install_rctx(ctx->cc_sec->ps_import,
-                                     ctx->cc_sec, ctx);
-        }
+        sptlrpc_cli_ctx_wakeup(ctx);
  }
  
-static
-void gss_cli_ctx_finalize(struct gss_cli_ctx *gctx)
+static void gss_cli_ctx_finalize(struct gss_cli_ctx *gctx)
  {
+        LASSERT(gctx->gc_base.cc_sec);
+
          if (gctx->gc_mechctx) {
                  lgss_delete_sec_context(&gctx->gc_mechctx);
                  gctx->gc_mechctx = NULL;
          }
  
+        if (!rawobj_empty(&gctx->gc_svc_handle)) {
+                /* forward ctx: mark buddy reverse svcctx soon-expire. */
+                if (!sec_is_reverse(gctx->gc_base.cc_sec) &&
+                    !rawobj_empty(&gctx->gc_svc_handle))
+                        gss_svc_upcall_expire_rvs_ctx(&gctx->gc_svc_handle);
+
+                rawobj_free(&gctx->gc_svc_handle);
+        }
+
          rawobj_free(&gctx->gc_handle);
  }
  
-/*
+/**
   * Based on sequence number algorithm as specified in RFC 2203.
   *
- * modified for our own problem: arriving request has valid sequence number,
+ * Modified for our own problem: arriving request has valid sequence number,
   * but unwrapping request might cost a long time, after that its sequence
   * are not valid anymore (fall behind the window). It rarely happen, mostly
   * under extreme load.
   *
- * note we should not check sequence before verify the integrity of incoming
+ * Note we should not check sequence before verifying the integrity of incoming
   * request, because just one attacking request with high sequence number might
- * cause all following request be dropped.
+ * cause all following requests be dropped.
   *
- * so here we use a multi-phase approach: prepare 2 sequence windows,
+ * So here we use a multi-phase approach: prepare 2 sequence windows,
   * "main window" for normal sequence and "back window" for fall behind sequence.
   * and 3-phase checking mechanism:
- *  0 - before integrity verification, perform a initial sequence checking in
- *      main window, which only try and don't actually set any bits. if the
- *      sequence is high above the window or fit in the window and the bit
+ *  0 - before integrity verification, perform an initial sequence checking in
+ *      main window, which only tries and doesn't actually set any bits. if the
+ *      sequence is high above the window or fits in the window and the bit
   *      is 0, then accept and proceed to integrity verification. otherwise
   *      reject this sequence.
   *  1 - after integrity verification, check in main window again. if this
- *      sequence is high above the window or fit in the window and the bit
- *      is 0, then set the bit and accept; if it fit in the window but bit
- *      already set, then reject; if it fall behind the window, then proceed
+ *      sequence is high above the window or fits in the window and the bit
+ *      is 0, then set the bit and accept; if it fits in the window but bit
+ *      already set, then reject; if it falls behind the window, then proceed
   *      to phase 2.
- *  2 - check in back window. if it is high above the window or fit in the
+ *  2 - check in back window. if it is high above the window or fits in the
   *      window and the bit is 0, then set the bit and accept. otherwise reject.
   *
- * return value:
- *   1: looks like a replay
- *   0: is ok
- *  -1: is a replay
+ * \return      1:     looks like a replay
+ * \return      0:     is ok
+ * \return     -1:     is a replay
   *
- * note phase 0 is necessary, because otherwise replay attacking request of
+ * Note phase 0 is necessary, because otherwise replay attacking request of
   * sequence which between the 2 windows can't be detected.
   *
- * this mechanism can't totally solve the problem, but could help much less
+ * This mechanism can't totally solve the problem, but could help reduce the
   * number of valid requests be dropped.
   */
  static
@@ -501,7 +507,7 @@ int gss_do_check_seq(unsigned long *window, __u32 win_size, __u32 *max_seq,
                   */
                  switch (phase) {
                  case 0:
-                        if (test_bit(seq_num % win_size, window))
+                       if (test_bit(seq_num % win_size, window))
                                  goto replay;
                          break;
                  case 1:
@@ -531,9 +537,9 @@ replay:
   */
  int gss_check_seq_num(struct gss_svc_seq_data *ssd, __u32 seq_num, int set)
  {
-        int rc = 0;
+       int rc = 0;
  
-        spin_lock(&ssd->ssd_lock);
+       spin_lock(&ssd->ssd_lock);
  
          if (set == 0) {
                  /*
@@ -567,19 +573,45 @@ int gss_check_seq_num(struct gss_svc_seq_data *ssd, __u32 seq_num, int set)
                          gss_stat_oos_record_svc(2, 0);
          }
  exit:
-        spin_unlock(&ssd->ssd_lock);
-        return rc;
+       spin_unlock(&ssd->ssd_lock);
+       return rc;
  }
  
  /***************************************
   * cred APIs                           *
   ***************************************/
  
-static inline
-int gss_cli_payload(struct ptlrpc_cli_ctx *ctx,
-                    int msgsize, int privacy)
+static inline int gss_cli_payload(struct ptlrpc_cli_ctx *ctx,
+                                  int msgsize, int privacy)
  {
-        return gss_estimate_payload(NULL, msgsize, privacy);
+        return gss_mech_payload(NULL, msgsize, privacy);
+}
+
+static int gss_cli_bulk_payload(struct ptlrpc_cli_ctx *ctx,
+                                struct sptlrpc_flavor *flvr,
+                                int reply, int read)
+{
+        int     payload = sizeof(struct ptlrpc_bulk_sec_desc);
+
+        LASSERT(SPTLRPC_FLVR_BULK_TYPE(flvr->sf_rpc) == SPTLRPC_BULK_DEFAULT);
+
+        if ((!reply && !read) || (reply && read)) {
+                switch (SPTLRPC_FLVR_BULK_SVC(flvr->sf_rpc)) {
+                case SPTLRPC_BULK_SVC_NULL:
+                        break;
+                case SPTLRPC_BULK_SVC_INTG:
+                        payload += gss_cli_payload(ctx, 0, 0);
+                        break;
+                case SPTLRPC_BULK_SVC_PRIV:
+                        payload += gss_cli_payload(ctx, 0, 1);
+                        break;
+                case SPTLRPC_BULK_SVC_AUTH:
+                default:
+                        LBUG();
+                }
+        }
+
+        return payload;
  }
  
  int gss_cli_ctx_match(struct ptlrpc_cli_ctx *ctx, struct vfs_cred *vcred)
@@ -589,31 +621,29 @@ int gss_cli_ctx_match(struct ptlrpc_cli_ctx *ctx, struct vfs_cred *vcred)
  
  void gss_cli_ctx_flags2str(unsigned long flags, char *buf, int bufsize)
  {
-        buf[0] = '\0';
-
-        if (flags & PTLRPC_CTX_NEW)
-                strncat(buf, "new,", bufsize);
-        if (flags & PTLRPC_CTX_UPTODATE)
-                strncat(buf, "uptodate,", bufsize);
-        if (flags & PTLRPC_CTX_DEAD)
-                strncat(buf, "dead,", bufsize);
-        if (flags & PTLRPC_CTX_ERROR)
-                strncat(buf, "error,", bufsize);
-        if (flags & PTLRPC_CTX_CACHED)
-                strncat(buf, "cached,", bufsize);
-        if (flags & PTLRPC_CTX_ETERNAL)
-                strncat(buf, "eternal,", bufsize);
-        if (buf[0] == '\0')
-                strncat(buf, "-,", bufsize);
+       buf[0] = '\0';
  
-        buf[strlen(buf) - 1] = '\0';
+       if (flags & PTLRPC_CTX_NEW)
+               strlcat(buf, "new,", bufsize);
+       if (flags & PTLRPC_CTX_UPTODATE)
+               strlcat(buf, "uptodate,", bufsize);
+       if (flags & PTLRPC_CTX_DEAD)
+               strlcat(buf, "dead,", bufsize);
+       if (flags & PTLRPC_CTX_ERROR)
+               strlcat(buf, "error,", bufsize);
+       if (flags & PTLRPC_CTX_CACHED)
+               strlcat(buf, "cached,", bufsize);
+       if (flags & PTLRPC_CTX_ETERNAL)
+               strlcat(buf, "eternal,", bufsize);
+       if (buf[0] == '\0')
+               strlcat(buf, "-,", bufsize);
  }
  
  int gss_cli_ctx_sign(struct ptlrpc_cli_ctx *ctx,
                       struct ptlrpc_request *req)
  {
-        struct gss_cli_ctx      *gctx;
-        __u32                    seq, svc;
+        struct gss_cli_ctx      *gctx = ctx2gctx(ctx);
+        __u32                    flags = 0, seq, svc;
          int                      rc;
          ENTRY;
  
@@ -625,35 +655,40 @@ int gss_cli_ctx_sign(struct ptlrpc_cli_ctx *ctx,
          if (req->rq_ctx_init)
                  RETURN(0);
  
-        gctx = container_of(ctx, struct gss_cli_ctx, gc_base);
-        svc = SEC_FLAVOR_SVC(req->rq_sec_flavor);
-redo:
-        seq = atomic_inc_return(&gctx->gc_seq);
-
-        rc = gss_sign_msg(req->rq_reqbuf, gctx->gc_mechctx,
-                          gctx->gc_proc, seq, svc,
-                          &gctx->gc_handle);
-        if (rc < 0)
-                RETURN(rc);
+        svc = SPTLRPC_FLVR_SVC(req->rq_flvr.sf_rpc);
+        if (req->rq_pack_bulk)
+                flags |= LUSTRE_GSS_PACK_BULK;
+        if (req->rq_pack_udesc)
+                flags |= LUSTRE_GSS_PACK_USER;
  
-        /* gss_sign_msg() msg might take long time to finish, in which period
-         * more rpcs could be wrapped up and sent out. if we found too many
-         * of them we should repack this rpc, because sent it too late might
-         * lead to the sequence number fall behind the window on server and
-         * be dropped. also applies to gss_cli_ctx_seal().
-         *
-         * Note: null mode dosen't check sequence number. */
-        if (svc != SPTLRPC_SVC_NULL &&
-            atomic_read(&gctx->gc_seq) - seq > GSS_SEQ_REPACK_THRESHOLD) {
-                int behind = atomic_read(&gctx->gc_seq) - seq;
-
-                gss_stat_oos_record_cli(behind);
-                CWARN("req %p: %u behind, retry signing\n", req, behind);
-                goto redo;
-        }
-
-        req->rq_reqdata_len = rc;
-        RETURN(0);
+redo:
+       seq = atomic_inc_return(&gctx->gc_seq);
+
+       rc = gss_sign_msg(req->rq_reqbuf, gctx->gc_mechctx,
+                         ctx->cc_sec->ps_part,
+                         flags, gctx->gc_proc, seq, svc,
+                         &gctx->gc_handle);
+       if (rc < 0)
+               RETURN(rc);
+
+       /* gss_sign_msg() msg might take long time to finish, in which period
+        * more rpcs could be wrapped up and sent out. if we found too many
+        * of them we should repack this rpc, because sent it too late might
+        * lead to the sequence number fall behind the window on server and
+        * be dropped. also applies to gss_cli_ctx_seal().
+        *
+        * Note: null mode doesn't check sequence number. */
+       if (svc != SPTLRPC_SVC_NULL &&
+           atomic_read(&gctx->gc_seq) - seq > GSS_SEQ_REPACK_THRESHOLD) {
+               int behind = atomic_read(&gctx->gc_seq) - seq;
+
+               gss_stat_oos_record_cli(behind);
+               CWARN("req %p: %u behind, retry signing\n", req, behind);
+               goto redo;
+       }
+
+       req->rq_reqdata_len = rc;
+       RETURN(0);
  }
  
  static
@@ -668,50 +703,55 @@ int gss_cli_ctx_handle_err_notify(struct ptlrpc_cli_ctx *ctx,
  
          errhdr = (struct gss_err_header *) ghdr;
  
+        CWARN("req x"LPU64"/t"LPU64", ctx %p idx "LPX64"(%u->%s): "
+              "%sserver respond (%08x/%08x)\n",
+              req->rq_xid, req->rq_transno, ctx,
+              gss_handle_to_u64(&ctx2gctx(ctx)->gc_handle),
+              ctx->cc_vcred.vc_uid, sec2target_str(ctx->cc_sec),
+              sec_is_reverse(ctx->cc_sec) ? "reverse" : "",
+              errhdr->gh_major, errhdr->gh_minor);
+
+        /* context fini rpc, let it failed */
+        if (req->rq_ctx_fini) {
+                CWARN("context fini rpc failed\n");
+                return -EINVAL;
+        }
+
+        /* reverse sec, just return error, don't expire this ctx because it's
+         * crucial to callback rpcs. note if the callback rpc failed because
+         * of bit flip during network transfer, the client will be evicted
+         * directly. so more gracefully we probably want let it retry for
+         * number of times. */
+        if (sec_is_reverse(ctx->cc_sec))
+                return -EINVAL;
+
+        if (errhdr->gh_major != GSS_S_NO_CONTEXT &&
+            errhdr->gh_major != GSS_S_BAD_SIG)
+                return -EACCES;
+
          /* server return NO_CONTEXT might be caused by context expire
-         * or server reboot/failover. we refresh the cred transparently
-         * to upper layer.
+         * or server reboot/failover. we try to refresh a new ctx which
+         * be transparent to upper layer.
+         *
           * In some cases, our gss handle is possible to be incidentally
           * identical to another handle since the handle itself is not
           * fully random. In krb5 case, the GSS_S_BAD_SIG will be
           * returned, maybe other gss error for other mechanism.
           *
           * if we add new mechanism, make sure the correct error are
-         * returned in this case.
-         *
-         * but in any cases, don't resend ctx destroying rpc, don't resend
-         * reverse rpc. */
-        if (req->rq_ctx_fini) {
-                CWARN("server respond error (%08x/%08x) for ctx fini\n",
-                      errhdr->gh_major, errhdr->gh_minor);
-                rc = -EINVAL;
-        } else if (sec_is_reverse(ctx->cc_sec)) {
-                CWARN("reverse server respond error (%08x/%08x)\n",
-                      errhdr->gh_major, errhdr->gh_minor);
-                rc = -EINVAL;
-        } else if (errhdr->gh_major == GSS_S_NO_CONTEXT ||
-                   errhdr->gh_major == GSS_S_BAD_SIG) {
-                CWARN("req x"LPU64"/t"LPU64": server respond ctx %p(%u->%s) "
-                      "%s, server might lost the context.\n",
-                      req->rq_xid, req->rq_transno, ctx, ctx->cc_vcred.vc_uid,
-                      sec2target_str(ctx->cc_sec),
-                      errhdr->gh_major == GSS_S_NO_CONTEXT ?
-                      "NO_CONTEXT" : "BAD_SIG");
-
-                sptlrpc_cli_ctx_expire(ctx);
-
-                /* we need replace the ctx right here, otherwise during
-                 * resent we'll hit the logic in sptlrpc_req_refresh_ctx()
-                 * which keep the ctx with RESEND flag, thus we'll never
-                 * get rid of this ctx. */
-                rc = sptlrpc_req_replace_dead_ctx(req);
-                if (rc == 0)
-                        req->rq_resend = 1;
-        } else {
-                CERROR("req %p: server report gss error (%x/%x)\n",
-                        req, errhdr->gh_major, errhdr->gh_minor);
-                rc = -EACCES;
-        }
+         * returned in this case. */
+        CWARN("%s: server might lost the context, retrying\n",
+              errhdr->gh_major == GSS_S_NO_CONTEXT ?  "NO_CONTEXT" : "BAD_SIG");
+
+        sptlrpc_cli_ctx_expire(ctx);
+
+        /* we need replace the ctx right here, otherwise during
+         * resent we'll hit the logic in sptlrpc_req_refresh_ctx()
+         * which keep the ctx with RESEND flag, thus we'll never
+         * get rid of this ctx. */
+        rc = sptlrpc_req_replace_dead_ctx(req);
+        if (rc == 0)
+                req->rq_resend = 1;
  
          return rc;
  }
@@ -721,20 +761,19 @@ int gss_cli_ctx_verify(struct ptlrpc_cli_ctx *ctx,
  {
          struct gss_cli_ctx     *gctx;
          struct gss_header      *ghdr, *reqhdr;
-        struct lustre_msg      *msg = req->rq_repbuf;
+        struct lustre_msg      *msg = req->rq_repdata;
          __u32                   major;
-        int                     rc = 0;
+        int                     pack_bulk, swabbed, rc = 0;
          ENTRY;
  
          LASSERT(req->rq_cli_ctx == ctx);
          LASSERT(msg);
  
-        req->rq_repdata_len = req->rq_nob_received;
          gctx = container_of(ctx, struct gss_cli_ctx, gc_base);
  
          /* special case for context negotiation, rq_repmsg/rq_replen actually
-         * are not used currently. */
-        if (req->rq_ctx_init) {
+         * are not used currently. but early reply always be treated normally */
+        if (req->rq_ctx_init && !req->rq_early) {
                  req->rq_repmsg = lustre_msg_buf(msg, 1, 0);
                  req->rq_replen = msg->lm_buflens[1];
                  RETURN(0);
@@ -745,7 +784,9 @@ int gss_cli_ctx_verify(struct ptlrpc_cli_ctx *ctx,
                  RETURN(-EPROTO);
          }
  
-        ghdr = gss_swab_header(msg, 0);
+        swabbed = ptlrpc_rep_need_swab(req);
+
+        ghdr = gss_swab_header(msg, 0, swabbed);
          if (ghdr == NULL) {
                  CERROR("can't decode gss header\n");
                  RETURN(-EPROTO);
@@ -763,6 +804,14 @@ int gss_cli_ctx_verify(struct ptlrpc_cli_ctx *ctx,
  
          switch (ghdr->gh_proc) {
          case PTLRPC_GSS_PROC_DATA:
+                pack_bulk = ghdr->gh_flags & LUSTRE_GSS_PACK_BULK;
+
+                if (!req->rq_early && !equi(req->rq_pack_bulk == 1, pack_bulk)){
+                        CERROR("%s bulk flag in reply\n",
+                               req->rq_pack_bulk ? "missing" : "unexpected");
+                        RETURN(-EPROTO);
+                }
+
                  if (ghdr->gh_seq != reqhdr->gh_seq) {
                          CERROR("seqnum %u mismatch, expect %u\n",
                                 ghdr->gh_seq, reqhdr->gh_seq);
@@ -775,29 +824,53 @@ int gss_cli_ctx_verify(struct ptlrpc_cli_ctx *ctx,
                          RETURN(-EPROTO);
                  }
  
-                if (lustre_msg_swabbed(msg))
+                if (swabbed)
                          gss_header_swabber(ghdr);
  
                  major = gss_verify_msg(msg, gctx->gc_mechctx, reqhdr->gh_svc);
-                if (major != GSS_S_COMPLETE)
+                if (major != GSS_S_COMPLETE) {
+                        CERROR("failed to verify reply: %x\n", major);
                          RETURN(-EPERM);
+                }
  
-                req->rq_repmsg = lustre_msg_buf(msg, 1, 0);
-                req->rq_replen = msg->lm_buflens[1];
+                if (req->rq_early && reqhdr->gh_svc == SPTLRPC_SVC_NULL) {
+                        __u32 cksum;
  
-                if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
-                        if (msg->lm_bufcount < 4) {
+                        cksum = crc32_le(!(__u32) 0,
+                                         lustre_msg_buf(msg, 1, 0),
+                                         lustre_msg_buflen(msg, 1));
+                        if (cksum != msg->lm_cksum) {
+                                CWARN("early reply checksum mismatch: "
+                                      "%08x != %08x\n", cksum, msg->lm_cksum);
+                                RETURN(-EPROTO);
+                        }
+                }
+
+                if (pack_bulk) {
+                        /* bulk checksum is right after the lustre msg */
+                        if (msg->lm_bufcount < 3) {
                                  CERROR("Invalid reply bufcount %u\n",
                                         msg->lm_bufcount);
                                  RETURN(-EPROTO);
                          }
  
-                        /* bulk checksum is the second last segment */
-                        rc = bulk_sec_desc_unpack(msg, msg->lm_bufcount - 2);
+                        rc = bulk_sec_desc_unpack(msg, 2, swabbed);
+                        if (rc) {
+                                CERROR("unpack bulk desc: %d\n", rc);
+                                RETURN(rc);
+                        }
                  }
+
+                req->rq_repmsg = lustre_msg_buf(msg, 1, 0);
+                req->rq_replen = msg->lm_buflens[1];
                  break;
          case PTLRPC_GSS_PROC_ERR:
-                rc = gss_cli_ctx_handle_err_notify(ctx, req, ghdr);
+                if (req->rq_early) {
+                        CERROR("server return error with early reply\n");
+                        rc = -EPROTO;
+                } else {
+                        rc = gss_cli_ctx_handle_err_notify(ctx, req, ghdr);
+                }
                  break;
          default:
                  CERROR("unknown gss proc %d\n", ghdr->gh_proc);
@@ -811,10 +884,10 @@ int gss_cli_ctx_seal(struct ptlrpc_cli_ctx *ctx,
                       struct ptlrpc_request *req)
  {
          struct gss_cli_ctx      *gctx;
-        rawobj_t                 msgobj, cipher_obj, micobj;
+        rawobj_t                 hdrobj, msgobj, token;
          struct gss_header       *ghdr;
-        int                      buflens[3], wiresize, rc;
-        __u32                    major;
+        __u32                    buflens[2], major;
+        int                      wiresize, rc;
          ENTRY;
  
          LASSERT(req->rq_clrbuf);
@@ -823,15 +896,14 @@ int gss_cli_ctx_seal(struct ptlrpc_cli_ctx *ctx,
  
          gctx = container_of(ctx, struct gss_cli_ctx, gc_base);
  
-        /* close clear data length */
+        /* final clear data length */
          req->rq_clrdata_len = lustre_msg_size_v2(req->rq_clrbuf->lm_bufcount,
                                                   req->rq_clrbuf->lm_buflens);
  
          /* calculate wire data length */
          buflens[0] = PTLRPC_GSS_HEADER_SIZE;
-        buflens[1] = gss_cli_payload(&gctx->gc_base, buflens[0], 0);
-        buflens[2] = gss_cli_payload(&gctx->gc_base, req->rq_clrdata_len, 1);
-        wiresize = lustre_msg_size_v2(3, buflens);
+        buflens[1] = gss_cli_payload(&gctx->gc_base, req->rq_clrdata_len, 1);
+        wiresize = lustre_msg_size_v2(2, buflens);
  
          /* allocate wire buffer */
          if (req->rq_pool) {
@@ -840,83 +912,71 @@ int gss_cli_ctx_seal(struct ptlrpc_cli_ctx *ctx,
                  LASSERT(req->rq_reqbuf != req->rq_clrbuf);
                  LASSERT(req->rq_reqbuf_len >= wiresize);
          } else {
-                OBD_ALLOC(req->rq_reqbuf, wiresize);
+                OBD_ALLOC_LARGE(req->rq_reqbuf, wiresize);
                  if (!req->rq_reqbuf)
                          RETURN(-ENOMEM);
                  req->rq_reqbuf_len = wiresize;
          }
  
-        lustre_init_msg_v2(req->rq_reqbuf, 3, buflens, NULL);
-        req->rq_reqbuf->lm_secflvr = req->rq_sec_flavor;
+        lustre_init_msg_v2(req->rq_reqbuf, 2, buflens, NULL);
+        req->rq_reqbuf->lm_secflvr = req->rq_flvr.sf_rpc;
  
          /* gss header */
          ghdr = lustre_msg_buf(req->rq_reqbuf, 0, 0);
          ghdr->gh_version = PTLRPC_GSS_VERSION;
+        ghdr->gh_sp = (__u8) ctx->cc_sec->ps_part;
          ghdr->gh_flags = 0;
          ghdr->gh_proc = gctx->gc_proc;
-        ghdr->gh_seq = atomic_inc_return(&gctx->gc_seq);
          ghdr->gh_svc = SPTLRPC_SVC_PRIV;
          ghdr->gh_handle.len = gctx->gc_handle.len;
          memcpy(ghdr->gh_handle.data, gctx->gc_handle.data, gctx->gc_handle.len);
+        if (req->rq_pack_bulk)
+                ghdr->gh_flags |= LUSTRE_GSS_PACK_BULK;
+        if (req->rq_pack_udesc)
+                ghdr->gh_flags |= LUSTRE_GSS_PACK_USER;
  
  redo:
-        /* header signature */
-        msgobj.len = req->rq_reqbuf->lm_buflens[0];
-        msgobj.data = lustre_msg_buf(req->rq_reqbuf, 0, 0);
-        micobj.len = req->rq_reqbuf->lm_buflens[1];
-        micobj.data = lustre_msg_buf(req->rq_reqbuf, 1, 0);
+       ghdr->gh_seq = atomic_inc_return(&gctx->gc_seq);
  
-        major = lgss_get_mic(gctx->gc_mechctx, 1, &msgobj, &micobj);
-        if (major != GSS_S_COMPLETE) {
-                CERROR("priv: sign message error: %08x\n", major);
-                GOTO(err_free, rc = -EPERM);
-        }
-        /* perhaps shrink msg has potential problem in re-packing???
-         * ship a little bit more data is fine.
-        lustre_shrink_msg(req->rq_reqbuf, 1, micobj.len, 0);
-         */
-
-        /* clear text */
+        /* buffer objects */
+        hdrobj.len = PTLRPC_GSS_HEADER_SIZE;
+        hdrobj.data = (__u8 *) ghdr;
          msgobj.len = req->rq_clrdata_len;
          msgobj.data = (__u8 *) req->rq_clrbuf;
+        token.len = lustre_msg_buflen(req->rq_reqbuf, 1);
+        token.data = lustre_msg_buf(req->rq_reqbuf, 1, 0);
  
-        /* cipher text */
-        cipher_obj.len = req->rq_reqbuf->lm_buflens[2];
-        cipher_obj.data = lustre_msg_buf(req->rq_reqbuf, 2, 0);
-
-        major = lgss_wrap(gctx->gc_mechctx, &msgobj, req->rq_clrbuf_len,
-                          &cipher_obj);
+        major = lgss_wrap(gctx->gc_mechctx, &hdrobj, &msgobj,
+                          req->rq_clrbuf_len, &token);
          if (major != GSS_S_COMPLETE) {
                  CERROR("priv: wrap message error: %08x\n", major);
                  GOTO(err_free, rc = -EPERM);
          }
-        LASSERT(cipher_obj.len <= buflens[2]);
-
-        /* see explain in gss_cli_ctx_sign() */
-        if (atomic_read(&gctx->gc_seq) - ghdr->gh_seq >
-            GSS_SEQ_REPACK_THRESHOLD) {
-                int behind = atomic_read(&gctx->gc_seq) - ghdr->gh_seq;
+        LASSERT(token.len <= buflens[1]);
  
-                gss_stat_oos_record_cli(behind);
-                CWARN("req %p: %u behind, retry sealing\n", req, behind);
+       /* see explain in gss_cli_ctx_sign() */
+       if (unlikely(atomic_read(&gctx->gc_seq) - ghdr->gh_seq >
+                    GSS_SEQ_REPACK_THRESHOLD)) {
+               int behind = atomic_read(&gctx->gc_seq) - ghdr->gh_seq;
  
-                ghdr->gh_seq = atomic_inc_return(&gctx->gc_seq);
-                goto redo;
-        }
+               gss_stat_oos_record_cli(behind);
+               CWARN("req %p: %u behind, retry sealing\n", req, behind);
  
-        /* now set the final wire data length */
-        req->rq_reqdata_len = lustre_shrink_msg(req->rq_reqbuf, 2,
-                                                cipher_obj.len, 0);
+               ghdr->gh_seq = atomic_inc_return(&gctx->gc_seq);
+               goto redo;
+       }
  
-        RETURN(0);
+       /* now set the final wire data length */
+       req->rq_reqdata_len = lustre_shrink_msg(req->rq_reqbuf, 1, token.len,0);
+       RETURN(0);
  
  err_free:
-        if (!req->rq_pool) {
-                OBD_FREE(req->rq_reqbuf, req->rq_reqbuf_len);
-                req->rq_reqbuf = NULL;
-                req->rq_reqbuf_len = 0;
-        }
-        RETURN(rc);
+       if (!req->rq_pool) {
+               OBD_FREE_LARGE(req->rq_reqbuf, req->rq_reqbuf_len);
+               req->rq_reqbuf = NULL;
+               req->rq_reqbuf_len = 0;
+       }
+       RETURN(rc);
  }
  
  int gss_cli_ctx_unseal(struct ptlrpc_cli_ctx *ctx,
@@ -924,16 +984,19 @@ int gss_cli_ctx_unseal(struct ptlrpc_cli_ctx *ctx,
  {
          struct gss_cli_ctx      *gctx;
          struct gss_header       *ghdr;
-        int                      msglen, rc;
+        struct lustre_msg       *msg = req->rq_repdata;
+        int                      msglen, pack_bulk, swabbed, rc;
          __u32                    major;
          ENTRY;
  
-        LASSERT(req->rq_repbuf);
          LASSERT(req->rq_cli_ctx == ctx);
+        LASSERT(req->rq_ctx_init == 0);
+        LASSERT(msg);
  
          gctx = container_of(ctx, struct gss_cli_ctx, gc_base);
+        swabbed = ptlrpc_rep_need_swab(req);
  
-        ghdr = gss_swab_header(req->rq_repbuf, 0);
+        ghdr = gss_swab_header(msg, 0, swabbed);
          if (ghdr == NULL) {
                  CERROR("can't decode gss header\n");
                  RETURN(-EPROTO);
@@ -948,47 +1011,65 @@ int gss_cli_ctx_unseal(struct ptlrpc_cli_ctx *ctx,
  
          switch (ghdr->gh_proc) {
          case PTLRPC_GSS_PROC_DATA:
-                if (lustre_msg_swabbed(req->rq_repbuf))
+                pack_bulk = ghdr->gh_flags & LUSTRE_GSS_PACK_BULK;
+
+                if (!req->rq_early && !equi(req->rq_pack_bulk == 1, pack_bulk)){
+                        CERROR("%s bulk flag in reply\n",
+                               req->rq_pack_bulk ? "missing" : "unexpected");
+                        RETURN(-EPROTO);
+                }
+
+                if (swabbed)
                          gss_header_swabber(ghdr);
  
-                major = gss_unseal_msg(gctx->gc_mechctx, req->rq_repbuf,
-                                       &msglen, req->rq_repbuf_len);
+                /* use rq_repdata_len as buffer size, which assume unseal
+                 * doesn't need extra memory space. for precise control, we'd
+                 * better calculate out actual buffer size as
+                 * (repbuf_len - offset - repdata_len) */
+                major = gss_unseal_msg(gctx->gc_mechctx, msg,
+                                       &msglen, req->rq_repdata_len);
                  if (major != GSS_S_COMPLETE) {
+                        CERROR("failed to unwrap reply: %x\n", major);
                          rc = -EPERM;
                          break;
                  }
  
-                if (lustre_unpack_msg(req->rq_repbuf, msglen)) {
+                swabbed = __lustre_unpack_msg(msg, msglen);
+                if (swabbed < 0) {
                          CERROR("Failed to unpack after decryption\n");
                          RETURN(-EPROTO);
                  }
-                req->rq_repdata_len = msglen;
  
-                if (req->rq_repbuf->lm_bufcount < 1) {
+                if (msg->lm_bufcount < 1) {
                          CERROR("Invalid reply buffer: empty\n");
                          RETURN(-EPROTO);
                  }
  
-                if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
-                        if (req->rq_repbuf->lm_bufcount < 2) {
-                                CERROR("Too few request buffer segments %d\n",
-                                       req->rq_repbuf->lm_bufcount);
+                if (pack_bulk) {
+                        if (msg->lm_bufcount < 2) {
+                                CERROR("bufcount %u: missing bulk sec desc\n",
+                                       msg->lm_bufcount);
                                  RETURN(-EPROTO);
                          }
  
                          /* bulk checksum is the last segment */
-                        if (bulk_sec_desc_unpack(req->rq_repbuf,
-                                                 req->rq_repbuf->lm_bufcount-1))
+                        if (bulk_sec_desc_unpack(msg, msg->lm_bufcount - 1,
+                                                 swabbed))
                                  RETURN(-EPROTO);
                  }
  
-                req->rq_repmsg = lustre_msg_buf(req->rq_repbuf, 0, 0);
-                req->rq_replen = req->rq_repbuf->lm_buflens[0];
+                req->rq_repmsg = lustre_msg_buf(msg, 0, 0);
+                req->rq_replen = msg->lm_buflens[0];
  
                  rc = 0;
                  break;
          case PTLRPC_GSS_PROC_ERR:
-                rc = gss_cli_ctx_handle_err_notify(ctx, req, ghdr);
+                if (req->rq_early) {
+                        CERROR("server return error with early reply\n");
+                        rc = -EPROTO;
+                } else {
+                        rc = gss_cli_ctx_handle_err_notify(ctx, req, ghdr);
+                }
                  break;
          default:
                  CERROR("unexpected proc %d\n", ghdr->gh_proc);
@@ -1016,75 +1097,78 @@ int gss_install_rvs_svc_ctx(struct obd_import *imp,
  int gss_sec_create_common(struct gss_sec *gsec,
                            struct ptlrpc_sec_policy *policy,
                            struct obd_import *imp,
-                          struct ptlrpc_svc_ctx *ctx,
-                          __u32 flavor,
-                          unsigned long flags)
+                          struct ptlrpc_svc_ctx *svcctx,
+                          struct sptlrpc_flavor *sf)
  {
          struct ptlrpc_sec   *sec;
  
          LASSERT(imp);
-        LASSERT(SEC_FLAVOR_POLICY(flavor) == SPTLRPC_POLICY_GSS);
+        LASSERT(SPTLRPC_FLVR_POLICY(sf->sf_rpc) == SPTLRPC_POLICY_GSS);
  
-        gsec->gs_mech = lgss_subflavor_to_mech(SEC_FLAVOR_SUB(flavor));
+        gsec->gs_mech = lgss_subflavor_to_mech(
+                                SPTLRPC_FLVR_BASE_SUB(sf->sf_rpc));
          if (!gsec->gs_mech) {
-                CERROR("gss backend 0x%x not found\n", SEC_FLAVOR_SUB(flavor));
+                CERROR("gss backend 0x%x not found\n",
+                       SPTLRPC_FLVR_BASE_SUB(sf->sf_rpc));
                  return -EOPNOTSUPP;
          }
  
-        spin_lock_init(&gsec->gs_lock);
+       spin_lock_init(&gsec->gs_lock);
          gsec->gs_rvs_hdl = 0ULL;
  
-        /* initialize upper ptlrpc_sec */
-        sec = &gsec->gs_base;
-        sec->ps_policy = policy;
-        sec->ps_flavor = flavor;
-        sec->ps_flags = flags;
-        sec->ps_import = class_import_get(imp);
-        sec->ps_lock = SPIN_LOCK_UNLOCKED;
-        atomic_set(&sec->ps_busy, 0);
-        CFS_INIT_LIST_HEAD(&sec->ps_gc_list);
-
-        if (!ctx) {
+       /* initialize upper ptlrpc_sec */
+       sec = &gsec->gs_base;
+       sec->ps_policy = policy;
+       atomic_set(&sec->ps_refcount, 0);
+       atomic_set(&sec->ps_nctx, 0);
+       sec->ps_id = sptlrpc_get_next_secid();
+       sec->ps_flvr = *sf;
+       sec->ps_import = class_import_get(imp);
+       spin_lock_init(&sec->ps_lock);
+       INIT_LIST_HEAD(&sec->ps_gc_list);
+
+        if (!svcctx) {
                  sec->ps_gc_interval = GSS_GC_INTERVAL;
-                sec->ps_gc_next = cfs_time_current_sec() + sec->ps_gc_interval;
          } else {
                  LASSERT(sec_is_reverse(sec));
  
                  /* never do gc on reverse sec */
                  sec->ps_gc_interval = 0;
-                sec->ps_gc_next = 0;
          }
  
-        if (SEC_FLAVOR_SVC(flavor) == SPTLRPC_SVC_PRIV &&
-            flags & PTLRPC_SEC_FL_BULK)
+        if (SPTLRPC_FLVR_BULK_SVC(sec->ps_flvr.sf_rpc) == SPTLRPC_BULK_SVC_PRIV)
                  sptlrpc_enc_pool_add_user();
  
-        CDEBUG(D_SEC, "create %s%s@%p\n", (ctx ? "reverse " : ""),
+        CDEBUG(D_SEC, "create %s%s@%p\n", (svcctx ? "reverse " : ""),
                 policy->sp_name, gsec);
          return 0;
  }
  
  void gss_sec_destroy_common(struct gss_sec *gsec)
  {
-        struct ptlrpc_sec      *sec = &gsec->gs_base;
-        ENTRY;
+       struct ptlrpc_sec       *sec = &gsec->gs_base;
+       ENTRY;
  
-        LASSERT(sec->ps_import);
-        LASSERT(atomic_read(&sec->ps_refcount) == 0);
-        LASSERT(atomic_read(&sec->ps_busy) == 0);
+       LASSERT(sec->ps_import);
+       LASSERT(atomic_read(&sec->ps_refcount) == 0);
+       LASSERT(atomic_read(&sec->ps_nctx) == 0);
  
-        if (gsec->gs_mech) {
-                lgss_mech_put(gsec->gs_mech);
-                gsec->gs_mech = NULL;
-        }
+       if (gsec->gs_mech) {
+               lgss_mech_put(gsec->gs_mech);
+               gsec->gs_mech = NULL;
+       }
  
-        class_import_put(sec->ps_import);
+       class_import_put(sec->ps_import);
  
-        if (SEC_FLAVOR_SVC(sec->ps_flavor) == SPTLRPC_SVC_PRIV &&
-            sec->ps_flags & PTLRPC_SEC_FL_BULK)
-                sptlrpc_enc_pool_del_user();
+       if (SPTLRPC_FLVR_BULK_SVC(sec->ps_flvr.sf_rpc) == SPTLRPC_BULK_SVC_PRIV)
+               sptlrpc_enc_pool_del_user();
  
-        EXIT;
+       EXIT;
+}
+
+void gss_sec_kill(struct ptlrpc_sec *sec)
+{
+       sec->ps_dying = 1;
  }
  
  int gss_cli_ctx_init_common(struct ptlrpc_sec *sec,
@@ -1092,74 +1176,79 @@ int gss_cli_ctx_init_common(struct ptlrpc_sec *sec,
                              struct ptlrpc_ctx_ops *ctxops,
                              struct vfs_cred *vcred)
  {
-        struct gss_cli_ctx    *gctx = ctx2gctx(ctx);
+       struct gss_cli_ctx      *gctx = ctx2gctx(ctx);
  
-        gctx->gc_win = 0;
-        atomic_set(&gctx->gc_seq, 0);
+       gctx->gc_win = 0;
+       atomic_set(&gctx->gc_seq, 0);
  
-        CFS_INIT_HLIST_NODE(&ctx->cc_cache);
-        atomic_set(&ctx->cc_refcount, 0);
-        ctx->cc_sec = sec;
-        ctx->cc_ops = ctxops;
-        ctx->cc_expire = 0;
-        ctx->cc_flags = PTLRPC_CTX_NEW;
-        ctx->cc_vcred = *vcred;
-        spin_lock_init(&ctx->cc_lock);
-        CFS_INIT_LIST_HEAD(&ctx->cc_req_list);
-        CFS_INIT_LIST_HEAD(&ctx->cc_gc_chain);
+       INIT_HLIST_NODE(&ctx->cc_cache);
+       atomic_set(&ctx->cc_refcount, 0);
+       ctx->cc_sec = sec;
+       ctx->cc_ops = ctxops;
+       ctx->cc_expire = 0;
+       ctx->cc_flags = PTLRPC_CTX_NEW;
+       ctx->cc_vcred = *vcred;
+       spin_lock_init(&ctx->cc_lock);
+       INIT_LIST_HEAD(&ctx->cc_req_list);
+       INIT_LIST_HEAD(&ctx->cc_gc_chain);
  
-        /* take a ref on belonging sec */
-        atomic_inc(&sec->ps_busy);
+       /* take a ref on belonging sec, balanced in ctx destroying */
+       atomic_inc(&sec->ps_refcount);
+       /* statistic only */
+       atomic_inc(&sec->ps_nctx);
  
-        CDEBUG(D_SEC, "%s@%p: create ctx %p(%u->%s)\n",
-               sec->ps_policy->sp_name, ctx->cc_sec,
-               ctx, ctx->cc_vcred.vc_uid, sec2target_str(ctx->cc_sec));
-        return 0;
+       CDEBUG(D_SEC, "%s@%p: create ctx %p(%u->%s)\n",
+              sec->ps_policy->sp_name, ctx->cc_sec,
+              ctx, ctx->cc_vcred.vc_uid, sec2target_str(ctx->cc_sec));
+       return 0;
  }
  
  /*
- * return:
- *  -1: the destroy has been taken care of by someone else
- *   0: proceed to destroy the ctx
- *   1: busy count dropped to 0, proceed to destroy ctx and sec
+ * return value:
+ *   1: the context has been taken care of by someone else
+ *   0: proceed to really destroy the context locally
   */
  int gss_cli_ctx_fini_common(struct ptlrpc_sec *sec,
                              struct ptlrpc_cli_ctx *ctx)
  {
-        struct gss_cli_ctx *gctx = ctx2gctx(ctx);
+       struct gss_cli_ctx *gctx = ctx2gctx(ctx);
  
-        LASSERT(ctx->cc_sec == sec);
-        LASSERT(atomic_read(&ctx->cc_refcount) == 0);
-        LASSERT(atomic_read(&sec->ps_busy) > 0);
+       LASSERT(atomic_read(&sec->ps_nctx) > 0);
+       LASSERT(atomic_read(&ctx->cc_refcount) == 0);
+       LASSERT(ctx->cc_sec == sec);
  
-        if (gctx->gc_mechctx) {
-                /* the final context fini rpc will use this ctx too, and it's
-                 * asynchronous which finished by request_out_callback(). so
-                 * we add refcount, whoever drop finally drop the refcount to
-                 * 0 should responsible for the rest of destroy. */
-                atomic_inc(&ctx->cc_refcount);
+       /*
+        * remove UPTODATE flag of reverse ctx thus we won't send fini rpc,
+        * this is to avoid potential problems of client side reverse svc ctx
+        * be mis-destroyed in various recovery senarios. anyway client can
+        * manage its reverse ctx well by associating it with its buddy ctx.
+        */
+       if (sec_is_reverse(sec))
+               ctx->cc_flags &= ~PTLRPC_CTX_UPTODATE;
  
-                gss_do_ctx_fini_rpc(gctx);
-                gss_cli_ctx_finalize(gctx);
+       if (gctx->gc_mechctx) {
+               /* the final context fini rpc will use this ctx too, and it's
+                * asynchronous which finished by request_out_callback(). so
+                * we add refcount, whoever drop finally drop the refcount to
+                * 0 should responsible for the rest of destroy. */
+               atomic_inc(&ctx->cc_refcount);
  
-                if (!atomic_dec_and_test(&ctx->cc_refcount))
-                        return -1;
-        }
+               gss_do_ctx_fini_rpc(gctx);
+               gss_cli_ctx_finalize(gctx);
  
-        if (sec_is_reverse(sec))
-                CDEBUG(D_SEC, "reverse sec %p: destroy ctx %p\n",
-                       ctx->cc_sec, ctx);
-        else
-                CWARN("%s@%p: destroy ctx %p(%u->%s)\n",
-                      sec->ps_policy->sp_name, ctx->cc_sec,
-                      ctx, ctx->cc_vcred.vc_uid, sec2target_str(ctx->cc_sec));
+               if (!atomic_dec_and_test(&ctx->cc_refcount))
+                       return 1;
+       }
  
-        if (atomic_dec_and_test(&sec->ps_busy)) {
-                LASSERT(atomic_read(&sec->ps_refcount) == 0);
-                return 1;
-        }
+       if (sec_is_reverse(sec))
+               CWARN("reverse sec %p: destroy ctx %p\n",
+                     ctx->cc_sec, ctx);
+       else
+               CWARN("%s@%p: destroy ctx %p(%u->%s)\n",
+                     sec->ps_policy->sp_name, ctx->cc_sec,
+                     ctx, ctx->cc_vcred.vc_uid, sec2target_str(ctx->cc_sec));
  
-        return 0;
+       return 0;
  }
  
  static
@@ -1167,9 +1256,9 @@ int gss_alloc_reqbuf_intg(struct ptlrpc_sec *sec,
                            struct ptlrpc_request *req,
                            int svc, int msgsize)
  {
-        struct sec_flavor_config *conf;
          int                       bufsize, txtsize;
-        int                       buflens[5], bufcnt = 2;
+        int                       bufcnt = 2;
+        __u32                     buflens[5];
          ENTRY;
  
          /*
@@ -1194,17 +1283,17 @@ int gss_alloc_reqbuf_intg(struct ptlrpc_sec *sec,
          if (svc == SPTLRPC_SVC_INTG)
                  txtsize += buflens[1];
  
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor)) {
+        if (req->rq_pack_udesc) {
                  buflens[bufcnt] = sptlrpc_current_user_desc_size();
                  if (svc == SPTLRPC_SVC_INTG)
                          txtsize += buflens[bufcnt];
                  bufcnt++;
          }
  
-        if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
-                conf = &req->rq_import->imp_obd->u.cli.cl_sec_conf;
-                buflens[bufcnt] = bulk_sec_desc_size(conf->sfc_bulk_csum, 1,
-                                                     req->rq_bulk_read);
+        if (req->rq_pack_bulk) {
+                buflens[bufcnt] = gss_cli_bulk_payload(req->rq_cli_ctx,
+                                                       &req->rq_flvr,
+                                                       0, req->rq_bulk_read);
                  if (svc == SPTLRPC_SVC_INTG)
                          txtsize += buflens[bufcnt];
                  bufcnt++;
@@ -1220,7 +1309,7 @@ int gss_alloc_reqbuf_intg(struct ptlrpc_sec *sec,
          if (!req->rq_reqbuf) {
                  bufsize = size_roundup_power2(bufsize);
  
-                OBD_ALLOC(req->rq_reqbuf, bufsize);
+                OBD_ALLOC_LARGE(req->rq_reqbuf, bufsize);
                  if (!req->rq_reqbuf)
                          RETURN(-ENOMEM);
  
@@ -1232,13 +1321,13 @@ int gss_alloc_reqbuf_intg(struct ptlrpc_sec *sec,
          }
  
          lustre_init_msg_v2(req->rq_reqbuf, bufcnt, buflens, NULL);
-        req->rq_reqbuf->lm_secflvr = req->rq_sec_flavor;
+        req->rq_reqbuf->lm_secflvr = req->rq_flvr.sf_rpc;
  
          req->rq_reqmsg = lustre_msg_buf(req->rq_reqbuf, 1, msgsize);
          LASSERT(req->rq_reqmsg);
  
          /* pack user desc here, later we might leave current user's process */
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor))
+        if (req->rq_pack_udesc)
                  sptlrpc_pack_user_desc(req->rq_reqbuf, 2);
  
          RETURN(0);
@@ -1249,9 +1338,8 @@ int gss_alloc_reqbuf_priv(struct ptlrpc_sec *sec,
                            struct ptlrpc_request *req,
                            int msgsize)
  {
-        struct sec_flavor_config *conf;
-        int                       ibuflens[3], ibufcnt;
-        int                       buflens[3];
+        __u32                     ibuflens[3], wbuflens[2];
+        int                       ibufcnt;
          int                       clearsize, wiresize;
          ENTRY;
  
@@ -1263,31 +1351,27 @@ int gss_alloc_reqbuf_priv(struct ptlrpc_sec *sec,
           *  - user descriptor (optional)
           *  - bulk checksum (optional)
           */
-
          ibufcnt = 1;
          ibuflens[0] = msgsize;
  
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor))
+        if (req->rq_pack_udesc)
                  ibuflens[ibufcnt++] = sptlrpc_current_user_desc_size();
-        if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
-                conf = &req->rq_import->imp_obd->u.cli.cl_sec_conf;
-                ibuflens[ibufcnt++] = bulk_sec_desc_size(conf->sfc_bulk_csum, 1,
-                                                         req->rq_bulk_read);
-        }
+        if (req->rq_pack_bulk)
+                ibuflens[ibufcnt++] = gss_cli_bulk_payload(req->rq_cli_ctx,
+                                                           &req->rq_flvr, 0,
+                                                           req->rq_bulk_read);
+
          clearsize = lustre_msg_size_v2(ibufcnt, ibuflens);
          /* to allow append padding during encryption */
          clearsize += GSS_MAX_CIPHER_BLOCK;
  
          /* Wrapper (wire) buffers
           *  - gss header
-         *  - signature of gss header
           *  - cipher text
           */
-
-        buflens[0] = PTLRPC_GSS_HEADER_SIZE;
-        buflens[1] = gss_cli_payload(req->rq_cli_ctx, buflens[0], 0);
-        buflens[2] = gss_cli_payload(req->rq_cli_ctx, clearsize, 1);
-        wiresize = lustre_msg_size_v2(3, buflens);
+        wbuflens[0] = PTLRPC_GSS_HEADER_SIZE;
+        wbuflens[1] = gss_cli_payload(req->rq_cli_ctx, clearsize, 1);
+        wiresize = lustre_msg_size_v2(2, wbuflens);
  
          if (req->rq_pool) {
                  /* rq_reqbuf is preallocated */
@@ -1312,7 +1396,7 @@ int gss_alloc_reqbuf_priv(struct ptlrpc_sec *sec,
          if (!req->rq_clrbuf) {
                  clearsize = size_roundup_power2(clearsize);
  
-                OBD_ALLOC(req->rq_clrbuf, clearsize);
+                OBD_ALLOC_LARGE(req->rq_clrbuf, clearsize);
                  if (!req->rq_clrbuf)
                          RETURN(-ENOMEM);
          }
@@ -1321,7 +1405,7 @@ int gss_alloc_reqbuf_priv(struct ptlrpc_sec *sec,
          lustre_init_msg_v2(req->rq_clrbuf, ibufcnt, ibuflens, NULL);
          req->rq_reqmsg = lustre_msg_buf(req->rq_clrbuf, 0, msgsize);
  
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor))
+        if (req->rq_pack_udesc)
                  sptlrpc_pack_user_desc(req->rq_clrbuf, 1);
  
          RETURN(0);
@@ -1335,9 +1419,9 @@ int gss_alloc_reqbuf(struct ptlrpc_sec *sec,
                       struct ptlrpc_request *req,
                       int msgsize)
  {
-        int     svc = SEC_FLAVOR_SVC(req->rq_sec_flavor);
+        int     svc = SPTLRPC_FLVR_SVC(req->rq_flvr.sf_rpc);
  
-        LASSERT(!SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor) ||
+        LASSERT(!req->rq_pack_bulk ||
                  (req->rq_bulk_read || req->rq_bulk_write));
  
          switch (svc) {
@@ -1348,7 +1432,7 @@ int gss_alloc_reqbuf(struct ptlrpc_sec *sec,
          case SPTLRPC_SVC_PRIV:
                  return gss_alloc_reqbuf_priv(sec, req, msgsize);
          default:
-                LASSERTF(0, "bad flavor %x\n", req->rq_sec_flavor);
+                LASSERTF(0, "bad rpc flavor %x\n", req->rq_flvr.sf_rpc);
                  return 0;
          }
  }
@@ -1360,7 +1444,7 @@ void gss_free_reqbuf(struct ptlrpc_sec *sec,
          ENTRY;
  
          LASSERT(!req->rq_pool || req->rq_reqbuf);
-        privacy = SEC_FLAVOR_SVC(req->rq_sec_flavor) == SPTLRPC_SVC_PRIV;
+        privacy = SPTLRPC_FLVR_SVC(req->rq_flvr.sf_rpc) == SPTLRPC_SVC_PRIV;
  
          if (!req->rq_clrbuf)
                  goto release_reqbuf;
@@ -1369,19 +1453,20 @@ void gss_free_reqbuf(struct ptlrpc_sec *sec,
          LASSERT(privacy);
          LASSERT(req->rq_clrbuf_len);
  
-        if (req->rq_pool &&
-            req->rq_clrbuf >= req->rq_reqbuf &&
-            (char *) req->rq_clrbuf <
+        if (req->rq_pool == NULL ||
+            req->rq_clrbuf < req->rq_reqbuf ||
+            (char *) req->rq_clrbuf >=
              (char *) req->rq_reqbuf + req->rq_reqbuf_len)
-                goto release_reqbuf;
+                OBD_FREE_LARGE(req->rq_clrbuf, req->rq_clrbuf_len);
  
-        OBD_FREE(req->rq_clrbuf, req->rq_clrbuf_len);
          req->rq_clrbuf = NULL;
          req->rq_clrbuf_len = 0;
  
  release_reqbuf:
          if (!req->rq_pool && req->rq_reqbuf) {
-                OBD_FREE(req->rq_reqbuf, req->rq_reqbuf_len);
+                LASSERT(req->rq_reqbuf_len);
+
+                OBD_FREE_LARGE(req->rq_reqbuf, req->rq_reqbuf_len);
                  req->rq_reqbuf = NULL;
                  req->rq_reqbuf_len = 0;
          }
@@ -1393,7 +1478,7 @@ static int do_alloc_repbuf(struct ptlrpc_request *req, int bufsize)
  {
          bufsize = size_roundup_power2(bufsize);
  
-        OBD_ALLOC(req->rq_repbuf, bufsize);
+        OBD_ALLOC_LARGE(req->rq_repbuf, bufsize);
          if (!req->rq_repbuf)
                  return -ENOMEM;
  
@@ -1406,9 +1491,10 @@ int gss_alloc_repbuf_intg(struct ptlrpc_sec *sec,
                            struct ptlrpc_request *req,
                            int svc, int msgsize)
  {
-        struct sec_flavor_config *conf;
-        int                       txtsize;
-        int                       buflens[4], bufcnt = 2;
+        int             txtsize;
+        __u32           buflens[4];
+        int             bufcnt = 2;
+        int             alloc_size;
  
          /*
           * on-wire data layout:
@@ -1431,10 +1517,10 @@ int gss_alloc_repbuf_intg(struct ptlrpc_sec *sec,
          if (svc == SPTLRPC_SVC_INTG)
                  txtsize += buflens[1];
  
-        if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
-                conf = &req->rq_import->imp_obd->u.cli.cl_sec_conf;
-                buflens[bufcnt] = bulk_sec_desc_size(conf->sfc_bulk_csum, 0,
-                                                     req->rq_bulk_read);
+        if (req->rq_pack_bulk) {
+                buflens[bufcnt] = gss_cli_bulk_payload(req->rq_cli_ctx,
+                                                       &req->rq_flvr,
+                                                       1, req->rq_bulk_read);
                  if (svc == SPTLRPC_SVC_INTG)
                          txtsize += buflens[bufcnt];
                  bufcnt++;
@@ -1445,7 +1531,12 @@ int gss_alloc_repbuf_intg(struct ptlrpc_sec *sec,
          else if (svc != SPTLRPC_SVC_NULL)
                  buflens[bufcnt++] = gss_cli_payload(req->rq_cli_ctx, txtsize,0);
  
-        return do_alloc_repbuf(req, lustre_msg_size_v2(bufcnt, buflens));
+        alloc_size = lustre_msg_size_v2(bufcnt, buflens);
+
+        /* add space for early reply */
+        alloc_size += gss_at_reply_off_integ;
+
+        return do_alloc_repbuf(req, alloc_size);
  }
  
  static
@@ -1453,49 +1544,42 @@ int gss_alloc_repbuf_priv(struct ptlrpc_sec *sec,
                            struct ptlrpc_request *req,
                            int msgsize)
  {
-        struct sec_flavor_config *conf;
-        int                       txtsize;
-        int                       buflens[3], bufcnt;
-
-        /* Inner (clear) buffers
-         *  - lustre message
-         *  - bulk checksum (optional)
-         */
+        int             txtsize;
+        __u32           buflens[2];
+        int             bufcnt;
+        int             alloc_size;
  
+        /* inner buffers */
          bufcnt = 1;
          buflens[0] = msgsize;
  
-        if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
-                conf = &req->rq_import->imp_obd->u.cli.cl_sec_conf;
-                buflens[bufcnt++] = bulk_sec_desc_size(
-                                                conf->sfc_bulk_csum, 0,
-                                                req->rq_bulk_read);
-        }
+        if (req->rq_pack_bulk)
+                buflens[bufcnt++] = gss_cli_bulk_payload(req->rq_cli_ctx,
+                                                         &req->rq_flvr,
+                                                         1, req->rq_bulk_read);
          txtsize = lustre_msg_size_v2(bufcnt, buflens);
          txtsize += GSS_MAX_CIPHER_BLOCK;
  
-        /* Wrapper (wire) buffers
-         *  - gss header
-         *  - signature of gss header
-         *  - cipher text
-         */
-
-        bufcnt = 3;
+        /* wrapper buffers */
+        bufcnt = 2;
          buflens[0] = PTLRPC_GSS_HEADER_SIZE;
-        buflens[1] = gss_cli_payload(req->rq_cli_ctx, buflens[0], 0);
-        buflens[2] = gss_cli_payload(req->rq_cli_ctx, txtsize, 1);
+        buflens[1] = gss_cli_payload(req->rq_cli_ctx, txtsize, 1);
+
+        alloc_size = lustre_msg_size_v2(bufcnt, buflens);
+        /* add space for early reply */
+        alloc_size += gss_at_reply_off_priv;
  
-        return do_alloc_repbuf(req, lustre_msg_size_v2(bufcnt, buflens));
+        return do_alloc_repbuf(req, alloc_size);
  }
  
  int gss_alloc_repbuf(struct ptlrpc_sec *sec,
                       struct ptlrpc_request *req,
                       int msgsize)
  {
-        int     svc = SEC_FLAVOR_SVC(req->rq_sec_flavor);
+        int     svc = SPTLRPC_FLVR_SVC(req->rq_flvr.sf_rpc);
          ENTRY;
  
-        LASSERT(!SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor) ||
+        LASSERT(!req->rq_pack_bulk ||
                  (req->rq_bulk_read || req->rq_bulk_write));
  
          switch (svc) {
@@ -1506,7 +1590,7 @@ int gss_alloc_repbuf(struct ptlrpc_sec *sec,
          case SPTLRPC_SVC_PRIV:
                  return gss_alloc_repbuf_priv(sec, req, msgsize);
          default:
-                LASSERTF(0, "bad flavor %x\n", req->rq_sec_flavor);
+                LASSERTF(0, "bad rpc flavor %x\n", req->rq_flvr.sf_rpc);
                  return 0;
          }
  }
@@ -1514,9 +1598,11 @@ int gss_alloc_repbuf(struct ptlrpc_sec *sec,
  void gss_free_repbuf(struct ptlrpc_sec *sec,
                       struct ptlrpc_request *req)
  {
-        OBD_FREE(req->rq_repbuf, req->rq_repbuf_len);
+        OBD_FREE_LARGE(req->rq_repbuf, req->rq_repbuf_len);
          req->rq_repbuf = NULL;
          req->rq_repbuf_len = 0;
+        req->rq_repdata = NULL;
+        req->rq_repdata_len = 0;
  }
  
  static int get_enlarged_msgsize(struct lustre_msg *msg,
@@ -1608,16 +1694,28 @@ int gss_enlarge_reqbuf_intg(struct ptlrpc_sec *sec,
          if (req->rq_reqbuf_len < newbuf_size) {
                  newbuf_size = size_roundup_power2(newbuf_size);
  
-                OBD_ALLOC(newbuf, newbuf_size);
+                OBD_ALLOC_LARGE(newbuf, newbuf_size);
                  if (newbuf == NULL)
                          RETURN(-ENOMEM);
  
+               /* Must lock this, so that otherwise unprotected change of
+                * rq_reqmsg is not racing with parallel processing of
+                * imp_replay_list traversing threads. See LU-3333
+                * This is a bandaid at best, we really need to deal with this
+                * in request enlarging code before unpacking that's already
+                * there */
+               if (req->rq_import)
+                       spin_lock(&req->rq_import->imp_lock);
+
                  memcpy(newbuf, req->rq_reqbuf, req->rq_reqbuf_len);
  
-                OBD_FREE(req->rq_reqbuf, req->rq_reqbuf_len);
+                OBD_FREE_LARGE(req->rq_reqbuf, req->rq_reqbuf_len);
                  req->rq_reqbuf = newbuf;
                  req->rq_reqbuf_len = newbuf_size;
                  req->rq_reqmsg = lustre_msg_buf(req->rq_reqbuf, 1, 0);
+
+               if (req->rq_import)
+                       spin_unlock(&req->rq_import->imp_lock);
          }
  
          /* do enlargement, from wrapper to embedded, from end to begin */
@@ -1640,7 +1738,7 @@ int gss_enlarge_reqbuf_priv(struct ptlrpc_sec *sec,
  {
          struct lustre_msg      *newclrbuf;
          int                     newmsg_size, newclrbuf_size, newcipbuf_size;
-        int                     buflens[3];
+        __u32                   buflens[3];
  
          /*
           * embedded msg is at seg 0 of clear buffer;
@@ -1678,6 +1776,8 @@ int gss_enlarge_reqbuf_priv(struct ptlrpc_sec *sec,
                  if (newclrbuf_size + newcipbuf_size <= req->rq_reqbuf_len) {
                          void *src, *dst;
  
+                       if (req->rq_import)
+                               spin_lock(&req->rq_import->imp_lock);
                          /* move clear text backward. */
                          src = req->rq_clrbuf;
                          dst = (char *) req->rq_reqbuf + newcipbuf_size;
@@ -1687,6 +1787,9 @@ int gss_enlarge_reqbuf_priv(struct ptlrpc_sec *sec,
                          req->rq_clrbuf = (struct lustre_msg *) dst;
                          req->rq_clrbuf_len = newclrbuf_size;
                          req->rq_reqmsg = lustre_msg_buf(req->rq_clrbuf, 0, 0);
+
+                       if (req->rq_import)
+                               spin_unlock(&req->rq_import->imp_lock);
                  } else {
                          /* sadly we have to split out the clear buffer */
                          LASSERT(req->rq_reqbuf_len >= newcipbuf_size);
@@ -1697,22 +1800,34 @@ int gss_enlarge_reqbuf_priv(struct ptlrpc_sec *sec,
          if (req->rq_clrbuf_len < newclrbuf_size) {
                  newclrbuf_size = size_roundup_power2(newclrbuf_size);
  
-                OBD_ALLOC(newclrbuf, newclrbuf_size);
+                OBD_ALLOC_LARGE(newclrbuf, newclrbuf_size);
                  if (newclrbuf == NULL)
                          RETURN(-ENOMEM);
  
+               /* Must lock this, so that otherwise unprotected change of
+                * rq_reqmsg is not racing with parallel processing of
+                * imp_replay_list traversing threads. See LU-3333
+                * This is a bandaid at best, we really need to deal with this
+                * in request enlarging code before unpacking that's already
+                * there */
+               if (req->rq_import)
+                       spin_lock(&req->rq_import->imp_lock);
+
                  memcpy(newclrbuf, req->rq_clrbuf, req->rq_clrbuf_len);
  
                  if (req->rq_reqbuf == NULL ||
                      req->rq_clrbuf < req->rq_reqbuf ||
                      (char *) req->rq_clrbuf >=
                      (char *) req->rq_reqbuf + req->rq_reqbuf_len) {
-                        OBD_FREE(req->rq_clrbuf, req->rq_clrbuf_len);
+                        OBD_FREE_LARGE(req->rq_clrbuf, req->rq_clrbuf_len);
                  }
  
                  req->rq_clrbuf = newclrbuf;
                  req->rq_clrbuf_len = newclrbuf_size;
                  req->rq_reqmsg = lustre_msg_buf(req->rq_clrbuf, 0, 0);
+
+               if (req->rq_import)
+                       spin_unlock(&req->rq_import->imp_lock);
          }
  
          _sptlrpc_enlarge_msg_inplace(req->rq_clrbuf, 0, newmsg_size);
@@ -1726,7 +1841,7 @@ int gss_enlarge_reqbuf(struct ptlrpc_sec *sec,
                         struct ptlrpc_request *req,
                         int segment, int newsize)
  {
-        int     svc = SEC_FLAVOR_SVC(req->rq_sec_flavor);
+        int     svc = SPTLRPC_FLVR_SVC(req->rq_flvr.sf_rpc);
  
          LASSERT(!req->rq_ctx_init && !req->rq_ctx_fini);
  
@@ -1738,7 +1853,7 @@ int gss_enlarge_reqbuf(struct ptlrpc_sec *sec,
          case SPTLRPC_SVC_PRIV:
                  return gss_enlarge_reqbuf_priv(sec, req, segment, newsize);
          default:
-                LASSERTF(0, "bad flavor %x\n", req->rq_sec_flavor);
+                LASSERTF(0, "bad rpc flavor %x\n", req->rq_flvr.sf_rpc);
                  return 0;
          }
  }
@@ -1783,41 +1898,59 @@ void gss_svc_reqctx_free(struct gss_svc_reqctx *grctx)
  static inline
  void gss_svc_reqctx_addref(struct gss_svc_reqctx *grctx)
  {
-        LASSERT(atomic_read(&grctx->src_base.sc_refcount) > 0);
-        atomic_inc(&grctx->src_base.sc_refcount);
+       LASSERT(atomic_read(&grctx->src_base.sc_refcount) > 0);
+       atomic_inc(&grctx->src_base.sc_refcount);
  }
  
  static inline
  void gss_svc_reqctx_decref(struct gss_svc_reqctx *grctx)
  {
-        LASSERT(atomic_read(&grctx->src_base.sc_refcount) > 0);
+       LASSERT(atomic_read(&grctx->src_base.sc_refcount) > 0);
  
-        if (atomic_dec_and_test(&grctx->src_base.sc_refcount))
-                gss_svc_reqctx_free(grctx);
+       if (atomic_dec_and_test(&grctx->src_base.sc_refcount))
+               gss_svc_reqctx_free(grctx);
  }
  
  static
  int gss_svc_sign(struct ptlrpc_request *req,
                   struct ptlrpc_reply_state *rs,
                   struct gss_svc_reqctx *grctx,
-                 int svc)
+                 __u32 svc)
  {
+        __u32   flags = 0;
          int     rc;
          ENTRY;
  
          LASSERT(rs->rs_msg == lustre_msg_buf(rs->rs_repbuf, 1, 0));
  
-        /* embedded lustre_msg might have been shrinked */
+        /* embedded lustre_msg might have been shrunk */
          if (req->rq_replen != rs->rs_repbuf->lm_buflens[1])
                  lustre_shrink_msg(rs->rs_repbuf, 1, req->rq_replen, 1);
  
+        if (req->rq_pack_bulk)
+                flags |= LUSTRE_GSS_PACK_BULK;
+
          rc = gss_sign_msg(rs->rs_repbuf, grctx->src_ctx->gsc_mechctx,
-                          PTLRPC_GSS_PROC_DATA, grctx->src_wirectx.gw_seq,
-                          svc, NULL);
+                          LUSTRE_SP_ANY, flags, PTLRPC_GSS_PROC_DATA,
+                          grctx->src_wirectx.gw_seq, svc, NULL);
          if (rc < 0)
                  RETURN(rc);
  
          rs->rs_repdata_len = rc;
+
+        if (likely(req->rq_packed_final)) {
+                if (lustre_msghdr_get_flags(req->rq_reqmsg) & MSGHDR_AT_SUPPORT)
+                        req->rq_reply_off = gss_at_reply_off_integ;
+                else
+                        req->rq_reply_off = 0;
+        } else {
+                if (svc == SPTLRPC_SVC_NULL)
+                        rs->rs_repbuf->lm_cksum = crc32_le(!(__u32) 0,
+                                        lustre_msg_buf(rs->rs_repbuf, 1, 0),
+                                        lustre_msg_buflen(rs->rs_repbuf, 1));
+                req->rq_reply_off = 0;
+        }
+
          RETURN(0);
  }
  
@@ -1836,7 +1969,7 @@ int gss_pack_err_notify(struct ptlrpc_request *req, __u32 major, __u32 minor)
          grctx->src_err_notify = 1;
          grctx->src_reserve_len = 0;
  
-        rc = lustre_pack_reply_v2(req, 1, &replen, NULL);
+        rc = lustre_pack_reply_v2(req, 1, &replen, NULL, 0);
          if (rc) {
                  CERROR("could not pack reply, err %d\n", rc);
                  RETURN(rc);
@@ -1872,7 +2005,7 @@ int gss_svc_handle_init(struct ptlrpc_request *req,
          rawobj_t                   uuid_obj, rvs_hdl, in_token;
          __u32                      lustre_svc;
          __u32                     *secdata, seclen;
-        int                        rc;
+        int                        swabbed, rc;
          ENTRY;
  
          CDEBUG(D_SEC, "processing gss init(%d) request from %s\n", gw->gw_proc,
@@ -1880,6 +2013,11 @@ int gss_svc_handle_init(struct ptlrpc_request *req,
  
          req->rq_ctx_init = 1;
  
+        if (gw->gw_flags & LUSTRE_GSS_PACK_BULK) {
+                CERROR("unexpected bulk flag\n");
+                RETURN(SECSVC_DROP);
+        }
+
          if (gw->gw_proc == PTLRPC_GSS_PROC_INIT && gw->gw_handle.len != 0) {
                  CERROR("proc %u: invalid handle length %u\n",
                         gw->gw_proc, gw->gw_handle.len);
@@ -1891,6 +2029,8 @@ int gss_svc_handle_init(struct ptlrpc_request *req,
                  RETURN(SECSVC_DROP);
          }
  
+        swabbed = ptlrpc_req_need_swab(req);
+
          /* ctx initiate payload is in last segment */
          secdata = lustre_msg_buf(reqbuf, reqbuf->lm_bufcount - 1, 0);
          seclen = reqbuf->lm_buflens[reqbuf->lm_bufcount - 1];
@@ -1915,7 +2055,7 @@ int gss_svc_handle_init(struct ptlrpc_request *req,
          uuid = (struct obd_uuid *) uuid_obj.data;
          target = class_uuid2obd(uuid);
          if (!target || target->obd_stopping || !target->obd_set_up) {
-                CERROR("target '%s' is not available for context init (%s)",
+                CERROR("target '%s' is not available for context init (%s)\n",
                         uuid->uuid, target == NULL ? "no target" :
                         (target->obd_stopping ? "stopping" : "not set up"));
                  RETURN(SECSVC_DROP);
@@ -1938,23 +2078,28 @@ int gss_svc_handle_init(struct ptlrpc_request *req,
          if (rc != SECSVC_OK)
                  RETURN(rc);
  
-        if (grctx->src_ctx->gsc_usr_mds || grctx->src_ctx->gsc_usr_root)
-                CWARN("user from %s authenticated as %s\n",
-                      libcfs_nid2str(req->rq_peer.nid),
-                      grctx->src_ctx->gsc_usr_mds ? "mds" : "root");
+        if (grctx->src_ctx->gsc_usr_mds || grctx->src_ctx->gsc_usr_oss ||
+            grctx->src_ctx->gsc_usr_root)
+                CWARN("create svc ctx %p: user from %s authenticated as %s\n",
+                      grctx->src_ctx, libcfs_nid2str(req->rq_peer.nid),
+                      grctx->src_ctx->gsc_usr_mds ? "mds" :
+                        (grctx->src_ctx->gsc_usr_oss ? "oss" : "root"));
          else
-                CWARN("accept user %u from %s\n", grctx->src_ctx->gsc_uid,
+                CWARN("create svc ctx %p: accept user %u from %s\n",
+                      grctx->src_ctx, grctx->src_ctx->gsc_uid,
                        libcfs_nid2str(req->rq_peer.nid));
  
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor)) {
+        if (gw->gw_flags & LUSTRE_GSS_PACK_USER) {
                  if (reqbuf->lm_bufcount < 4) {
                          CERROR("missing user descriptor\n");
                          RETURN(SECSVC_DROP);
                  }
-                if (sptlrpc_unpack_user_desc(reqbuf, 2)) {
+                if (sptlrpc_unpack_user_desc(reqbuf, 2, swabbed)) {
                          CERROR("Mal-formed user descriptor\n");
                          RETURN(SECSVC_DROP);
                  }
+
+                req->rq_pack_udesc = 1;
                  req->rq_user_desc = lustre_msg_buf(reqbuf, 2, 0);
          }
  
@@ -1976,6 +2121,7 @@ int gss_svc_verify_request(struct ptlrpc_request *req,
          struct gss_svc_ctx *gctx = grctx->src_ctx;
          struct lustre_msg  *msg = req->rq_reqbuf;
          int                 offset = 2;
+        int                 swabbed;
          ENTRY;
  
          *major = GSS_S_COMPLETE;
@@ -1995,42 +2141,49 @@ int gss_svc_verify_request(struct ptlrpc_request *req,
          }
  
          *major = gss_verify_msg(msg, gctx->gsc_mechctx, gw->gw_svc);
-        if (*major != GSS_S_COMPLETE)
+        if (*major != GSS_S_COMPLETE) {
+                CERROR("failed to verify request: %x\n", *major);
                  RETURN(-EACCES);
+        }
  
-        if (gss_check_seq_num(&gctx->gsc_seqdata, gw->gw_seq, 1)) {
+        if (gctx->gsc_reverse == 0 &&
+            gss_check_seq_num(&gctx->gsc_seqdata, gw->gw_seq, 1)) {
                  CERROR("phase 1+: discard replayed req: seq %u\n", gw->gw_seq);
                  *major = GSS_S_DUPLICATE_TOKEN;
                  RETURN(-EACCES);
          }
  
  verified:
+        swabbed = ptlrpc_req_need_swab(req);
+
          /* user descriptor */
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor)) {
+        if (gw->gw_flags & LUSTRE_GSS_PACK_USER) {
                  if (msg->lm_bufcount < (offset + 1)) {
                          CERROR("no user desc included\n");
                          RETURN(-EINVAL);
                  }
  
-                if (sptlrpc_unpack_user_desc(msg, offset)) {
+                if (sptlrpc_unpack_user_desc(msg, offset, swabbed)) {
                          CERROR("Mal-formed user descriptor\n");
                          RETURN(-EINVAL);
                  }
  
+                req->rq_pack_udesc = 1;
                  req->rq_user_desc = lustre_msg_buf(msg, offset, 0);
                  offset++;
          }
  
-        /* check bulk cksum data */
-        if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
+        /* check bulk_sec_desc data */
+        if (gw->gw_flags & LUSTRE_GSS_PACK_BULK) {
                  if (msg->lm_bufcount < (offset + 1)) {
-                        CERROR("no bulk checksum included\n");
+                        CERROR("missing bulk sec descriptor\n");
                          RETURN(-EINVAL);
                  }
  
-                if (bulk_sec_desc_unpack(msg, offset))
+                if (bulk_sec_desc_unpack(msg, offset, swabbed))
                          RETURN(-EINVAL);
  
+                req->rq_pack_bulk = 1;
                  grctx->src_reqbsd = lustre_msg_buf(msg, offset, 0);
                  grctx->src_reqbsd_size = lustre_msg_buflen(msg, offset);
          }
@@ -2048,7 +2201,7 @@ int gss_svc_unseal_request(struct ptlrpc_request *req,
  {
          struct gss_svc_ctx *gctx = grctx->src_ctx;
          struct lustre_msg  *msg = req->rq_reqbuf;
-        int                 msglen, offset = 1;
+        int                 swabbed, msglen, offset = 1;
          ENTRY;
  
          if (gss_check_seq_num(&gctx->gsc_seqdata, gw->gw_seq, 0)) {
@@ -2059,8 +2212,10 @@ int gss_svc_unseal_request(struct ptlrpc_request *req,
  
          *major = gss_unseal_msg(gctx->gsc_mechctx, msg,
                                 &msglen, req->rq_reqdata_len);
-        if (*major != GSS_S_COMPLETE)
+        if (*major != GSS_S_COMPLETE) {
+                CERROR("failed to unwrap request: %x\n", *major);
                  RETURN(-EACCES);
+        }
  
          if (gss_check_seq_num(&gctx->gsc_seqdata, gw->gw_seq, 1)) {
                  CERROR("phase 1+: discard replayed req: seq %u\n", gw->gw_seq);
@@ -2068,7 +2223,8 @@ int gss_svc_unseal_request(struct ptlrpc_request *req,
                  RETURN(-EACCES);
          }
  
-        if (lustre_unpack_msg(msg, msglen)) {
+        swabbed = __lustre_unpack_msg(msg, msglen);
+        if (swabbed < 0) {
                  CERROR("Failed to unpack after decryption\n");
                  RETURN(-EINVAL);
          }
@@ -2079,30 +2235,32 @@ int gss_svc_unseal_request(struct ptlrpc_request *req,
                  RETURN(-EINVAL);
          }
  
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor)) {
+        if (gw->gw_flags & LUSTRE_GSS_PACK_USER) {
                  if (msg->lm_bufcount < offset + 1) {
                          CERROR("no user descriptor included\n");
                          RETURN(-EINVAL);
                  }
  
-                if (sptlrpc_unpack_user_desc(msg, offset)) {
+                if (sptlrpc_unpack_user_desc(msg, offset, swabbed)) {
                          CERROR("Mal-formed user descriptor\n");
                          RETURN(-EINVAL);
                  }
  
+                req->rq_pack_udesc = 1;
                  req->rq_user_desc = lustre_msg_buf(msg, offset, 0);
                  offset++;
          }
  
-        if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
+        if (gw->gw_flags & LUSTRE_GSS_PACK_BULK) {
                  if (msg->lm_bufcount < offset + 1) {
                          CERROR("no bulk checksum included\n");
                          RETURN(-EINVAL);
                  }
  
-                if (bulk_sec_desc_unpack(msg, offset))
+                if (bulk_sec_desc_unpack(msg, offset, swabbed))
                          RETURN(-EINVAL);
  
+                req->rq_pack_bulk = 1;
                  grctx->src_reqbsd = lustre_msg_buf(msg, offset, 0);
                  grctx->src_reqbsd_size = lustre_msg_buflen(msg, offset);
          }
@@ -2144,9 +2302,10 @@ int gss_svc_handle_data(struct ptlrpc_request *req,
          if (rc == 0)
                  RETURN(SECSVC_OK);
  
-        CERROR("svc %u failed: major 0x%08x: ctx %p(%u->%s)\n",
-               gw->gw_svc, major, grctx->src_ctx, grctx->src_ctx->gsc_uid,
-               libcfs_nid2str(req->rq_peer.nid));
+        CERROR("svc %u failed: major 0x%08x: req xid "LPU64" ctx %p idx "
+               LPX64"(%u->%s)\n", gw->gw_svc, major, req->rq_xid,
+               grctx->src_ctx, gss_handle_to_u64(&gw->gw_handle),
+               grctx->src_ctx->gsc_uid, libcfs_nid2str(req->rq_peer.nid));
  error:
          /* we only notify client in case of NO_CONTEXT/BAD_SIG, which
           * might happen after server reboot, to allow recovery. */
@@ -2170,7 +2329,7 @@ int gss_svc_handle_destroy(struct ptlrpc_request *req,
  
          grctx->src_ctx = gss_svc_upcall_get_ctx(req, gw);
          if (!grctx->src_ctx) {
-                CWARN("invalid gss context handle for destroy.\n");
+                CDEBUG(D_SEC, "invalid gss context handle for destroy.\n");
                  RETURN(SECSVC_DROP);
          }
  
@@ -2182,20 +2341,24 @@ int gss_svc_handle_destroy(struct ptlrpc_request *req,
          if (gss_svc_verify_request(req, grctx, gw, &major))
                  RETURN(SECSVC_DROP);
  
-        CWARN("destroy svc ctx %p(%u->%s)\n", grctx->src_ctx,
-               grctx->src_ctx->gsc_uid, libcfs_nid2str(req->rq_peer.nid));
+        CWARN("destroy svc ctx %p idx "LPX64" (%u->%s)\n",
+              grctx->src_ctx, gss_handle_to_u64(&gw->gw_handle),
+              grctx->src_ctx->gsc_uid, libcfs_nid2str(req->rq_peer.nid));
  
          gss_svc_upcall_destroy_ctx(grctx->src_ctx);
  
-        if (SEC_FLAVOR_HAS_USER(req->rq_sec_flavor)) {
+        if (gw->gw_flags & LUSTRE_GSS_PACK_USER) {
                  if (req->rq_reqbuf->lm_bufcount < 4) {
                          CERROR("missing user descriptor, ignore it\n");
                          RETURN(SECSVC_OK);
                  }
-                if (sptlrpc_unpack_user_desc(req->rq_reqbuf, 2)) {
+                if (sptlrpc_unpack_user_desc(req->rq_reqbuf, 2,
+                                             ptlrpc_req_need_swab(req))) {
                          CERROR("Mal-formed user descriptor, ignore it\n");
                          RETURN(SECSVC_OK);
                  }
+
+                req->rq_pack_udesc = 1;
                  req->rq_user_desc = lustre_msg_buf(req->rq_reqbuf, 2, 0);
          }
  
@@ -2207,7 +2370,7 @@ int gss_svc_accept(struct ptlrpc_sec_policy *policy, struct ptlrpc_request *req)
          struct gss_header      *ghdr;
          struct gss_svc_reqctx  *grctx;
          struct gss_wire_ctx    *gw;
-        int                     rc;
+        int                     swabbed, rc;
          ENTRY;
  
          LASSERT(req->rq_reqbuf);
@@ -2218,7 +2381,9 @@ int gss_svc_accept(struct ptlrpc_sec_policy *policy, struct ptlrpc_request *req)
                  RETURN(SECSVC_DROP);
          }
  
-        ghdr = gss_swab_header(req->rq_reqbuf, 0);
+        swabbed = ptlrpc_req_need_swab(req);
+
+        ghdr = gss_swab_header(req->rq_reqbuf, 0, swabbed);
          if (ghdr == NULL) {
                  CERROR("can't decode gss header\n");
                  RETURN(SECSVC_DROP);
@@ -2231,25 +2396,27 @@ int gss_svc_accept(struct ptlrpc_sec_policy *policy, struct ptlrpc_request *req)
                  RETURN(SECSVC_DROP);
          }
  
+        req->rq_sp_from = ghdr->gh_sp;
+
          /* alloc grctx data */
          OBD_ALLOC_PTR(grctx);
-        if (!grctx) {
-                CERROR("fail to alloc svc reqctx\n");
+        if (!grctx)
                  RETURN(SECSVC_DROP);
-        }
-        grctx->src_base.sc_policy = sptlrpc_policy_get(policy);
-        atomic_set(&grctx->src_base.sc_refcount, 1);
-        req->rq_svc_ctx = &grctx->src_base;
-        gw = &grctx->src_wirectx;
+
+       grctx->src_base.sc_policy = sptlrpc_policy_get(policy);
+       atomic_set(&grctx->src_base.sc_refcount, 1);
+       req->rq_svc_ctx = &grctx->src_base;
+       gw = &grctx->src_wirectx;
  
          /* save wire context */
+        gw->gw_flags = ghdr->gh_flags;
          gw->gw_proc = ghdr->gh_proc;
          gw->gw_seq = ghdr->gh_seq;
          gw->gw_svc = ghdr->gh_svc;
          rawobj_from_netobj(&gw->gw_handle, &ghdr->gh_handle);
  
          /* keep original wire header which subject to checksum verification */
-        if (lustre_msg_swabbed(req->rq_reqbuf))
+        if (swabbed)
                  gss_header_swabber(ghdr);
  
          switch(ghdr->gh_proc) {
@@ -2276,6 +2443,7 @@ int gss_svc_accept(struct ptlrpc_sec_policy *policy, struct ptlrpc_request *req)
                  req->rq_auth_gss = 1;
                  req->rq_auth_remote = grctx->src_ctx->gsc_remote;
                  req->rq_auth_usr_mdt = grctx->src_ctx->gsc_usr_mds;
+                req->rq_auth_usr_ost = grctx->src_ctx->gsc_usr_oss;
                  req->rq_auth_usr_root = grctx->src_ctx->gsc_usr_root;
                  req->rq_auth_uid = grctx->src_ctx->gsc_uid;
                  req->rq_auth_mapped_uid = grctx->src_ctx->gsc_mapped_uid;
@@ -2311,62 +2479,91 @@ void gss_svc_invalidate_ctx(struct ptlrpc_svc_ctx *svc_ctx)
  }
  
  static inline
-int gss_svc_payload(struct gss_svc_reqctx *grctx, int msgsize, int privacy)
+int gss_svc_payload(struct gss_svc_reqctx *grctx, int early,
+                    int msgsize, int privacy)
  {
-        if (gss_svc_reqctx_is_special(grctx))
+        /* we should treat early reply normally, but which is actually sharing
+         * the same ctx with original request, so in this case we should
+         * ignore the special ctx's special flags */
+        if (early == 0 && gss_svc_reqctx_is_special(grctx))
                  return grctx->src_reserve_len;
  
-        return gss_estimate_payload(NULL, msgsize, privacy);
+        return gss_mech_payload(NULL, msgsize, privacy);
+}
+
+static int gss_svc_bulk_payload(struct gss_svc_ctx *gctx,
+                                struct sptlrpc_flavor *flvr,
+                                int read)
+{
+        int     payload = sizeof(struct ptlrpc_bulk_sec_desc);
+
+        if (read) {
+                switch (SPTLRPC_FLVR_BULK_SVC(flvr->sf_rpc)) {
+                case SPTLRPC_BULK_SVC_NULL:
+                        break;
+                case SPTLRPC_BULK_SVC_INTG:
+                        payload += gss_mech_payload(NULL, 0, 0);
+                        break;
+                case SPTLRPC_BULK_SVC_PRIV:
+                        payload += gss_mech_payload(NULL, 0, 1);
+                        break;
+                case SPTLRPC_BULK_SVC_AUTH:
+                default:
+                        LBUG();
+                }
+        }
+
+        return payload;
  }
  
  int gss_svc_alloc_rs(struct ptlrpc_request *req, int msglen)
  {
          struct gss_svc_reqctx       *grctx;
          struct ptlrpc_reply_state   *rs;
-        int                          privacy, svc, bsd_off = 0;
-        int                          ibuflens[2], ibufcnt = 0;
-        int                          buflens[4], bufcnt;
+        int                          early, privacy, svc, bsd_off = 0;
+        __u32                        ibuflens[2], buflens[4];
+        int                          ibufcnt = 0, bufcnt;
          int                          txtsize, wmsg_size, rs_size;
          ENTRY;
  
          LASSERT(msglen % 8 == 0);
  
-        if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor) &&
-            !req->rq_bulk_read && !req->rq_bulk_write) {
+        if (req->rq_pack_bulk && !req->rq_bulk_read && !req->rq_bulk_write) {
                  CERROR("client request bulk sec on non-bulk rpc\n");
                  RETURN(-EPROTO);
          }
  
-        svc = SEC_FLAVOR_SVC(req->rq_sec_flavor);
+        svc = SPTLRPC_FLVR_SVC(req->rq_flvr.sf_rpc);
+        early = (req->rq_packed_final == 0);
  
          grctx = gss_svc_ctx2reqctx(req->rq_svc_ctx);
-        if (gss_svc_reqctx_is_special(grctx))
+        if (!early && gss_svc_reqctx_is_special(grctx))
                  privacy = 0;
          else
                  privacy = (svc == SPTLRPC_SVC_PRIV);
  
          if (privacy) {
-                /* Inner buffer */
+                /* inner clear buffers */
                  ibufcnt = 1;
                  ibuflens[0] = msglen;
  
-                if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
+                if (req->rq_pack_bulk) {
                          LASSERT(grctx->src_reqbsd);
  
                          bsd_off = ibufcnt;
-                        ibuflens[ibufcnt++] = bulk_sec_desc_size(
-                                                grctx->src_reqbsd->bsd_csum_alg,
-                                                0, req->rq_bulk_read);
+                        ibuflens[ibufcnt++] = gss_svc_bulk_payload(
+                                                        grctx->src_ctx,
+                                                        &req->rq_flvr,
+                                                        req->rq_bulk_read);
                  }
  
                  txtsize = lustre_msg_size_v2(ibufcnt, ibuflens);
                  txtsize += GSS_MAX_CIPHER_BLOCK;
  
                  /* wrapper buffer */
-                bufcnt = 3;
+                bufcnt = 2;
                  buflens[0] = PTLRPC_GSS_HEADER_SIZE;
-                buflens[1] = gss_svc_payload(grctx, buflens[0], 0);
-                buflens[2] = gss_svc_payload(grctx, txtsize, 1);
+                buflens[1] = gss_svc_payload(grctx, early, txtsize, 1);
          } else {
                  bufcnt = 2;
                  buflens[0] = PTLRPC_GSS_HEADER_SIZE;
@@ -2376,21 +2573,23 @@ int gss_svc_alloc_rs(struct ptlrpc_request *req, int msglen)
                  if (svc == SPTLRPC_SVC_INTG)
                          txtsize += buflens[1];
  
-                if (SEC_FLAVOR_HAS_BULK(req->rq_sec_flavor)) {
+                if (req->rq_pack_bulk) {
                          LASSERT(grctx->src_reqbsd);
  
                          bsd_off = bufcnt;
-                        buflens[bufcnt] = bulk_sec_desc_size(
-                                                grctx->src_reqbsd->bsd_csum_alg,
-                                                0, req->rq_bulk_read);
+                        buflens[bufcnt] = gss_svc_bulk_payload(
+                                                        grctx->src_ctx,
+                                                        &req->rq_flvr,
+                                                        req->rq_bulk_read);
                          if (svc == SPTLRPC_SVC_INTG)
                                  txtsize += buflens[bufcnt];
                          bufcnt++;
                  }
  
-                if (gss_svc_reqctx_is_special(grctx) ||
+                if ((!early && gss_svc_reqctx_is_special(grctx)) ||
                      svc != SPTLRPC_SVC_NULL)
-                        buflens[bufcnt++] = gss_svc_payload(grctx, txtsize, 0);
+                        buflens[bufcnt++] = gss_svc_payload(grctx, early,
+                                                            txtsize, 0);
          }
  
          wmsg_size = lustre_msg_size_v2(bufcnt, buflens);
@@ -2402,7 +2601,7 @@ int gss_svc_alloc_rs(struct ptlrpc_request *req, int msglen)
                  /* pre-allocated */
                  LASSERT(rs->rs_size >= rs_size);
          } else {
-                OBD_ALLOC(rs, rs_size);
+                OBD_ALLOC_LARGE(rs, rs_size);
                  if (rs == NULL)
                          RETURN(-ENOMEM);
  
@@ -2418,7 +2617,7 @@ int gss_svc_alloc_rs(struct ptlrpc_request *req, int msglen)
                  rs->rs_msg = lustre_msg_buf(rs->rs_repbuf, 0, msglen);
          } else {
                  lustre_init_msg_v2(rs->rs_repbuf, bufcnt, buflens, NULL);
-                rs->rs_repbuf->lm_secflvr = req->rq_sec_flavor;
+                rs->rs_repbuf->lm_secflvr = req->rq_flvr.sf_rpc;
  
                  rs->rs_msg = lustre_msg_buf(rs->rs_repbuf, 1, 0);
          }
@@ -2437,91 +2636,92 @@ int gss_svc_alloc_rs(struct ptlrpc_request *req, int msglen)
          RETURN(0);
  }
  
-static
-int gss_svc_seal(struct ptlrpc_request *req,
-                 struct ptlrpc_reply_state *rs,
-                 struct gss_svc_reqctx *grctx)
+static int gss_svc_seal(struct ptlrpc_request *req,
+                        struct ptlrpc_reply_state *rs,
+                        struct gss_svc_reqctx *grctx)
  {
          struct gss_svc_ctx      *gctx = grctx->src_ctx;
-        rawobj_t                 msgobj, cipher_obj, micobj;
+        rawobj_t                 hdrobj, msgobj, token;
          struct gss_header       *ghdr;
-        __u8                    *cipher_buf;
-        int                      cipher_buflen, buflens[3];
+        __u8                    *token_buf;
+        int                      token_buflen; 
+        __u32                    buflens[2], major;
          int                      msglen, rc;
-        __u32                    major;
          ENTRY;
  
-        /* embedded lustre_msg might have been shrinked */
-        if (req->rq_replen != rs->rs_repbuf->lm_buflens[0])
-                lustre_shrink_msg(rs->rs_repbuf, 0, req->rq_replen, 1);
-
-        /* clear data length */
-        msglen = lustre_msg_size_v2(rs->rs_repbuf->lm_bufcount,
-                                    rs->rs_repbuf->lm_buflens);
-
-        /* clear text */
-        msgobj.len = msglen;
-        msgobj.data = (__u8 *) rs->rs_repbuf;
+        /* get clear data length. note embedded lustre_msg might
+         * have been shrunk */
+        if (req->rq_replen != lustre_msg_buflen(rs->rs_repbuf, 0))
+                msglen = lustre_shrink_msg(rs->rs_repbuf, 0, req->rq_replen, 1);
+        else 
+                msglen = lustre_msg_size_v2(rs->rs_repbuf->lm_bufcount,
+                                            rs->rs_repbuf->lm_buflens);
+
+        /* temporarily use tail of buffer to hold gss header data */
+        LASSERT(msglen + PTLRPC_GSS_HEADER_SIZE <= rs->rs_repbuf_len);
+        ghdr = (struct gss_header *) ((char *) rs->rs_repbuf +
+                                rs->rs_repbuf_len - PTLRPC_GSS_HEADER_SIZE);
+        ghdr->gh_version = PTLRPC_GSS_VERSION;
+        ghdr->gh_sp = LUSTRE_SP_ANY;
+        ghdr->gh_flags = 0;
+        ghdr->gh_proc = PTLRPC_GSS_PROC_DATA;
+        ghdr->gh_seq = grctx->src_wirectx.gw_seq;
+        ghdr->gh_svc = SPTLRPC_SVC_PRIV;
+        ghdr->gh_handle.len = 0;
+        if (req->rq_pack_bulk)
+                ghdr->gh_flags |= LUSTRE_GSS_PACK_BULK;
  
          /* allocate temporary cipher buffer */
-        cipher_buflen = gss_estimate_payload(gctx->gsc_mechctx, msglen, 1);
-        OBD_ALLOC(cipher_buf, cipher_buflen);
-        if (!cipher_buf)
+        token_buflen = gss_mech_payload(gctx->gsc_mechctx, msglen, 1);
+        OBD_ALLOC_LARGE(token_buf, token_buflen);
+        if (token_buf == NULL)
                  RETURN(-ENOMEM);
  
-        cipher_obj.len = cipher_buflen;
-        cipher_obj.data = cipher_buf;
+        hdrobj.len = PTLRPC_GSS_HEADER_SIZE;
+        hdrobj.data = (__u8 *) ghdr;
+        msgobj.len = msglen;
+        msgobj.data = (__u8 *) rs->rs_repbuf;
+        token.len = token_buflen;
+        token.data = token_buf;
  
-        major = lgss_wrap(gctx->gsc_mechctx, &msgobj, rs->rs_repbuf_len,
-                          &cipher_obj);
+        major = lgss_wrap(gctx->gsc_mechctx, &hdrobj, &msgobj,
+                          rs->rs_repbuf_len - PTLRPC_GSS_HEADER_SIZE, &token);
          if (major != GSS_S_COMPLETE) {
-                CERROR("priv: wrap message error: %08x\n", major);
+                CERROR("wrap message error: %08x\n", major);
                  GOTO(out_free, rc = -EPERM);
          }
-        LASSERT(cipher_obj.len <= cipher_buflen);
+        LASSERT(token.len <= token_buflen);
  
          /* we are about to override data at rs->rs_repbuf, nullify pointers
           * to which to catch further illegal usage. */
-        grctx->src_repbsd = NULL;
-        grctx->src_repbsd_size = 0;
+        if (req->rq_pack_bulk) {
+                grctx->src_repbsd = NULL;
+                grctx->src_repbsd_size = 0;
+        }
  
-        /* now the real wire data */
+        /* now fill the actual wire data
+         * - gss header
+         * - gss token
+         */
          buflens[0] = PTLRPC_GSS_HEADER_SIZE;
-        buflens[1] = gss_estimate_payload(gctx->gsc_mechctx, buflens[0], 0);
-        buflens[2] = cipher_obj.len;
+        buflens[1] = token.len;
  
-        LASSERT(lustre_msg_size_v2(3, buflens) <= rs->rs_repbuf_len);
-        lustre_init_msg_v2(rs->rs_repbuf, 3, buflens, NULL);
-        rs->rs_repbuf->lm_secflvr = req->rq_sec_flavor;
+        rs->rs_repdata_len = lustre_msg_size_v2(2, buflens);
+        LASSERT(rs->rs_repdata_len <= rs->rs_repbuf_len);
  
-        /* gss header */
-        ghdr = lustre_msg_buf(rs->rs_repbuf, 0, 0);
-        ghdr->gh_version = PTLRPC_GSS_VERSION;
-        ghdr->gh_flags = 0;
-        ghdr->gh_proc = PTLRPC_GSS_PROC_DATA;
-        ghdr->gh_seq = grctx->src_wirectx.gw_seq;
-        ghdr->gh_svc = SPTLRPC_SVC_PRIV;
-        ghdr->gh_handle.len = 0;
+        lustre_init_msg_v2(rs->rs_repbuf, 2, buflens, NULL);
+        rs->rs_repbuf->lm_secflvr = req->rq_flvr.sf_rpc;
  
-        /* header signature */
-        msgobj.len = rs->rs_repbuf->lm_buflens[0];
-        msgobj.data = lustre_msg_buf(rs->rs_repbuf, 0, 0);
-        micobj.len = rs->rs_repbuf->lm_buflens[1];
-        micobj.data = lustre_msg_buf(rs->rs_repbuf, 1, 0);
+        memcpy(lustre_msg_buf(rs->rs_repbuf, 0, 0), ghdr,
+               PTLRPC_GSS_HEADER_SIZE);
+        memcpy(lustre_msg_buf(rs->rs_repbuf, 1, 0), token.data, token.len);
  
-        major = lgss_get_mic(gctx->gsc_mechctx, 1, &msgobj, &micobj);
-        if (major != GSS_S_COMPLETE) {
-                CERROR("priv: sign message error: %08x\n", major);
-                GOTO(out_free, rc = -EPERM);
-        }
-        lustre_shrink_msg(rs->rs_repbuf, 1, micobj.len, 0);
-
-        /* cipher token */
-        memcpy(lustre_msg_buf(rs->rs_repbuf, 2, 0),
-               cipher_obj.data, cipher_obj.len);
-
-        rs->rs_repdata_len = lustre_shrink_msg(rs->rs_repbuf, 2,
-                                               cipher_obj.len, 0);
+        /* reply offset */
+        if (req->rq_packed_final &&
+            (lustre_msghdr_get_flags(req->rq_reqmsg) & MSGHDR_AT_SUPPORT))
+                req->rq_reply_off = gss_at_reply_off_priv;
+        else
+                req->rq_reply_off = 0;
  
          /* to catch upper layer's further access */
          rs->rs_msg = NULL;
@@ -2530,7 +2730,7 @@ int gss_svc_seal(struct ptlrpc_request *req,
  
          rc = 0;
  out_free:
-        OBD_FREE(cipher_buf, cipher_buflen);
+        OBD_FREE_LARGE(token_buf, token_buflen);
          RETURN(rc);
  }
  
@@ -2538,15 +2738,22 @@ int gss_svc_authorize(struct ptlrpc_request *req)
  {
          struct ptlrpc_reply_state *rs = req->rq_reply_state;
          struct gss_svc_reqctx     *grctx = gss_svc_ctx2reqctx(req->rq_svc_ctx);
-        struct gss_wire_ctx       *gw;
-        int                        rc;
+        struct gss_wire_ctx       *gw = &grctx->src_wirectx;
+        int                        early, rc;
          ENTRY;
  
-        if (gss_svc_reqctx_is_special(grctx))
+        early = (req->rq_packed_final == 0);
+
+        if (!early && gss_svc_reqctx_is_special(grctx)) {
+                LASSERT(rs->rs_repdata_len != 0);
+
+                req->rq_reply_off = gss_at_reply_off_integ;
                  RETURN(0);
+        }
  
-        gw = &grctx->src_wirectx;
-        if (gw->gw_proc != PTLRPC_GSS_PROC_DATA &&
+        /* early reply could happen in many cases */
+        if (!early &&
+            gw->gw_proc != PTLRPC_GSS_PROC_DATA &&
              gw->gw_proc != PTLRPC_GSS_PROC_DESTROY) {
                  CERROR("proc %d not support\n", gw->gw_proc);
                  RETURN(-EINVAL);
@@ -2580,57 +2787,91 @@ void gss_svc_free_rs(struct ptlrpc_reply_state *rs)
          LASSERT(rs->rs_svc_ctx);
          grctx = container_of(rs->rs_svc_ctx, struct gss_svc_reqctx, src_base);
  
-        /* paranoid, maybe not necessary */
-        grctx->src_reqbsd = NULL;
-        grctx->src_repbsd = NULL;
-
          gss_svc_reqctx_decref(grctx);
          rs->rs_svc_ctx = NULL;
  
          if (!rs->rs_prealloc)
-                OBD_FREE(rs, rs->rs_size);
+                OBD_FREE_LARGE(rs, rs->rs_size);
  }
  
  void gss_svc_free_ctx(struct ptlrpc_svc_ctx *ctx)
  {
-        LASSERT(atomic_read(&ctx->sc_refcount) == 0);
-        gss_svc_reqctx_free(gss_svc_ctx2reqctx(ctx));
+       LASSERT(atomic_read(&ctx->sc_refcount) == 0);
+       gss_svc_reqctx_free(gss_svc_ctx2reqctx(ctx));
  }
  
  int gss_copy_rvc_cli_ctx(struct ptlrpc_cli_ctx *cli_ctx,
                           struct ptlrpc_svc_ctx *svc_ctx)
  {
          struct gss_cli_ctx     *cli_gctx = ctx2gctx(cli_ctx);
-        struct gss_svc_reqctx  *grctx;
+        struct gss_svc_ctx     *svc_gctx = gss_svc_ctx2gssctx(svc_ctx);
          struct gss_ctx         *mechctx = NULL;
  
+        LASSERT(cli_gctx);
+        LASSERT(svc_gctx && svc_gctx->gsc_mechctx);
+
          cli_gctx->gc_proc = PTLRPC_GSS_PROC_DATA;
          cli_gctx->gc_win = GSS_SEQ_WIN;
-        atomic_set(&cli_gctx->gc_seq, 0);
  
-        grctx = container_of(svc_ctx, struct gss_svc_reqctx, src_base);
-        LASSERT(grctx->src_ctx);
-        LASSERT(grctx->src_ctx->gsc_mechctx);
-
-        if (lgss_copy_reverse_context(grctx->src_ctx->gsc_mechctx, &mechctx) !=
+       /* The problem is the reverse ctx might get lost in some recovery
+        * situations, and the same svc_ctx will be used to re-create it.
+        * if there's callback be sentout before that, new reverse ctx start
+        * with sequence 0 will lead to future callback rpc be treated as
+        * replay.
+        *
+        * each reverse root ctx will record its latest sequence number on its
+        * buddy svcctx before be destroyed, so here we continue use it.
+        */
+       atomic_set(&cli_gctx->gc_seq, svc_gctx->gsc_rvs_seq);
+
+       if (gss_svc_upcall_dup_handle(&cli_gctx->gc_svc_handle, svc_gctx)) {
+               CERROR("failed to dup svc handle\n");
+               goto err_out;
+       }
+
+        if (lgss_copy_reverse_context(svc_gctx->gsc_mechctx, &mechctx) !=
              GSS_S_COMPLETE) {
                  CERROR("failed to copy mech context\n");
-                return -ENOMEM;
+                goto err_svc_handle;
          }
  
-        if (rawobj_dup(&cli_gctx->gc_handle, &grctx->src_ctx->gsc_rvs_hdl)) {
+        if (rawobj_dup(&cli_gctx->gc_handle, &svc_gctx->gsc_rvs_hdl)) {
                  CERROR("failed to dup reverse handle\n");
-                lgss_delete_sec_context(&mechctx);
-                return -ENOMEM;
+                goto err_ctx;
          }
  
          cli_gctx->gc_mechctx = mechctx;
          gss_cli_ctx_uptodate(cli_gctx);
  
          return 0;
+
+err_ctx:
+        lgss_delete_sec_context(&mechctx);
+err_svc_handle:
+        rawobj_free(&cli_gctx->gc_svc_handle);
+err_out:
+        return -ENOMEM;
+}
+
+static void gss_init_at_reply_offset(void)
+{
+        __u32 buflens[3];
+        int clearsize;
+
+        buflens[0] = PTLRPC_GSS_HEADER_SIZE;
+        buflens[1] = lustre_msg_early_size();
+        buflens[2] = gss_cli_payload(NULL, buflens[1], 0);
+        gss_at_reply_off_integ = lustre_msg_size_v2(3, buflens);
+
+        buflens[0] = lustre_msg_early_size();
+        clearsize = lustre_msg_size_v2(1, buflens);
+        buflens[0] = PTLRPC_GSS_HEADER_SIZE;
+        buflens[1] = gss_cli_payload(NULL, clearsize, 0);
+        buflens[2] = gss_cli_payload(NULL, clearsize, 1);
+        gss_at_reply_off_priv = lustre_msg_size_v2(3, buflens);
  }
  
-int __init sptlrpc_gss_init(void)
+static int __init sptlrpc_gss_init(void)
  {
          int rc;
  
@@ -2646,55 +2887,63 @@ int __init sptlrpc_gss_init(void)
          if (rc)
                  goto out_cli_upcall;
  
-        rc = init_kerberos_module();
-        if (rc)
-                goto out_svc_upcall;
+       rc = init_null_module();
+       if (rc)
+               goto out_svc_upcall;
  
-        /* register policy after all other stuff be intialized, because it
-         * might be in used immediately after the registration. */
+       rc = init_kerberos_module();
+       if (rc)
+               goto out_null;
  
-        rc = gss_init_keyring();
-        if (rc)
-                goto out_kerberos;
+       rc = init_sk_module();
+       if (rc)
+               goto out_kerberos;
  
-#ifdef HAVE_GSS_PIPEFS
-        rc = gss_init_pipefs();
-        if (rc)
-                goto out_keyring;
-#endif
+       /* register policy after all other stuff be initialized, because it
+        * might be in used immediately after the registration. */
  
-        return 0;
+       rc = gss_init_keyring();
+       if (rc)
+               goto out_sk;
  
-#ifdef HAVE_GSS_PIPEFS
-out_keyring:
-        gss_exit_keyring();
-#endif
+       rc = gss_init_pipefs();
+       if (rc)
+               goto out_keyring;
+
+       gss_init_at_reply_offset();
  
+       return 0;
+
+out_keyring:
+       gss_exit_keyring();
+out_sk:
+       cleanup_sk_module();
  out_kerberos:
-        cleanup_kerberos_module();
+       cleanup_kerberos_module();
+out_null:
+       cleanup_null_module();
  out_svc_upcall:
-        gss_exit_svc_upcall();
+       gss_exit_svc_upcall();
  out_cli_upcall:
-        gss_exit_cli_upcall();
+       gss_exit_cli_upcall();
  out_lproc:
-        gss_exit_lproc();
-        return rc;
+       gss_exit_lproc();
+       return rc;
  }
  
  static void __exit sptlrpc_gss_exit(void)
  {
          gss_exit_keyring();
-#ifdef HAVE_GSS_PIPEFS
          gss_exit_pipefs();
-#endif
          cleanup_kerberos_module();
          gss_exit_svc_upcall();
          gss_exit_cli_upcall();
          gss_exit_lproc();
  }
  
-MODULE_AUTHOR("Cluster File Systems, Inc. <info@clusterfs.com>");
-MODULE_DESCRIPTION("GSS security policy for Lustre");
+MODULE_AUTHOR("OpenSFS, Inc. <http://www.lustre.org/>");
+MODULE_DESCRIPTION("Lustre GSS security policy");
+MODULE_VERSION(LUSTRE_VERSION_STRING);
  MODULE_LICENSE("GPL");
  
  module_init(sptlrpc_gss_init);