* Copyright (c) 2009, 2010, Oracle and/or its affiliates. All rights reserved.
* Use is subject to license terms.
*
- * Copyright (c) 2011, 2012, Intel Corporation.
+ * Copyright (c) 2011, 2014, Intel Corporation.
*/
/*
* This file is part of Lustre, http://www.lustre.org/
#include <lustre_export.h>
#include <lustre_update.h>
#include <lustre_disk.h>
+#include <lustre_lfsck.h>
+
+/* Each one represents a distribute transaction replay
+ * operation, and updates on each MDTs are linked to
+ * dtr_sub_list */
+struct distribute_txn_replay_req {
+ /* update record */
+ struct llog_update_record *dtrq_lur;
+ int dtrq_lur_size;
+
+ /* linked to the distribute transaction replay
+ * list (tdtd_replay_list) */
+ struct list_head dtrq_list;
+
+ /* all of sub updates are linked here */
+ struct list_head dtrq_sub_list;
+ spinlock_t dtrq_sub_list_lock;
+};
+
+/* Each one represents a sub replay item under a distribute
+ * transaction. A distribute transaction will be operated in
+ * two or more MDTs, and updates on each MDT will be represented
+ * by this structure */
+struct distribute_txn_replay_req_sub {
+ __u32 dtrqs_mdt_index;
+
+ /* All of cookies for the update will be linked here */
+ spinlock_t dtrqs_cookie_list_lock;
+ struct list_head dtrqs_cookie_list;
+ struct list_head dtrqs_list;
+};
+
+struct target_distribute_txn_data;
+typedef int (*distribute_txn_replay_handler_t)(struct lu_env *env,
+ struct target_distribute_txn_data *tdtd,
+ struct distribute_txn_replay_req *dtrq);
+struct target_distribute_txn_data {
+ /* Distribution ID is used to identify updates log on different
+ * MDTs for one operation */
+ spinlock_t tdtd_batchid_lock;
+ __u64 tdtd_batchid;
+ struct lu_target *tdtd_lut;
+ struct dt_object *tdtd_batchid_obj;
+ struct dt_device *tdtd_dt;
+
+ /* Committed batchid for distribute transaction */
+ __u64 tdtd_committed_batchid;
+
+ /* List for distribute transaction */
+ struct list_head tdtd_list;
+
+ /* Threads to manage distribute transaction */
+ wait_queue_head_t tdtd_commit_thread_waitq;
+ atomic_t tdtd_refcount;
+
+ /* recovery update */
+ distribute_txn_replay_handler_t tdtd_replay_handler;
+ struct list_head tdtd_replay_list;
+ spinlock_t tdtd_replay_list_lock;
+ /* last replay update transno */
+ __u64 tdtd_last_update_transno;
+ __u32 tdtd_replay_ready:1;
+
+};
struct lu_target {
struct obd_device *lut_obd;
struct dt_device *lut_bottom;
+ struct target_distribute_txn_data *lut_tdtd;
+ struct ptlrpc_thread lut_tdtd_commit_thread;
+
/* supported opcodes and handlers for this target */
struct tgt_opc_slice *lut_slice;
__u32 lut_reply_fail_id;
/* sptlrpc rules */
rwlock_t lut_sptlrpc_lock;
struct sptlrpc_rule_set lut_sptlrpc_rset;
+ spinlock_t lut_flags_lock;
int lut_sec_level;
- unsigned int lut_mds_capa:1,
- lut_oss_capa:1;
-
- /* LAST_RCVD parameters */
+ unsigned int lut_syncjournal:1,
+ lut_sync_lock_cancel:2,
+ /* e.g. OST node */
+ lut_no_reconstruct:1;
/** last_rcvd file */
struct dt_object *lut_last_rcvd;
/* transaction callbacks */
spinlock_t lut_client_bitmap_lock;
/** Bitmap of known clients */
unsigned long *lut_client_bitmap;
+ /* Number of clients supporting multiple modify RPCs
+ * recorded in the bitmap */
+ atomic_t lut_num_clients;
+ /* Client generation to identify client slot reuse */
+ atomic_t lut_client_generation;
+ /** reply_data file */
+ struct dt_object *lut_reply_data;
+ /** Bitmap of used slots in the reply data file */
+ unsigned long **lut_reply_bitmap;
+};
+
+/* number of slots in reply bitmap */
+#define LUT_REPLY_SLOTS_PER_CHUNK (1<<20)
+#define LUT_REPLY_SLOTS_MAX_CHUNKS 16
+
+/**
+ * Target reply data
+ */
+struct tg_reply_data {
+ /** chain of reply data anchored in tg_export_data */
+ struct list_head trd_list;
+ /** copy of on-disk reply data */
+ struct lsd_reply_data trd_reply;
+ /** versions for Version Based Recovery */
+ __u64 trd_pre_versions[4];
+ /** slot index in reply_data file */
+ int trd_index;
+ /** tag the client used */
+ __u16 trd_tag;
};
extern struct lu_context_key tgt_session_key;
struct obd_export *tsi_exp;
const struct lu_env *tsi_env;
struct lu_target *tsi_tgt;
+
+ const struct mdt_body *tsi_mdt_body;
+ struct ost_body *tsi_ost_body;
+ struct lu_object *tsi_corpus;
+
+ struct lu_fid tsi_fid;
+ struct ldlm_res_id tsi_resid;
+
+ /* object affected by VBR, for last_rcvd_update */
+ struct dt_object *tsi_vbr_obj;
+ /* opdata for mdt_reint_open(), has the same value as
+ * ldlm_reply:lock_policy_res1. The tgt_update_last_rcvd() stores
+ * this value onto disk for recovery when tgt_txn_stop_cb() is called.
+ */
+ __u64 tsi_opdata;
+
/*
* Additional fail id that can be set by handler.
*/
int tsi_reply_fail_id;
- int tsi_request_fail_id;
-
- __u32 tsi_has_trans:1; /* has txn already? */
+ bool tsi_preprocessed;
+ /* request JobID */
+ char *tsi_jobid;
};
static inline struct tgt_session_info *tgt_ses_info(const struct lu_env *env)
return tsi;
}
+static inline void tgt_vbr_obj_set(const struct lu_env *env,
+ struct dt_object *obj)
+{
+ struct tgt_session_info *tsi;
+
+ if (env->le_ses != NULL) {
+ tsi = tgt_ses_info(env);
+ tsi->tsi_vbr_obj = obj;
+ }
+}
+
+static inline void tgt_opdata_set(const struct lu_env *env, __u64 flags)
+{
+ struct tgt_session_info *tsi;
+
+ if (env->le_ses != NULL) {
+ tsi = tgt_ses_info(env);
+ tsi->tsi_opdata |= flags;
+ }
+}
+
+static inline void tgt_opdata_clear(const struct lu_env *env, __u64 flags)
+{
+ struct tgt_session_info *tsi;
+
+ if (env->le_ses != NULL) {
+ tsi = tgt_ses_info(env);
+ tsi->tsi_opdata &= ~flags;
+ }
+}
+
/*
* Generic unified target support.
*/
/* Request version for this opcode */
int th_version;
/* Handler function */
- int (*th_act)(struct tgt_session_info *tti);
+ int (*th_act)(struct tgt_session_info *tsi);
+ /* Handler function for high priority requests */
+ void (*th_hp)(struct tgt_session_info *tsi);
/* Request format for this request */
const struct req_format *th_fmt;
};
return !!(lustre_msg_get_flags(req->rq_reqmsg) & MSG_REPLAY);
}
+static inline bool tgt_is_multimodrpcs_client(struct obd_export *exp)
+{
+ return exp_connect_flags(exp) & OBD_CONNECT_MULTIMODRPCS;
+}
+
+
/* target/tgt_handler.c */
int tgt_request_handle(struct ptlrpc_request *req);
char *tgt_name(struct lu_target *tgt);
void tgt_counter_incr(struct obd_export *exp, int opcode);
int tgt_connect_check_sptlrpc(struct ptlrpc_request *req,
struct obd_export *exp);
+int tgt_adapt_sptlrpc_conf(struct lu_target *tgt, int initial);
int tgt_connect(struct tgt_session_info *tsi);
int tgt_disconnect(struct tgt_session_info *uti);
int tgt_obd_ping(struct tgt_session_info *tsi);
int tgt_sec_ctx_init(struct tgt_session_info *tsi);
int tgt_sec_ctx_init_cont(struct tgt_session_info *tsi);
int tgt_sec_ctx_fini(struct tgt_session_info *tsi);
-
-extern struct tgt_handler tgt_sec_ctx_handlers[];
+int tgt_sendpage(struct tgt_session_info *tsi, struct lu_rdpg *rdpg, int nob);
+int tgt_validate_obdo(struct tgt_session_info *tsi, struct obdo *oa);
+int tgt_sync(const struct lu_env *env, struct lu_target *tgt,
+ struct dt_object *obj, __u64 start, __u64 end);
+
+int tgt_io_thread_init(struct ptlrpc_thread *thread);
+void tgt_io_thread_done(struct ptlrpc_thread *thread);
+
+int tgt_extent_lock(struct ldlm_namespace *ns, struct ldlm_res_id *res_id,
+ __u64 start, __u64 end, struct lustre_handle *lh,
+ int mode, __u64 *flags);
+void tgt_extent_unlock(struct lustre_handle *lh, ldlm_mode_t mode);
+int tgt_brw_lock(struct ldlm_namespace *ns, struct ldlm_res_id *res_id,
+ struct obd_ioobj *obj, struct niobuf_remote *nb,
+ struct lustre_handle *lh, int mode);
+void tgt_brw_unlock(struct obd_ioobj *obj, struct niobuf_remote *niob,
+ struct lustre_handle *lh, int mode);
+int tgt_brw_read(struct tgt_session_info *tsi);
+int tgt_brw_write(struct tgt_session_info *tsi);
+int tgt_hpreq_handler(struct ptlrpc_request *req);
+void tgt_register_lfsck_in_notify(int (*notify)(const struct lu_env *,
+ struct dt_device *,
+ struct lfsck_request *,
+ struct thandle *));
+void tgt_register_lfsck_query(int (*query)(const struct lu_env *,
+ struct dt_device *,
+ struct lfsck_request *));
+bool req_can_reconstruct(struct ptlrpc_request *req, struct tg_reply_data *trd);
+
+extern struct tgt_handler tgt_lfsck_handlers[];
extern struct tgt_handler tgt_obd_handlers[];
extern struct tgt_handler tgt_dlm_handlers[];
extern struct tgt_handler tgt_llog_handlers[];
void *tgt_cb_data;
};
+int tgt_hpreq_handler(struct ptlrpc_request *req);
+
/* target/tgt_main.c */
void tgt_boot_epoch_update(struct lu_target *lut);
int tgt_last_commit_cb_add(struct thandle *th, struct lu_target *lut,
int sync);
int tgt_truncate_last_rcvd(const struct lu_env *env, struct lu_target *tg,
loff_t off);
-int tgt_last_rcvd_update(const struct lu_env *env, struct lu_target *tgt,
- struct dt_object *obj, __u64 opdata,
- struct thandle *th, struct ptlrpc_request *req);
+int tgt_reply_data_init(const struct lu_env *env, struct lu_target *tgt);
+bool tgt_lookup_reply(struct ptlrpc_request *req, struct tg_reply_data *trd);
+
+/* target/update_trans.c */
+int distribute_txn_init(const struct lu_env *env,
+ struct lu_target *lut,
+ struct target_distribute_txn_data *tdtd,
+ __u32 index);
+void distribute_txn_fini(const struct lu_env *env,
+ struct target_distribute_txn_data *tdtd);
+
+/* target/update_recovery.c */
+int insert_update_records_to_replay_list(struct target_distribute_txn_data *,
+ struct llog_update_record *,
+ struct llog_cookie *, __u32);
+void dtrq_list_dump(struct target_distribute_txn_data *tdtd,
+ unsigned int mask);
+void dtrq_list_destroy(struct target_distribute_txn_data *tdtd);
+int distribute_txn_replay_handle(struct lu_env *env,
+ struct target_distribute_txn_data *tdtd,
+ struct distribute_txn_replay_req *dtrq);
+__u64 distribute_txn_get_next_transno(struct target_distribute_txn_data *tdtd);
+struct distribute_txn_replay_req *
+distribute_txn_get_next_req(struct target_distribute_txn_data *tdtd);
+void dtrq_destroy(struct distribute_txn_replay_req *dtrq);
+struct distribute_txn_replay_req_sub *
+dtrq_sub_lookup(struct distribute_txn_replay_req *dtrq, __u32 mdt_index);
+
enum {
ESERIOUS = 0x0001000
};
return (rc < 0 && -rc & ESERIOUS);
}
+/**
+ * Do not return server-side uid/gid to remote client
+ */
+static inline void tgt_drop_id(struct obd_export *exp, struct obdo *oa)
+{
+ if (unlikely(exp_connect_rmtclient(exp))) {
+ oa->o_uid = -1;
+ oa->o_gid = -1;
+ oa->o_valid &= ~(OBD_MD_FLUID | OBD_MD_FLGID);
+ }
+}
+
/*
* Unified target generic handers macros and generic functions.
*/
-#define TGT_RPC_HANDLER(base, flags, opc, fn, fmt, version) \
+#define TGT_RPC_HANDLER_HP(base, flags, opc, fn, hp, fmt, version) \
[opc - base] = { \
.th_name = #opc, \
.th_fail_id = OBD_FAIL_ ## opc ## _NET, \
.th_flags = flags, \
.th_act = fn, \
.th_fmt = fmt, \
- .th_version = version \
+ .th_version = version, \
+ .th_hp = hp, \
}
+#define TGT_RPC_HANDLER(base, flags, opc, fn, fmt, version) \
+ TGT_RPC_HANDLER_HP(base, flags, opc, fn, NULL, fmt, version)
/* MDT Request with a format known in advance */
#define TGT_MDT_HDL(flags, name, fn) \
TGT_RPC_HANDLER(MDS_FIRST_OPC, flags, name, fn, NULL, \
LUSTRE_MDS_VERSION)
+/* OST Request with a format known in advance */
+#define TGT_OST_HDL(flags, name, fn) \
+ TGT_RPC_HANDLER(OST_FIRST_OPC, flags, name, fn, &RQF_ ## name, \
+ LUSTRE_OST_VERSION)
+#define TGT_OST_HDL_HP(flags, name, fn, hp) \
+ TGT_RPC_HANDLER_HP(OST_FIRST_OPC, flags, name, fn, hp, \
+ &RQF_ ## name, LUSTRE_OST_VERSION)
+
/* MGS request with a format known in advance */
#define TGT_MGS_HDL(flags, name, fn) \
TGT_RPC_HANDLER(MGS_FIRST_OPC, flags, name, fn, &RQF_ ## name, \
LUSTRE_MDS_VERSION)
/* FID Location Database handlers */
-#define TGT_FLD_HDL(flags, name, fn) \
- TGT_RPC_HANDLER(FLD_QUERY, flags, name, fn, &RQF_ ## name, \
+#define TGT_FLD_HDL_VAR(flags, name, fn) \
+ TGT_RPC_HANDLER(FLD_QUERY, flags, name, fn, NULL, \
LUSTRE_MDS_VERSION)
+/* LFSCK handlers */
+#define TGT_LFSCK_HDL(flags, name, fn) \
+ TGT_RPC_HANDLER(LFSCK_FIRST_OPC, flags, name, fn, \
+ &RQF_ ## name, LUSTRE_OBD_VERSION)
+
/* Request with a format known in advance */
#define TGT_UPDATE_HDL(flags, name, fn) \
- TGT_RPC_HANDLER(UPDATE_OBJ, flags, name, fn, &RQF_ ## name, \
+ TGT_RPC_HANDLER(OUT_UPDATE, flags, name, fn, &RQF_ ## name, \
LUSTRE_MDS_VERSION)
#endif /* __LUSTRE_LU_TARGET_H */