X-Git-Url: https://git.whamcloud.com/?p=fs%2Flustre-release.git;a=blobdiff_plain;f=lustre%2Fmdt%2Fmdt_internal.h;h=5bf811f4fbe008894618daf2079a2ce6fdf64eaf;hp=d0b9d8c4fae9e293faf36bbc321307ac0000add5;hb=640ed6104453e912a5c7766d265a36a30a31761d;hpb=d185bf805b71079343b42521fafdd734d52d052b;ds=sidebyside diff --git a/lustre/mdt/mdt_internal.h b/lustre/mdt/mdt_internal.h index d0b9d8c..5bf811f 100644 --- a/lustre/mdt/mdt_internal.h +++ b/lustre/mdt/mdt_internal.h @@ -23,7 +23,7 @@ * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved. * Use is subject to license terms. * - * Copyright (c) 2011, 2016, Intel Corporation. + * Copyright (c) 2011, 2017, Intel Corporation. */ /* * This file is part of Lustre, http://www.lustre.org/ @@ -47,7 +47,6 @@ #include #include #include -#include #include #include #include @@ -66,15 +65,15 @@ struct mdt_object; /* file data for open files on MDS */ struct mdt_file_data { /** portals handle must be first */ - struct portals_handle mfd_handle; + struct portals_handle mfd_open_handle; /** open mode provided by client */ - __u64 mfd_mode; + u64 mfd_open_flags; /** protected by med_open_lock */ struct list_head mfd_list; /** xid of the open request */ __u64 mfd_xid; /** old handle in replay case */ - struct lustre_handle mfd_old_handle; + struct lustre_handle mfd_open_handle_old; /** point to opened object */ struct mdt_object *mfd_object; }; @@ -129,35 +128,38 @@ static inline char *cdt_mdt_state2str(int state) struct coordinator { wait_queue_head_t cdt_waitq; /**< cdt wait queue */ bool cdt_event; /**< coordinator event */ + struct task_struct *cdt_task; /**< cdt thread handle */ struct lu_env cdt_env; /**< coordinator lustre * env */ struct lu_context cdt_session; /** session for lu_ucred */ struct proc_dir_entry *cdt_proc_dir; /**< cdt /proc directory */ __u64 cdt_policy; /**< policy flags */ enum cdt_states cdt_state; /**< state */ - spinlock_t cdt_state_lock; /**< cdt_state lock */ - atomic_t cdt_compound_id; /**< compound id - * counter */ + struct mutex cdt_state_lock; /**< cdt_state lock */ __u64 cdt_last_cookie; /**< last cookie * allocated */ - struct mutex cdt_llog_lock; /**< protect llog + struct rw_semaphore cdt_llog_lock; /**< protect llog * access */ struct rw_semaphore cdt_agent_lock; /**< protect agent list */ struct rw_semaphore cdt_request_lock; /**< protect request * list */ struct mutex cdt_restore_lock; /**< protect restore * list */ - cfs_time_t cdt_loop_period; /**< llog scan period */ - cfs_time_t cdt_grace_delay; /**< request grace + time64_t cdt_loop_period; /**< llog scan period */ + time64_t cdt_grace_delay; /**< request grace * delay */ - cfs_time_t cdt_active_req_timeout; /**< request timeout */ + time64_t cdt_active_req_timeout; /**< request timeout */ __u32 cdt_default_archive_id; /**< archive id used * when none are * specified */ __u64 cdt_max_requests; /**< max count of started * requests */ - atomic_t cdt_request_count; /**< current count of - * started requests */ + /** Current count of active requests */ + atomic_t cdt_request_count; /** total */ + atomic_t cdt_archive_count; + atomic_t cdt_restore_count; + atomic_t cdt_remove_count; + /* started requests (struct cdt_agent_req:car_cookie_hash) * indexed by cookie */ struct cfs_hash *cdt_request_cookie_hash; @@ -165,18 +167,40 @@ struct coordinator { struct list_head cdt_request_list; struct list_head cdt_agents; /**< list of register * agents */ - struct list_head cdt_restore_hdl; /**< list of restore lock - * handles */ + struct list_head cdt_restore_handle_list; + + /* Hash of cookies to locations of record locations in agent + * request log. */ + struct cfs_hash *cdt_agent_record_hash; + /* Bitmasks indexed by the HSMA_XXX constants. */ __u64 cdt_user_request_mask; __u64 cdt_group_request_mask; __u64 cdt_other_request_mask; + + /* Remove archive on last unlink policy */ + bool cdt_remove_archive_on_last_unlink; + + bool cdt_wakeup_coordinator; }; /* mdt state flag bits */ #define MDT_FL_CFGLOG 0 #define MDT_FL_SYNCED 1 +/* possible values for mo_dom_lock */ +enum { + NO_DOM_LOCK_ON_OPEN = 0, + TRYLOCK_DOM_ON_OPEN = 1, + ALWAYS_DOM_LOCK_ON_OPEN = 2, + NUM_DOM_LOCK_ON_OPEN_MODES +}; + +struct mdt_statfs_cache { + struct obd_statfs msf_osfs; + __u64 msf_age; +}; + struct mdt_device { /* super-class */ struct lu_device mdt_lu_dev; @@ -190,6 +214,7 @@ struct mdt_device { struct md_device *mdt_child; struct dt_device *mdt_bottom; struct obd_export *mdt_bottom_exp; + struct local_oid_storage *mdt_los; /** target device */ struct lu_target mdt_lut; /* @@ -199,7 +224,10 @@ struct mdt_device { unsigned int mo_user_xattr:1, mo_acl:1, mo_cos:1, - mo_evict_tgt_nids:1; + mo_evict_tgt_nids:1, + mo_dom_read_open:1, + mo_migrate_hsm_allowed:1; + unsigned int mo_dom_lock; } mdt_opts; /* mdt state flags */ unsigned long mdt_state; @@ -213,21 +241,28 @@ struct mdt_device { int mdt_max_ea_size; + /* preferred BRW size, decided by storage type and capability */ + __u32 mdt_brw_size; + struct upcall_cache *mdt_identity_cache; unsigned int mdt_capa_conf:1, /* Enable remote dir on non-MDT0 */ mdt_enable_remote_dir:1, + mdt_enable_striped_dir:1, + mdt_enable_dir_migration:1, mdt_skip_lfsck:1; + /* user with gid can create remote/striped + * dir, and set default dir stripe */ gid_t mdt_enable_remote_dir_gid; /* lock for osfs and md_root */ spinlock_t mdt_lock; /* statfs optimization: we cache a bit */ - struct obd_statfs mdt_osfs; - __u64 mdt_osfs_age; + struct mdt_statfs_cache mdt_sum_osfs; + struct mdt_statfs_cache mdt_osfs; /* root squash */ struct root_squash_info mdt_squash; @@ -254,6 +289,8 @@ struct mdt_device { #define MDT_SERVICE_WATCHDOG_FACTOR (2) #define MDT_COS_DEFAULT (0) +#define ENOENT_VERSION 1 /** 'virtual' version of non-existent object */ + struct mdt_object { struct lu_object_header mot_header; struct lu_object mot_obj; @@ -262,8 +299,12 @@ struct mdt_object { * attribute cache */ int mot_write_count; spinlock_t mot_write_lock; + /* Lock to protect object's SOM update. */ + struct mutex mot_som_mutex; /* Lock to protect create_data */ struct mutex mot_lov_mutex; + /* lock to protect read/write stages for Data-on-MDT files */ + struct rw_semaphore mot_dom_sem; /* Lock to protect lease open. * Lease open acquires write lock; normal open acquires read lock */ struct rw_semaphore mot_open_sem; @@ -313,8 +354,9 @@ enum { #define MDT_EREMOTE_OPEN (EREMOTE + 1024) struct mdt_reint_record { - mdt_reint_t rr_opcode; - const struct lustre_handle *rr_handle; + enum mds_reint_op rr_opcode; + const struct lustre_handle *rr_open_handle; + const struct lustre_handle *rr_lease_handle; const struct lu_fid *rr_fid1; const struct lu_fid *rr_fid2; struct lu_name rr_name; @@ -322,6 +364,7 @@ struct mdt_reint_record { void *rr_eadata; int rr_eadatalen; __u32 rr_flags; + __u16 rr_mirror_id; }; enum mdt_reint_flag { @@ -368,7 +411,8 @@ struct mdt_thread_info { /* * Object attributes. */ - struct md_attr mti_attr; + struct md_attr mti_attr; + struct md_attr mti_attr2; /* mdt_lvb.c */ /* * Body for "habeo corpus" operations. */ @@ -386,7 +430,8 @@ struct mdt_thread_info { mti_cross_ref:1, /* big_lmm buffer was used and must be used in reply */ mti_big_lmm_used:1, - mti_big_acl_used:1; + mti_big_acl_used:1, + mti_som_valid:1; /* opdata for mdt_reint_open(), has the same as * ldlm_reply:lock_policy_res1. mdt_update_last_rcvd() stores this @@ -438,15 +483,19 @@ struct mdt_thread_info { struct { struct md_attr attr; } hsm; - } mti_u; + struct { + struct md_attr attr; + } som; + } mti_u; - struct lustre_handle mti_close_handle; - loff_t mti_off; - struct lu_buf mti_buf; - struct lu_buf mti_big_buf; + struct lustre_handle mti_open_handle; + loff_t mti_off; + struct lu_buf mti_buf; + struct lu_buf mti_big_buf; /* Ops object filename */ struct lu_name mti_name; + char mti_filename[NAME_MAX + 1]; /* per-thread values, can be re-used, may be vmalloc'd */ void *mti_big_lmm; void *mti_big_acl; @@ -454,8 +503,13 @@ struct mdt_thread_info { int mti_big_aclsize; /* should be enough to fit lustre_mdt_attrs */ char mti_xattr_buf[128]; - struct ldlm_enqueue_info mti_einfo; + struct ldlm_enqueue_info mti_einfo[2]; + /* einfo used by mdt_remote_object_lock_try() */ + struct ldlm_enqueue_info mti_remote_einfo; struct tg_reply_data *mti_reply_data; + + /* FLR: layout change API */ + struct md_layout_change mti_layout; }; extern struct lu_context_key mdt_thread_key; @@ -485,13 +539,12 @@ struct cdt_agent_req { struct hlist_node car_cookie_hash; /**< find req by cookie */ struct list_head car_request_list; /**< to chain all the req. */ atomic_t car_refcount; /**< reference counter */ - __u64 car_compound_id; /**< compound id */ __u64 car_flags; /**< request original flags */ struct obd_uuid car_uuid; /**< agent doing the req. */ __u32 car_archive_id; /**< archive id */ int car_canceled; /**< request was canceled */ - cfs_time_t car_req_start; /**< start time */ - cfs_time_t car_req_update; /**< last update time */ + time64_t car_req_start; /**< start time */ + time64_t car_req_update; /**< last update time */ struct hsm_action_item *car_hai; /**< req. to the agent */ struct cdt_req_progress car_progress; /**< track data mvt * progress */ @@ -518,6 +571,11 @@ struct cdt_restore_handle { }; extern struct kmem_cache *mdt_hsm_cdt_kmem; /** restore handle slab cache */ +struct hsm_record_update { + __u64 cookie; + enum agent_req_status status; +}; + static inline const struct md_device_operations * mdt_child_ops(struct mdt_device * m) { @@ -600,6 +658,61 @@ static inline bool mdt_is_striped_client(struct obd_export *exp) return exp_connect_flags(exp) & OBD_CONNECT_DIR_STRIPE; } +enum { + LMM_NO_DOM, + LMM_DOM_ONLY, + LMM_DOM_OST +}; + +/* XXX Look into layout in MDT layer. This must be done in LOD. */ +static inline int mdt_lmm_dom_entry(struct lov_mds_md *lmm) +{ + struct lov_comp_md_v1 *comp_v1; + struct lov_mds_md *v1; + __u32 off; + int i; + + if (le32_to_cpu(lmm->lmm_magic) != LOV_MAGIC_COMP_V1) + return LMM_NO_DOM; + + comp_v1 = (struct lov_comp_md_v1 *)lmm; + off = le32_to_cpu(comp_v1->lcm_entries[0].lcme_offset); + v1 = (struct lov_mds_md *)((char *)comp_v1 + off); + + /* DoM entry is the first entry always */ + if (lov_pattern(le32_to_cpu(v1->lmm_pattern)) != LOV_PATTERN_MDT) + return LMM_NO_DOM; + + for (i = 1; i < le16_to_cpu(comp_v1->lcm_entry_count); i++) { + int j; + + off = le32_to_cpu(comp_v1->lcm_entries[i].lcme_offset); + v1 = (struct lov_mds_md *)((char *)comp_v1 + off); + + for (j = 0; j < le16_to_cpu(v1->lmm_stripe_count); j++) { + /* if there is any object on OST */ + if (le32_to_cpu(v1->lmm_objects[j].l_ost_idx) != + (__u32)-1UL) + return LMM_DOM_OST; + } + } + return LMM_DOM_ONLY; +} + +static inline bool mdt_lmm_is_flr(struct lov_mds_md *lmm) +{ + struct lov_comp_md_v1 *lcm = (typeof(lcm))lmm; + + return le32_to_cpu(lmm->lmm_magic) == LOV_MAGIC_COMP_V1 && + le16_to_cpu(lcm->lcm_mirror_count) > 0; +} + +static inline bool mdt_is_sum_statfs_client(struct obd_export *exp) +{ + return exp_connect_flags(exp) & OBD_CONNECT_FLAGS2 && + exp_connect_flags2(exp) & OBD_CONNECT2_SUM_STATFS; +} + __u64 mdt_get_disposition(struct ldlm_reply *rep, __u64 op_flag); void mdt_set_disposition(struct mdt_thread_info *info, struct ldlm_reply *rep, __u64 op_flag); @@ -625,14 +738,13 @@ int mdt_reint_object_lock(struct mdt_thread_info *info, struct mdt_object *o, bool cos_incompat); int mdt_object_lock_try(struct mdt_thread_info *info, struct mdt_object *mo, - struct mdt_lock_handle *lh, __u64 ibits); - -int mdt_reint_object_lock_try(struct mdt_thread_info *info, - struct mdt_object *o, struct mdt_lock_handle *lh, - __u64 ibits, bool cos_incompat); + struct mdt_lock_handle *lh, __u64 *ibits, + __u64 trybits, bool cos_incompat); void mdt_object_unlock(struct mdt_thread_info *info, struct mdt_object *mo, struct mdt_lock_handle *lh, int decref); +void mdt_save_lock(struct mdt_thread_info *info, struct lustre_handle *h, + enum ldlm_mode mode, int decref); struct mdt_object *mdt_object_new(const struct lu_env *env, struct mdt_device *, @@ -654,8 +766,17 @@ void mdt_client_compatibility(struct mdt_thread_info *info); int mdt_remote_object_lock(struct mdt_thread_info *mti, struct mdt_object *o, const struct lu_fid *fid, struct lustre_handle *lh, - enum ldlm_mode mode, __u64 ibits, bool nonblock, - bool cache); + enum ldlm_mode mode, __u64 ibits, bool cache); +int mdt_reint_striped_lock(struct mdt_thread_info *info, + struct mdt_object *o, + struct mdt_lock_handle *lh, + __u64 ibits, + struct ldlm_enqueue_info *einfo, + bool cos_incompat); +void mdt_reint_striped_unlock(struct mdt_thread_info *info, + struct mdt_object *o, + struct mdt_lock_handle *lh, + struct ldlm_enqueue_info *einfo, int decref); enum mdt_name_flags { MNF_FIX_ANON = 1, @@ -674,8 +795,9 @@ int mdt_pack_acl2body(struct mdt_thread_info *info, struct mdt_body *repbody, struct mdt_object *o, struct lu_nodemap *nodemap); #endif void mdt_pack_attr2body(struct mdt_thread_info *info, struct mdt_body *b, - const struct lu_attr *attr, const struct lu_fid *fid); - + const struct lu_attr *attr, const struct lu_fid *fid); +int mdt_pack_size2body(struct mdt_thread_info *info, + const struct lu_fid *fid, struct lustre_handle *lh); int mdt_getxattr(struct mdt_thread_info *info); int mdt_reint_setxattr(struct mdt_thread_info *info, struct mdt_lock_handle *lh); @@ -699,18 +821,16 @@ int mdt_export_stats_init(struct obd_device *obd, void *client_nid); int mdt_lock_new_child(struct mdt_thread_info *info, - struct mdt_object *o, - struct mdt_lock_handle *child_lockh); - -void mdt_mfd_set_mode(struct mdt_file_data *mfd, - __u64 mode); - -int mdt_reint_open(struct mdt_thread_info *info, - struct mdt_lock_handle *lhc); - -struct mdt_file_data *mdt_handle2mfd(struct mdt_export_data *med, - const struct lustre_handle *handle, - bool is_replay); + struct mdt_object *o, + struct mdt_lock_handle *child_lockh); +void mdt_mfd_set_mode(struct mdt_file_data *mfd, u64 open_flags); +int mdt_reint_open(struct mdt_thread_info *info, struct mdt_lock_handle *lhc); +struct mdt_file_data *mdt_open_handle2mfd(struct mdt_export_data *med, + const struct lustre_handle *open_handle, + bool is_replay); +int mdt_revoke_remote_lookup_lock(struct mdt_thread_info *info, + struct mdt_object *pobj, + struct mdt_object *obj); int mdt_get_info(struct tgt_session_info *tsi); int mdt_attr_get_complex(struct mdt_thread_info *info, @@ -719,6 +839,8 @@ int mdt_big_xattr_get(struct mdt_thread_info *info, struct mdt_object *o, const char *name); int mdt_stripe_get(struct mdt_thread_info *info, struct mdt_object *o, struct md_attr *ma, const char *name); +int mdt_attr_get_pfid(struct mdt_thread_info *info, struct mdt_object *o, + struct lu_fid *pfid); int mdt_write_get(struct mdt_object *o); void mdt_write_put(struct mdt_object *o); int mdt_write_read(struct mdt_object *o); @@ -730,8 +852,11 @@ int mdt_add_dirty_flag(struct mdt_thread_info *info, struct mdt_object *mo, struct md_attr *ma); int mdt_fix_reply(struct mdt_thread_info *info); int mdt_handle_last_unlink(struct mdt_thread_info *, struct mdt_object *, - const struct md_attr *); + struct md_attr *); void mdt_reconstruct_open(struct mdt_thread_info *, struct mdt_lock_handle *); +int mdt_layout_change(struct mdt_thread_info *info, struct mdt_object *obj, + struct md_layout_change *spec); +int mdt_device_sync(const struct lu_env *env, struct mdt_device *mdt); struct lu_buf *mdt_buf(const struct lu_env *env, void *area, ssize_t len); const struct lu_buf *mdt_buf_const(const struct lu_env *env, @@ -754,6 +879,13 @@ void mdt_thread_info_init(struct ptlrpc_request *req, struct mdt_thread_info *mti); void mdt_thread_info_fini(struct mdt_thread_info *mti); struct mdt_thread_info *tsi2mdt_info(struct tgt_session_info *tsi); +void mdt_intent_fixup_resent(struct mdt_thread_info *info, + struct ldlm_lock *new_lock, + struct mdt_lock_handle *lh, __u64 flags); +int mdt_intent_lock_replace(struct mdt_thread_info *info, + struct ldlm_lock **lockp, + struct mdt_lock_handle *lh, + __u64 flags, int result); int mdt_hsm_attr_set(struct mdt_thread_info *info, struct mdt_object *obj, const struct md_hsm *mh); @@ -823,13 +955,19 @@ extern const struct file_operations mdt_hsm_actions_fops; void dump_llog_agent_req_rec(const char *prefix, const struct llog_agent_req_rec *larr); int cdt_llog_process(const struct lu_env *env, struct mdt_device *mdt, - llog_cb_t cb, void *data); + llog_cb_t cb, void *data, u32 start_cat_idx, + u32 start_rec_idx, int rw); int mdt_agent_record_add(const struct lu_env *env, struct mdt_device *mdt, - __u64 compound_id, __u32 archive_id, - __u64 flags, struct hsm_action_item *hai); -int mdt_agent_record_update(const struct lu_env *env, - struct mdt_device *mdt, __u64 *cookies, - int cookies_count, enum agent_req_status status); + __u32 archive_id, __u64 flags, + struct hsm_action_item *hai); +int mdt_agent_record_update(const struct lu_env *env, struct mdt_device *mdt, + struct hsm_record_update *updates, + unsigned int updates_count); +void cdt_agent_record_hash_add(struct coordinator *cdt, u64 cookie, u32 cat_idt, + u32 rec_idx); +void cdt_agent_record_hash_lookup(struct coordinator *cdt, u64 cookie, + u32 *cat_idt, u32 *rec_idx); +void cdt_agent_record_hash_del(struct coordinator *cdt, u64 cookie); /* mdt/mdt_hsm_cdt_agent.c */ extern const struct file_operations mdt_hsm_agent_fops; @@ -848,21 +986,23 @@ int mdt_hsm_find_best_agent(struct coordinator *cdt, __u32 archive, struct obd_uuid *uuid); int mdt_hsm_agent_send(struct mdt_thread_info *mti, struct hsm_action_list *hal, bool purge); -int mdt_hsm_coordinator_update(struct mdt_thread_info *mti, - struct hsm_progress_kernel *pgs); /* mdt/mdt_hsm_cdt_client.c */ int mdt_hsm_add_actions(struct mdt_thread_info *info, struct hsm_action_list *hal); -int mdt_hsm_get_actions(struct mdt_thread_info *mti, - struct hsm_action_list *hal); +int mdt_hsm_get_action(struct mdt_thread_info *mti, + const struct lu_fid *fid, + enum hsm_copytool_action *action, + enum agent_req_status *status, + struct hsm_extent *extent); bool mdt_hsm_restore_is_running(struct mdt_thread_info *mti, const struct lu_fid *fid); /* mdt/mdt_hsm_cdt_requests.c */ extern struct cfs_hash_ops cdt_request_cookie_hash_ops; +extern struct cfs_hash_ops cdt_agent_record_hash_ops; extern const struct file_operations mdt_hsm_active_requests_fops; void dump_requests(char *prefix, struct coordinator *cdt); -struct cdt_agent_req *mdt_cdt_alloc_request(__u64 compound_id, __u32 archive_id, - __u64 flags, struct obd_uuid *uuid, +struct cdt_agent_req *mdt_cdt_alloc_request(__u32 archive_id, __u64 flags, + struct obd_uuid *uuid, struct hsm_action_item *hai); void mdt_cdt_free_request(struct cdt_agent_req *car); int mdt_cdt_add_request(struct coordinator *cdt, struct cdt_agent_req *new_car); @@ -876,13 +1016,26 @@ int mdt_cdt_remove_request(struct coordinator *cdt, __u64 cookie); /* mdt/mdt_coordinator.c */ void mdt_hsm_dump_hal(int level, const char *prefix, struct hsm_action_list *hal); -struct cdt_restore_handle *mdt_hsm_restore_hdl_find(struct coordinator *cdt, - const struct lu_fid *fid); +int cdt_restore_handle_add(struct mdt_thread_info *mti, struct coordinator *cdt, + const struct lu_fid *fid, + const struct hsm_extent *he); +struct cdt_restore_handle *cdt_restore_handle_find(struct coordinator *cdt, + const struct lu_fid *fid); +void cdt_restore_handle_del(struct mdt_thread_info *mti, + struct coordinator *cdt, const struct lu_fid *fid); /* coordinator management */ int mdt_hsm_cdt_init(struct mdt_device *mdt); int mdt_hsm_cdt_stop(struct mdt_device *mdt); int mdt_hsm_cdt_fini(struct mdt_device *mdt); -int mdt_hsm_cdt_wakeup(struct mdt_device *mdt); + +/* + * Signal the coordinator has work to do + * \param cdt [IN] coordinator + */ +static inline void mdt_hsm_cdt_event(struct coordinator *cdt) +{ + cdt->cdt_event = true; +} /* coordinator control /proc interface */ ssize_t mdt_hsm_cdt_control_seq_write(struct file *file, @@ -903,8 +1056,7 @@ bool mdt_hsm_is_action_compat(const struct hsm_action_item *hai, u32 archive_id, u64 rq_flags, const struct md_hsm *hsm); int mdt_hsm_update_request_state(struct mdt_thread_info *mti, - struct hsm_progress_kernel *pgs, - const int update_record); + struct hsm_progress_kernel *pgs); int mdt_close_swap_layouts(struct mdt_thread_info *info, struct mdt_object *o, struct md_attr *ma); @@ -982,22 +1134,30 @@ static inline int is_identity_get_disabled(struct upcall_cache *cache) int mdt_blocking_ast(struct ldlm_lock*, struct ldlm_lock_desc*, void*, int); +static int mdt_dom_glimpse_ast(struct ldlm_lock *lock, void *reqp) +{ + return -ELDLM_NO_LOCK_DATA; +} + /* Issues dlm lock on passed @ns, @f stores it lock handle into @lh. */ -static inline int mdt_fid_lock(struct ldlm_namespace *ns, +static inline int mdt_fid_lock(const struct lu_env *env, + struct ldlm_namespace *ns, struct lustre_handle *lh, enum ldlm_mode mode, union ldlm_policy_data *policy, const struct ldlm_res_id *res_id, __u64 flags, const __u64 *client_cookie) { int rc; + bool glimpse = policy->l_inodebits.bits & MDS_INODELOCK_DOM; LASSERT(ns != NULL); LASSERT(lh != NULL); - rc = ldlm_cli_enqueue_local(ns, res_id, LDLM_IBITS, policy, + rc = ldlm_cli_enqueue_local(env, ns, res_id, LDLM_IBITS, policy, mode, &flags, mdt_blocking_ast, - ldlm_completion_ast, NULL, NULL, 0, - LVB_T_NONE, client_cookie, lh); + ldlm_completion_ast, + glimpse ? mdt_dom_glimpse_ast : NULL, + NULL, 0, LVB_T_NONE, client_cookie, lh); return rc == ELDLM_OK ? 0 : -EIO; } @@ -1028,15 +1188,28 @@ static inline enum ldlm_mode mdt_mdl_mode2dlm_mode(mdl_mode_t mode) return mdt_dlm_lock_modes[mode]; } +/* mdt_som.c */ +int mdt_set_som(struct mdt_thread_info *info, struct mdt_object *obj, + enum lustre_som_flags flag, __u64 size, __u64 blocks); +int mdt_get_som(struct mdt_thread_info *info, struct mdt_object *obj, + struct md_attr *ma); +int mdt_lsom_downgrade(struct mdt_thread_info *info, struct mdt_object *obj); +int mdt_lsom_update(struct mdt_thread_info *info, struct mdt_object *obj, + bool truncate); + /* mdt_lvb.c */ extern struct ldlm_valblock_ops mdt_lvbo; +int mdt_dom_lvb_is_valid(struct ldlm_resource *res); +int mdt_dom_lvbo_update(const struct lu_env *env, struct ldlm_resource *res, + struct ldlm_lock *lock, struct ptlrpc_request *req, + bool increase_only); -void mdt_enable_cos(struct mdt_device *, int); +void mdt_enable_cos(struct mdt_device *dev, bool enable); int mdt_cos_is_enabled(struct mdt_device *); /* lprocfs stuff */ -enum { - LPROC_MDT_OPEN = 0, +enum mdt_stat_idx { + LPROC_MDT_OPEN, LPROC_MDT_CLOSE, LPROC_MDT_MKNOD, LPROC_MDT_LINK, @@ -1050,10 +1223,14 @@ enum { LPROC_MDT_SETXATTR, LPROC_MDT_STATFS, LPROC_MDT_SYNC, - LPROC_MDT_SAMEDIR_RENAME, - LPROC_MDT_CROSSDIR_RENAME, - LPROC_MDT_LAST, + LPROC_MDT_SAMEDIR_RENAME, + LPROC_MDT_CROSSDIR_RENAME, + LPROC_MDT_IO_READ, + LPROC_MDT_IO_WRITE, + LPROC_MDT_IO_PUNCH, + LPROC_MDT_LAST, }; + void mdt_counter_incr(struct ptlrpc_request *req, int opcode); void mdt_stats_counter_init(struct lprocfs_stats *stats); int mdt_procfs_init(struct mdt_device *mdt, const char *name); @@ -1093,4 +1270,54 @@ static inline char *mdt_req_get_jobid(struct ptlrpc_request *req) return jobid; } +/* MDT IO */ + +#define VALID_FLAGS (LA_TYPE | LA_MODE | LA_SIZE | LA_BLOCKS | \ + LA_BLKSIZE | LA_ATIME | LA_MTIME | LA_CTIME) + +int mdt_obd_preprw(const struct lu_env *env, int cmd, struct obd_export *exp, + struct obdo *oa, int objcount, struct obd_ioobj *obj, + struct niobuf_remote *rnb, int *nr_local, + struct niobuf_local *lnb); + +int mdt_obd_commitrw(const struct lu_env *env, int cmd, struct obd_export *exp, + struct obdo *oa, int objcount, struct obd_ioobj *obj, + struct niobuf_remote *rnb, int npages, + struct niobuf_local *lnb, int old_rc); +int mdt_punch_hdl(struct tgt_session_info *tsi); +int mdt_glimpse_enqueue(struct mdt_thread_info *mti, struct ldlm_namespace *ns, + struct ldlm_lock **lockp, __u64 flags); +int mdt_brw_enqueue(struct mdt_thread_info *info, struct ldlm_namespace *ns, + struct ldlm_lock **lockp, __u64 flags); +int mdt_dom_read_on_open(struct mdt_thread_info *mti, struct mdt_device *mdt, + struct lustre_handle *lh); +void mdt_dom_discard_data(struct mdt_thread_info *info, + const struct lu_fid *fid); +int mdt_dom_disk_lvbo_update(const struct lu_env *env, struct mdt_object *mo, + struct ldlm_resource *res, bool increase_only); +void mdt_dom_obj_lvb_update(const struct lu_env *env, struct mdt_object *mo, + bool increase_only); +int mdt_dom_lvb_alloc(struct ldlm_resource *res); + +static inline bool mdt_dom_check_for_discard(struct mdt_thread_info *mti, + struct mdt_object *mo) +{ + return lu_object_is_dying(&mo->mot_header) && + S_ISREG(lu_object_attr(&mo->mot_obj)); +} + +int mdt_dom_object_size(const struct lu_env *env, struct mdt_device *mdt, + const struct lu_fid *fid, struct mdt_body *mb, + bool dom_lock); +bool mdt_dom_client_has_lock(struct mdt_thread_info *info, + const struct lu_fid *fid); +void mdt_hp_brw(struct tgt_session_info *tsi); +void mdt_hp_punch(struct tgt_session_info *tsi); +int mdt_data_version_get(struct tgt_session_info *tsi); + +/* grants */ +long mdt_grant_connect(const struct lu_env *env, struct obd_export *exp, + u64 want, bool conservative); +extern struct kmem_cache *ldlm_glimpse_work_kmem; + #endif /* _MDT_INTERNAL_H */