4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; If not, see
18 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
20 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
21 * CA 95054 USA or visit www.sun.com if you need additional information or
27 * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
28 * Use is subject to license terms.
30 * Copyright (c) 2011, 2013, Intel Corporation.
33 * This file is part of Lustre, http://www.lustre.org/
34 * Lustre is a trademark of Sun Microsystems, Inc.
37 #ifndef __LUSTRE_DT_OBJECT_H
38 #define __LUSTRE_DT_OBJECT_H
41 * Sub-class of lu_object with methods common for "data" objects in OST stack.
43 * Data objects behave like regular files: you can read/write them, get and
44 * set their attributes. Implementation of dt interface is supposed to
45 * implement some form of garbage collection, normally reference counting
48 * Examples: osd (lustre/osd) is an implementation of dt interface.
52 #include <obd_support.h>
54 * super-class definitions.
56 #include <lu_object.h>
58 #include <libcfs/libcfs.h>
61 struct proc_dir_entry;
67 struct dt_index_features;
70 struct ldlm_enqueue_info;
73 MNTOPT_USERXATTR = 0x00000001,
74 MNTOPT_ACL = 0x00000002,
77 struct dt_device_param {
78 unsigned ddp_max_name_len;
79 unsigned ddp_max_nlink;
80 unsigned ddp_block_shift;
82 unsigned ddp_max_ea_size;
84 unsigned long long ddp_maxbytes;
85 /* percentage of available space to reserve for grant error margin */
86 int ddp_grant_reserved;
87 /* per-inode space consumption */
89 /* per-fragment grant overhead to be used by client for grant
95 * Per-transaction commit callback function
97 struct dt_txn_commit_cb;
98 typedef void (*dt_cb_t)(struct lu_env *env, struct thandle *th,
99 struct dt_txn_commit_cb *cb, int err);
101 * Special per-transaction callback for cases when just commit callback
102 * is needed and per-device callback are not convenient to use
104 #define TRANS_COMMIT_CB_MAGIC 0xa0a00a0a
105 #define MAX_COMMIT_CB_STR_LEN 32
107 struct dt_txn_commit_cb {
108 cfs_list_t dcb_linkage;
111 char dcb_name[MAX_COMMIT_CB_STR_LEN];
115 * Operations on dt device.
117 struct dt_device_operations {
119 * Return device-wide statistics.
121 int (*dt_statfs)(const struct lu_env *env,
122 struct dt_device *dev, struct obd_statfs *osfs);
124 * Create transaction, described by \a param.
126 struct thandle *(*dt_trans_create)(const struct lu_env *env,
127 struct dt_device *dev);
129 * Start transaction, described by \a param.
131 int (*dt_trans_start)(const struct lu_env *env,
132 struct dt_device *dev, struct thandle *th);
134 * Finish previously started transaction.
136 int (*dt_trans_stop)(const struct lu_env *env, struct dt_device *dev,
139 * Add commit callback to the transaction.
141 int (*dt_trans_cb_add)(struct thandle *th,
142 struct dt_txn_commit_cb *dcb);
144 * Return fid of root index object.
146 int (*dt_root_get)(const struct lu_env *env,
147 struct dt_device *dev, struct lu_fid *f);
149 * Return device configuration data.
151 void (*dt_conf_get)(const struct lu_env *env,
152 const struct dt_device *dev,
153 struct dt_device_param *param);
155 * handling device state, mostly for tests
157 int (*dt_sync)(const struct lu_env *env, struct dt_device *dev);
158 int (*dt_ro)(const struct lu_env *env, struct dt_device *dev);
160 * Start a transaction commit asynchronously
162 * \param env environment
163 * \param dev dt_device to start commit on
165 * \return 0 success, negative value if error
167 int (*dt_commit_async)(const struct lu_env *env,
168 struct dt_device *dev);
170 * Initialize capability context.
172 int (*dt_init_capa_ctxt)(const struct lu_env *env,
173 struct dt_device *dev,
174 int mode, unsigned long timeout,
175 __u32 alg, struct lustre_capa_key *keys);
178 struct dt_index_features {
179 /** required feature flags from enum dt_index_flags */
181 /** minimal required key size */
182 size_t dif_keysize_min;
183 /** maximal required key size, 0 if no limit */
184 size_t dif_keysize_max;
185 /** minimal required record size */
186 size_t dif_recsize_min;
187 /** maximal required record size, 0 if no limit */
188 size_t dif_recsize_max;
189 /** pointer size for record */
193 enum dt_index_flags {
194 /** index supports variable sized keys */
195 DT_IND_VARKEY = 1 << 0,
196 /** index supports variable sized records */
197 DT_IND_VARREC = 1 << 1,
198 /** index can be modified */
199 DT_IND_UPDATE = 1 << 2,
200 /** index supports records with non-unique (duplicate) keys */
201 DT_IND_NONUNQ = 1 << 3,
203 * index support fixed-size keys sorted with natural numerical way
204 * and is able to return left-side value if no exact value found
206 DT_IND_RANGE = 1 << 4,
210 * Features, required from index to support file system directories (mapping
213 extern const struct dt_index_features dt_directory_features;
214 extern const struct dt_index_features dt_otable_features;
215 extern const struct dt_index_features dt_lfsck_features;
217 /* index features supported by the accounting objects */
218 extern const struct dt_index_features dt_acct_features;
220 /* index features supported by the quota global indexes */
221 extern const struct dt_index_features dt_quota_glb_features;
223 /* index features supported by the quota slave indexes */
224 extern const struct dt_index_features dt_quota_slv_features;
227 * This is a general purpose dt allocation hint.
228 * It now contains the parent object.
229 * It can contain any allocation hint in the future.
231 struct dt_allocation_hint {
232 struct dt_object *dah_parent;
233 const void *dah_eadata;
239 * object type specifier.
242 enum dt_format_type {
247 /** for special index */
249 /** for symbolic link */
254 * object format specifier.
256 struct dt_object_format {
257 /** type for dt object */
258 enum dt_format_type dof_type;
268 * special index need feature as parameter to create
272 const struct dt_index_features *di_feat;
277 enum dt_format_type dt_mode_to_dft(__u32 mode);
279 typedef __u64 dt_obj_version_t;
281 union ldlm_policy_data;
284 * Per-dt-object operations.
286 struct dt_object_operations {
287 void (*do_read_lock)(const struct lu_env *env,
288 struct dt_object *dt, unsigned role);
289 void (*do_write_lock)(const struct lu_env *env,
290 struct dt_object *dt, unsigned role);
291 void (*do_read_unlock)(const struct lu_env *env,
292 struct dt_object *dt);
293 void (*do_write_unlock)(const struct lu_env *env,
294 struct dt_object *dt);
295 int (*do_write_locked)(const struct lu_env *env,
296 struct dt_object *dt);
298 * Note: following ->do_{x,}attr_{set,get}() operations are very
299 * similar to ->moo_{x,}attr_{set,get}() operations in struct
300 * md_object_operations (see md_object.h). These operations are not in
301 * lu_object_operations, because ->do_{x,}attr_set() versions take
302 * transaction handle as an argument (this transaction is started by
303 * caller). We might factor ->do_{x,}attr_get() into
304 * lu_object_operations, but that would break existing symmetry.
307 int (*do_declare_attr_get)(const struct lu_env *env,
308 struct dt_object *dt,
309 struct lustre_capa *capa);
311 * Return standard attributes.
313 * precondition: lu_object_exists(&dt->do_lu);
315 int (*do_attr_get)(const struct lu_env *env,
316 struct dt_object *dt, struct lu_attr *attr,
317 struct lustre_capa *capa);
319 * Set standard attributes.
321 * precondition: dt_object_exists(dt);
323 int (*do_declare_attr_set)(const struct lu_env *env,
324 struct dt_object *dt,
325 const struct lu_attr *attr,
326 struct thandle *handle);
327 int (*do_attr_set)(const struct lu_env *env,
328 struct dt_object *dt,
329 const struct lu_attr *attr,
330 struct thandle *handle,
331 struct lustre_capa *capa);
333 int (*do_declare_xattr_get)(const struct lu_env *env,
334 struct dt_object *dt,
337 struct lustre_capa *capa);
340 * Return a value of an extended attribute.
342 * precondition: dt_object_exists(dt);
344 int (*do_xattr_get)(const struct lu_env *env, struct dt_object *dt,
345 struct lu_buf *buf, const char *name,
346 struct lustre_capa *capa);
348 * Set value of an extended attribute.
350 * \a fl - flags from enum lu_xattr_flags
352 * precondition: dt_object_exists(dt);
354 int (*do_declare_xattr_set)(const struct lu_env *env,
355 struct dt_object *dt,
356 const struct lu_buf *buf,
357 const char *name, int fl,
358 struct thandle *handle);
359 int (*do_xattr_set)(const struct lu_env *env,
360 struct dt_object *dt, const struct lu_buf *buf,
361 const char *name, int fl, struct thandle *handle,
362 struct lustre_capa *capa);
364 * Delete existing extended attribute.
366 * precondition: dt_object_exists(dt);
368 int (*do_declare_xattr_del)(const struct lu_env *env,
369 struct dt_object *dt,
370 const char *name, struct thandle *handle);
371 int (*do_xattr_del)(const struct lu_env *env,
372 struct dt_object *dt,
373 const char *name, struct thandle *handle,
374 struct lustre_capa *capa);
376 * Place list of existing extended attributes into \a buf (which has
379 * precondition: dt_object_exists(dt);
381 int (*do_xattr_list)(const struct lu_env *env,
382 struct dt_object *dt, struct lu_buf *buf,
383 struct lustre_capa *capa);
385 * Init allocation hint using parent object and child mode.
386 * (1) The \a parent might be NULL if this is a partial creation for
388 * (2) The type of child is in \a child_mode.
389 * (3) The result hint is stored in \a ah;
391 void (*do_ah_init)(const struct lu_env *env,
392 struct dt_allocation_hint *ah,
393 struct dt_object *parent,
394 struct dt_object *child,
397 * Create new object on this device.
399 * precondition: !dt_object_exists(dt);
400 * postcondition: ergo(result == 0, dt_object_exists(dt));
402 int (*do_declare_create)(const struct lu_env *env,
403 struct dt_object *dt,
404 struct lu_attr *attr,
405 struct dt_allocation_hint *hint,
406 struct dt_object_format *dof,
408 int (*do_create)(const struct lu_env *env, struct dt_object *dt,
409 struct lu_attr *attr,
410 struct dt_allocation_hint *hint,
411 struct dt_object_format *dof,
415 Destroy object on this device
416 * precondition: !dt_object_exists(dt);
417 * postcondition: ergo(result == 0, dt_object_exists(dt));
419 int (*do_declare_destroy)(const struct lu_env *env,
420 struct dt_object *dt,
422 int (*do_destroy)(const struct lu_env *env, struct dt_object *dt,
426 * Announce that this object is going to be used as an index. This
427 * operation check that object supports indexing operations and
428 * installs appropriate dt_index_operations vector on success.
430 * Also probes for features. Operation is successful if all required
431 * features are supported.
433 int (*do_index_try)(const struct lu_env *env,
434 struct dt_object *dt,
435 const struct dt_index_features *feat);
437 * Add nlink of the object
438 * precondition: dt_object_exists(dt);
440 int (*do_declare_ref_add)(const struct lu_env *env,
441 struct dt_object *dt, struct thandle *th);
442 int (*do_ref_add)(const struct lu_env *env,
443 struct dt_object *dt, struct thandle *th);
445 * Del nlink of the object
446 * precondition: dt_object_exists(dt);
448 int (*do_declare_ref_del)(const struct lu_env *env,
449 struct dt_object *dt, struct thandle *th);
450 int (*do_ref_del)(const struct lu_env *env,
451 struct dt_object *dt, struct thandle *th);
453 struct obd_capa *(*do_capa_get)(const struct lu_env *env,
454 struct dt_object *dt,
455 struct lustre_capa *old,
457 int (*do_object_sync)(const struct lu_env *, struct dt_object *);
459 * Get object info of next level. Currently, only get inode from osd.
460 * This is only used by quota b=16542
461 * precondition: dt_object_exists(dt);
463 int (*do_data_get)(const struct lu_env *env, struct dt_object *dt,
469 int (*do_object_lock)(const struct lu_env *env, struct dt_object *dt,
470 struct lustre_handle *lh,
471 struct ldlm_enqueue_info *einfo,
472 union ldlm_policy_data *policy);
474 int (*do_object_unlock)(const struct lu_env *env, struct dt_object *dt,
475 struct ldlm_enqueue_info *einfo,
476 union ldlm_policy_data *policy);
480 * Per-dt-object operations on "file body".
482 struct dt_body_operations {
484 * precondition: dt_object_exists(dt);
486 ssize_t (*dbo_read)(const struct lu_env *env, struct dt_object *dt,
487 struct lu_buf *buf, loff_t *pos,
488 struct lustre_capa *capa);
490 * precondition: dt_object_exists(dt);
492 ssize_t (*dbo_declare_write)(const struct lu_env *env,
493 struct dt_object *dt,
494 const loff_t size, loff_t pos,
495 struct thandle *handle);
496 ssize_t (*dbo_write)(const struct lu_env *env, struct dt_object *dt,
497 const struct lu_buf *buf, loff_t *pos,
498 struct thandle *handle, struct lustre_capa *capa,
501 * methods for zero-copy IO
505 * precondition: dt_object_exists(dt);
509 * > 0 - number of local buffers prepared
511 int (*dbo_bufs_get)(const struct lu_env *env, struct dt_object *dt,
512 loff_t pos, ssize_t len, struct niobuf_local *lb,
513 int rw, struct lustre_capa *capa);
515 * precondition: dt_object_exists(dt);
517 int (*dbo_bufs_put)(const struct lu_env *env, struct dt_object *dt,
518 struct niobuf_local *lb, int nr);
520 * precondition: dt_object_exists(dt);
522 int (*dbo_write_prep)(const struct lu_env *env, struct dt_object *dt,
523 struct niobuf_local *lb, int nr);
525 * precondition: dt_object_exists(dt);
527 int (*dbo_declare_write_commit)(const struct lu_env *env,
528 struct dt_object *dt,
529 struct niobuf_local *,
530 int, struct thandle *);
532 * precondition: dt_object_exists(dt);
534 int (*dbo_write_commit)(const struct lu_env *env, struct dt_object *dt,
535 struct niobuf_local *, int, struct thandle *);
537 * precondition: dt_object_exists(dt);
539 int (*dbo_read_prep)(const struct lu_env *env, struct dt_object *dt,
540 struct niobuf_local *lnb, int nr);
541 int (*dbo_fiemap_get)(const struct lu_env *env, struct dt_object *dt,
542 struct ll_user_fiemap *fm);
544 * Punch object's content
545 * precondition: regular object, not index
547 int (*dbo_declare_punch)(const struct lu_env *, struct dt_object *,
548 __u64, __u64, struct thandle *th);
549 int (*dbo_punch)(const struct lu_env *env, struct dt_object *dt,
550 __u64 start, __u64 end, struct thandle *th,
551 struct lustre_capa *capa);
555 * Incomplete type of index record.
560 * Incomplete type of index key.
565 * Incomplete type of dt iterator.
570 * Per-dt-object operations on object as index.
572 struct dt_index_operations {
574 * precondition: dt_object_exists(dt);
576 int (*dio_lookup)(const struct lu_env *env, struct dt_object *dt,
577 struct dt_rec *rec, const struct dt_key *key,
578 struct lustre_capa *capa);
580 * precondition: dt_object_exists(dt);
582 int (*dio_declare_insert)(const struct lu_env *env,
583 struct dt_object *dt,
584 const struct dt_rec *rec,
585 const struct dt_key *key,
586 struct thandle *handle);
587 int (*dio_insert)(const struct lu_env *env, struct dt_object *dt,
588 const struct dt_rec *rec, const struct dt_key *key,
589 struct thandle *handle, struct lustre_capa *capa,
592 * precondition: dt_object_exists(dt);
594 int (*dio_declare_delete)(const struct lu_env *env,
595 struct dt_object *dt,
596 const struct dt_key *key,
597 struct thandle *handle);
598 int (*dio_delete)(const struct lu_env *env, struct dt_object *dt,
599 const struct dt_key *key, struct thandle *handle,
600 struct lustre_capa *capa);
606 * Allocate and initialize new iterator.
608 * precondition: dt_object_exists(dt);
610 struct dt_it *(*init)(const struct lu_env *env,
611 struct dt_object *dt,
613 struct lustre_capa *capa);
614 void (*fini)(const struct lu_env *env,
616 int (*get)(const struct lu_env *env,
618 const struct dt_key *key);
619 void (*put)(const struct lu_env *env,
621 int (*next)(const struct lu_env *env,
623 struct dt_key *(*key)(const struct lu_env *env,
624 const struct dt_it *di);
625 int (*key_size)(const struct lu_env *env,
626 const struct dt_it *di);
627 int (*rec)(const struct lu_env *env,
628 const struct dt_it *di,
631 __u64 (*store)(const struct lu_env *env,
632 const struct dt_it *di);
633 int (*load)(const struct lu_env *env,
634 const struct dt_it *di, __u64 hash);
635 int (*key_rec)(const struct lu_env *env,
636 const struct dt_it *di, void* key_rec);
640 enum dt_otable_it_valid {
641 DOIV_ERROR_HANDLE = 0x0001,
642 DOIV_DRYRUN = 0x0002,
645 enum dt_otable_it_flags {
646 /* Exit when fail. */
647 DOIF_FAILOUT = 0x0001,
649 /* Reset iteration position to the device beginning. */
652 /* There is up layer component uses the iteration. */
653 DOIF_OUTUSED = 0x0004,
655 /* Check only without repairing. */
656 DOIF_DRYRUN = 0x0008,
659 /* otable based iteration needs to use the common DT interation APIs.
660 * To initialize the iteration, it needs call dio_it::init() firstly.
661 * Here is how the otable based iteration should prepare arguments to
662 * call dt_it_ops::init().
664 * For otable based iteration, the 32-bits 'attr' for dt_it_ops::init()
665 * is composed of two parts:
666 * low 16-bits is for valid bits, high 16-bits is for flags bits. */
667 #define DT_OTABLE_IT_FLAGS_SHIFT 16
668 #define DT_OTABLE_IT_FLAGS_MASK 0xffff0000
671 struct lu_device dd_lu_dev;
672 const struct dt_device_operations *dd_ops;
675 * List of dt_txn_callback (see below). This is not protected in any
676 * way, because callbacks are supposed to be added/deleted only during
677 * single-threaded start-up shut-down procedures.
679 cfs_list_t dd_txn_callbacks;
680 unsigned int dd_record_fid_accessed:1;
683 int dt_device_init(struct dt_device *dev, struct lu_device_type *t);
684 void dt_device_fini(struct dt_device *dev);
686 static inline int lu_device_is_dt(const struct lu_device *d)
688 return ergo(d != NULL, d->ld_type->ldt_tags & LU_DEVICE_DT);
691 static inline struct dt_device * lu2dt_dev(struct lu_device *l)
693 LASSERT(lu_device_is_dt(l));
694 return container_of0(l, struct dt_device, dd_lu_dev);
698 struct lu_object do_lu;
699 const struct dt_object_operations *do_ops;
700 const struct dt_body_operations *do_body_ops;
701 const struct dt_index_operations *do_index_ops;
705 * In-core representation of per-device local object OID storage
707 struct local_oid_storage {
708 /* all initialized llog systems on this node linked by this */
711 /* how many handle's reference this los has */
712 atomic_t los_refcount;
713 struct dt_device *los_dev;
714 struct dt_object *los_obj;
716 /* data used to generate new fids */
717 struct mutex los_id_lock;
722 static inline struct lu_device *dt2lu_dev(struct dt_device *d)
724 return &d->dd_lu_dev;
727 static inline struct dt_object *lu2dt(struct lu_object *l)
729 LASSERT(l == NULL || IS_ERR(l) || lu_device_is_dt(l->lo_dev));
730 return container_of0(l, struct dt_object, do_lu);
733 int dt_object_init(struct dt_object *obj,
734 struct lu_object_header *h, struct lu_device *d);
736 void dt_object_fini(struct dt_object *obj);
738 static inline int dt_object_exists(const struct dt_object *dt)
740 return lu_object_exists(&dt->do_lu);
743 static inline int dt_object_remote(const struct dt_object *dt)
745 return lu_object_remote(&dt->do_lu);
748 static inline struct dt_object *lu2dt_obj(struct lu_object *o)
750 LASSERT(ergo(o != NULL, lu_device_is_dt(o->lo_dev)));
751 return container_of0(o, struct dt_object, do_lu);
754 struct thandle_update {
755 /* In DNE, one transaction can be disassembled into
756 * updates on several different MDTs, and these updates
757 * will be attached to tu_remote_update_list per target.
758 * Only single thread will access the list, no need lock
760 struct list_head tu_remote_update_list;
762 /* sent after or before local transaction */
763 unsigned int tu_sent_after_local_trans:1,
764 tu_only_remote_trans:1;
768 * This is the general purpose transaction handle.
769 * 1. Transaction Life Cycle
770 * This transaction handle is allocated upon starting a new transaction,
771 * and deallocated after this transaction is committed.
772 * 2. Transaction Nesting
773 * We do _NOT_ support nested transaction. So, every thread should only
774 * have one active transaction, and a transaction only belongs to one
775 * thread. Due to this, transaction handle need no reference count.
776 * 3. Transaction & dt_object locking
777 * dt_object locks should be taken inside transaction.
778 * 4. Transaction & RPC
779 * No RPC request should be issued inside transaction.
782 /** the dt device on which the transactions are executed */
783 struct dt_device *th_dev;
786 /* the size of transaction */
789 /** context for this transaction, tag is LCT_TX_HANDLE */
790 struct lu_context th_ctx;
792 /** additional tags (layers can add in declare) */
795 /** the last operation result in this transaction.
796 * this value is used in recovery */
799 /** whether we need sync commit */
800 unsigned int th_sync:1;
802 /* local transation, no need to inform other layers */
803 unsigned int th_local:1;
805 struct thandle_update *th_update;
808 static inline void thandle_get(struct thandle *thandle)
810 atomic_inc(&thandle->th_refc);
813 static inline void thandle_put(struct thandle *thandle)
815 if (atomic_dec_and_test(&thandle->th_refc)) {
816 if (thandle->th_update != NULL)
817 OBD_FREE_PTR(thandle->th_update);
818 OBD_FREE(thandle, thandle->th_alloc_size);
822 * Transaction call-backs.
824 * These are invoked by osd (or underlying transaction engine) when
825 * transaction changes state.
827 * Call-backs are used by upper layers to modify transaction parameters and to
828 * perform some actions on for each transaction state transition. Typical
829 * example is mdt registering call-back to write into last-received file
830 * before each transaction commit.
832 struct dt_txn_callback {
833 int (*dtc_txn_start)(const struct lu_env *env,
834 struct thandle *txn, void *cookie);
835 int (*dtc_txn_stop)(const struct lu_env *env,
836 struct thandle *txn, void *cookie);
837 void (*dtc_txn_commit)(struct thandle *txn, void *cookie);
840 cfs_list_t dtc_linkage;
843 void dt_txn_callback_add(struct dt_device *dev, struct dt_txn_callback *cb);
844 void dt_txn_callback_del(struct dt_device *dev, struct dt_txn_callback *cb);
846 int dt_txn_hook_start(const struct lu_env *env,
847 struct dt_device *dev, struct thandle *txn);
848 int dt_txn_hook_stop(const struct lu_env *env, struct thandle *txn);
849 void dt_txn_hook_commit(struct thandle *txn);
851 int dt_try_as_dir(const struct lu_env *env, struct dt_object *obj);
854 * Callback function used for parsing path.
855 * \see llo_store_resolve
857 typedef int (*dt_entry_func_t)(const struct lu_env *env,
861 #define DT_MAX_PATH 1024
863 int dt_path_parser(const struct lu_env *env,
864 char *local, dt_entry_func_t entry_func,
868 dt_store_resolve(const struct lu_env *env, struct dt_device *dt,
869 const char *path, struct lu_fid *fid);
871 struct dt_object *dt_store_open(const struct lu_env *env,
872 struct dt_device *dt,
874 const char *filename,
877 struct dt_object *dt_find_or_create(const struct lu_env *env,
878 struct dt_device *dt,
879 const struct lu_fid *fid,
880 struct dt_object_format *dof,
881 struct lu_attr *attr);
883 struct dt_object *dt_locate_at(const struct lu_env *env,
884 struct dt_device *dev,
885 const struct lu_fid *fid,
886 struct lu_device *top_dev,
887 const struct lu_object_conf *conf);
889 static inline struct dt_object *
890 dt_locate(const struct lu_env *env, struct dt_device *dev,
891 const struct lu_fid *fid)
893 return dt_locate_at(env, dev, fid,
894 dev->dd_lu_dev.ld_site->ls_top_dev, NULL);
897 int local_oid_storage_init(const struct lu_env *env, struct dt_device *dev,
898 const struct lu_fid *first_fid,
899 struct local_oid_storage **los);
900 void local_oid_storage_fini(const struct lu_env *env,
901 struct local_oid_storage *los);
902 int local_object_fid_generate(const struct lu_env *env,
903 struct local_oid_storage *los,
905 int local_object_declare_create(const struct lu_env *env,
906 struct local_oid_storage *los,
908 struct lu_attr *attr,
909 struct dt_object_format *dof,
911 int local_object_create(const struct lu_env *env,
912 struct local_oid_storage *los,
914 struct lu_attr *attr, struct dt_object_format *dof,
916 struct dt_object *local_file_find_or_create(const struct lu_env *env,
917 struct local_oid_storage *los,
918 struct dt_object *parent,
919 const char *name, __u32 mode);
920 struct dt_object *local_file_find_or_create_with_fid(const struct lu_env *env,
921 struct dt_device *dt,
922 const struct lu_fid *fid,
923 struct dt_object *parent,
927 local_index_find_or_create(const struct lu_env *env,
928 struct local_oid_storage *los,
929 struct dt_object *parent,
930 const char *name, __u32 mode,
931 const struct dt_index_features *ft);
933 local_index_find_or_create_with_fid(const struct lu_env *env,
934 struct dt_device *dt,
935 const struct lu_fid *fid,
936 struct dt_object *parent,
937 const char *name, __u32 mode,
938 const struct dt_index_features *ft);
939 int local_object_unlink(const struct lu_env *env, struct dt_device *dt,
940 struct dt_object *parent, const char *name);
942 static inline int dt_object_lock(const struct lu_env *env,
943 struct dt_object *o, struct lustre_handle *lh,
944 struct ldlm_enqueue_info *einfo,
945 union ldlm_policy_data *policy)
948 LASSERT(o->do_ops != NULL);
949 LASSERT(o->do_ops->do_object_lock != NULL);
950 return o->do_ops->do_object_lock(env, o, lh, einfo, policy);
953 static inline int dt_object_unlock(const struct lu_env *env,
955 struct ldlm_enqueue_info *einfo,
956 union ldlm_policy_data *policy)
959 LASSERT(o->do_ops != NULL);
960 LASSERT(o->do_ops->do_object_unlock != NULL);
961 return o->do_ops->do_object_unlock(env, o, einfo, policy);
964 int dt_lookup_dir(const struct lu_env *env, struct dt_object *dir,
965 const char *name, struct lu_fid *fid);
967 static inline int dt_object_sync(const struct lu_env *env,
972 LASSERT(o->do_ops->do_object_sync);
973 return o->do_ops->do_object_sync(env, o);
976 int dt_declare_version_set(const struct lu_env *env, struct dt_object *o,
978 void dt_version_set(const struct lu_env *env, struct dt_object *o,
979 dt_obj_version_t version, struct thandle *th);
980 dt_obj_version_t dt_version_get(const struct lu_env *env, struct dt_object *o);
983 int dt_read(const struct lu_env *env, struct dt_object *dt,
984 struct lu_buf *buf, loff_t *pos);
985 int dt_record_read(const struct lu_env *env, struct dt_object *dt,
986 struct lu_buf *buf, loff_t *pos);
987 int dt_record_write(const struct lu_env *env, struct dt_object *dt,
988 const struct lu_buf *buf, loff_t *pos, struct thandle *th);
989 typedef int (*dt_index_page_build_t)(const struct lu_env *env,
990 union lu_page *lp, int nob,
991 const struct dt_it_ops *iops,
992 struct dt_it *it, __u32 attr, void *arg);
993 int dt_index_walk(const struct lu_env *env, struct dt_object *obj,
994 const struct lu_rdpg *rdpg, dt_index_page_build_t filler,
996 int dt_index_read(const struct lu_env *env, struct dt_device *dev,
997 struct idx_info *ii, const struct lu_rdpg *rdpg);
999 static inline struct thandle *dt_trans_create(const struct lu_env *env,
1000 struct dt_device *d)
1002 LASSERT(d->dd_ops->dt_trans_create);
1003 return d->dd_ops->dt_trans_create(env, d);
1006 static inline int dt_trans_start(const struct lu_env *env,
1007 struct dt_device *d, struct thandle *th)
1009 LASSERT(d->dd_ops->dt_trans_start);
1010 return d->dd_ops->dt_trans_start(env, d, th);
1013 /* for this transaction hooks shouldn't be called */
1014 static inline int dt_trans_start_local(const struct lu_env *env,
1015 struct dt_device *d, struct thandle *th)
1017 LASSERT(d->dd_ops->dt_trans_start);
1019 return d->dd_ops->dt_trans_start(env, d, th);
1022 static inline int dt_trans_stop(const struct lu_env *env,
1023 struct dt_device *d, struct thandle *th)
1025 LASSERT(d->dd_ops->dt_trans_stop);
1026 return d->dd_ops->dt_trans_stop(env, d, th);
1029 static inline int dt_trans_cb_add(struct thandle *th,
1030 struct dt_txn_commit_cb *dcb)
1032 LASSERT(th->th_dev->dd_ops->dt_trans_cb_add);
1033 dcb->dcb_magic = TRANS_COMMIT_CB_MAGIC;
1034 return th->th_dev->dd_ops->dt_trans_cb_add(th, dcb);
1039 static inline int dt_declare_record_write(const struct lu_env *env,
1040 struct dt_object *dt,
1041 int size, loff_t pos,
1046 LASSERTF(dt != NULL, "dt is NULL when we want to write record\n");
1047 LASSERT(th != NULL);
1048 LASSERT(dt->do_body_ops);
1049 LASSERT(dt->do_body_ops->dbo_declare_write);
1050 rc = dt->do_body_ops->dbo_declare_write(env, dt, size, pos, th);
1054 static inline int dt_declare_create(const struct lu_env *env,
1055 struct dt_object *dt,
1056 struct lu_attr *attr,
1057 struct dt_allocation_hint *hint,
1058 struct dt_object_format *dof,
1062 LASSERT(dt->do_ops);
1063 LASSERT(dt->do_ops->do_declare_create);
1064 return dt->do_ops->do_declare_create(env, dt, attr, hint, dof, th);
1067 static inline int dt_create(const struct lu_env *env,
1068 struct dt_object *dt,
1069 struct lu_attr *attr,
1070 struct dt_allocation_hint *hint,
1071 struct dt_object_format *dof,
1075 LASSERT(dt->do_ops);
1076 LASSERT(dt->do_ops->do_create);
1077 return dt->do_ops->do_create(env, dt, attr, hint, dof, th);
1080 static inline int dt_declare_destroy(const struct lu_env *env,
1081 struct dt_object *dt,
1085 LASSERT(dt->do_ops);
1086 LASSERT(dt->do_ops->do_declare_destroy);
1087 return dt->do_ops->do_declare_destroy(env, dt, th);
1090 static inline int dt_destroy(const struct lu_env *env,
1091 struct dt_object *dt,
1095 LASSERT(dt->do_ops);
1096 LASSERT(dt->do_ops->do_destroy);
1097 return dt->do_ops->do_destroy(env, dt, th);
1100 static inline void dt_read_lock(const struct lu_env *env,
1101 struct dt_object *dt,
1105 LASSERT(dt->do_ops);
1106 LASSERT(dt->do_ops->do_read_lock);
1107 dt->do_ops->do_read_lock(env, dt, role);
1110 static inline void dt_write_lock(const struct lu_env *env,
1111 struct dt_object *dt,
1115 LASSERT(dt->do_ops);
1116 LASSERT(dt->do_ops->do_write_lock);
1117 dt->do_ops->do_write_lock(env, dt, role);
1120 static inline void dt_read_unlock(const struct lu_env *env,
1121 struct dt_object *dt)
1124 LASSERT(dt->do_ops);
1125 LASSERT(dt->do_ops->do_read_unlock);
1126 dt->do_ops->do_read_unlock(env, dt);
1129 static inline void dt_write_unlock(const struct lu_env *env,
1130 struct dt_object *dt)
1133 LASSERT(dt->do_ops);
1134 LASSERT(dt->do_ops->do_write_unlock);
1135 dt->do_ops->do_write_unlock(env, dt);
1138 static inline int dt_write_locked(const struct lu_env *env,
1139 struct dt_object *dt)
1142 LASSERT(dt->do_ops);
1143 LASSERT(dt->do_ops->do_write_locked);
1144 return dt->do_ops->do_write_locked(env, dt);
1147 static inline int dt_declare_attr_get(const struct lu_env *env,
1148 struct dt_object *dt,
1149 struct lustre_capa *capa)
1152 LASSERT(dt->do_ops);
1153 LASSERT(dt->do_ops->do_declare_attr_get);
1154 return dt->do_ops->do_declare_attr_get(env, dt, capa);
1157 static inline int dt_attr_get(const struct lu_env *env, struct dt_object *dt,
1158 struct lu_attr *la, void *arg)
1161 LASSERT(dt->do_ops);
1162 LASSERT(dt->do_ops->do_attr_get);
1163 return dt->do_ops->do_attr_get(env, dt, la, arg);
1166 static inline int dt_declare_attr_set(const struct lu_env *env,
1167 struct dt_object *dt,
1168 const struct lu_attr *la,
1172 LASSERT(dt->do_ops);
1173 LASSERT(dt->do_ops->do_declare_attr_set);
1174 return dt->do_ops->do_declare_attr_set(env, dt, la, th);
1177 static inline int dt_attr_set(const struct lu_env *env, struct dt_object *dt,
1178 const struct lu_attr *la, struct thandle *th,
1179 struct lustre_capa *capa)
1182 LASSERT(dt->do_ops);
1183 LASSERT(dt->do_ops->do_attr_set);
1184 return dt->do_ops->do_attr_set(env, dt, la, th, capa);
1187 static inline int dt_declare_ref_add(const struct lu_env *env,
1188 struct dt_object *dt, struct thandle *th)
1191 LASSERT(dt->do_ops);
1192 LASSERT(dt->do_ops->do_declare_ref_add);
1193 return dt->do_ops->do_declare_ref_add(env, dt, th);
1196 static inline int dt_ref_add(const struct lu_env *env,
1197 struct dt_object *dt, struct thandle *th)
1200 LASSERT(dt->do_ops);
1201 LASSERT(dt->do_ops->do_ref_add);
1202 return dt->do_ops->do_ref_add(env, dt, th);
1205 static inline int dt_declare_ref_del(const struct lu_env *env,
1206 struct dt_object *dt, struct thandle *th)
1209 LASSERT(dt->do_ops);
1210 LASSERT(dt->do_ops->do_declare_ref_del);
1211 return dt->do_ops->do_declare_ref_del(env, dt, th);
1214 static inline int dt_ref_del(const struct lu_env *env,
1215 struct dt_object *dt, struct thandle *th)
1218 LASSERT(dt->do_ops);
1219 LASSERT(dt->do_ops->do_ref_del);
1220 return dt->do_ops->do_ref_del(env, dt, th);
1223 static inline struct obd_capa *dt_capa_get(const struct lu_env *env,
1224 struct dt_object *dt,
1225 struct lustre_capa *old, __u64 opc)
1228 LASSERT(dt->do_ops);
1229 LASSERT(dt->do_ops->do_capa_get);
1230 return dt->do_ops->do_capa_get(env, dt, old, opc);
1233 static inline int dt_bufs_get(const struct lu_env *env, struct dt_object *d,
1234 struct niobuf_remote *rnb,
1235 struct niobuf_local *lnb, int rw,
1236 struct lustre_capa *capa)
1239 LASSERT(d->do_body_ops);
1240 LASSERT(d->do_body_ops->dbo_bufs_get);
1241 return d->do_body_ops->dbo_bufs_get(env, d, rnb->offset,
1242 rnb->len, lnb, rw, capa);
1245 static inline int dt_bufs_put(const struct lu_env *env, struct dt_object *d,
1246 struct niobuf_local *lnb, int n)
1249 LASSERT(d->do_body_ops);
1250 LASSERT(d->do_body_ops->dbo_bufs_put);
1251 return d->do_body_ops->dbo_bufs_put(env, d, lnb, n);
1254 static inline int dt_write_prep(const struct lu_env *env, struct dt_object *d,
1255 struct niobuf_local *lnb, int n)
1258 LASSERT(d->do_body_ops);
1259 LASSERT(d->do_body_ops->dbo_write_prep);
1260 return d->do_body_ops->dbo_write_prep(env, d, lnb, n);
1263 static inline int dt_declare_write_commit(const struct lu_env *env,
1264 struct dt_object *d,
1265 struct niobuf_local *lnb,
1266 int n, struct thandle *th)
1268 LASSERTF(d != NULL, "dt is NULL when we want to declare write\n");
1269 LASSERT(th != NULL);
1270 return d->do_body_ops->dbo_declare_write_commit(env, d, lnb, n, th);
1274 static inline int dt_write_commit(const struct lu_env *env,
1275 struct dt_object *d, struct niobuf_local *lnb,
1276 int n, struct thandle *th)
1279 LASSERT(d->do_body_ops);
1280 LASSERT(d->do_body_ops->dbo_write_commit);
1281 return d->do_body_ops->dbo_write_commit(env, d, lnb, n, th);
1284 static inline int dt_read_prep(const struct lu_env *env, struct dt_object *d,
1285 struct niobuf_local *lnb, int n)
1288 LASSERT(d->do_body_ops);
1289 LASSERT(d->do_body_ops->dbo_read_prep);
1290 return d->do_body_ops->dbo_read_prep(env, d, lnb, n);
1293 static inline int dt_declare_punch(const struct lu_env *env,
1294 struct dt_object *dt, __u64 start,
1295 __u64 end, struct thandle *th)
1298 LASSERT(dt->do_body_ops);
1299 LASSERT(dt->do_body_ops->dbo_declare_punch);
1300 return dt->do_body_ops->dbo_declare_punch(env, dt, start, end, th);
1303 static inline int dt_punch(const struct lu_env *env, struct dt_object *dt,
1304 __u64 start, __u64 end, struct thandle *th,
1305 struct lustre_capa *capa)
1308 LASSERT(dt->do_body_ops);
1309 LASSERT(dt->do_body_ops->dbo_punch);
1310 return dt->do_body_ops->dbo_punch(env, dt, start, end, th, capa);
1313 static inline int dt_fiemap_get(const struct lu_env *env, struct dt_object *d,
1314 struct ll_user_fiemap *fm)
1317 if (d->do_body_ops == NULL)
1319 if (d->do_body_ops->dbo_fiemap_get == NULL)
1321 return d->do_body_ops->dbo_fiemap_get(env, d, fm);
1324 static inline int dt_statfs(const struct lu_env *env, struct dt_device *dev,
1325 struct obd_statfs *osfs)
1328 LASSERT(dev->dd_ops);
1329 LASSERT(dev->dd_ops->dt_statfs);
1330 return dev->dd_ops->dt_statfs(env, dev, osfs);
1333 static inline int dt_root_get(const struct lu_env *env, struct dt_device *dev,
1337 LASSERT(dev->dd_ops);
1338 LASSERT(dev->dd_ops->dt_root_get);
1339 return dev->dd_ops->dt_root_get(env, dev, f);
1342 static inline void dt_conf_get(const struct lu_env *env,
1343 const struct dt_device *dev,
1344 struct dt_device_param *param)
1347 LASSERT(dev->dd_ops);
1348 LASSERT(dev->dd_ops->dt_conf_get);
1349 return dev->dd_ops->dt_conf_get(env, dev, param);
1352 static inline int dt_sync(const struct lu_env *env, struct dt_device *dev)
1355 LASSERT(dev->dd_ops);
1356 LASSERT(dev->dd_ops->dt_sync);
1357 return dev->dd_ops->dt_sync(env, dev);
1360 static inline int dt_ro(const struct lu_env *env, struct dt_device *dev)
1363 LASSERT(dev->dd_ops);
1364 LASSERT(dev->dd_ops->dt_ro);
1365 return dev->dd_ops->dt_ro(env, dev);
1368 static inline int dt_declare_insert(const struct lu_env *env,
1369 struct dt_object *dt,
1370 const struct dt_rec *rec,
1371 const struct dt_key *key,
1375 LASSERT(dt->do_index_ops);
1376 LASSERT(dt->do_index_ops->dio_declare_insert);
1377 return dt->do_index_ops->dio_declare_insert(env, dt, rec, key, th);
1380 static inline int dt_insert(const struct lu_env *env,
1381 struct dt_object *dt,
1382 const struct dt_rec *rec,
1383 const struct dt_key *key,
1385 struct lustre_capa *capa,
1389 LASSERT(dt->do_index_ops);
1390 LASSERT(dt->do_index_ops->dio_insert);
1391 return dt->do_index_ops->dio_insert(env, dt, rec, key, th,
1395 static inline int dt_declare_xattr_del(const struct lu_env *env,
1396 struct dt_object *dt,
1401 LASSERT(dt->do_ops);
1402 LASSERT(dt->do_ops->do_declare_xattr_del);
1403 return dt->do_ops->do_declare_xattr_del(env, dt, name, th);
1406 static inline int dt_xattr_del(const struct lu_env *env,
1407 struct dt_object *dt, const char *name,
1409 struct lustre_capa *capa)
1412 LASSERT(dt->do_ops);
1413 LASSERT(dt->do_ops->do_xattr_del);
1414 return dt->do_ops->do_xattr_del(env, dt, name, th, capa);
1417 static inline int dt_declare_xattr_set(const struct lu_env *env,
1418 struct dt_object *dt,
1419 const struct lu_buf *buf,
1420 const char *name, int fl,
1424 LASSERT(dt->do_ops);
1425 LASSERT(dt->do_ops->do_declare_xattr_set);
1426 return dt->do_ops->do_declare_xattr_set(env, dt, buf, name, fl, th);
1429 static inline int dt_xattr_set(const struct lu_env *env,
1430 struct dt_object *dt, const struct lu_buf *buf,
1431 const char *name, int fl, struct thandle *th,
1432 struct lustre_capa *capa)
1435 LASSERT(dt->do_ops);
1436 LASSERT(dt->do_ops->do_xattr_set);
1437 return dt->do_ops->do_xattr_set(env, dt, buf, name, fl, th, capa);
1440 static inline int dt_declare_xattr_get(const struct lu_env *env,
1441 struct dt_object *dt,
1444 struct lustre_capa *capa)
1447 LASSERT(dt->do_ops);
1448 LASSERT(dt->do_ops->do_declare_xattr_get);
1449 return dt->do_ops->do_declare_xattr_get(env, dt, buf, name, capa);
1452 static inline int dt_xattr_get(const struct lu_env *env,
1453 struct dt_object *dt, struct lu_buf *buf,
1454 const char *name, struct lustre_capa *capa)
1457 LASSERT(dt->do_ops);
1458 LASSERT(dt->do_ops->do_xattr_get);
1459 return dt->do_ops->do_xattr_get(env, dt, buf, name, capa);
1462 static inline int dt_xattr_list(const struct lu_env *env,
1463 struct dt_object *dt, struct lu_buf *buf,
1464 struct lustre_capa *capa)
1467 LASSERT(dt->do_ops);
1468 LASSERT(dt->do_ops->do_xattr_list);
1469 return dt->do_ops->do_xattr_list(env, dt, buf, capa);
1472 static inline int dt_declare_delete(const struct lu_env *env,
1473 struct dt_object *dt,
1474 const struct dt_key *key,
1478 LASSERT(dt->do_index_ops);
1479 LASSERT(dt->do_index_ops->dio_declare_delete);
1480 return dt->do_index_ops->dio_declare_delete(env, dt, key, th);
1483 static inline int dt_delete(const struct lu_env *env,
1484 struct dt_object *dt,
1485 const struct dt_key *key,
1487 struct lustre_capa *capa)
1490 LASSERT(dt->do_index_ops);
1491 LASSERT(dt->do_index_ops->dio_delete);
1492 return dt->do_index_ops->dio_delete(env, dt, key, th, capa);
1495 static inline int dt_commit_async(const struct lu_env *env,
1496 struct dt_device *dev)
1499 LASSERT(dev->dd_ops);
1500 LASSERT(dev->dd_ops->dt_commit_async);
1501 return dev->dd_ops->dt_commit_async(env, dev);
1504 static inline int dt_init_capa_ctxt(const struct lu_env *env,
1505 struct dt_device *dev,
1506 int mode, unsigned long timeout,
1507 __u32 alg, struct lustre_capa_key *keys)
1510 LASSERT(dev->dd_ops);
1511 LASSERT(dev->dd_ops->dt_init_capa_ctxt);
1512 return dev->dd_ops->dt_init_capa_ctxt(env, dev, mode,
1513 timeout, alg, keys);
1516 static inline int dt_lookup(const struct lu_env *env,
1517 struct dt_object *dt,
1519 const struct dt_key *key,
1520 struct lustre_capa *capa)
1525 LASSERT(dt->do_index_ops);
1526 LASSERT(dt->do_index_ops->dio_lookup);
1528 ret = dt->do_index_ops->dio_lookup(env, dt, rec, key, capa);
1536 #define LU221_BAD_TIME (0x80000000U + 24 * 3600)
1538 struct dt_find_hint {
1539 struct lu_fid *dfh_fid;
1540 struct dt_device *dfh_dt;
1541 struct dt_object *dfh_o;
1544 struct dt_thread_info {
1545 char dti_buf[DT_MAX_PATH];
1546 struct dt_find_hint dti_dfh;
1547 struct lu_attr dti_attr;
1548 struct lu_fid dti_fid;
1549 struct dt_object_format dti_dof;
1550 struct lustre_mdt_attrs dti_lma;
1551 struct lu_buf dti_lb;
1552 struct lu_object_conf dti_conf;
1556 extern struct lu_context_key dt_key;
1558 static inline struct dt_thread_info *dt_info(const struct lu_env *env)
1560 struct dt_thread_info *dti;
1562 dti = lu_context_key_get(&env->le_ctx, &dt_key);
1567 int dt_global_init(void);
1568 void dt_global_fini(void);
1571 #ifndef HAVE_ONLY_PROCFS_SEQ
1572 int lprocfs_dt_rd_blksize(char *page, char **start, off_t off,
1573 int count, int *eof, void *data);
1574 int lprocfs_dt_rd_kbytestotal(char *page, char **start, off_t off,
1575 int count, int *eof, void *data);
1576 int lprocfs_dt_rd_kbytesfree(char *page, char **start, off_t off,
1577 int count, int *eof, void *data);
1578 int lprocfs_dt_rd_kbytesavail(char *page, char **start, off_t off,
1579 int count, int *eof, void *data);
1580 int lprocfs_dt_rd_filestotal(char *page, char **start, off_t off,
1581 int count, int *eof, void *data);
1582 int lprocfs_dt_rd_filesfree(char *page, char **start, off_t off,
1583 int count, int *eof, void *data);
1585 int lprocfs_dt_blksize_seq_show(struct seq_file *m, void *v);
1586 int lprocfs_dt_kbytestotal_seq_show(struct seq_file *m, void *v);
1587 int lprocfs_dt_kbytesfree_seq_show(struct seq_file *m, void *v);
1588 int lprocfs_dt_kbytesavail_seq_show(struct seq_file *m, void *v);
1589 int lprocfs_dt_filestotal_seq_show(struct seq_file *m, void *v);
1590 int lprocfs_dt_filesfree_seq_show(struct seq_file *m, void *v);
1591 # endif /* LPROCFS */
1593 #endif /* __LUSTRE_DT_OBJECT_H */