4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License version 2 for more details. A copy is
14 * included in the COPYING file that accompanied this code.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 * Copyright 2009 Sun Microsystems, Inc. All rights reserved
24 * Use is subject to license terms.
26 * Copyright (c) 2012, 2013, Intel Corporation.
29 * This file is part of Lustre, http://www.lustre.org/
30 * Lustre is a trademark of Sun Microsystems, Inc.
32 * lustre/lod/lod_internal.h
34 * Author: Alex Zhuravlev <alexey.zhuravlev@intel.com>
35 * Author: Mikhail Pershin <mike.pershin@intel.com>
38 #ifndef _LOD_INTERNAL_H
39 #define _LOD_INTERNAL_H
41 #include <libcfs/libcfs.h>
43 #include <dt_object.h>
45 #define LOV_USES_ASSIGNED_STRIPE 0
46 #define LOV_USES_DEFAULT_STRIPE 1
49 __u32 lqr_start_idx; /* start index of new inode */
50 __u32 lqr_offset_idx; /* aliasing for start_idx */
51 int lqr_start_count; /* reseed counter */
52 struct ost_pool lqr_pool; /* round-robin optimized list */
53 unsigned long lqr_dirty:1; /* recalc round-robin list */
57 char pool_name[LOV_MAXPOOLNAME + 1];
58 struct ost_pool pool_obds; /* pool members */
59 atomic_t pool_refcount;
60 struct lod_qos_rr pool_rr;
61 cfs_hlist_node_t pool_hash; /* access by poolname */
62 struct list_head pool_list;
63 struct proc_dir_entry *pool_proc_entry;
64 struct obd_device *pool_lobd; /* owner */
67 #define pool_tgt_size(p) ((p)->pool_obds.op_size)
68 #define pool_tgt_count(p) ((p)->pool_obds.op_count)
69 #define pool_tgt_array(p) ((p)->pool_obds.op_array)
70 #define pool_tgt_rw_sem(p) ((p)->pool_obds.op_rw_sem)
73 struct list_head lq_oss_list;
74 struct rw_semaphore lq_rw_sem;
75 __u32 lq_active_oss_count;
76 unsigned int lq_prio_free; /* priority for free space */
77 unsigned int lq_threshold_rr;/* priority for rr */
78 struct lod_qos_rr lq_rr; /* round robin qos data */
79 bool lq_dirty:1, /* recalc qos data */
80 lq_same_space:1,/* the ost's all have approx.
81 the same space avail */
82 lq_reset:1; /* zero current penalties */
86 struct obd_uuid lqo_uuid; /* ptlrpc's c_remote_uuid */
87 struct list_head lqo_oss_list; /* link to lov_qos */
88 __u64 lqo_bavail; /* total bytes avail on OSS */
89 __u64 lqo_penalty; /* current penalty */
90 __u64 lqo_penalty_per_obj; /* penalty decrease
92 time_t lqo_used; /* last used time, seconds */
93 __u32 lqo_ost_count; /* number of osts on this oss */
97 struct lod_qos_oss *ltq_oss; /* oss info */
98 __u64 ltq_penalty; /* current penalty */
99 __u64 ltq_penalty_per_obj; /* penalty decrease
101 __u64 ltq_weight; /* net weighting */
102 time_t ltq_used; /* last used time, seconds */
103 bool ltq_usable:1; /* usable for striping */
106 struct lod_tgt_desc {
107 struct dt_device *ltd_tgt;
108 struct list_head ltd_kill;
109 struct obd_export *ltd_exp;
110 struct obd_uuid ltd_uuid;
113 struct ltd_qos ltd_qos; /* qos info per target */
114 struct obd_statfs ltd_statfs;
115 unsigned long ltd_active:1,/* is this target up for requests */
116 ltd_activate:1,/* should target be activated */
117 ltd_reap:1; /* should this target be deleted */
120 #define TGT_PTRS 256 /* number of pointers at 1st level */
121 #define TGT_PTRS_PER_BLOCK 256 /* number of pointers at 2nd level */
123 struct lod_tgt_desc_idx {
124 struct lod_tgt_desc *ldi_tgt[TGT_PTRS_PER_BLOCK];
127 #define LTD_TGT(ltd, index) \
128 ((ltd)->ltd_tgt_idx[(index) / \
129 TGT_PTRS_PER_BLOCK]->ldi_tgt[(index) % TGT_PTRS_PER_BLOCK])
131 #define OST_TGT(lod, index) LTD_TGT(&lod->lod_ost_descs, index)
132 struct lod_tgt_descs {
133 /* list of known TGTs */
134 struct lod_tgt_desc_idx *ltd_tgt_idx[TGT_PTRS];
135 /* Size of the lod_tgts array, granted to be a power of 2 */
137 /* number of registered TGTs */
139 /* bitmap of TGTs available */
140 cfs_bitmap_t *ltd_tgt_bitmap;
141 /* TGTs scheduled to be deleted */
143 /* Table refcount used for delayed deletion */
145 /* mutex to serialize concurrent updates to the tgt table */
146 struct mutex ltd_mutex;
147 /* read/write semaphore used for array relocation */
148 struct rw_semaphore ltd_rw_sem;
152 struct dt_device lod_dt_dev;
153 struct obd_export *lod_child_exp;
154 struct dt_device *lod_child;
155 cfs_proc_dir_entry_t *lod_proc_entry;
156 struct lprocfs_stats *lod_stats;
157 spinlock_t lod_connects_lock;
159 unsigned int lod_recovery_completed:1,
162 /* lov settings descriptor storing static information */
163 struct lov_desc lod_desc;
165 /* use to protect ld_active_tgt_count and all ltd_active */
166 spinlock_t lod_desc_lock;
168 /* Description of OST */
169 struct lod_tgt_descs lod_ost_descs;
170 /* Description of MDT */
171 struct lod_tgt_descs lod_mdt_descs;
173 /* maximum EA size underlied OSD may have */
174 unsigned int lod_osd_max_easize;
176 /*FIXME: When QOS and pool is implemented for MDT, probably these
177 * structure should be moved to lod_tgt_descs as well.
179 /* QoS info per LOD */
180 struct lod_qos lod_qos; /* qos info per lod */
183 struct ost_pool lod_pool_info; /* all OSTs in a packed array */
185 cfs_hash_t *lod_pools_hash_body; /* used for key access */
186 cfs_list_t lod_pool_list; /* used for sequential access */
187 cfs_proc_dir_entry_t *lod_pool_proc_entry;
189 enum lustre_sec_part lod_sp_me;
191 cfs_proc_dir_entry_t *lod_symlink;
194 #define lod_osts lod_ost_descs.ltd_tgts
195 #define lod_ost_bitmap lod_ost_descs.ltd_tgt_bitmap
196 #define lod_ostnr lod_ost_descs.ltd_tgtnr
197 #define lod_osts_size lod_ost_descs.ltd_tgts_size
198 #define ltd_ost ltd_tgt
199 #define lod_ost_desc lod_tgt_desc
202 * XXX: shrink this structure, currently it's 72bytes on 32bit arch,
203 * so, slab will be allocating 128bytes
206 struct dt_object ldo_obj;
208 /* if object is striped, then the next fields describe stripes */
210 __u16 ldo_layout_gen;
211 __u32 ldo_stripe_size;
213 __u16 ldo_released_stripenr;
215 struct dt_object **ldo_stripe;
216 /* to know how much memory to free, ldo_stripenr can be less */
217 /* default striping for directory represented by this object
218 * is cached in stripenr/stripe_size */
219 unsigned int ldo_stripes_allocated:16,
220 ldo_striping_cached:1,
221 ldo_def_striping_set:1;
222 __u32 ldo_def_stripe_size;
223 __u16 ldo_def_stripenr;
224 __u16 ldo_def_stripe_offset;
230 struct dt_object *lit_obj; /* object from the layer below */
231 struct dt_it *lit_it; /* iterator from the layer below */
234 struct lod_thread_info {
235 /* per-thread buffer for LOV EA */
237 int lti_ea_store_size;
238 struct lu_buf lti_buf;
239 struct ost_id lti_ostid;
240 struct lu_fid lti_fid;
241 struct obd_statfs lti_osfs;
242 struct lu_attr lti_attr;
243 struct lod_it lti_it;
246 extern const struct lu_device_operations lod_lu_ops;
248 static inline int lu_device_is_lod(struct lu_device *d)
250 return ergo(d != NULL && d->ld_ops != NULL, d->ld_ops == &lod_lu_ops);
253 static inline struct lod_device* lu2lod_dev(struct lu_device *d)
255 LASSERT(lu_device_is_lod(d));
256 return container_of0(d, struct lod_device, lod_dt_dev.dd_lu_dev);
259 static inline struct lu_device *lod2lu_dev(struct lod_device *d)
261 return &d->lod_dt_dev.dd_lu_dev;
264 static inline struct obd_device *lod2obd(struct lod_device *d)
266 return d->lod_dt_dev.dd_lu_dev.ld_obd;
269 static inline struct lod_device *dt2lod_dev(struct dt_device *d)
271 LASSERT(lu_device_is_lod(&d->dd_lu_dev));
272 return container_of0(d, struct lod_device, lod_dt_dev);
275 static inline struct lod_object *lu2lod_obj(struct lu_object *o)
277 LASSERT(ergo(o != NULL, lu_device_is_lod(o->lo_dev)));
278 return container_of0(o, struct lod_object, ldo_obj.do_lu);
281 static inline struct lu_object *lod2lu_obj(struct lod_object *obj)
283 return &obj->ldo_obj.do_lu;
286 static inline struct lod_object *lod_obj(const struct lu_object *o)
288 LASSERT(lu_device_is_lod(o->lo_dev));
289 return container_of0(o, struct lod_object, ldo_obj.do_lu);
292 static inline struct lod_object *lod_dt_obj(const struct dt_object *d)
294 return lod_obj(&d->do_lu);
297 static inline struct dt_object* lod_object_child(struct lod_object *o)
299 return container_of0(lu_object_next(lod2lu_obj(o)),
300 struct dt_object, do_lu);
303 static inline struct dt_object *dt_object_child(struct dt_object *o)
305 return container_of0(lu_object_next(&(o)->do_lu),
306 struct dt_object, do_lu);
309 extern struct lu_context_key lod_thread_key;
311 static inline struct lod_thread_info *lod_env_info(const struct lu_env *env)
313 struct lod_thread_info *info;
314 info = lu_context_key_get(&env->le_ctx, &lod_thread_key);
319 #define lod_foreach_ost(__dev, index) \
320 if ((__dev)->lod_osts_size > 0) \
321 cfs_foreach_bit((__dev)->lod_ost_bitmap, (index))
324 int lod_fld_lookup(const struct lu_env *env, struct lod_device *lod,
325 const struct lu_fid *fid, mdsno_t *tgt, int flags);
327 void lod_getref(struct lod_tgt_descs *ltd);
328 void lod_putref(struct lod_device *lod, struct lod_tgt_descs *ltd);
329 int lod_add_device(const struct lu_env *env, struct lod_device *lod,
330 char *osp, unsigned index, unsigned gen, int mdt_index,
331 char *type, int active);
332 int lod_del_device(const struct lu_env *env, struct lod_device *lod,
333 struct lod_tgt_descs *ltd, char *osp, unsigned idx,
335 int lod_fini_tgt(struct lod_device *lod, struct lod_tgt_descs *ltd);
336 int lod_load_striping(const struct lu_env *env, struct lod_object *mo);
337 int lod_get_lov_ea(const struct lu_env *env, struct lod_object *mo);
338 void lod_fix_desc(struct lov_desc *desc);
339 void lod_fix_desc_qos_maxage(__u32 *val);
340 void lod_fix_desc_pattern(__u32 *val);
341 void lod_fix_desc_stripe_count(__u32 *val);
342 void lod_fix_desc_stripe_size(__u64 *val);
343 int lod_pools_init(struct lod_device *m, struct lustre_cfg *cfg);
344 int lod_pools_fini(struct lod_device *m);
345 int lod_parse_striping(const struct lu_env *env, struct lod_object *mo,
346 const struct lu_buf *buf);
347 int lod_initialize_objects(const struct lu_env *env, struct lod_object *mo,
348 struct lov_ost_data_v1 *objs);
349 int lod_store_def_striping(const struct lu_env *env, struct dt_object *dt,
351 int lod_verify_striping(struct lod_device *d, const struct lu_buf *buf, int specific);
352 int lod_generate_and_set_lovea(const struct lu_env *env,
353 struct lod_object *mo, struct thandle *th);
356 int lod_ost_pool_add(struct ost_pool *op, __u32 idx, unsigned int min_count);
357 int lod_ost_pool_remove(struct ost_pool *op, __u32 idx);
358 int lod_ost_pool_extend(struct ost_pool *op, unsigned int min_count);
359 struct pool_desc *lod_find_pool(struct lod_device *lod, char *poolname);
360 void lod_pool_putref(struct pool_desc *pool);
361 int lod_ost_pool_free(struct ost_pool *op);
362 int lod_pool_del(struct obd_device *obd, char *poolname);
363 int lod_ost_pool_init(struct ost_pool *op, unsigned int count);
364 extern cfs_hash_ops_t pool_hash_operations;
365 int lod_check_index_in_pool(__u32 idx, struct pool_desc *pool);
366 int lod_pool_new(struct obd_device *obd, char *poolname);
367 int lod_pool_add(struct obd_device *obd, char *poolname, char *ostname);
368 int lod_pool_remove(struct obd_device *obd, char *poolname, char *ostname);
371 int lod_qos_prep_create(const struct lu_env *env, struct lod_object *lo,
372 struct lu_attr *attr, const struct lu_buf *buf,
374 int qos_add_tgt(struct lod_device*, struct lod_tgt_desc *);
375 int qos_del_tgt(struct lod_device *, struct lod_tgt_desc *);
378 void lprocfs_lod_init_vars(struct lprocfs_static_vars *lvars);
379 int lod_procfs_init(struct lod_device *lod);
380 void lod_procfs_fini(struct lod_device *lod);
383 int lod_object_set_pool(struct lod_object *o, char *pool);
384 int lod_declare_striped_object(const struct lu_env *env, struct dt_object *dt,
385 struct lu_attr *attr,
386 const struct lu_buf *lovea, struct thandle *th);
387 int lod_striping_create(const struct lu_env *env, struct dt_object *dt,
388 struct lu_attr *attr, struct dt_object_format *dof,
390 void lod_object_free_striping(const struct lu_env *env, struct lod_object *lo);