1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
4 * Copyright (C) 2002, 2003 Cluster File Systems, Inc.
6 * This file is part of the Lustre file system, http://www.lustre.org
7 * Lustre is a trademark of Cluster File Systems, Inc.
9 * You may have signed or agreed to another license before downloading
10 * this software. If so, you are bound by the terms and conditions
11 * of that agreement, and the following does not apply to you. See the
12 * LICENSE file included with this distribution for more information.
14 * If you did not agree to a different license, then this copy of Lustre
15 * is open source software; you can redistribute it and/or modify it
16 * under the terms of version 2 of the GNU General Public License as
17 * published by the Free Software Foundation.
19 * In either case, Lustre is distributed in the hope that it will be
20 * useful, but WITHOUT ANY WARRANTY; without even the implied warranty
21 * of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
22 * license text for more details.
26 # define EXPORT_SYMTAB
28 #define DEBUG_SUBSYSTEM S_LOV
31 #include <libcfs/libcfs.h>
33 #include <liblustre.h>
36 #include <obd_class.h>
38 #include <lustre/lustre_idl.h>
40 #include "lov_internal.h"
42 static void lov_init_set(struct lov_request_set *set)
45 set->set_completes = 0;
48 CFS_INIT_LIST_HEAD(&set->set_list);
49 atomic_set(&set->set_refcount, 1);
52 static void lov_finish_set(struct lov_request_set *set)
54 struct list_head *pos, *n;
58 list_for_each_safe(pos, n, &set->set_list) {
59 struct lov_request *req = list_entry(pos, struct lov_request,
61 list_del_init(&req->rq_link);
64 obdo_free(req->rq_oi.oi_oa);
66 OBD_FREE(req->rq_oi.oi_md, req->rq_buflen);
67 if (req->rq_oi.oi_osfs)
68 OBD_FREE(req->rq_oi.oi_osfs,
69 sizeof(*req->rq_oi.oi_osfs));
70 OBD_FREE(req, sizeof(*req));
74 int len = set->set_oabufs * sizeof(*set->set_pga);
75 OBD_FREE(set->set_pga, len);
78 lov_llh_put(set->set_lockh);
80 OBD_FREE(set, sizeof(*set));
84 void lov_update_set(struct lov_request_set *set,
85 struct lov_request *req, int rc)
95 int lov_update_common_set(struct lov_request_set *set,
96 struct lov_request *req, int rc)
98 struct lov_obd *lov = &set->set_exp->exp_obd->u.lov;
101 lov_update_set(set, req, rc);
103 /* grace error on inactive ost */
104 if (rc && !(lov->lov_tgts[req->rq_idx] &&
105 lov->lov_tgts[req->rq_idx]->ltd_active))
108 /* FIXME in raid1 regime, should return 0 */
112 void lov_set_add_req(struct lov_request *req, struct lov_request_set *set)
114 list_add_tail(&req->rq_link, &set->set_list);
118 int lov_update_enqueue_set(struct lov_request *req, __u32 mode, int rc)
120 struct lov_request_set *set = req->rq_rqset;
121 struct lustre_handle *lov_lockhp;
122 struct lov_oinfo *loi;
125 LASSERT(set != NULL);
126 LASSERT(set->set_oi != NULL);
128 lov_lockhp = set->set_lockh->llh_handles + req->rq_stripe;
129 loi = &set->set_oi->oi_md->lsm_oinfo[req->rq_stripe];
131 /* XXX LOV STACKING: OSC gets a copy, created in lov_prep_enqueue_set
132 * and that copy can be arbitrarily out of date.
134 * The LOV API is due for a serious rewriting anyways, and this
135 * can be addressed then. */
137 if (rc == ELDLM_OK) {
138 struct ldlm_lock *lock = ldlm_handle2lock(lov_lockhp);
141 LASSERT(lock != NULL);
142 lov_stripe_lock(set->set_oi->oi_md);
143 loi->loi_lvb = req->rq_oi.oi_md->lsm_oinfo->loi_lvb;
144 tmp = loi->loi_lvb.lvb_size;
145 /* Extend KMS up to the end of this lock and no further
146 * A lock on [x,y] means a KMS of up to y + 1 bytes! */
147 if (tmp > lock->l_policy_data.l_extent.end)
148 tmp = lock->l_policy_data.l_extent.end + 1;
149 if (tmp >= loi->loi_kms) {
150 LDLM_DEBUG(lock, "lock acquired, setting rss="LPU64
151 ", kms="LPU64, loi->loi_lvb.lvb_size, tmp);
153 loi->loi_kms_valid = 1;
155 LDLM_DEBUG(lock, "lock acquired, setting rss="
156 LPU64"; leaving kms="LPU64", end="LPU64,
157 loi->loi_lvb.lvb_size, loi->loi_kms,
158 lock->l_policy_data.l_extent.end);
160 lov_stripe_unlock(set->set_oi->oi_md);
161 ldlm_lock_allow_match(lock);
163 } else if ((rc == ELDLM_LOCK_ABORTED) &&
164 (set->set_ei->ei_flags & LDLM_FL_HAS_INTENT)) {
165 memset(lov_lockhp, 0, sizeof(*lov_lockhp));
166 lov_stripe_lock(set->set_oi->oi_md);
167 loi->loi_lvb = req->rq_oi.oi_md->lsm_oinfo->loi_lvb;
168 lov_stripe_unlock(set->set_oi->oi_md);
169 CDEBUG(D_INODE, "glimpsed, setting rss="LPU64"; leaving"
170 " kms="LPU64"\n", loi->loi_lvb.lvb_size, loi->loi_kms);
173 struct obd_export *exp = set->set_exp;
174 struct lov_obd *lov = &exp->exp_obd->u.lov;
176 memset(lov_lockhp, 0, sizeof(*lov_lockhp));
177 if (lov->lov_tgts[req->rq_idx] &&
178 lov->lov_tgts[req->rq_idx]->ltd_active) {
179 CERROR("error: enqueue objid "LPX64" subobj "
180 LPX64" on OST idx %d: rc = %d\n",
181 set->set_oi->oi_md->lsm_object_id,
182 loi->loi_id, loi->loi_ost_idx, rc);
187 lov_update_set(set, req, rc);
191 /* The callback for osc_enqueue that updates lov info for every OSC request. */
192 static int cb_update_enqueue(struct obd_info *oinfo, int rc)
194 struct obd_enqueue_info *einfo;
195 struct lov_request *lovreq;
197 lovreq = container_of(oinfo, struct lov_request, rq_oi);
198 einfo = lovreq->rq_rqset->set_ei;
199 return lov_update_enqueue_set(lovreq, einfo->ei_mode, rc);
202 static int enqueue_done(struct lov_request_set *set, __u32 mode)
204 struct lov_request *req;
205 struct lov_obd *lov = &set->set_exp->exp_obd->u.lov;
209 /* enqueue/match success, just return */
210 if (set->set_completes && set->set_completes == set->set_success)
213 /* cancel enqueued/matched locks */
214 list_for_each_entry(req, &set->set_list, rq_link) {
215 struct lustre_handle *lov_lockhp;
217 if (!req->rq_complete || req->rq_rc)
220 lov_lockhp = set->set_lockh->llh_handles + req->rq_stripe;
222 if (!lustre_handle_is_used(lov_lockhp))
225 rc = obd_cancel(lov->lov_tgts[req->rq_idx]->ltd_exp,
226 req->rq_oi.oi_md, mode, lov_lockhp);
227 if (rc && lov->lov_tgts[req->rq_idx] &&
228 lov->lov_tgts[req->rq_idx]->ltd_active)
229 CERROR("cancelling obdjid "LPX64" on OST "
230 "idx %d error: rc = %d\n",
231 req->rq_oi.oi_md->lsm_object_id,
235 lov_llh_put(set->set_lockh);
239 int lov_fini_enqueue_set(struct lov_request_set *set, __u32 mode, int rc)
246 LASSERT(set->set_exp);
247 /* Do enqueue_done only for sync requests and if any request
249 if (!set->set_ei->ei_rqset) {
251 set->set_completes = 0;
252 ret = enqueue_done(set, mode);
253 } else if (set->set_lockh)
254 lov_llh_put(set->set_lockh);
256 if (atomic_dec_and_test(&set->set_refcount))
259 RETURN(rc ? rc : ret);
262 int lov_prep_enqueue_set(struct obd_export *exp, struct obd_info *oinfo,
263 struct obd_enqueue_info *einfo,
264 struct lov_request_set **reqset)
266 struct lov_obd *lov = &exp->exp_obd->u.lov;
267 struct lov_request_set *set;
269 struct lov_oinfo *loi;
272 OBD_ALLOC(set, sizeof(*set));
280 set->set_lockh = lov_llh_new(oinfo->oi_md);
281 if (set->set_lockh == NULL)
282 GOTO(out_set, rc = -ENOMEM);
283 oinfo->oi_lockh->cookie = set->set_lockh->llh_handle.h_cookie;
285 loi = oinfo->oi_md->lsm_oinfo;
286 for (i = 0; i < oinfo->oi_md->lsm_stripe_count; i++, loi++) {
287 struct lov_request *req;
290 if (!lov_stripe_intersects(oinfo->oi_md, i,
291 oinfo->oi_policy.l_extent.start,
292 oinfo->oi_policy.l_extent.end,
296 if (!lov->lov_tgts[loi->loi_ost_idx] ||
297 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
298 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
302 OBD_ALLOC(req, sizeof(*req));
304 GOTO(out_set, rc = -ENOMEM);
306 req->rq_buflen = sizeof(*req->rq_oi.oi_md) +
307 sizeof(struct lov_oinfo);
308 OBD_ALLOC(req->rq_oi.oi_md, req->rq_buflen);
309 if (req->rq_oi.oi_md == NULL) {
310 OBD_FREE(req, sizeof(*req));
311 GOTO(out_set, rc = -ENOMEM);
315 /* Set lov request specific parameters. */
316 req->rq_oi.oi_lockh = set->set_lockh->llh_handles + i;
317 req->rq_oi.oi_cb_up = cb_update_enqueue;
319 LASSERT(req->rq_oi.oi_lockh);
321 req->rq_oi.oi_policy.l_extent.gid =
322 oinfo->oi_policy.l_extent.gid;
323 req->rq_oi.oi_policy.l_extent.start = start;
324 req->rq_oi.oi_policy.l_extent.end = end;
326 req->rq_idx = loi->loi_ost_idx;
329 /* XXX LOV STACKING: submd should be from the subobj */
330 req->rq_oi.oi_md->lsm_object_id = loi->loi_id;
331 req->rq_oi.oi_md->lsm_object_gr = oinfo->oi_md->lsm_object_gr;
332 req->rq_oi.oi_md->lsm_stripe_count = 0;
333 req->rq_oi.oi_md->lsm_oinfo->loi_kms_valid =
335 req->rq_oi.oi_md->lsm_oinfo->loi_kms = loi->loi_kms;
336 req->rq_oi.oi_md->lsm_oinfo->loi_lvb = loi->loi_lvb;
338 lov_set_add_req(req, set);
341 GOTO(out_set, rc = -EIO);
345 lov_fini_enqueue_set(set, einfo->ei_mode, rc);
349 int lov_update_match_set(struct lov_request_set *set, struct lov_request *req,
359 lov_update_set(set, req, ret);
363 int lov_fini_match_set(struct lov_request_set *set, __u32 mode, int flags)
370 LASSERT(set->set_exp);
371 rc = enqueue_done(set, mode);
372 if ((set->set_count == set->set_success) &&
373 (flags & LDLM_FL_TEST_LOCK))
374 lov_llh_put(set->set_lockh);
376 if (atomic_dec_and_test(&set->set_refcount))
382 int lov_prep_match_set(struct obd_export *exp, struct obd_info *oinfo,
383 struct lov_stripe_md *lsm, ldlm_policy_data_t *policy,
384 __u32 mode, struct lustre_handle *lockh,
385 struct lov_request_set **reqset)
387 struct lov_obd *lov = &exp->exp_obd->u.lov;
388 struct lov_request_set *set;
390 struct lov_oinfo *loi;
393 OBD_ALLOC(set, sizeof(*set));
400 set->set_oi->oi_md = lsm;
401 set->set_lockh = lov_llh_new(lsm);
402 if (set->set_lockh == NULL)
403 GOTO(out_set, rc = -ENOMEM);
404 lockh->cookie = set->set_lockh->llh_handle.h_cookie;
406 for (i = 0,loi = lsm->lsm_oinfo; i < lsm->lsm_stripe_count; i++, loi++){
407 struct lov_request *req;
410 if (!lov_stripe_intersects(lsm, i, policy->l_extent.start,
411 policy->l_extent.end, &start, &end))
414 /* FIXME raid1 should grace this error */
415 if (!lov->lov_tgts[loi->loi_ost_idx] ||
416 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
417 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
418 GOTO(out_set, rc = -EIO);
421 OBD_ALLOC(req, sizeof(*req));
423 GOTO(out_set, rc = -ENOMEM);
425 req->rq_buflen = sizeof(*req->rq_oi.oi_md);
426 OBD_ALLOC(req->rq_oi.oi_md, req->rq_buflen);
427 if (req->rq_oi.oi_md == NULL) {
428 OBD_FREE(req, sizeof(*req));
429 GOTO(out_set, rc = -ENOMEM);
432 req->rq_oi.oi_policy.l_extent.start = start;
433 req->rq_oi.oi_policy.l_extent.end = end;
434 req->rq_oi.oi_policy.l_extent.gid = policy->l_extent.gid;
436 req->rq_idx = loi->loi_ost_idx;
439 /* XXX LOV STACKING: submd should be from the subobj */
440 req->rq_oi.oi_md->lsm_object_id = loi->loi_id;
441 req->rq_oi.oi_md->lsm_object_gr = lsm->lsm_object_gr;
442 req->rq_oi.oi_md->lsm_stripe_count = 0;
444 lov_set_add_req(req, set);
447 GOTO(out_set, rc = -EIO);
451 lov_fini_match_set(set, mode, 0);
455 int lov_fini_cancel_set(struct lov_request_set *set)
463 LASSERT(set->set_exp);
465 lov_llh_put(set->set_lockh);
467 if (atomic_dec_and_test(&set->set_refcount))
473 int lov_prep_cancel_set(struct obd_export *exp, struct obd_info *oinfo,
474 struct lov_stripe_md *lsm, __u32 mode,
475 struct lustre_handle *lockh,
476 struct lov_request_set **reqset)
478 struct lov_request_set *set;
480 struct lov_oinfo *loi;
483 OBD_ALLOC(set, sizeof(*set));
490 set->set_oi->oi_md = lsm;
491 set->set_lockh = lov_handle2llh(lockh);
492 if (set->set_lockh == NULL) {
493 CERROR("LOV: invalid lov lock handle %p\n", lockh);
494 GOTO(out_set, rc = -EINVAL);
496 lockh->cookie = set->set_lockh->llh_handle.h_cookie;
498 for (i = 0,loi = lsm->lsm_oinfo; i < lsm->lsm_stripe_count; i++, loi++){
499 struct lov_request *req;
500 struct lustre_handle *lov_lockhp;
502 lov_lockhp = set->set_lockh->llh_handles + i;
503 if (!lustre_handle_is_used(lov_lockhp)) {
504 CDEBUG(D_HA, "lov idx %d subobj "LPX64" no lock?\n",
505 loi->loi_ost_idx, loi->loi_id);
509 OBD_ALLOC(req, sizeof(*req));
511 GOTO(out_set, rc = -ENOMEM);
513 req->rq_buflen = sizeof(*req->rq_oi.oi_md);
514 OBD_ALLOC(req->rq_oi.oi_md, req->rq_buflen);
515 if (req->rq_oi.oi_md == NULL) {
516 OBD_FREE(req, sizeof(*req));
517 GOTO(out_set, rc = -ENOMEM);
520 req->rq_idx = loi->loi_ost_idx;
523 /* XXX LOV STACKING: submd should be from the subobj */
524 req->rq_oi.oi_md->lsm_object_id = loi->loi_id;
525 req->rq_oi.oi_md->lsm_object_gr = lsm->lsm_object_gr;
526 req->rq_oi.oi_md->lsm_stripe_count = 0;
528 lov_set_add_req(req, set);
531 GOTO(out_set, rc = -EIO);
535 lov_fini_cancel_set(set);
539 static int create_done(struct obd_export *exp, struct lov_request_set *set,
540 struct lov_stripe_md **lsmp)
542 struct lov_obd *lov = &exp->exp_obd->u.lov;
543 struct obd_trans_info *oti = set->set_oti;
544 struct obdo *src_oa = set->set_oi->oi_oa;
545 struct lov_request *req;
546 struct obdo *ret_oa = NULL;
547 int attrset = 0, rc = 0;
550 LASSERT(set->set_completes);
552 /* try alloc objects on other osts if osc_create fails for
553 * exceptions: RPC failure, ENOSPC, etc */
554 if (set->set_count != set->set_success) {
555 list_for_each_entry (req, &set->set_list, rq_link) {
559 set->set_completes--;
560 req->rq_complete = 0;
562 rc = qos_remedy_create(set, req);
563 lov_update_create_set(set, req, rc);
570 /* no successful creates */
571 if (set->set_success == 0)
574 /* If there was an explicit stripe set, fail. Otherwise, we
575 * got some objects and that's not bad. */
576 if (set->set_count != set->set_success) {
579 set->set_count = set->set_success;
583 ret_oa = obdo_alloc();
585 GOTO(cleanup, rc = -ENOMEM);
587 list_for_each_entry(req, &set->set_list, rq_link) {
588 if (!req->rq_complete || req->rq_rc)
590 lov_merge_attrs(ret_oa, req->rq_oi.oi_oa,
591 req->rq_oi.oi_oa->o_valid, set->set_oi->oi_md,
592 req->rq_stripe, &attrset);
594 if (src_oa->o_valid & OBD_MD_FLSIZE &&
595 ret_oa->o_size != src_oa->o_size) {
596 CERROR("original size "LPU64" isn't new object size "LPU64"\n",
597 src_oa->o_size, ret_oa->o_size);
600 ret_oa->o_id = src_oa->o_id;
601 ret_oa->o_gr = src_oa->o_gr;
602 ret_oa->o_valid |= OBD_MD_FLID | OBD_MD_FLGROUP;
603 memcpy(src_oa, ret_oa, sizeof(*src_oa));
606 *lsmp = set->set_oi->oi_md;
610 list_for_each_entry(req, &set->set_list, rq_link) {
611 struct obd_export *sub_exp;
614 if (!req->rq_complete || req->rq_rc)
617 sub_exp = lov->lov_tgts[req->rq_idx]->ltd_exp;
618 err = obd_destroy(sub_exp, req->rq_oi.oi_oa, NULL, oti, NULL);
620 CERROR("Failed to uncreate objid "LPX64" subobj "
621 LPX64" on OST idx %d: rc = %d\n",
622 src_oa->o_id, req->rq_oi.oi_oa->o_id,
626 obd_free_memmd(exp, &set->set_oi->oi_md);
628 if (oti && set->set_cookies) {
629 oti->oti_logcookies = set->set_cookies;
630 if (!set->set_cookie_sent) {
631 oti_free_cookies(oti);
632 src_oa->o_valid &= ~OBD_MD_FLCOOKIE;
634 src_oa->o_valid |= OBD_MD_FLCOOKIE;
640 int lov_fini_create_set(struct lov_request_set *set,struct lov_stripe_md **lsmp)
647 LASSERT(set->set_exp);
648 if (set->set_completes)
649 rc = create_done(set->set_exp, set, lsmp);
651 if (atomic_dec_and_test(&set->set_refcount))
657 int lov_update_create_set(struct lov_request_set *set,
658 struct lov_request *req, int rc)
660 struct obd_trans_info *oti = set->set_oti;
661 struct lov_stripe_md *lsm = set->set_oi->oi_md;
662 struct lov_oinfo *loi;
663 struct lov_obd *lov = &set->set_exp->exp_obd->u.lov;
666 req->rq_stripe = set->set_success;
667 loi = &lsm->lsm_oinfo[req->rq_stripe];
669 if (rc && lov->lov_tgts[req->rq_idx] &&
670 lov->lov_tgts[req->rq_idx]->ltd_active) {
671 CERROR("error creating fid "LPX64" sub-object"
672 " on OST idx %d/%d: rc = %d\n",
673 set->set_oi->oi_oa->o_id, req->rq_idx,
674 lsm->lsm_stripe_count, rc);
676 CERROR("obd_create returned invalid err %d\n", rc);
680 lov_update_set(set, req, rc);
684 if (oti && oti->oti_objid)
685 oti->oti_objid[req->rq_idx] = req->rq_oi.oi_oa->o_id;
687 loi->loi_id = req->rq_oi.oi_oa->o_id;
688 loi->loi_gr = req->rq_oi.oi_oa->o_gr;
689 loi->loi_ost_idx = req->rq_idx;
690 CDEBUG(D_INODE, "objid "LPX64" has subobj "LPX64"/"LPU64" at idx %d\n",
691 lsm->lsm_object_id, loi->loi_id, loi->loi_id, req->rq_idx);
694 if (oti && set->set_cookies)
695 ++oti->oti_logcookies;
696 if (req->rq_oi.oi_oa->o_valid & OBD_MD_FLCOOKIE)
697 set->set_cookie_sent++;
702 int lov_prep_create_set(struct obd_export *exp, struct obd_info *oinfo,
703 struct lov_stripe_md **lsmp, struct obdo *src_oa,
704 struct obd_trans_info *oti,
705 struct lov_request_set **reqset)
707 struct lov_request_set *set;
711 OBD_ALLOC(set, sizeof(*set));
718 set->set_oi->oi_md = *lsmp;
719 set->set_oi->oi_oa = src_oa;
722 rc = qos_prep_create(exp, set);
724 lov_fini_create_set(set, lsmp);
730 static int common_attr_done(struct lov_request_set *set)
732 struct list_head *pos;
733 struct lov_request *req;
735 int rc = 0, attrset = 0;
738 LASSERT(set->set_oi != NULL);
740 if (set->set_oi->oi_oa == NULL)
743 if (!set->set_success)
746 tmp_oa = obdo_alloc();
748 GOTO(out, rc = -ENOMEM);
750 list_for_each (pos, &set->set_list) {
751 req = list_entry(pos, struct lov_request, rq_link);
753 if (!req->rq_complete || req->rq_rc)
755 if (req->rq_oi.oi_oa->o_valid == 0) /* inactive stripe */
757 lov_merge_attrs(tmp_oa, req->rq_oi.oi_oa,
758 req->rq_oi.oi_oa->o_valid,
759 set->set_oi->oi_md, req->rq_stripe, &attrset);
762 CERROR("No stripes had valid attrs\n");
765 tmp_oa->o_id = set->set_oi->oi_oa->o_id;
766 memcpy(set->set_oi->oi_oa, tmp_oa, sizeof(*set->set_oi->oi_oa));
774 static int brw_done(struct lov_request_set *set)
776 struct lov_stripe_md *lsm = set->set_oi->oi_md;
777 struct lov_oinfo *loi = NULL;
778 struct list_head *pos;
779 struct lov_request *req;
782 list_for_each (pos, &set->set_list) {
783 req = list_entry(pos, struct lov_request, rq_link);
785 if (!req->rq_complete || req->rq_rc)
788 loi = &lsm->lsm_oinfo[req->rq_stripe];
790 if (req->rq_oi.oi_oa->o_valid & OBD_MD_FLBLOCKS)
791 loi->loi_lvb.lvb_blocks = req->rq_oi.oi_oa->o_blocks;
797 int lov_fini_brw_set(struct lov_request_set *set)
804 LASSERT(set->set_exp);
805 if (set->set_completes) {
807 /* FIXME update qos data here */
809 if (atomic_dec_and_test(&set->set_refcount))
815 int lov_prep_brw_set(struct obd_export *exp, struct obd_info *oinfo,
816 obd_count oa_bufs, struct brw_page *pga,
817 struct obd_trans_info *oti,
818 struct lov_request_set **reqset)
825 struct lov_request_set *set;
826 struct lov_oinfo *loi = NULL;
827 struct lov_obd *lov = &exp->exp_obd->u.lov;
828 int rc = 0, i, shift;
831 OBD_ALLOC(set, sizeof(*set));
839 set->set_oabufs = oa_bufs;
840 OBD_ALLOC(set->set_pga, oa_bufs * sizeof(*set->set_pga));
842 GOTO(out, rc = -ENOMEM);
844 OBD_ALLOC(info, sizeof(*info) * oinfo->oi_md->lsm_stripe_count);
846 GOTO(out, rc = -ENOMEM);
848 /* calculate the page count for each stripe */
849 for (i = 0; i < oa_bufs; i++) {
850 int stripe = lov_stripe_number(oinfo->oi_md, pga[i].off);
851 info[stripe].count++;
854 /* alloc and initialize lov request */
856 for (i = 0, loi = oinfo->oi_md->lsm_oinfo;
857 i < oinfo->oi_md->lsm_stripe_count; i++, loi++){
858 struct lov_request *req;
860 if (info[i].count == 0)
863 if (!lov->lov_tgts[loi->loi_ost_idx] ||
864 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
865 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
866 GOTO(out, rc = -EIO);
869 OBD_ALLOC(req, sizeof(*req));
871 GOTO(out, rc = -ENOMEM);
873 req->rq_oi.oi_oa = obdo_alloc();
874 if (req->rq_oi.oi_oa == NULL) {
875 OBD_FREE(req, sizeof(*req));
876 GOTO(out, rc = -ENOMEM);
880 memcpy(req->rq_oi.oi_oa, oinfo->oi_oa,
881 sizeof(*req->rq_oi.oi_oa));
883 req->rq_oi.oi_oa->o_id = loi->loi_id;
884 req->rq_oi.oi_oa->o_stripe_idx = i;
886 req->rq_buflen = sizeof(*req->rq_oi.oi_md);
887 OBD_ALLOC(req->rq_oi.oi_md, req->rq_buflen);
888 if (req->rq_oi.oi_md == NULL) {
889 obdo_free(req->rq_oi.oi_oa);
890 OBD_FREE(req, sizeof(*req));
891 GOTO(out, rc = -ENOMEM);
894 req->rq_idx = loi->loi_ost_idx;
897 /* XXX LOV STACKING */
898 req->rq_oi.oi_md->lsm_object_id = loi->loi_id;
899 req->rq_oi.oi_md->lsm_object_gr = oinfo->oi_md->lsm_object_gr;
900 req->rq_oabufs = info[i].count;
901 req->rq_pgaidx = shift;
902 shift += req->rq_oabufs;
904 /* remember the index for sort brw_page array */
905 info[i].index = req->rq_pgaidx;
907 req->rq_oi.oi_capa = oinfo->oi_capa;
909 lov_set_add_req(req, set);
912 GOTO(out, rc = -EIO);
914 /* rotate & sort the brw_page array */
915 for (i = 0; i < oa_bufs; i++) {
916 int stripe = lov_stripe_number(oinfo->oi_md, pga[i].off);
918 shift = info[stripe].index + info[stripe].off;
919 LASSERT(shift < oa_bufs);
920 set->set_pga[shift] = pga[i];
921 lov_stripe_offset(oinfo->oi_md, pga[i].off, stripe,
922 &set->set_pga[shift].off);
927 OBD_FREE(info, sizeof(*info) * oinfo->oi_md->lsm_stripe_count);
932 lov_fini_brw_set(set);
937 int lov_fini_getattr_set(struct lov_request_set *set)
944 LASSERT(set->set_exp);
945 if (set->set_completes)
946 rc = common_attr_done(set);
948 if (atomic_dec_and_test(&set->set_refcount))
954 /* The callback for osc_getattr_async that finilizes a request info when a
955 * response is recieved. */
956 static int cb_getattr_update(struct obd_info *oinfo, int rc)
958 struct lov_request *lovreq;
959 lovreq = container_of(oinfo, struct lov_request, rq_oi);
960 return lov_update_common_set(lovreq->rq_rqset, lovreq, rc);
963 int lov_prep_getattr_set(struct obd_export *exp, struct obd_info *oinfo,
964 struct lov_request_set **reqset)
966 struct lov_request_set *set;
967 struct lov_oinfo *loi = NULL;
968 struct lov_obd *lov = &exp->exp_obd->u.lov;
972 OBD_ALLOC(set, sizeof(*set));
980 loi = oinfo->oi_md->lsm_oinfo;
981 for (i = 0; i < oinfo->oi_md->lsm_stripe_count; i++, loi++) {
982 struct lov_request *req;
984 if (!lov->lov_tgts[loi->loi_ost_idx] ||
985 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
986 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
990 OBD_ALLOC(req, sizeof(*req));
992 GOTO(out_set, rc = -ENOMEM);
995 req->rq_idx = loi->loi_ost_idx;
997 req->rq_oi.oi_oa = obdo_alloc();
998 if (req->rq_oi.oi_oa == NULL) {
999 OBD_FREE(req, sizeof(*req));
1000 GOTO(out_set, rc = -ENOMEM);
1002 memcpy(req->rq_oi.oi_oa, oinfo->oi_oa,
1003 sizeof(*req->rq_oi.oi_oa));
1004 req->rq_oi.oi_oa->o_id = loi->loi_id;
1005 req->rq_oi.oi_cb_up = cb_getattr_update;
1006 req->rq_oi.oi_capa = oinfo->oi_capa;
1007 req->rq_rqset = set;
1009 lov_set_add_req(req, set);
1011 if (!set->set_count)
1012 GOTO(out_set, rc = -EIO);
1016 lov_fini_getattr_set(set);
1020 int lov_fini_destroy_set(struct lov_request_set *set)
1026 LASSERT(set->set_exp);
1027 if (set->set_completes) {
1028 /* FIXME update qos data here */
1031 if (atomic_dec_and_test(&set->set_refcount))
1032 lov_finish_set(set);
1037 int lov_prep_destroy_set(struct obd_export *exp, struct obd_info *oinfo,
1038 struct obdo *src_oa, struct lov_stripe_md *lsm,
1039 struct obd_trans_info *oti,
1040 struct lov_request_set **reqset)
1042 struct lov_request_set *set;
1043 struct lov_oinfo *loi = NULL;
1044 struct lov_obd *lov = &exp->exp_obd->u.lov;
1048 OBD_ALLOC(set, sizeof(*set));
1054 set->set_oi = oinfo;
1055 set->set_oi->oi_md = lsm;
1056 set->set_oi->oi_oa = src_oa;
1058 if (oti != NULL && src_oa->o_valid & OBD_MD_FLCOOKIE)
1059 set->set_cookies = oti->oti_logcookies;
1061 loi = lsm->lsm_oinfo;
1062 for (i = 0; i < lsm->lsm_stripe_count; i++, loi++) {
1063 struct lov_request *req;
1065 if (!lov->lov_tgts[loi->loi_ost_idx] ||
1066 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
1067 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
1071 OBD_ALLOC(req, sizeof(*req));
1073 GOTO(out_set, rc = -ENOMEM);
1076 req->rq_idx = loi->loi_ost_idx;
1078 req->rq_oi.oi_oa = obdo_alloc();
1079 if (req->rq_oi.oi_oa == NULL) {
1080 OBD_FREE(req, sizeof(*req));
1081 GOTO(out_set, rc = -ENOMEM);
1083 memcpy(req->rq_oi.oi_oa, src_oa, sizeof(*req->rq_oi.oi_oa));
1084 req->rq_oi.oi_oa->o_id = loi->loi_id;
1085 lov_set_add_req(req, set);
1087 if (!set->set_count)
1088 GOTO(out_set, rc = -EIO);
1092 lov_fini_destroy_set(set);
1096 int lov_fini_setattr_set(struct lov_request_set *set)
1103 LASSERT(set->set_exp);
1104 if (set->set_completes) {
1105 rc = common_attr_done(set);
1106 /* FIXME update qos data here */
1109 if (atomic_dec_and_test(&set->set_refcount))
1110 lov_finish_set(set);
1114 int lov_update_setattr_set(struct lov_request_set *set,
1115 struct lov_request *req, int rc)
1117 struct lov_obd *lov = &req->rq_rqset->set_exp->exp_obd->u.lov;
1118 struct lov_stripe_md *lsm = req->rq_rqset->set_oi->oi_md;
1121 lov_update_set(set, req, rc);
1123 /* grace error on inactive ost */
1124 if (rc && !(lov->lov_tgts[req->rq_idx] &&
1125 lov->lov_tgts[req->rq_idx]->ltd_active))
1129 if (req->rq_oi.oi_oa->o_valid & OBD_MD_FLCTIME)
1130 lsm->lsm_oinfo[req->rq_stripe].loi_lvb.lvb_ctime =
1131 req->rq_oi.oi_oa->o_ctime;
1132 if (req->rq_oi.oi_oa->o_valid & OBD_MD_FLMTIME)
1133 lsm->lsm_oinfo[req->rq_stripe].loi_lvb.lvb_mtime =
1134 req->rq_oi.oi_oa->o_mtime;
1135 if (req->rq_oi.oi_oa->o_valid & OBD_MD_FLATIME)
1136 lsm->lsm_oinfo[req->rq_stripe].loi_lvb.lvb_atime =
1137 req->rq_oi.oi_oa->o_atime;
1143 /* The callback for osc_setattr_async that finilizes a request info when a
1144 * response is recieved. */
1145 static int cb_setattr_update(struct obd_info *oinfo, int rc)
1147 struct lov_request *lovreq;
1148 lovreq = container_of(oinfo, struct lov_request, rq_oi);
1149 return lov_update_setattr_set(lovreq->rq_rqset, lovreq, rc);
1152 int lov_prep_setattr_set(struct obd_export *exp, struct obd_info *oinfo,
1153 struct obd_trans_info *oti,
1154 struct lov_request_set **reqset)
1156 struct lov_request_set *set;
1157 struct lov_oinfo *loi = NULL;
1158 struct lov_obd *lov = &exp->exp_obd->u.lov;
1162 OBD_ALLOC(set, sizeof(*set));
1169 set->set_oi = oinfo;
1170 if (oti != NULL && oinfo->oi_oa->o_valid & OBD_MD_FLCOOKIE)
1171 set->set_cookies = oti->oti_logcookies;
1173 loi = oinfo->oi_md->lsm_oinfo;
1174 for (i = 0; i < oinfo->oi_md->lsm_stripe_count; i++, loi++) {
1175 struct lov_request *req;
1177 if (!lov->lov_tgts[loi->loi_ost_idx] ||
1178 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
1179 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
1183 OBD_ALLOC(req, sizeof(*req));
1185 GOTO(out_set, rc = -ENOMEM);
1187 req->rq_idx = loi->loi_ost_idx;
1189 req->rq_oi.oi_oa = obdo_alloc();
1190 if (req->rq_oi.oi_oa == NULL) {
1191 OBD_FREE(req, sizeof(*req));
1192 GOTO(out_set, rc = -ENOMEM);
1194 memcpy(req->rq_oi.oi_oa, oinfo->oi_oa,
1195 sizeof(*req->rq_oi.oi_oa));
1196 req->rq_oi.oi_oa->o_id = loi->loi_id;
1197 LASSERT(!(req->rq_oi.oi_oa->o_valid & OBD_MD_FLGROUP)
1198 || req->rq_oi.oi_oa->o_gr>0);
1199 req->rq_oi.oi_oa->o_stripe_idx = i;
1200 req->rq_oi.oi_cb_up = cb_setattr_update;
1201 req->rq_oi.oi_capa = oinfo->oi_capa;
1202 req->rq_rqset = set;
1204 if (oinfo->oi_oa->o_valid & OBD_MD_FLSIZE) {
1205 int off = lov_stripe_offset(oinfo->oi_md,
1206 oinfo->oi_oa->o_size, i,
1207 &req->rq_oi.oi_oa->o_size);
1209 if (off < 0 && req->rq_oi.oi_oa->o_size)
1210 req->rq_oi.oi_oa->o_size--;
1212 CDEBUG(D_INODE, "stripe %d has size "LPU64"/"LPU64"\n",
1213 i, req->rq_oi.oi_oa->o_size,
1214 oinfo->oi_oa->o_size);
1216 lov_set_add_req(req, set);
1218 if (!set->set_count)
1219 GOTO(out_set, rc = -EIO);
1223 lov_fini_setattr_set(set);
1227 int lov_fini_punch_set(struct lov_request_set *set)
1234 LASSERT(set->set_exp);
1235 if (set->set_completes) {
1236 if (!set->set_success)
1238 /* FIXME update qos data here */
1241 if (atomic_dec_and_test(&set->set_refcount))
1242 lov_finish_set(set);
1247 /* The callback for osc_punch that finilizes a request info when a response
1249 static int cb_update_punch(struct obd_info *oinfo, int rc)
1251 struct lov_request *lovreq;
1252 lovreq = container_of(oinfo, struct lov_request, rq_oi);
1253 return lov_update_common_set(lovreq->rq_rqset, lovreq, rc);
1256 int lov_prep_punch_set(struct obd_export *exp, struct obd_info *oinfo,
1257 struct obd_trans_info *oti,
1258 struct lov_request_set **reqset)
1260 struct lov_request_set *set;
1261 struct lov_oinfo *loi = NULL;
1262 struct lov_obd *lov = &exp->exp_obd->u.lov;
1266 OBD_ALLOC(set, sizeof(*set));
1271 set->set_oi = oinfo;
1274 loi = oinfo->oi_md->lsm_oinfo;
1275 for (i = 0; i < oinfo->oi_md->lsm_stripe_count; i++, loi++) {
1276 struct lov_request *req;
1279 if (!lov->lov_tgts[loi->loi_ost_idx] ||
1280 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
1281 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
1285 if (!lov_stripe_intersects(oinfo->oi_md, i,
1286 oinfo->oi_policy.l_extent.start,
1287 oinfo->oi_policy.l_extent.end,
1291 OBD_ALLOC(req, sizeof(*req));
1293 GOTO(out_set, rc = -ENOMEM);
1295 req->rq_idx = loi->loi_ost_idx;
1297 req->rq_oi.oi_oa = obdo_alloc();
1298 if (req->rq_oi.oi_oa == NULL) {
1299 OBD_FREE(req, sizeof(*req));
1300 GOTO(out_set, rc = -ENOMEM);
1302 memcpy(req->rq_oi.oi_oa, oinfo->oi_oa,
1303 sizeof(*req->rq_oi.oi_oa));
1304 req->rq_oi.oi_oa->o_id = loi->loi_id;
1305 req->rq_oi.oi_oa->o_gr = loi->loi_gr;
1306 req->rq_oi.oi_oa->o_valid |= OBD_MD_FLGROUP;
1308 req->rq_oi.oi_oa->o_stripe_idx = i;
1309 req->rq_oi.oi_cb_up = cb_update_punch;
1310 req->rq_rqset = set;
1312 req->rq_oi.oi_policy.l_extent.start = rs;
1313 req->rq_oi.oi_policy.l_extent.end = re;
1314 req->rq_oi.oi_policy.l_extent.gid = -1;
1316 req->rq_oi.oi_capa = oinfo->oi_capa;
1318 lov_set_add_req(req, set);
1320 if (!set->set_count)
1321 GOTO(out_set, rc = -EIO);
1325 lov_fini_punch_set(set);
1329 int lov_fini_sync_set(struct lov_request_set *set)
1336 LASSERT(set->set_exp);
1337 if (set->set_completes) {
1338 if (!set->set_success)
1340 /* FIXME update qos data here */
1343 if (atomic_dec_and_test(&set->set_refcount))
1344 lov_finish_set(set);
1349 int lov_prep_sync_set(struct obd_export *exp, struct obd_info *oinfo,
1350 struct obdo *src_oa, struct lov_stripe_md *lsm,
1351 obd_off start, obd_off end,
1352 struct lov_request_set **reqset)
1354 struct lov_request_set *set;
1355 struct lov_oinfo *loi = NULL;
1356 struct lov_obd *lov = &exp->exp_obd->u.lov;
1360 OBD_ALLOC(set, sizeof(*set));
1366 set->set_oi = oinfo;
1367 set->set_oi->oi_md = lsm;
1368 set->set_oi->oi_oa = src_oa;
1370 loi = lsm->lsm_oinfo;
1371 for (i = 0; i < lsm->lsm_stripe_count; i++, loi++) {
1372 struct lov_request *req;
1375 if (!lov->lov_tgts[loi->loi_ost_idx] ||
1376 !lov->lov_tgts[loi->loi_ost_idx]->ltd_active) {
1377 CDEBUG(D_HA, "lov idx %d inactive\n", loi->loi_ost_idx);
1381 if (!lov_stripe_intersects(lsm, i, start, end, &rs, &re))
1384 OBD_ALLOC(req, sizeof(*req));
1386 GOTO(out_set, rc = -ENOMEM);
1388 req->rq_idx = loi->loi_ost_idx;
1390 req->rq_oi.oi_oa = obdo_alloc();
1391 if (req->rq_oi.oi_oa == NULL) {
1392 OBD_FREE(req, sizeof(*req));
1393 GOTO(out_set, rc = -ENOMEM);
1395 memcpy(req->rq_oi.oi_oa, src_oa, sizeof(*req->rq_oi.oi_oa));
1396 req->rq_oi.oi_oa->o_id = loi->loi_id;
1397 req->rq_oi.oi_oa->o_stripe_idx = i;
1399 req->rq_oi.oi_policy.l_extent.start = rs;
1400 req->rq_oi.oi_policy.l_extent.end = re;
1401 req->rq_oi.oi_policy.l_extent.gid = -1;
1403 lov_set_add_req(req, set);
1405 if (!set->set_count)
1406 GOTO(out_set, rc = -EIO);
1410 lov_fini_sync_set(set);
1414 #define LOV_U64_MAX ((__u64)~0ULL)
1415 #define LOV_SUM_MAX(tot, add) \
1417 if ((tot) + (add) < (tot)) \
1418 (tot) = LOV_U64_MAX; \
1423 int lov_fini_statfs(struct obd_device *obd, struct obd_statfs *osfs,int success)
1428 __u32 expected_stripes = lov_get_stripecnt(&obd->u.lov, 0);
1430 if (osfs->os_files != LOV_U64_MAX)
1431 do_div(osfs->os_files, expected_stripes);
1432 if (osfs->os_ffree != LOV_U64_MAX)
1433 do_div(osfs->os_ffree, expected_stripes);
1435 spin_lock(&obd->obd_osfs_lock);
1436 memcpy(&obd->obd_osfs, osfs, sizeof(*osfs));
1437 obd->obd_osfs_age = get_jiffies_64();
1438 spin_unlock(&obd->obd_osfs_lock);
1445 int lov_fini_statfs_set(struct lov_request_set *set)
1453 if (set->set_completes) {
1454 rc = lov_fini_statfs(set->set_obd, set->set_oi->oi_osfs,
1458 if (atomic_dec_and_test(&set->set_refcount))
1459 lov_finish_set(set);
1464 void lov_update_statfs(struct obd_device *obd, struct obd_statfs *osfs,
1465 struct obd_statfs *lov_sfs, int success)
1467 spin_lock(&obd->obd_osfs_lock);
1468 memcpy(&obd->obd_osfs, lov_sfs, sizeof(*lov_sfs));
1469 obd->obd_osfs_age = get_jiffies_64();
1470 spin_unlock(&obd->obd_osfs_lock);
1473 memcpy(osfs, lov_sfs, sizeof(*lov_sfs));
1476 /* Sandia requested that df (and so, statfs) only
1477 returned minimal available space on
1478 a single OST, so people would be able to
1479 write this much data guaranteed. */
1480 if (osfs->os_bavail > lov_sfs->os_bavail) {
1481 /* Presumably if new bavail is smaller,
1482 new bfree is bigger as well */
1483 osfs->os_bfree = lov_sfs->os_bfree;
1484 osfs->os_bavail = lov_sfs->os_bavail;
1487 osfs->os_bfree += lov_sfs->os_bfree;
1488 osfs->os_bavail += lov_sfs->os_bavail;
1490 osfs->os_blocks += lov_sfs->os_blocks;
1491 /* XXX not sure about this one - depends on policy.
1492 * - could be minimum if we always stripe on all OBDs
1493 * (but that would be wrong for any other policy,
1494 * if one of the OBDs has no more objects left)
1495 * - could be sum if we stripe whole objects
1496 * - could be average, just to give a nice number
1498 * To give a "reasonable" (if not wholly accurate)
1499 * number, we divide the total number of free objects
1500 * by expected stripe count (watch out for overflow).
1502 LOV_SUM_MAX(osfs->os_files, lov_sfs->os_files);
1503 LOV_SUM_MAX(osfs->os_ffree, lov_sfs->os_ffree);
1507 /* The callback for osc_statfs_async that finilizes a request info when a
1508 * response is recieved. */
1509 static int cb_statfs_update(struct obd_info *oinfo, int rc)
1511 struct lov_request *lovreq;
1512 struct obd_statfs *osfs, *lov_sfs;
1513 struct obd_device *obd;
1514 struct lov_obd *lov;
1518 lovreq = container_of(oinfo, struct lov_request, rq_oi);
1519 lov = &lovreq->rq_rqset->set_obd->u.lov;
1520 obd = class_exp2obd(lov->lov_tgts[lovreq->rq_idx]->ltd_exp);
1522 osfs = lovreq->rq_rqset->set_oi->oi_osfs;
1523 lov_sfs = oinfo->oi_osfs;
1525 success = lovreq->rq_rqset->set_success;
1527 /* XXX: the same is done in lov_update_common_set, however
1528 lovset->set_exp is not initialized. */
1529 lov_update_set(lovreq->rq_rqset, lovreq, rc);
1531 if (rc && !(lov->lov_tgts[lovreq->rq_idx] &&
1532 lov->lov_tgts[lovreq->rq_idx]->ltd_active))
1537 lov_update_statfs(obd, osfs, lov_sfs, success);
1541 int lov_prep_statfs_set(struct obd_device *obd, struct obd_info *oinfo,
1542 struct lov_request_set **reqset)
1544 struct lov_request_set *set;
1545 struct lov_obd *lov = &obd->u.lov;
1549 OBD_ALLOC(set, sizeof(*set));
1555 set->set_oi = oinfo;
1557 /* We only get block data from the OBD */
1558 for (i = 0; i < lov->desc.ld_tgt_count; i++) {
1559 struct lov_request *req;
1561 if (!lov->lov_tgts[i] || !lov->lov_tgts[i]->ltd_active) {
1562 CDEBUG(D_HA, "lov idx %d inactive\n", i);
1566 OBD_ALLOC(req, sizeof(*req));
1568 GOTO(out_set, rc = -ENOMEM);
1570 OBD_ALLOC(req->rq_oi.oi_osfs, sizeof(*req->rq_oi.oi_osfs));
1571 if (req->rq_oi.oi_osfs == NULL) {
1572 OBD_FREE(req, sizeof(*req));
1573 GOTO(out_set, rc = -ENOMEM);
1577 req->rq_oi.oi_cb_up = cb_statfs_update;
1578 req->rq_rqset = set;
1580 lov_set_add_req(req, set);
1582 if (!set->set_count)
1583 GOTO(out_set, rc = -EIO);
1587 lov_fini_statfs_set(set);