4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; if not, write to the
18 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
19 * Boston, MA 021110-1307, USA
24 * Copyright (c) 2012, Intel Corporation.
25 * Use is subject to license terms.
27 * Author: Johann Lombardi <johann.lombardi@intel.com>
28 * Author: Niu Yawei <yawei.niu@intel.com>
31 #define DEBUG_SUBSYSTEM S_LQUOTA
33 #include <obd_class.h>
34 #include "qmt_internal.h"
37 * Retrieve quota settings for a given identifier.
39 * \param env - is the environment passed by the caller
40 * \param qmt - is the quota master target
41 * \param pool_id - is the 16-bit pool identifier
42 * \param restype - is the pool type, either block (i.e. LQUOTA_RES_DT) or inode
43 * (i.e. LQUOTA_RES_MD)
44 * \param qtype - is the quota type
45 * \param id - is the quota indentifier for which we want to acces quota
47 * \param hard - is the output variable where to copy the hard limit
48 * \param soft - is the output variable where to copy the soft limit
49 * \param time - is the output variable where to copy the grace time
51 static int qmt_get(const struct lu_env *env, struct qmt_device *qmt,
52 __u16 pool_id, __u8 restype, __u8 qtype, union lquota_id *id,
53 __u64 *hard, __u64 *soft, __u64 *time)
55 struct lquota_entry *lqe;
58 /* look-up lqe structure containing quota settings */
59 lqe = qmt_pool_lqe_lookup(env, qmt, pool_id, restype, qtype, id);
63 /* copy quota settings */
65 LQUOTA_DEBUG(lqe, "fetch settings");
67 *hard = lqe->lqe_hardlimit;
69 *soft = lqe->lqe_softlimit;
71 *time = lqe->lqe_gracetime;
79 * Update quota settings for a given identifier.
81 * \param env - is the environment passed by the caller
82 * \param qmt - is the quota master target
83 * \param pool_id - is the 16-bit pool identifier
84 * \param restype - is the pool type, either block (i.e. LQUOTA_RES_DT) or inode
85 * (i.e. LQUOTA_RES_MD)
86 * \param qtype - is the quota type
87 * \param id - is the quota indentifier for which we want to modify quota
89 * \param hard - is the new hard limit
90 * \param soft - is the new soft limit
91 * \param time - is the new grace time
92 * \param valid - is the list of settings to change
94 static int qmt_set(const struct lu_env *env, struct qmt_device *qmt,
95 __u16 pool_id, __u8 restype, __u8 qtype,
96 union lquota_id *id, __u64 hard, __u64 soft, __u64 time,
99 struct qmt_thread_info *qti = qmt_info(env);
100 struct lquota_entry *lqe;
101 struct thandle *th = NULL;
103 bool dirtied = false;
107 /* look-up quota entry associated with this ID */
108 lqe = qmt_pool_lqe_lookup(env, qmt, pool_id, restype, qtype, id);
110 RETURN(PTR_ERR(lqe));
112 /* allocate & start transaction with enough credits to update quota
113 * settings in the global index file */
114 th = qmt_trans_start(env, lqe, &qti->qti_restore);
116 GOTO(out_nolock, rc = PTR_ERR(th));
118 now = cfs_time_current_sec();
121 LQUOTA_DEBUG(lqe, "changing quota settings valid:%x hard:"LPU64" soft:"
122 LPU64" time:"LPU64, valid, hard, soft, time);
124 if ((valid & QIF_TIMES) != 0 && lqe->lqe_gracetime != time) {
125 /* change time settings */
126 lqe->lqe_gracetime = time;
130 if ((valid & QIF_LIMITS) != 0 &&
131 (lqe->lqe_hardlimit != hard || lqe->lqe_softlimit != soft)) {
132 rc = qmt_validate_limits(lqe, hard, soft);
136 /* recompute qunit in case it was never initialized */
137 qmt_revalidate(env, lqe);
139 /* change quota limits */
140 lqe->lqe_hardlimit = hard;
141 lqe->lqe_softlimit = soft;
143 /* clear grace time */
144 if (lqe->lqe_softlimit == 0 ||
145 lqe->lqe_granted <= lqe->lqe_softlimit)
146 /* no soft limit or below soft limit, let's clear grace
148 lqe->lqe_gracetime = 0;
149 else if ((valid & QIF_TIMES) == 0)
150 /* set grace only if user hasn't provided his own */
151 lqe->lqe_gracetime = now + qmt_lqe_grace(lqe);
153 /* change enforced status based on new parameters */
154 if (lqe->lqe_hardlimit == 0 && lqe->lqe_softlimit == 0)
155 lqe->lqe_enforced = false;
157 lqe->lqe_enforced = true;
163 /* write new quota settings to disk */
164 rc = qmt_glb_write(env, th, lqe, LQUOTA_BUMP_VER, &ver);
166 /* restore initial quota settings */
167 qmt_restore(lqe, &qti->qti_restore);
171 /* compute new qunit value now that we have modified the quota
173 qmt_adjust_qunit(env, lqe);
175 /* clear/set edquot flag as needed */
176 qmt_adjust_edquot(lqe, now);
180 lqe_write_unlock(lqe);
184 if (th != NULL && !IS_ERR(th))
185 dt_trans_stop(env, qmt->qmt_child, th);
187 if (rc == 0 && dirtied)
188 qmt_glb_lock_notify(env, lqe, ver);
194 * Handle quotactl request.
196 * \param env - is the environment passed by the caller
197 * \param ld - is the lu device associated with the qmt
198 * \param oqctl - is the quotactl request
200 static int qmt_quotactl(const struct lu_env *env, struct lu_device *ld,
201 struct obd_quotactl *oqctl)
203 struct qmt_thread_info *qti = qmt_info(env);
204 union lquota_id *id = &qti->qti_id;
205 struct qmt_device *qmt = lu2qmt_dev(ld);
206 struct obd_dqblk *dqb = &oqctl->qc_dqblk;
210 LASSERT(qmt != NULL);
212 if (oqctl->qc_type >= LL_MAXQUOTAS)
213 /* invalid quota type */
216 switch (oqctl->qc_cmd) {
218 case Q_GETINFO: /* read grace times */
219 /* Global grace time is stored in quota settings of ID 0. */
222 /* read inode grace time */
223 rc = qmt_get(env, qmt, 0, LQUOTA_RES_MD, oqctl->qc_type, id,
224 NULL, NULL, &oqctl->qc_dqinfo.dqi_igrace);
228 /* read block grace time */
229 rc = qmt_get(env, qmt, 0, LQUOTA_RES_DT, oqctl->qc_type, id,
230 NULL, NULL, &oqctl->qc_dqinfo.dqi_bgrace);
233 case Q_SETINFO: /* modify grace times */
234 /* setinfo should be using dqi->dqi_valid, but lfs incorrectly
235 * sets the valid flags in dqb->dqb_valid instead, try to live
238 /* Global grace time is stored in quota settings of ID 0. */
241 if ((dqb->dqb_valid & QIF_ITIME) != 0) {
242 /* set inode grace time */
243 rc = qmt_set(env, qmt, 0, LQUOTA_RES_MD, oqctl->qc_type,
244 id, 0, 0, oqctl->qc_dqinfo.dqi_igrace,
250 if ((dqb->dqb_valid & QIF_BTIME) != 0)
251 /* set block grace time */
252 rc = qmt_set(env, qmt, 0, LQUOTA_RES_DT, oqctl->qc_type,
253 id, 0, 0, oqctl->qc_dqinfo.dqi_bgrace,
257 case Q_GETQUOTA: /* consult quota limit */
258 /* There is no quota limit for root user & group */
259 if (oqctl->qc_id == 0) {
260 memset(dqb, 0, sizeof(*dqb));
261 dqb->dqb_valid = QIF_LIMITS | QIF_TIMES;
264 /* extract quota ID from quotactl request */
265 id->qid_uid = oqctl->qc_id;
267 /* look-up inode quota settings */
268 rc = qmt_get(env, qmt, 0, LQUOTA_RES_MD, oqctl->qc_type, id,
269 &dqb->dqb_ihardlimit, &dqb->dqb_isoftlimit,
274 dqb->dqb_valid |= QIF_ILIMITS | QIF_ITIME;
275 /* master isn't aware of actual inode usage */
276 dqb->dqb_curinodes = 0;
278 /* look-up block quota settings */
279 rc = qmt_get(env, qmt, 0, LQUOTA_RES_DT, oqctl->qc_type, id,
280 &dqb->dqb_bhardlimit, &dqb->dqb_bsoftlimit,
285 dqb->dqb_valid |= QIF_BLIMITS | QIF_BTIME;
286 /* master doesn't know the actual block usage */
287 dqb->dqb_curspace = 0;
290 case Q_SETQUOTA: /* change quota limits */
291 if (oqctl->qc_id == 0)
292 /* can't enforce a quota limit for root user & group */
294 /* extract quota ID from quotactl request */
295 id->qid_uid = oqctl->qc_id;
297 if ((dqb->dqb_valid & QIF_IFLAGS) != 0) {
298 /* update inode quota settings */
299 rc = qmt_set(env, qmt, 0, LQUOTA_RES_MD, oqctl->qc_type,
300 id, dqb->dqb_ihardlimit,
301 dqb->dqb_isoftlimit, dqb->dqb_itime,
302 dqb->dqb_valid & QIF_IFLAGS);
307 if ((dqb->dqb_valid & QIF_BFLAGS) != 0)
308 /* update block quota settings */
309 rc = qmt_set(env, qmt, 0, LQUOTA_RES_DT, oqctl->qc_type,
310 id, dqb->dqb_bhardlimit,
311 dqb->dqb_bsoftlimit, dqb->dqb_btime,
312 dqb->dqb_valid & QIF_BFLAGS);
316 CERROR("%s: unsupported quotactl command: %d\n",
317 qmt->qmt_svname, oqctl->qc_cmd);
325 * Helper function to handle quota request from slave.
327 * \param env - is the environment passed by the caller
328 * \param lqe - is the lquota_entry subject to the quota request
329 * \param qmt - is the master device
330 * \param uuid - is the uuid associated with the slave
331 * \param qb_flags - are the quota request flags as packed in the quota_body
332 * \param qb_count - is the amount of quota space the slave wants to
334 * \param qb_usage - is the current space usage on the slave
335 * \param repbody - is the quota_body of reply
337 * \retval 0 : success
338 * \retval -EDQUOT : out of quota
339 * -EINPROGRESS : inform client to retry write/create
340 * -ve : other appropriate errors
342 int qmt_dqacq0(const struct lu_env *env, struct lquota_entry *lqe,
343 struct qmt_device *qmt, struct obd_uuid *uuid, __u32 qb_flags,
344 __u64 qb_count, __u64 qb_usage, struct quota_body *repbody)
346 struct qmt_thread_info *qti = qmt_info(env);
348 struct dt_object *slv_obj = NULL;
349 __u64 slv_granted, slv_granted_bck;
350 struct thandle *th = NULL;
354 LASSERT(uuid != NULL);
356 /* initialize reply */
357 memset(repbody, 0, sizeof(*repbody));
358 memcpy(&repbody->qb_id, &lqe->lqe_id, sizeof(repbody->qb_id));
360 if (OBD_FAIL_CHECK(OBD_FAIL_QUOTA_RECOVERABLE_ERR))
361 RETURN(-cfs_fail_val);
363 /* look-up index file associated with acquiring slave */
364 slv_obj = lquota_disk_slv_find(env, qmt->qmt_child, LQE_ROOT(lqe),
365 lu_object_fid(&LQE_GLB_OBJ(lqe)->do_lu),
368 GOTO(out, rc = PTR_ERR(slv_obj));
370 /* pack slave fid in reply just for sanity check */
371 memcpy(&repbody->qb_slv_fid, lu_object_fid(&slv_obj->do_lu),
372 sizeof(struct lu_fid));
374 /* allocate & start transaction with enough credits to update
375 * global & slave indexes */
376 th = qmt_trans_start_with_slv(env, lqe, slv_obj, &qti->qti_restore);
378 GOTO(out, rc = PTR_ERR(th));
381 LQUOTA_DEBUG(lqe, "dqacq starts uuid:%s flags:0x%x wanted:"LPU64
382 " usage:"LPU64, obd_uuid2str(uuid), qb_flags, qb_count,
385 /* Legal race, limits have been removed on master, but slave didn't
386 * receive the change yet. Just return EINPROGRESS until the slave gets
388 if (!lqe->lqe_enforced && !req_is_rel(qb_flags))
389 GOTO(out_locked, rc = -ESRCH);
391 /* recompute qunit in case it was never initialized */
392 qmt_revalidate(env, lqe);
394 /* slave just wants to acquire per-ID lock */
395 if (req_is_acq(qb_flags) && qb_count == 0)
396 GOTO(out_locked, rc = 0);
398 /* fetch how much quota space is already granted to this slave */
399 rc = qmt_slv_read(env, lqe, slv_obj, &slv_granted);
401 LQUOTA_ERROR(lqe, "Failed to get granted for slave %s, rc=%d",
402 obd_uuid2str(uuid), rc);
403 GOTO(out_locked, rc);
405 /* recall how much space this slave currently owns in order to restore
406 * it in case of failure */
407 slv_granted_bck = slv_granted;
409 /* record current time for soft limit & grace time management */
410 now = (__u64)cfs_time_current_sec();
412 if (req_is_rel(qb_flags)) {
413 /* Slave would like to release quota space */
414 if (slv_granted < qb_count ||
415 lqe->lqe_granted < qb_count) {
416 /* can't release more than granted */
417 LQUOTA_ERROR(lqe, "Release too much! uuid:%s release:"
418 LPU64" granted:"LPU64", total:"LPU64,
419 obd_uuid2str(uuid), qb_count,
420 slv_granted, lqe->lqe_granted);
421 GOTO(out_locked, rc = -EINVAL);
424 repbody->qb_count = qb_count;
425 /* put released space back to global pool */
426 QMT_REL(lqe, slv_granted, qb_count);
427 GOTO(out_write, rc = 0);
430 if (req_has_rep(qb_flags) && slv_granted < qb_usage) {
431 /* Slave is reporting space usage in quota request and it turns
432 * out to be using more quota space than owned, so we adjust
433 * granted space regardless of the current state of affairs */
434 repbody->qb_count = qb_usage - slv_granted;
435 QMT_GRANT(lqe, slv_granted, repbody->qb_count);
438 if (!req_is_acq(qb_flags) && !req_is_preacq(qb_flags))
439 GOTO(out_write, rc = 0);
441 qmt_adjust_edquot(lqe, now);
443 /* no hope to claim further space back */
444 GOTO(out_write, rc = -EDQUOT);
446 if (qmt_space_exhausted(lqe, now)) {
447 /* might have some free space once rebalancing is completed */
448 rc = req_is_acq(qb_flags) ? -EINPROGRESS : -EDQUOT;
452 if (req_is_preacq(qb_flags)) {
453 /* slave would like to pre-acquire quota space. To do so, it
454 * reports in qb_count how much spare quota space it owns and we
455 * can grant back quota space which is consistent with qunit
458 if (qb_count >= lqe->lqe_qunit)
459 /* slave already own the maximum it should */
460 GOTO(out_write, rc = 0);
462 count = qmt_alloc_expand(lqe, slv_granted, qb_count);
464 GOTO(out_write, rc = -EDQUOT);
466 repbody->qb_count += count;
467 QMT_GRANT(lqe, slv_granted, count);
468 GOTO(out_write, rc = 0);
471 /* processing acquire request with clients waiting */
472 if (lqe->lqe_hardlimit != 0 &&
473 lqe->lqe_granted + qb_count > lqe->lqe_hardlimit) {
474 /* cannot grant as much as asked, but can still afford to grant
475 * some quota space back */
476 count = lqe->lqe_hardlimit - lqe->lqe_granted;
477 repbody->qb_count += count;
478 QMT_GRANT(lqe, slv_granted, count);
479 GOTO(out_write, rc = 0);
482 /* Whouhou! we can satisfy the slave request! */
483 repbody->qb_count += qb_count;
484 QMT_GRANT(lqe, slv_granted, qb_count);
486 /* Try to expand the acquired count for DQACQ */
487 count = qmt_alloc_expand(lqe, slv_granted, 0);
489 /* can even grant more than asked, it is like xmas ... */
490 repbody->qb_count += count;
491 QMT_GRANT(lqe, slv_granted, count);
492 GOTO(out_write, rc = 0);
495 GOTO(out_write, rc = 0);
497 if (repbody->qb_count == 0)
498 GOTO(out_locked, rc);
500 /* start/stop grace timer if required */
501 if (lqe->lqe_softlimit != 0) {
502 if (lqe->lqe_granted > lqe->lqe_softlimit &&
503 lqe->lqe_gracetime == 0)
504 /* first time over soft limit, let's start grace
506 lqe->lqe_gracetime = now + qmt_lqe_grace(lqe);
507 else if (lqe->lqe_granted <= lqe->lqe_softlimit &&
508 lqe->lqe_gracetime != 0)
509 /* Clear grace timer */
510 lqe->lqe_gracetime = 0;
513 /* Update slave index first since it is easier to roll back */
514 ret = qmt_slv_write(env, th, lqe, slv_obj, LQUOTA_BUMP_VER,
515 &repbody->qb_slv_ver, slv_granted);
517 /* restore initial quota settings */
518 qmt_restore(lqe, &qti->qti_restore);
520 repbody->qb_count = 0;
521 GOTO(out_locked, rc = ret);
524 /* Update global index, no version bump needed */
525 ret = qmt_glb_write(env, th, lqe, 0, NULL);
528 /* restore initial quota settings */
529 qmt_restore(lqe, &qti->qti_restore);
531 repbody->qb_count = 0;
533 /* restore previous granted value */
534 ret = qmt_slv_write(env, th, lqe, slv_obj, 0, NULL,
537 LQUOTA_ERROR(lqe, "failed to restore initial slave "
538 "value rc:%d ret%d", rc, ret);
541 qmt_adjust_edquot(lqe, now);
542 GOTO(out_locked, rc);
545 /* Total granted has been changed, let's try to adjust the qunit
546 * size according to the total granted & limits. */
547 qmt_adjust_qunit(env, lqe);
549 /* clear/set edquot flag and notify slaves via glimpse if needed */
550 qmt_adjust_edquot(lqe, now);
552 LQUOTA_DEBUG(lqe, "dqacq ends count:"LPU64" ver:"LPU64" rc:%d",
553 repbody->qb_count, repbody->qb_slv_ver, rc);
554 lqe_write_unlock(lqe);
556 if (th != NULL && !IS_ERR(th))
557 dt_trans_stop(env, qmt->qmt_child, th);
559 if (slv_obj != NULL && !IS_ERR(slv_obj))
560 lu_object_put(env, &slv_obj->do_lu);
562 if ((req_is_acq(qb_flags) || req_is_preacq(qb_flags)) &&
563 OBD_FAIL_CHECK(OBD_FAIL_QUOTA_EDQUOT)) {
564 /* introduce inconsistency between granted value in slave index
565 * and slave index copy of slave */
566 repbody->qb_count = 0;
574 * Handle quota request from slave.
576 * \param env - is the environment passed by the caller
577 * \param ld - is the lu device associated with the qmt
578 * \param req - is the quota acquire request
580 static int qmt_dqacq(const struct lu_env *env, struct lu_device *ld,
581 struct ptlrpc_request *req)
583 struct qmt_device *qmt = lu2qmt_dev(ld);
584 struct quota_body *qbody, *repbody;
585 struct obd_uuid *uuid;
586 struct ldlm_lock *lock;
587 struct lquota_entry *lqe;
588 int pool_id, pool_type, qtype;
592 qbody = req_capsule_client_get(&req->rq_pill, &RMF_QUOTA_BODY);
594 RETURN(err_serious(-EPROTO));
596 repbody = req_capsule_server_get(&req->rq_pill, &RMF_QUOTA_BODY);
598 RETURN(err_serious(-EFAULT));
600 /* verify if global lock is stale */
601 if (!lustre_handle_is_used(&qbody->qb_glb_lockh))
604 lock = ldlm_handle2lock(&qbody->qb_glb_lockh);
609 uuid = &req->rq_export->exp_client_uuid;
611 if (req_is_rel(qbody->qb_flags) + req_is_acq(qbody->qb_flags) +
612 req_is_preacq(qbody->qb_flags) > 1) {
613 CERROR("%s: malformed quota request with conflicting flags set "
614 "(%x) from slave %s\n", qmt->qmt_svname,
615 qbody->qb_flags, obd_uuid2str(uuid));
619 if (req_is_acq(qbody->qb_flags) || req_is_preacq(qbody->qb_flags)) {
620 /* acquire and pre-acquire should use a valid ID lock */
622 if (!lustre_handle_is_used(&qbody->qb_lockh))
625 lock = ldlm_handle2lock(&qbody->qb_lockh);
627 /* no lock associated with this handle */
630 LDLM_DEBUG(lock, "%sacquire request",
631 req_is_preacq(qbody->qb_flags) ? "pre" : "");
633 if (!obd_uuid_equals(&lock->l_export->exp_client_uuid, uuid)) {
634 /* sorry, no way to cheat ... */
639 if (ldlm_is_ast_sent(lock)) {
640 struct ptlrpc_service_part *svc;
641 unsigned int timeout;
643 svc = req->rq_rqbd->rqbd_svcpt;
644 timeout = at_est2timeout(at_get(&svc->scp_at_estimate));
645 timeout += (ldlm_bl_timeout(lock) >> 1);
647 /* lock is being cancelled, prolong timeout */
648 ldlm_refresh_waiting_lock(lock, timeout);
653 /* extract pool & quota information from global index FID packed in the
655 rc = lquota_extract_fid(&qbody->qb_fid, &pool_id, &pool_type, &qtype);
659 /* Find the quota entry associated with the quota id */
660 lqe = qmt_pool_lqe_lookup(env, qmt, pool_id, pool_type, qtype,
663 RETURN(PTR_ERR(lqe));
665 /* process quota request */
666 rc = qmt_dqacq0(env, lqe, qmt, uuid, qbody->qb_flags, qbody->qb_count,
667 qbody->qb_usage, repbody);
669 if (lustre_handle_is_used(&qbody->qb_lockh))
670 /* return current qunit value only to slaves owning an per-ID
671 * quota lock. For enqueue, the qunit value will be returned in
673 repbody->qb_qunit = lqe->lqe_qunit;
678 /* Vector of quota request handlers. This vector is used by the MDT to forward
679 * requests to the quota master. */
680 struct qmt_handlers qmt_hdls = {
681 /* quota request handlers */
682 .qmth_quotactl = qmt_quotactl,
683 .qmth_dqacq = qmt_dqacq,
686 .qmth_intent_policy = qmt_intent_policy,
687 .qmth_lvbo_init = qmt_lvbo_init,
688 .qmth_lvbo_update = qmt_lvbo_update,
689 .qmth_lvbo_size = qmt_lvbo_size,
690 .qmth_lvbo_fill = qmt_lvbo_fill,
691 .qmth_lvbo_free = qmt_lvbo_free,
693 EXPORT_SYMBOL(qmt_hdls);