1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2 * vim:expandtab:shiftwidth=8:tabstop=8:
6 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
8 * This program is free software; you can redistribute it and/or modify
9 * it under the terms of the GNU General Public License version 2 only,
10 * as published by the Free Software Foundation.
12 * This program is distributed in the hope that it will be useful, but
13 * WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * General Public License version 2 for more details (a copy is included
16 * in the LICENSE file that accompanied this code).
18 * You should have received a copy of the GNU General Public License
19 * version 2 along with this program; If not, see
20 * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
22 * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
23 * CA 95054 USA or visit www.sun.com if you need additional information or
29 * Copyright 2008 Sun Microsystems, Inc. All rights reserved
30 * Use is subject to license terms.
33 * This file is part of Lustre, http://www.lustre.org/
34 * Lustre is a trademark of Sun Microsystems, Inc.
37 # define EXPORT_SYMTAB
39 #define DEBUG_SUBSYSTEM S_LQUOTA
42 # include <linux/version.h>
43 # include <linux/module.h>
44 # include <linux/init.h>
45 # include <linux/fs.h>
46 # include <linux/jbd.h>
47 # include <linux/quota.h>
48 # include <linux/smp_lock.h>
49 # include <linux/buffer_head.h>
50 # include <linux/workqueue.h>
51 # include <linux/mount.h>
52 #else /* __KERNEL__ */
53 # include <liblustre.h>
56 #include <obd_class.h>
57 #include <lustre_mds.h>
58 #include <lustre_dlm.h>
59 #include <lustre_cfg.h>
61 #include <lustre_fsfilt.h>
62 #include <linux/lustre_quota.h>
63 #include <class_hash.h>
64 #include "quota_internal.h"
66 #ifdef HAVE_QUOTA_SUPPORT
69 /* this function is charge of recording lqs_ino_rec and
70 * lqs_blk_rec. when a lquota slave checks a quota
71 * request(check_cur_qunit) and finishes a quota
72 * request(dqacq_completion), it will be called.
73 * is_chk: whether it is checking quota; otherwise, it is finishing
74 * is_acq: whether it is acquiring; otherwise, it is releasing
76 void quota_compute_lqs(struct qunit_data *qdata, struct lustre_qunit_size *lqs,
77 int is_chk, int is_acq)
81 LASSERT(qdata && lqs);
82 LASSERT_SPIN_LOCKED(&lqs->lqs_lock);
83 is_blk = QDATA_IS_BLK(qdata);
88 lqs->lqs_blk_rec += qdata->qd_count;
90 lqs->lqs_ino_rec += qdata->qd_count;
93 lqs->lqs_blk_rec -= qdata->qd_count;
95 lqs->lqs_ino_rec -= qdata->qd_count;
100 lqs->lqs_blk_rec -= qdata->qd_count;
102 lqs->lqs_ino_rec -= qdata->qd_count;
105 lqs->lqs_blk_rec += qdata->qd_count;
107 lqs->lqs_ino_rec += qdata->qd_count;
112 void qdata_to_oqaq(struct qunit_data *qdata, struct quota_adjust_qunit *oqaq)
117 oqaq->qaq_flags = qdata->qd_flags;
118 oqaq->qaq_id = qdata->qd_id;
119 if (QDATA_IS_ADJBLK(qdata))
120 oqaq->qaq_bunit_sz = qdata->qd_qunit;
121 if (QDATA_IS_ADJINO(qdata))
122 oqaq->qaq_iunit_sz = qdata->qd_qunit;
125 int quota_search_lqs(struct qunit_data *qdata, struct quota_adjust_qunit *oqaq,
126 struct lustre_quota_ctxt *qctxt,
127 struct lustre_qunit_size **lqs_return)
129 struct quota_adjust_qunit *oqaq_tmp = NULL;
132 LASSERT(*lqs_return == NULL);
133 LASSERT(oqaq || qdata);
136 OBD_ALLOC_PTR(oqaq_tmp);
139 qdata_to_oqaq(qdata, oqaq_tmp);
144 *lqs_return = lustre_hash_lookup(qctxt->lqc_lqs_hash, oqaq_tmp);
146 LQS_DEBUG((*lqs_return), "show lqs\n");
149 OBD_FREE_PTR(oqaq_tmp);
153 int quota_create_lqs(struct qunit_data *qdata, struct quota_adjust_qunit *oqaq,
154 struct lustre_quota_ctxt *qctxt,
155 struct lustre_qunit_size **lqs_return)
157 struct lustre_qunit_size *lqs = NULL;
161 LASSERT(*lqs_return == NULL);
162 LASSERT(oqaq || qdata);
166 GOTO(out, rc = -ENOMEM);
169 qdata_to_oqaq(qdata, &lqs->lqs_key);
171 lqs->lqs_key = *oqaq;
174 spin_lock_init(&lqs->lqs_lock);
175 lqs->lqs_bwrite_pending = 0;
176 lqs->lqs_iwrite_pending = 0;
177 lqs->lqs_ino_rec = 0;
178 lqs->lqs_blk_rec = 0;
179 lqs->lqs_id = lqs->lqs_key.qaq_id;
180 lqs->lqs_flags = QAQ_IS_GRP(&lqs->lqs_key);
181 lqs->lqs_bunit_sz = qctxt->lqc_bunit_sz;
182 lqs->lqs_iunit_sz = qctxt->lqc_iunit_sz;
183 lqs->lqs_btune_sz = qctxt->lqc_btune_sz;
184 lqs->lqs_itune_sz = qctxt->lqc_itune_sz;
185 lqs->lqs_ctxt = qctxt;
186 if (qctxt->lqc_handler) {
187 lqs->lqs_last_bshrink = 0;
188 lqs->lqs_last_ishrink = 0;
191 rc = lustre_hash_add_unique(qctxt->lqc_lqs_hash,
192 &lqs->lqs_key, &lqs->lqs_hash);
193 LQS_DEBUG(lqs, "create lqs\n");
204 int quota_adjust_slave_lqs(struct quota_adjust_qunit *oqaq,
205 struct lustre_quota_ctxt *qctxt)
207 struct lustre_qunit_size *lqs = NULL;
208 unsigned long *lbunit, *liunit, *lbtune, *litune;
209 signed long b_tmp = 0, i_tmp = 0;
210 cfs_time_t time_limit = 0;
214 if (OBD_FAIL_CHECK(OBD_FAIL_QUOTA_WITHOUT_CHANGE_QS))
219 rc = quota_search_lqs(NULL, oqaq, qctxt, &lqs);
221 /* deleting the lqs, because a user sets lfs quota 0 0 0 0 */
222 if (!oqaq->qaq_bunit_sz && !oqaq->qaq_iunit_sz && QAQ_IS_ADJBLK(oqaq) &&
223 QAQ_IS_ADJINO(oqaq)) {
225 LQS_DEBUG(lqs, "release lqs\n");
226 /* this is for quota_search_lqs */
235 rc = quota_create_lqs(NULL, oqaq, qctxt, &lqs);
242 lbunit = &lqs->lqs_bunit_sz;
243 liunit = &lqs->lqs_iunit_sz;
244 lbtune = &lqs->lqs_btune_sz;
245 litune = &lqs->lqs_itune_sz;
247 spin_lock(&lqs->lqs_lock);
248 CDEBUG(D_QUOTA, "before: bunit: %lu, iunit: %lu.\n", *lbunit, *liunit);
249 /* adjust the slave's block qunit size */
250 if (QAQ_IS_ADJBLK(oqaq)) {
251 cfs_duration_t sec = cfs_time_seconds(qctxt->lqc_switch_seconds);
253 b_tmp = *lbunit - oqaq->qaq_bunit_sz;
255 if (qctxt->lqc_handler && b_tmp > 0)
256 lqs->lqs_last_bshrink = cfs_time_current();
258 if (qctxt->lqc_handler && b_tmp < 0) {
259 time_limit = cfs_time_add(lqs->lqs_last_bshrink, sec);
260 if (!lqs->lqs_last_bshrink ||
261 cfs_time_after(cfs_time_current(), time_limit)) {
262 *lbunit = oqaq->qaq_bunit_sz;
263 *lbtune = (*lbunit) / 2;
268 *lbunit = oqaq->qaq_bunit_sz;
269 *lbtune = (*lbunit) / 2;
273 /* adjust the slave's file qunit size */
274 if (QAQ_IS_ADJINO(oqaq)) {
275 i_tmp = *liunit - oqaq->qaq_iunit_sz;
277 if (qctxt->lqc_handler && i_tmp > 0)
278 lqs->lqs_last_ishrink = cfs_time_current();
280 if (qctxt->lqc_handler && i_tmp < 0) {
281 time_limit = cfs_time_add(lqs->lqs_last_ishrink,
282 cfs_time_seconds(qctxt->
283 lqc_switch_seconds));
284 if (!lqs->lqs_last_ishrink ||
285 cfs_time_after(cfs_time_current(), time_limit)) {
286 *liunit = oqaq->qaq_iunit_sz;
287 *litune = (*liunit) / 2;
292 *liunit = oqaq->qaq_iunit_sz;
293 *litune = (*liunit) / 2;
296 CDEBUG(D_QUOTA, "after: bunit: %lu, iunit: %lu.\n", *lbunit, *liunit);
297 spin_unlock(&lqs->lqs_lock);
302 rc |= LQS_BLK_DECREASE;
304 rc |= LQS_BLK_INCREASE;
307 rc |= LQS_INO_DECREASE;
309 rc |= LQS_INO_INCREASE;
314 int filter_quota_adjust_qunit(struct obd_export *exp,
315 struct quota_adjust_qunit *oqaq,
316 struct lustre_quota_ctxt *qctxt)
318 struct obd_device *obd = exp->exp_obd;
319 unsigned int uid = 0, gid = 0;
324 LASSERT(QAQ_IS_ADJBLK(oqaq));
325 rc = quota_adjust_slave_lqs(oqaq, qctxt);
327 CERROR("adjust mds slave's qunit size failed!(rc:%d)\n", rc);
330 if (QAQ_IS_GRP(oqaq))
336 rc = qctxt_adjust_qunit(obd, qctxt, uid, gid, 1, 0, NULL);
337 if (rc == -EDQUOT || rc == -EBUSY || rc == -EAGAIN) {
338 CDEBUG(D_QUOTA, "rc: %d.\n", rc);
342 CERROR("slave adjust block quota failed!(rc:%d)\n", rc);
346 #endif /* __KERNEL__ */
349 int client_quota_adjust_qunit(struct obd_export *exp,
350 struct quota_adjust_qunit *oqaq,
351 struct lustre_quota_ctxt *qctxt)
353 struct ptlrpc_request *req;
354 struct quota_adjust_qunit *oqa;
355 __u32 size[2] = { sizeof(struct ptlrpc_body), sizeof(*oqaq) };
359 /* client don't support this kind of operation, abort it */
360 if (!(exp->exp_connect_flags & OBD_CONNECT_CHANGE_QS)||
361 OBD_FAIL_CHECK(OBD_FAIL_QUOTA_WITHOUT_CHANGE_QS)) {
362 CDEBUG(D_QUOTA, "osc: %s don't support change qunit size\n",
363 exp->exp_obd->obd_name);
366 if (strcmp(exp->exp_obd->obd_type->typ_name, LUSTRE_OSC_NAME))
369 req = ptlrpc_prep_req(class_exp2cliimp(exp), LUSTRE_OST_VERSION,
370 OST_QUOTA_ADJUST_QUNIT, 2, size, NULL);
372 GOTO(out, rc = -ENOMEM);
374 oqa = lustre_msg_buf(req->rq_reqmsg, REQ_REC_OFF, sizeof(*oqaq));
377 ptlrpc_req_set_repsize(req, 2, size);
379 rc = ptlrpc_queue_wait(req);
381 CERROR("%s: %s failed: rc = %d\n", exp->exp_obd->obd_name,
385 ptlrpc_req_finished(req);
390 int lov_quota_adjust_qunit(struct obd_export *exp,
391 struct quota_adjust_qunit *oqaq,
392 struct lustre_quota_ctxt *qctxt)
394 struct obd_device *obd = class_exp2obd(exp);
395 struct lov_obd *lov = &obd->u.lov;
399 if (!QAQ_IS_ADJBLK(oqaq)) {
400 CERROR("bad qaq_flags %x for lov obd.\n", oqaq->qaq_flags);
404 for (i = 0; i < lov->desc.ld_tgt_count; i++) {
407 if (!lov->lov_tgts[i]->ltd_active) {
408 CDEBUG(D_HA, "ost %d is inactive\n", i);
412 err = obd_quota_adjust_qunit(lov->lov_tgts[i]->ltd_exp, oqaq,
415 if (lov->lov_tgts[i]->ltd_active && !rc)