4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * General Public License version 2 for more details (a copy is included
14 * in the LICENSE file that accompanied this code).
16 * You should have received a copy of the GNU General Public License
17 * version 2 along with this program; if not, write to the
18 * Free Software Foundation, Inc., 59 Temple Place - Suite 330,
19 * Boston, MA 021110-1307, USA
24 * Copyright (c) 2011, 2012, Intel, Inc.
25 * Use is subject to license terms.
27 * Author: Johann Lombardi <johann.lombardi@intel.com>
28 * Author: Niu Yawei <yawei.niu@intel.com>
32 # define EXPORT_SYMTAB
35 #define DEBUG_SUBSYSTEM S_LQUOTA
37 #include "qsd_internal.h"
40 * Completion function invoked when the global quota lock enqueue has completed
42 static void qsd_reint_completion(const struct lu_env *env,
43 struct qsd_qtype_info *qqi,
44 struct quota_body *req_qbody,
45 struct quota_body *rep_qbody,
46 struct lustre_handle *lockh,
47 union ldlm_wire_lvb *lvb,
50 struct qsd_instance *qsd = qqi->qqi_qsd;
51 __u64 *slv_ver = (__u64 *)arg;
55 CERROR("%s: failed to enqueue global quota lock, glb "
56 "fid:"DFID", rc:%d\n", qsd->qsd_svname,
57 PFID(&req_qbody->qb_fid), rc);
61 CDEBUG(D_QUOTA, "%s: global quota lock successfully acquired, glb "
62 "fid:"DFID", glb ver:"LPU64", slv fid:"DFID", slv ver:"LPU64"\n",
63 qsd->qsd_svname, PFID(&req_qbody->qb_fid),
64 lvb->l_lquota.lvb_glb_ver, PFID(&rep_qbody->qb_slv_fid),
65 rep_qbody->qb_slv_ver);
67 *slv_ver = rep_qbody->qb_slv_ver;
68 memcpy(&qqi->qqi_slv_fid, &rep_qbody->qb_slv_fid,
69 sizeof(struct lu_fid));
70 lustre_handle_copy(&qqi->qqi_lockh, lockh);
74 static int qsd_reint_qid(const struct lu_env *env, struct qsd_qtype_info *qqi,
75 bool global, union lquota_id *qid, void *rec)
77 struct lquota_entry *lqe;
81 lqe = lqe_locate(env, qqi->qqi_site, qid);
85 rc = qsd_update_lqe(env, lqe, global, rec);
89 rc = qsd_update_index(env, qqi, qid, global, 0, rec);
95 static int qsd_reint_entries(const struct lu_env *env,
96 struct qsd_qtype_info *qqi,
97 struct idx_info *ii, bool global,
99 unsigned int npages, bool need_swab)
101 struct qsd_thread_info *qti = qsd_info(env);
102 union lquota_id *qid = &qti->qti_id;
107 /* sanity check on the record size */
108 if ((global && ii->ii_recsize != sizeof(struct lquota_glb_rec)) ||
109 (!global && ii->ii_recsize != sizeof(struct lquota_slv_rec))) {
110 CERROR("Invalid record size:%d, global:%s\n",
111 ii->ii_recsize, global ? "true" : "false");
115 size = ii->ii_recsize + ii->ii_keysize + sizeof(__u64);
117 for (i = 0; i < npages; i++) {
118 union lu_page *lip = cfs_kmap(pages[i]);
120 for (j = 0; j < LU_PAGE_COUNT; j++) {
121 for (k = 0; k < lip->lp_idx.lip_nr; k++) {
124 entry = lip->lp_idx.lip_entries + k * size;
125 memcpy(qid, entry, ii->ii_keysize); /* key */
126 entry += ii->ii_keysize; /* value */
132 __swab64s(&qid->qid_uid);
133 /* quota records only include 64-bit
135 while (offset < ii->ii_recsize) {
138 offset += sizeof(__u64);
142 rc = qsd_reint_qid(env, qqi, global, qid,
150 cfs_kunmap(pages[i]);
157 static int qsd_reint_index(const struct lu_env *env, struct qsd_qtype_info *qqi,
160 struct qsd_thread_info *qti = qsd_info(env);
161 struct qsd_instance *qsd = qqi->qqi_qsd;
162 struct idx_info *ii = &qti->qti_ii;
164 cfs_page_t **pages = NULL;
165 unsigned int npages, pg_cnt;
166 __u64 start_hash = 0, ver = 0;
167 bool need_swab = false;
171 fid = global ? &qqi->qqi_fid : &qqi->qqi_slv_fid;
173 /* let's do a 1MB bulk */
174 npages = min_t(unsigned int, PTLRPC_MAX_BRW_SIZE, 1 << 20);
175 npages /= CFS_PAGE_SIZE;
177 /* allocate pages for bulk index read */
178 OBD_ALLOC(pages, npages * sizeof(*pages));
180 GOTO(out, rc = -ENOMEM);
181 for (i = 0; i < npages; i++) {
182 pages[i] = cfs_alloc_page(CFS_ALLOC_STD);
183 if (pages[i] == NULL)
184 GOTO(out, rc = -ENOMEM);
188 /* initialize index_info request with FID of global index */
189 memset(ii, 0, sizeof(*ii));
190 memcpy(&ii->ii_fid, fid, sizeof(*fid));
191 ii->ii_magic = IDX_INFO_MAGIC;
192 ii->ii_flags = II_FL_NOHASH;
193 ii->ii_count = npages * LU_PAGE_COUNT;
194 ii->ii_hash_start = start_hash;
196 /* send bulk request to quota master to read global index */
197 rc = qsd_fetch_index(env, qsd->qsd_exp, ii, npages, pages, &need_swab);
199 CWARN("%s: failed to fetch index for "DFID". %d\n",
200 qsd->qsd_svname, PFID(fid), rc);
204 /* various sanity checks */
205 if (ii->ii_magic != IDX_INFO_MAGIC) {
206 CERROR("%s: invalid magic in index transfer %x != %x\n",
207 qsd->qsd_svname, ii->ii_magic, IDX_INFO_MAGIC);
208 GOTO(out, rc = -EPROTO);
210 if ((ii->ii_flags & II_FL_VARKEY) != 0)
211 CWARN("%s: II_FL_VARKEY is set on index transfer for fid "DFID
212 ", it shouldn't be\n", qsd->qsd_svname, PFID(fid));
213 if ((ii->ii_flags & II_FL_NONUNQ) != 0)
214 CWARN("%s: II_FL_NONUNQ is set on index transfer for fid "DFID
215 ", it shouldn't be\n", qsd->qsd_svname, PFID(fid));
216 if (ii->ii_keysize != sizeof(__u64)) {
217 CERROR("%s: invalid key size reported on index transfer for "
218 "fid "DFID", %u != %u\n", qsd->qsd_svname, PFID(fid),
219 ii->ii_keysize, (int)sizeof(__u64));
220 GOTO(out, rc = -EPROTO);
222 if (ii->ii_version == 0 && ii->ii_count != 0)
223 CWARN("%s: index version for fid "DFID" is 0, but index isn't "
224 "empty (%d)\n", qsd->qsd_svname, PFID(fid), ii->ii_count);
226 CDEBUG(D_QUOTA, "%s: reintegration process for fid "DFID" successfully "
227 "fetched %s index, count = %d\n", qsd->qsd_svname,
228 PFID(fid), global ? "global" : "slave", ii->ii_count);
231 /* record version associated with the first bulk transfer */
232 ver = ii->ii_version;
234 pg_cnt = (ii->ii_count + (LU_PAGE_COUNT) - 1);
235 pg_cnt >>= CFS_PAGE_SHIFT - LU_PAGE_SHIFT;
237 if (pg_cnt > npages) {
238 CERROR("%s: master returned more pages than expected, %u > %u"
239 "\n", qsd->qsd_svname, pg_cnt, npages);
243 rc = qsd_reint_entries(env, qqi, ii, global, pages, pg_cnt, need_swab);
247 if (ii->ii_hash_end != II_END_OFF) {
248 start_hash = ii->ii_hash_end;
253 for (i = 0; i < npages; i++)
254 if (pages[i] != NULL)
255 cfs_free_page(pages[i]);
256 OBD_FREE(pages, npages * sizeof(*pages));
259 /* Update index version */
261 rc = qsd_write_version(env, qqi, ver, global);
263 CERROR("%s: write version "LPU64" to "DFID" failed. "
264 "%d\n", qsd->qsd_svname, ver, PFID(fid), rc);
270 static int qsd_reconciliation(const struct lu_env *env,
271 struct qsd_qtype_info *qqi)
273 struct qsd_thread_info *qti = qsd_info(env);
274 struct qsd_instance *qsd = qqi->qqi_qsd;
275 const struct dt_it_ops *iops;
278 struct lquota_entry *lqe;
279 union lquota_id *qid = &qti->qti_id;
283 LASSERT(qqi->qqi_glb_obj != NULL);
284 iops = &qqi->qqi_glb_obj->do_index_ops->dio_it;
286 it = iops->init(env, qqi->qqi_glb_obj, 0, BYPASS_CAPA);
288 CWARN("%s: Initialize it for "DFID" failed. %ld\n",
289 qsd->qsd_svname, PFID(&qqi->qqi_fid), PTR_ERR(it));
293 rc = iops->load(env, it, 0);
295 CWARN("%s: Load first entry for "DFID" failed. %d\n",
296 qsd->qsd_svname, PFID(&qqi->qqi_fid), rc);
298 } else if (rc == 0) {
299 rc = iops->next(env, it);
301 GOTO(out, rc = (rc < 0) ? rc : 0);
305 key = iops->key(env, it);
307 CWARN("%s: Error key for "DFID". %ld\n",
308 qsd->qsd_svname, PFID(&qqi->qqi_fid),
310 GOTO(out, rc = PTR_ERR(key));
313 /* skip the root user/group */
314 if (*((__u64 *)key) == 0)
317 qid->qid_uid = *((__u64 *)key);
319 lqe = lqe_locate(env, qqi->qqi_site, qid);
321 CWARN("%s: Fail to locate lqe. "DFID", %ld\n",
322 qsd->qsd_svname, PFID(&qqi->qqi_fid),
324 GOTO(out, rc = PTR_ERR(lqe));
327 if (!lqe->lqe_enforced) {
332 rc = qsd_refresh_usage(env, lqe);
334 CWARN("%s: Fail to get usage. "DFID", %d\n",
335 qsd->qsd_svname, PFID(&qqi->qqi_fid), rc);
340 rc = qsd_dqacq(env, lqe, QSD_REP);
344 CWARN("%s: Fail to report quota. "DFID", %d\n",
345 qsd->qsd_svname, PFID(&qqi->qqi_fid), rc);
349 rc = iops->next(env, it);
351 CWARN("%s: Error next "DFID". %d\n", qsd->qsd_svname,
352 PFID(&qqi->qqi_fid), rc);
364 static int qsd_connected(struct qsd_instance *qsd)
368 cfs_read_lock(&qsd->qsd_lock);
369 connected = qsd->qsd_exp_valid ? 1 : 0;
370 cfs_read_unlock(&qsd->qsd_lock);
375 static int qsd_started(struct qsd_instance *qsd)
379 cfs_read_lock(&qsd->qsd_lock);
380 started = qsd->qsd_started ? 1 : 0;
381 cfs_read_unlock(&qsd->qsd_lock);
387 * Routine executed by the reintegration thread.
389 static int qsd_reint_main(void *args)
392 struct qsd_thread_info *qti;
393 struct qsd_qtype_info *qqi = (struct qsd_qtype_info *)args;
394 struct qsd_instance *qsd = qqi->qqi_qsd;
395 struct ptlrpc_thread *thread = &qqi->qqi_reint_thread;
396 struct l_wait_info lwi = { 0 };
400 cfs_daemonize("qsd_reint");
402 CDEBUG(D_QUOTA, "%s: Starting reintegration thread for "DFID"\n",
403 qsd->qsd_svname, PFID(&qqi->qqi_fid));
406 lu_ref_add(&qqi->qqi_reference, "reint_thread", thread);
408 thread_set_flags(thread, SVC_RUNNING);
409 cfs_waitq_signal(&thread->t_ctl_waitq);
413 GOTO(out, rc = -ENOMEM);
415 /* initialize environment */
416 rc = lu_env_init(env, LCT_DT_THREAD);
421 /* wait for the connection to master established */
422 l_wait_event(thread->t_ctl_waitq,
423 qsd_connected(qsd) || !thread_is_running(thread), &lwi);
425 /* Step 1: enqueue global index lock */
426 if (!thread_is_running(thread))
427 GOTO(out_env_init, rc = 0);
429 LASSERT(qsd->qsd_exp != NULL);
430 LASSERT(qqi->qqi_glb_uptodate == 0 || qqi->qqi_slv_uptodate == 0);
432 memset(&qti->qti_lvb, 0, sizeof(qti->qti_lvb));
434 cfs_read_lock(&qsd->qsd_lock);
435 /* check whether we already own a global quota lock for this type */
436 if (lustre_handle_is_used(&qqi->qqi_lockh) &&
437 ldlm_lock_addref_try(&qqi->qqi_lockh, qsd_glb_einfo.ei_mode) == 0) {
438 cfs_read_unlock(&qsd->qsd_lock);
439 /* force refresh of global & slave index copy */
440 qti->qti_lvb.l_lquota.lvb_glb_ver = ~0ULL;
441 qti->qti_slv_ver = ~0ULL;
443 /* no valid lock found, let's enqueue a new one */
444 cfs_read_unlock(&qsd->qsd_lock);
446 memset(&qti->qti_body, 0, sizeof(qti->qti_body));
447 memcpy(&qti->qti_body.qb_fid, &qqi->qqi_fid,
448 sizeof(qqi->qqi_fid));
450 rc = qsd_intent_lock(env, qsd->qsd_exp, &qti->qti_body, true,
451 IT_QUOTA_CONN, qsd_reint_completion, qqi,
452 &qti->qti_lvb, (void *)&qti->qti_slv_ver);
454 GOTO(out_env_init, rc);
456 CDEBUG(D_QUOTA, "%s: glb_ver:"LPU64"/"LPU64",slv_ver:"LPU64"/"
457 LPU64"\n", qsd->qsd_svname,
458 qti->qti_lvb.l_lquota.lvb_glb_ver, qqi->qqi_glb_ver,
459 qti->qti_slv_ver, qqi->qqi_slv_ver);
462 /* Step 2: reintegrate global index */
463 if (!thread_is_running(thread))
464 GOTO(out_lock, rc = 0);
466 OBD_FAIL_TIMEOUT(OBD_FAIL_QUOTA_DELAY_REINT, 10);
468 if (qqi->qqi_glb_ver != qti->qti_lvb.l_lquota.lvb_glb_ver) {
469 rc = qsd_reint_index(env, qqi, true);
471 CWARN("%s: reint global for "DFID" failed. %d\n",
472 qsd->qsd_svname, PFID(&qqi->qqi_fid), rc);
476 qsd_bump_version(qqi, qqi->qqi_glb_ver, true);
479 /* Step 3: reintegrate slave index */
480 if (!thread_is_running(thread))
481 GOTO(out_lock, rc = 0);
483 if (qqi->qqi_slv_ver != qti->qti_slv_ver) {
484 rc = qsd_reint_index(env, qqi, false);
486 CWARN("%s: Reint slave for "DFID" failed. %d\n",
487 qsd->qsd_svname, PFID(&qqi->qqi_slv_fid), rc);
491 qsd_bump_version(qqi, qqi->qqi_slv_ver, false);
494 /* wait for the connection to master established */
495 l_wait_event(thread->t_ctl_waitq,
496 qsd_started(qsd) || !thread_is_running(thread), &lwi);
498 if (!thread_is_running(thread))
499 GOTO(out_lock, rc = 0);
501 /* Step 4: start reconciliation for each enforced ID */
502 rc = qsd_reconciliation(env, qqi);
504 CWARN("%s: reconciliation failed. "DFID", %d\n",
505 qsd->qsd_svname, PFID(&qti->qti_fid), rc);
509 ldlm_lock_decref(&qqi->qqi_lockh, qsd_glb_einfo.ei_mode);
515 cfs_write_lock(&qsd->qsd_lock);
517 cfs_write_unlock(&qsd->qsd_lock);
520 lu_ref_del(&qqi->qqi_reference, "reint_thread", thread);
522 thread_set_flags(thread, SVC_STOPPED);
523 cfs_waitq_signal(&thread->t_ctl_waitq);
527 void qsd_stop_reint_thread(struct qsd_qtype_info *qqi)
529 struct ptlrpc_thread *thread = &qqi->qqi_reint_thread;
530 struct l_wait_info lwi = { 0 };
532 if (!thread_is_stopped(thread)) {
533 thread_set_flags(thread, SVC_STOPPING);
534 cfs_waitq_signal(&thread->t_ctl_waitq);
536 l_wait_event(thread->t_ctl_waitq,
537 thread_is_stopped(thread), &lwi);
541 int qsd_start_reint_thread(struct qsd_qtype_info *qqi)
543 struct ptlrpc_thread *thread = &qqi->qqi_reint_thread;
544 struct qsd_instance *qsd = qqi->qqi_qsd;
545 struct l_wait_info lwi = { 0 };
549 /* don't bother to do reintegration when quota isn't enabled */
550 if (!qsd_type_enabled(qqi->qqi_qsd, qqi->qqi_qtype))
553 /* check if the reintegration has already started or finished */
554 cfs_write_lock(&qsd->qsd_lock);
556 if ((qqi->qqi_glb_uptodate && qqi->qqi_slv_uptodate) ||
557 qqi->qqi_reint || qsd->qsd_stopping) {
558 cfs_write_unlock(&qsd->qsd_lock);
563 cfs_write_unlock(&qsd->qsd_lock);
565 rc = cfs_create_thread(qsd_reint_main, (void *)qqi, 0);
567 thread_set_flags(thread, SVC_STOPPED);
568 cfs_write_lock(&qsd->qsd_lock);
570 cfs_write_unlock(&qsd->qsd_lock);
574 l_wait_event(thread->t_ctl_waitq,
575 thread_is_running(thread) || thread_is_stopped(thread),