4 * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 only,
8 * as published by the Free Software Foundation.
10 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 * GNU General Public License version 2 for more details. A copy is
14 * included in the COPYING file that accompanied this code.
16 * You should have received a copy of the GNU General Public License
17 * along with this program; if not, write to the Free Software
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
23 * Copyright (c) 2011, 2012 Commissariat a l'energie atomique et aux energies
25 * Use is subject to license terms.
27 * Copyright (c) 2012, 2015, Intel Corporation.
30 * lustre/mdt/mdt_hsm.c
32 * Lustre Metadata Target (mdt) request handler
34 * Author: Aurelien Degremont <aurelien.degremont@cea.fr>
35 * Author: JC Lafoucriere <jacques-charles.lafoucriere@cea.fr>
38 #define DEBUG_SUBSYSTEM S_MDS
40 #include "mdt_internal.h"
42 /* Max allocation to satisfy single HSM RPC. */
43 #define MDT_HSM_ALLOC_MAX (1 << 20)
45 #define MDT_HSM_ALLOC(ptr, size) \
47 if ((size) <= MDT_HSM_ALLOC_MAX) \
48 OBD_ALLOC_LARGE((ptr), (size)); \
53 #define MDT_HSM_FREE(ptr, size) OBD_FREE_LARGE((ptr), (size))
56 * Update on-disk HSM attributes.
58 int mdt_hsm_attr_set(struct mdt_thread_info *info, struct mdt_object *obj,
59 const struct md_hsm *mh)
61 struct md_object *next = mdt_object_child(obj);
62 struct lu_buf *buf = &info->mti_buf;
63 struct hsm_attrs *attrs;
67 attrs = (struct hsm_attrs *)info->mti_xattr_buf;
68 CLASSERT(sizeof(info->mti_xattr_buf) >= sizeof(*attrs));
70 /* pack HSM attributes */
71 lustre_hsm2buf(info->mti_xattr_buf, mh);
73 /* update HSM attributes */
75 buf->lb_len = sizeof(*attrs);
76 rc = mo_xattr_set(info->mti_env, next, buf, XATTR_NAME_HSM, 0);
81 static inline bool mdt_hsm_is_admin(struct mdt_thread_info *info)
86 if (info->mti_body == NULL)
89 rc = mdt_init_ucred(info, (struct mdt_body *)info->mti_body);
93 is_admin = md_capable(mdt_ucred(info), CFS_CAP_SYS_ADMIN);
101 * Extract information coming from a copytool and asks coordinator to update
102 * a request status depending on the update content.
104 * Copytools could use this to report failure in their process.
106 * This is HSM_PROGRESS RPC handler.
108 int mdt_hsm_progress(struct tgt_session_info *tsi)
110 struct mdt_thread_info *info;
111 struct hsm_progress_kernel *hpk;
115 if (tsi->tsi_mdt_body == NULL)
118 hpk = req_capsule_client_get(tsi->tsi_pill, &RMF_MDS_HSM_PROGRESS);
120 RETURN(err_serious(-EPROTO));
122 hpk->hpk_errval = lustre_errno_ntoh(hpk->hpk_errval);
124 CDEBUG(D_HSM, "Progress on "DFID": len=%llu : rc = %d\n",
125 PFID(&hpk->hpk_fid), hpk->hpk_extent.length, hpk->hpk_errval);
128 CDEBUG(D_HSM, "Copytool progress on "DFID" failed : rc = %d; %s.\n",
129 PFID(&hpk->hpk_fid), hpk->hpk_errval,
130 hpk->hpk_flags & HP_FLAG_RETRY ? "will retry" : "fatal");
132 if (hpk->hpk_flags & HP_FLAG_COMPLETED)
133 CDEBUG(D_HSM, "Finished "DFID" : rc = %d; cancel cookie=%#llx\n",
134 PFID(&hpk->hpk_fid), hpk->hpk_errval, hpk->hpk_cookie);
136 info = tsi2mdt_info(tsi);
137 if (!mdt_hsm_is_admin(info))
138 GOTO(out, rc = -EPERM);
140 rc = mdt_hsm_coordinator_update(info, hpk);
142 mdt_thread_info_fini(info);
146 int mdt_hsm_ct_register(struct tgt_session_info *tsi)
148 struct mdt_thread_info *info;
153 archives = req_capsule_client_get(tsi->tsi_pill, &RMF_MDS_HSM_ARCHIVE);
154 if (archives == NULL)
155 RETURN(err_serious(-EPROTO));
157 info = tsi2mdt_info(tsi);
158 if (!mdt_hsm_is_admin(info))
159 GOTO(out, rc = -EPERM);
161 /* XXX: directly include this function here? */
162 rc = mdt_hsm_agent_register_mask(info, &tsi->tsi_exp->exp_client_uuid,
165 mdt_thread_info_fini(info);
169 int mdt_hsm_ct_unregister(struct tgt_session_info *tsi)
171 struct mdt_thread_info *info;
175 if (tsi->tsi_mdt_body == NULL)
178 info = tsi2mdt_info(tsi);
179 if (!mdt_hsm_is_admin(info))
180 GOTO(out, rc = -EPERM);
182 /* XXX: directly include this function here? */
183 rc = mdt_hsm_agent_unregister(info, &tsi->tsi_exp->exp_client_uuid);
185 mdt_thread_info_fini(info);
190 * Retrieve the current HSM flags, archive id and undergoing HSM requests for
191 * the fid provided in RPC body.
193 * Current requests are read from coordinator states.
195 * This is MDS_HSM_STATE_GET RPC handler.
197 int mdt_hsm_state_get(struct tgt_session_info *tsi)
199 struct mdt_thread_info *info = tsi2mdt_info(tsi);
200 struct mdt_object *obj = info->mti_object;
201 struct md_attr *ma = &info->mti_attr;
202 struct hsm_user_state *hus;
203 struct mdt_lock_handle *lh;
207 if (info->mti_body == NULL || obj == NULL)
208 GOTO(out, rc = -EPROTO);
210 /* Only valid if client is remote */
211 rc = mdt_init_ucred(info, (struct mdt_body *)info->mti_body);
213 GOTO(out, rc = err_serious(rc));
215 lh = &info->mti_lh[MDT_LH_CHILD];
216 mdt_lock_reg_init(lh, LCK_PR);
217 rc = mdt_object_lock(info, obj, lh, MDS_INODELOCK_LOOKUP);
222 ma->ma_need = MA_HSM;
223 rc = mdt_attr_get_complex(info, obj, ma);
225 GOTO(out_unlock, rc);
227 hus = req_capsule_server_get(tsi->tsi_pill, &RMF_HSM_USER_STATE);
229 GOTO(out_unlock, rc = -EPROTO);
231 /* Current HSM flags */
232 hus->hus_states = ma->ma_hsm.mh_flags;
233 hus->hus_archive_id = ma->ma_hsm.mh_arch_id;
237 mdt_object_unlock(info, obj, lh, 1);
239 mdt_exit_ucred(info);
241 mdt_thread_info_fini(info);
246 * Change HSM state and archive number of a file.
248 * Archive number is changed iif the value is not 0.
249 * The new flagset that will be computed should result in a coherent state.
250 * This function checks that flags are compatible.
252 * This is MDS_HSM_STATE_SET RPC handler.
254 int mdt_hsm_state_set(struct tgt_session_info *tsi)
256 struct mdt_thread_info *info = tsi2mdt_info(tsi);
257 struct mdt_object *obj = info->mti_object;
258 struct md_attr *ma = &info->mti_attr;
259 struct hsm_state_set *hss;
260 struct mdt_lock_handle *lh;
265 hss = req_capsule_client_get(info->mti_pill, &RMF_HSM_STATE_SET);
267 if (info->mti_body == NULL || obj == NULL || hss == NULL)
268 GOTO(out, rc = -EPROTO);
270 /* Only valid if client is remote */
271 rc = mdt_init_ucred(info, (struct mdt_body *)info->mti_body);
273 GOTO(out, rc = err_serious(rc));
275 lh = &info->mti_lh[MDT_LH_CHILD];
276 mdt_lock_reg_init(lh, LCK_PW);
277 rc = mdt_object_lock(info, obj, lh, MDS_INODELOCK_LOOKUP |
278 MDS_INODELOCK_XATTR);
282 /* Detect out-of range masks */
283 if ((hss->hss_setmask | hss->hss_clearmask) & ~HSM_FLAGS_MASK) {
284 CDEBUG(D_HSM, "Incompatible masks provided (set %#llx"
285 ", clear %#llx) vs supported set (%#x).\n",
286 hss->hss_setmask, hss->hss_clearmask, HSM_FLAGS_MASK);
287 GOTO(out_unlock, rc = -EINVAL);
290 /* Non-root users are forbidden to set or clear flags which are
291 * NOT defined in HSM_USER_MASK. */
292 if (((hss->hss_setmask | hss->hss_clearmask) & ~HSM_USER_MASK) &&
293 !md_capable(mdt_ucred(info), CFS_CAP_SYS_ADMIN)) {
294 CDEBUG(D_HSM, "Incompatible masks provided (set %#llx"
295 ", clear %#llx) vs unprivileged set (%#x).\n",
296 hss->hss_setmask, hss->hss_clearmask, HSM_USER_MASK);
297 GOTO(out_unlock, rc = -EPERM);
300 /* Read current HSM info */
302 ma->ma_need = MA_HSM;
303 rc = mdt_attr_get_complex(info, obj, ma);
305 GOTO(out_unlock, rc);
307 /* Change HSM flags depending on provided masks */
308 if (hss->hss_valid & HSS_SETMASK)
309 ma->ma_hsm.mh_flags |= hss->hss_setmask;
310 if (hss->hss_valid & HSS_CLEARMASK)
311 ma->ma_hsm.mh_flags &= ~hss->hss_clearmask;
313 /* Change archive_id if provided. */
314 if (hss->hss_valid & HSS_ARCHIVE_ID) {
315 if (!(ma->ma_hsm.mh_flags & HS_EXISTS)) {
316 CDEBUG(D_HSM, "Could not set an archive number for "
317 DFID "if HSM EXISTS flag is not set.\n",
318 PFID(&info->mti_body->mbo_fid1));
319 GOTO(out_unlock, rc);
322 /* Detect out-of range archive id */
323 if (hss->hss_archive_id > LL_HSM_MAX_ARCHIVE) {
324 CDEBUG(D_HSM, "archive id %u exceeds maximum %zu.\n",
325 hss->hss_archive_id, LL_HSM_MAX_ARCHIVE);
326 GOTO(out_unlock, rc = -EINVAL);
329 ma->ma_hsm.mh_arch_id = hss->hss_archive_id;
332 /* Check for inconsistant HSM flagset.
333 * DIRTY without EXISTS: no dirty if no archive was created.
334 * DIRTY and RELEASED: a dirty file could not be released.
335 * RELEASED without ARCHIVED: do not release a non-archived file.
336 * LOST without ARCHIVED: cannot lost a non-archived file.
338 flags = ma->ma_hsm.mh_flags;
339 if ((flags & HS_DIRTY && !(flags & HS_EXISTS)) ||
340 (flags & HS_RELEASED && flags & HS_DIRTY) ||
341 (flags & HS_RELEASED && !(flags & HS_ARCHIVED)) ||
342 (flags & HS_LOST && !(flags & HS_ARCHIVED))) {
343 CDEBUG(D_HSM, "Incompatible flag change on "DFID
345 PFID(&info->mti_body->mbo_fid1), flags);
346 GOTO(out_unlock, rc = -EINVAL);
349 /* Save the modified flags */
350 rc = mdt_hsm_attr_set(info, obj, &ma->ma_hsm);
352 GOTO(out_unlock, rc);
357 mdt_object_unlock(info, obj, lh, 1);
359 mdt_exit_ucred(info);
361 mdt_thread_info_fini(info);
366 * Retrieve undergoing HSM requests for the fid provided in RPC body.
367 * Current requests are read from coordinator states.
369 * This is MDS_HSM_ACTION RPC handler.
371 int mdt_hsm_action(struct tgt_session_info *tsi)
373 struct mdt_thread_info *info;
374 struct hsm_current_action *hca;
375 struct hsm_action_list *hal = NULL;
376 struct hsm_action_item *hai;
381 hca = req_capsule_server_get(tsi->tsi_pill,
382 &RMF_MDS_HSM_CURRENT_ACTION);
384 RETURN(err_serious(-EPROTO));
386 if (tsi->tsi_mdt_body == NULL)
389 info = tsi2mdt_info(tsi);
390 /* Only valid if client is remote */
391 rc = mdt_init_ucred(info, (struct mdt_body *)info->mti_body);
393 GOTO(out, rc = err_serious(rc));
395 /* Coordinator information */
396 hal_size = sizeof(*hal) +
397 cfs_size_round(MTI_NAME_MAXLEN) /* fsname */ +
398 cfs_size_round(sizeof(*hai));
400 MDT_HSM_ALLOC(hal, hal_size);
402 GOTO(out_ucred, rc = -ENOMEM);
404 hal->hal_version = HAL_VERSION;
405 hal->hal_archive_id = 0;
407 obd_uuid2fsname(hal->hal_fsname, mdt_obd_name(info->mti_mdt),
410 hai = hai_first(hal);
411 hai->hai_action = HSMA_NONE;
414 hai->hai_fid = info->mti_body->mbo_fid1;
415 hai->hai_len = sizeof(*hai);
417 rc = mdt_hsm_get_actions(info, hal);
421 /* cookie is used to give back request status */
422 if (hai->hai_cookie == 0)
423 hca->hca_state = HPS_WAITING;
425 hca->hca_state = HPS_RUNNING;
427 switch (hai->hai_action) {
429 hca->hca_action = HUA_NONE;
432 hca->hca_action = HUA_ARCHIVE;
435 hca->hca_action = HUA_RESTORE;
438 hca->hca_action = HUA_REMOVE;
441 hca->hca_action = HUA_CANCEL;
444 hca->hca_action = HUA_NONE;
445 CERROR("%s: Unknown hsm action: %d on "DFID"\n",
446 mdt_obd_name(info->mti_mdt),
447 hai->hai_action, PFID(&hai->hai_fid));
451 hca->hca_location = hai->hai_extent;
455 MDT_HSM_FREE(hal, hal_size);
457 mdt_exit_ucred(info);
459 mdt_thread_info_fini(info);
463 /* Return true if a FID is present in an action list. */
464 static bool is_fid_in_hal(struct hsm_action_list *hal, const lustre_fid *fid)
466 struct hsm_action_item *hai;
469 for (hai = hai_first(hal), i = 0;
471 i++, hai = hai_next(hai)) {
472 if (lu_fid_eq(&hai->hai_fid, fid))
480 * Process the HSM actions described in a struct hsm_user_request.
482 * The action described in hur will be send to coordinator to be saved and
483 * processed later or either handled directly if hur.hur_action is HUA_RELEASE.
485 * This is MDS_HSM_REQUEST RPC handler.
487 int mdt_hsm_request(struct tgt_session_info *tsi)
489 struct mdt_thread_info *info;
490 struct req_capsule *pill = tsi->tsi_pill;
491 struct hsm_request *hr;
492 struct hsm_user_item *hui;
493 struct hsm_action_list *hal;
494 struct hsm_action_item *hai;
498 enum hsm_copytool_action action = HSMA_NONE;
502 hr = req_capsule_client_get(pill, &RMF_MDS_HSM_REQUEST);
503 hui = req_capsule_client_get(pill, &RMF_MDS_HSM_USER_ITEM);
504 data = req_capsule_client_get(pill, &RMF_GENERIC_DATA);
506 if (tsi->tsi_mdt_body == NULL || hr == NULL || hui == NULL || data == NULL)
509 /* Sanity check. Nothing to do with an empty list */
510 if (hr->hr_itemcount == 0)
513 hui_list_size = req_capsule_get_size(pill, &RMF_MDS_HSM_USER_ITEM,
515 if (hui_list_size < hr->hr_itemcount * sizeof(*hui))
518 data_size = req_capsule_get_size(pill, &RMF_GENERIC_DATA, RCL_CLIENT);
519 if (data_size != hr->hr_data_len)
522 info = tsi2mdt_info(tsi);
523 /* Only valid if client is remote */
524 rc = mdt_init_ucred(info, (struct mdt_body *)info->mti_body);
528 switch (hr->hr_action) {
529 /* code to be removed in hsm1_merge and final patch */
531 CERROR("Release action is not working in hsm1_coord\n");
532 GOTO(out_ucred, rc = -EINVAL);
534 /* end of code to be removed */
536 action = HSMA_ARCHIVE;
539 action = HSMA_RESTORE;
542 action = HSMA_REMOVE;
545 action = HSMA_CANCEL;
548 CERROR("Unknown hsm action: %d\n", hr->hr_action);
549 GOTO(out_ucred, rc = -EINVAL);
552 hal_size = sizeof(*hal) + cfs_size_round(MTI_NAME_MAXLEN) /* fsname */ +
553 (sizeof(*hai) + cfs_size_round(hr->hr_data_len)) *
556 MDT_HSM_ALLOC(hal, hal_size);
558 GOTO(out_ucred, rc = -ENOMEM);
560 hal->hal_version = HAL_VERSION;
561 hal->hal_archive_id = hr->hr_archive_id;
562 hal->hal_flags = hr->hr_flags;
563 obd_uuid2fsname(hal->hal_fsname, mdt_obd_name(info->mti_mdt),
567 hai = hai_first(hal);
568 for (i = 0; i < hr->hr_itemcount; i++, hai = hai_next(hai)) {
569 /* Get rid of duplicate entries. Otherwise we get
570 * duplicated work in the llog. */
571 if (is_fid_in_hal(hal, &hui[i].hui_fid))
574 hai->hai_action = action;
577 hai->hai_fid = hui[i].hui_fid;
578 hai->hai_extent = hui[i].hui_extent;
579 memcpy(hai->hai_data, data, hr->hr_data_len);
580 hai->hai_len = sizeof(*hai) + hr->hr_data_len;
585 rc = mdt_hsm_add_actions(info, hal);
587 MDT_HSM_FREE(hal, hal_size);
592 mdt_exit_ucred(info);
594 mdt_thread_info_fini(info);