Whamcloud - gitweb
LU-848 clio: page writeback support
[fs/lustre-release.git] / lustre / osc / osc_create.c
1 /* -*- mode: c; c-basic-offset: 8; indent-tabs-mode: nil; -*-
2  * vim:expandtab:shiftwidth=8:tabstop=8:
3  *
4  * GPL HEADER START
5  *
6  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
7  *
8  * This program is free software; you can redistribute it and/or modify
9  * it under the terms of the GNU General Public License version 2 only,
10  * as published by the Free Software Foundation.
11  *
12  * This program is distributed in the hope that it will be useful, but
13  * WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
15  * General Public License version 2 for more details (a copy is included
16  * in the LICENSE file that accompanied this code).
17  *
18  * You should have received a copy of the GNU General Public License
19  * version 2 along with this program; If not, see
20  * http://www.sun.com/software/products/lustre/docs/GPLv2.pdf
21  *
22  * Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
23  * CA 95054 USA or visit www.sun.com if you need additional information or
24  * have any questions.
25  *
26  * GPL HEADER END
27  */
28 /*
29  * Copyright (c) 2003, 2010, Oracle and/or its affiliates. All rights reserved.
30  * Use is subject to license terms.
31  *
32  * Copyright (c) 2011 Whamcloud, Inc.
33  *
34  */
35 /*
36  * This file is part of Lustre, http://www.lustre.org/
37  * Lustre is a trademark of Sun Microsystems, Inc.
38  *
39  * lustre/osc/osc_create.c
40  * For testing and management it is treated as an obd_device,
41  * although * it does not export a full OBD method table (the
42  * requests are coming * in over the wire, so object target modules
43  * do not have a full * method table.)
44  *
45  * Author: Peter Braam <braam@clusterfs.com>
46  */
47
48 #ifndef EXPORT_SYMTAB
49 # define EXPORT_SYMTAB
50 #endif
51 #define DEBUG_SUBSYSTEM S_OSC
52
53 #ifdef __KERNEL__
54 # include <libcfs/libcfs.h>
55 #else /* __KERNEL__ */
56 # include <liblustre.h>
57 #endif
58
59 #ifdef  __CYGWIN__
60 # include <ctype.h>
61 #endif
62
63 #include <lustre_dlm.h>
64 #include <obd_class.h>
65 #include "osc_internal.h"
66
67 /* XXX need AT adjust ? */
68 #define osc_create_timeout      (obd_timeout / 2)
69
70 struct osc_create_async_args {
71         struct osc_creator      *rq_oscc;
72         struct lov_stripe_md    *rq_lsm;
73         struct obd_info         *rq_oinfo;
74         int                      rq_grow_count;
75 };
76
77 static int oscc_internal_create(struct osc_creator *oscc);
78 static int handle_async_create(struct ptlrpc_request *req, int rc);
79
80 static int osc_interpret_create(const struct lu_env *env,
81                                 struct ptlrpc_request *req, void *data, int rc)
82 {
83         struct osc_create_async_args *args = ptlrpc_req_async_args(req);
84         struct osc_creator *oscc = args->rq_oscc;
85         struct ost_body *body = NULL;
86         struct ptlrpc_request *fake_req, *pos;
87         ENTRY;
88
89         if (req->rq_repmsg) {
90                 body = req_capsule_server_get(&req->rq_pill, &RMF_OST_BODY);
91                 if (body == NULL && rc == 0)
92                         rc = -EPROTO;
93         }
94
95         LASSERT(oscc && (oscc->oscc_obd != LP_POISON));
96
97         cfs_spin_lock(&oscc->oscc_lock);
98         oscc->oscc_flags &= ~OSCC_FLAG_CREATING;
99         switch (rc) {
100         case 0: {
101                 if (body) {
102                         int diff =ostid_id(&body->oa.o_oi)- oscc->oscc_last_id;
103
104                         /* oscc_internal_create() stores the original value of
105                          * grow_count in osc_create_async_args::rq_grow_count.
106                          * We can't compare against oscc_grow_count directly,
107                          * because it may have been increased while the RPC
108                          * is in flight, so we would always find ourselves
109                          * having created fewer objects and decreasing the
110                          * precreate request size.  b=18577 */
111                         if (diff < args->rq_grow_count) {
112                                 /* the OST has not managed to create all the
113                                  * objects we asked for */
114                                 oscc->oscc_grow_count = max(diff,
115                                                             OST_MIN_PRECREATE);
116                                 /* don't bump grow_count next time */
117                                 oscc->oscc_flags |= OSCC_FLAG_LOW;
118                         } else {
119                                 /* the OST is able to keep up with the work,
120                                  * we could consider increasing grow_count
121                                  * next time if needed */
122                                 oscc->oscc_flags &= ~OSCC_FLAG_LOW;
123                         }
124                         oscc->oscc_last_id = ostid_id(&body->oa.o_oi);
125                 }
126                 cfs_spin_unlock(&oscc->oscc_lock);
127                 break;
128         }
129         case -EROFS:
130                 oscc->oscc_flags |= OSCC_FLAG_RDONLY;
131         case -ENOSPC:
132         case -EFBIG: 
133                 if (rc != -EROFS) {
134                         oscc->oscc_flags |= OSCC_FLAG_NOSPC;
135                         if (body && rc == -ENOSPC) {
136                                 oscc->oscc_last_id = body->oa.o_id;
137                                 oscc->oscc_grow_count = OST_MIN_PRECREATE;
138
139                                 if ((body->oa.o_valid & OBD_MD_FLFLAGS) &&
140                                     (body->oa.o_flags & OBD_FL_NOSPC_BLK))
141                                         oscc->oscc_flags |= OSCC_FLAG_NOSPC_BLK;
142                                 else
143                                         rc = 0;
144                         }
145                 }
146                 cfs_spin_unlock(&oscc->oscc_lock);
147                 DEBUG_REQ(D_INODE, req, "OST out of space, flagging");
148                 break;
149         case -EIO: {
150                 /* filter always set body->oa.o_id as the last_id
151                  * of filter (see filter_handle_precreate for detail)*/
152                 if (body && body->oa.o_id > oscc->oscc_last_id)
153                         oscc->oscc_last_id = body->oa.o_id;
154                 cfs_spin_unlock(&oscc->oscc_lock);
155                 break;
156         }
157         case -EINTR:
158         case -EWOULDBLOCK: {
159                 /* aka EAGAIN we should not delay create if import failed -
160                  * this avoid client stick in create and avoid race with
161                  * delorphan */
162                 /* EINTR say - old create request is killed due mds<>ost
163                  * eviction - OSCC_FLAG_RECOVERING can already set due
164                  * IMP_DISCONN event */
165                 oscc->oscc_flags |= OSCC_FLAG_RECOVERING;
166                 /* oscc->oscc_grow_count = OST_MIN_PRECREATE; */
167                 cfs_spin_unlock(&oscc->oscc_lock);
168                 break;
169         }
170         default: {
171                 oscc->oscc_flags |= OSCC_FLAG_RECOVERING;
172                 oscc->oscc_grow_count = OST_MIN_PRECREATE;
173                 cfs_spin_unlock(&oscc->oscc_lock);
174                 DEBUG_REQ(D_ERROR, req,
175                           "Unknown rc %d from async create: failing oscc", rc);
176                 ptlrpc_fail_import(req->rq_import,
177                                    lustre_msg_get_conn_cnt(req->rq_reqmsg));
178         }
179         }
180
181         CDEBUG(D_HA, "preallocated through id "LPU64" (next to use "LPU64")\n",
182                oscc->oscc_last_id, oscc->oscc_next_id);
183
184         cfs_spin_lock(&oscc->oscc_lock);
185         cfs_list_for_each_entry_safe(fake_req, pos,
186                                      &oscc->oscc_wait_create_list, rq_list) {
187                 if (handle_async_create(fake_req, rc) == -EAGAIN) {
188                         oscc_internal_create(oscc);
189                         /* sending request should be never fail because
190                          * osc use preallocated requests pool */
191                         GOTO(exit_wakeup, rc);
192                 }
193         }
194         cfs_spin_unlock(&oscc->oscc_lock);
195
196 exit_wakeup:
197         cfs_waitq_signal(&oscc->oscc_waitq);
198         RETURN(rc);
199 }
200
201 static int oscc_internal_create(struct osc_creator *oscc)
202 {
203         struct osc_create_async_args *args;
204         struct ptlrpc_request *request;
205         struct ost_body *body;
206         ENTRY;
207
208         LASSERT_SPIN_LOCKED(&oscc->oscc_lock);
209
210         /* Do not check for a degraded OST here - bug21563/bug18539 */
211         if (oscc->oscc_flags & OSCC_FLAG_RECOVERING) {
212                 cfs_spin_unlock(&oscc->oscc_lock);
213                 RETURN(0);
214         }
215
216         /* we need check it before OSCC_FLAG_CREATING - because need
217          * see lower number of precreate objects */
218         if (oscc->oscc_grow_count < oscc->oscc_max_grow_count &&
219             ((oscc->oscc_flags & OSCC_FLAG_LOW) == 0) &&
220             (__s64)(oscc->oscc_last_id - oscc->oscc_next_id) <=
221                    (oscc->oscc_grow_count / 4 + 1)) {
222                 oscc->oscc_flags |= OSCC_FLAG_LOW;
223                 oscc->oscc_grow_count *= 2;
224         }
225
226         if (oscc->oscc_flags & OSCC_FLAG_CREATING) {
227                 cfs_spin_unlock(&oscc->oscc_lock);
228                 RETURN(0);
229         }
230
231         if (oscc->oscc_grow_count > oscc->oscc_max_grow_count / 2)
232                 oscc->oscc_grow_count = oscc->oscc_max_grow_count / 2;
233
234         oscc->oscc_flags |= OSCC_FLAG_CREATING;
235         cfs_spin_unlock(&oscc->oscc_lock);
236
237         request = ptlrpc_request_alloc_pack(oscc->oscc_obd->u.cli.cl_import,
238                                             &RQF_OST_CREATE,
239                                             LUSTRE_OST_VERSION, OST_CREATE);
240         if (request == NULL) {
241                 cfs_spin_lock(&oscc->oscc_lock);
242                 oscc->oscc_flags &= ~OSCC_FLAG_CREATING;
243                 cfs_spin_unlock(&oscc->oscc_lock);
244                 RETURN(-ENOMEM);
245         }
246
247         request->rq_request_portal = OST_CREATE_PORTAL;
248         ptlrpc_at_set_req_timeout(request);
249         body = req_capsule_client_get(&request->rq_pill, &RMF_OST_BODY);
250         args = ptlrpc_req_async_args(request);
251         args->rq_oscc = oscc;
252
253         cfs_spin_lock(&oscc->oscc_lock);
254         args->rq_grow_count = oscc->oscc_grow_count;
255
256         if (likely(fid_seq_is_mdt(oscc->oscc_oa.o_seq))) {
257                 body->oa.o_oi.oi_seq = oscc->oscc_oa.o_seq;
258                 body->oa.o_oi.oi_id  = oscc->oscc_last_id +
259                                        oscc->oscc_grow_count;
260         } else {
261                 /*Just warning here currently, since not sure how fid-on-ost
262                  *will be implemented here */
263                 CWARN("o_seq: "LPU64" is not indicate any MDTs.\n",
264                        oscc->oscc_oa.o_seq);
265         }
266         cfs_spin_unlock(&oscc->oscc_lock);
267
268         body->oa.o_valid |= OBD_MD_FLID | OBD_MD_FLGROUP;
269         CDEBUG(D_RPCTRACE, "prealloc through id "LPU64" (last seen "LPU64")\n",
270                body->oa.o_id, oscc->oscc_last_id);
271
272         /* we should not resend create request - anyway we will have delorphan
273          * and kill these objects */
274         request->rq_no_delay = request->rq_no_resend = 1;
275         ptlrpc_request_set_replen(request);
276
277         request->rq_interpret_reply = osc_interpret_create;
278         ptlrpcd_add_req(request, PDL_POLICY_ROUND, -1);
279
280         RETURN(0);
281 }
282
283 static int oscc_has_objects_nolock(struct osc_creator *oscc, int count)
284 {
285         return ((__s64)(oscc->oscc_last_id - oscc->oscc_next_id) >= count);
286 }
287
288 static int oscc_has_objects(struct osc_creator *oscc, int count)
289 {
290         int have_objs;
291
292         cfs_spin_lock(&oscc->oscc_lock);
293         have_objs = oscc_has_objects_nolock(oscc, count);
294         cfs_spin_unlock(&oscc->oscc_lock);
295
296         return have_objs;
297 }
298
299 static int oscc_wait_for_objects(struct osc_creator *oscc, int count)
300 {
301         int have_objs;
302         int ost_unusable;
303
304         ost_unusable = oscc->oscc_obd->u.cli.cl_import->imp_invalid;
305
306         cfs_spin_lock(&oscc->oscc_lock);
307         ost_unusable |= (OSCC_FLAG_NOSPC | OSCC_FLAG_RDONLY |
308                          OSCC_FLAG_EXITING) & oscc->oscc_flags;
309         have_objs = oscc_has_objects_nolock(oscc, count);
310
311         if (!ost_unusable && !have_objs)
312                 /* they release lock himself */
313                 have_objs = oscc_internal_create(oscc);
314         else
315                 cfs_spin_unlock(&oscc->oscc_lock);
316
317         return have_objs || ost_unusable;
318 }
319
320 static int oscc_precreate(struct osc_creator *oscc)
321 {
322         struct l_wait_info lwi;
323         int rc = 0;
324         ENTRY;
325
326         if (oscc_has_objects(oscc, oscc->oscc_grow_count / 2))
327                 RETURN(0);
328
329         /* we should be not block forever - because client's create rpc can
330          * stick in mds for long time and forbid client reconnect */
331         lwi = LWI_TIMEOUT(cfs_timeout_cap(cfs_time_seconds(osc_create_timeout)),
332                           NULL, NULL);
333
334         rc = l_wait_event(oscc->oscc_waitq, oscc_wait_for_objects(oscc, 1), &lwi);
335         RETURN(rc);
336 }
337
338 static int oscc_in_sync(struct osc_creator *oscc)
339 {
340         int sync;
341
342         cfs_spin_lock(&oscc->oscc_lock);
343         sync = oscc->oscc_flags & OSCC_FLAG_SYNC_IN_PROGRESS;
344         cfs_spin_unlock(&oscc->oscc_lock);
345
346         return sync;
347 }
348
349 /* decide if the OST has remaining object, return value :
350         0 : the OST has remaining objects, may or may not send precreation RPC.
351         1 : the OST has no remaining object, and the sent precreation RPC
352             has not been completed yet.
353         2 : the OST has no remaining object, and will not get any for
354             a potentially very long time
355      1000 : unusable
356  */
357 int osc_precreate(struct obd_export *exp)
358 {
359         struct osc_creator *oscc = &exp->exp_obd->u.cli.cl_oscc;
360         struct obd_import *imp = exp->exp_imp_reverse;
361         int rc;
362         ENTRY;
363
364         LASSERT(oscc != NULL);
365         if (imp != NULL && imp->imp_deactive)
366                 GOTO(out_nolock, rc = 1000);
367
368         /* Handle critical states first */
369         cfs_spin_lock(&oscc->oscc_lock);
370         if (oscc->oscc_flags & OSCC_FLAG_NOSPC_BLK ||
371             oscc->oscc_flags & OSCC_FLAG_RDONLY ||
372             oscc->oscc_flags & OSCC_FLAG_EXITING)
373                 GOTO(out, rc = 1000);
374
375         if ((oscc->oscc_flags & OSCC_FLAG_RECOVERING) ||
376             (oscc->oscc_flags & OSCC_FLAG_DEGRADED))
377                 GOTO(out, rc = 2);
378
379         if (oscc_has_objects_nolock(oscc, oscc->oscc_grow_count / 2))
380                 GOTO(out, rc = 0);
381
382         /* Return 0, if we have at least one object - bug 22884 */
383         rc = oscc_has_objects_nolock(oscc, 1) ? 0 : 1;
384
385         if (oscc->oscc_flags & OSCC_FLAG_NOSPC)
386                 GOTO(out, (rc == 0) ? 0 : 1000);
387
388         /* Do not check for OSCC_FLAG_CREATING flag here, let
389          * osc_precreate() call oscc_internal_create() and
390          * adjust oscc_grow_count bug21563 */
391         if (oscc->oscc_flags & OSCC_FLAG_SYNC_IN_PROGRESS)
392                 GOTO(out, rc);
393
394         if (oscc_internal_create(oscc))
395                 GOTO(out_nolock, rc = 1000);
396
397         RETURN(rc);
398 out:
399         cfs_spin_unlock(&oscc->oscc_lock);
400 out_nolock:
401         return rc;
402 }
403
404 static int handle_async_create(struct ptlrpc_request *req, int rc)
405 {
406         struct osc_create_async_args *args = ptlrpc_req_async_args(req);
407         struct osc_creator    *oscc = args->rq_oscc;
408         struct lov_stripe_md  *lsm  = args->rq_lsm;
409         struct obd_info       *oinfo = args->rq_oinfo;
410         struct obdo           *oa = oinfo->oi_oa;
411
412         LASSERT_SPIN_LOCKED(&oscc->oscc_lock);
413
414         if(rc)
415                 GOTO(out_wake, rc);
416
417         /* Handle the critical type errors first.
418          * Should we also test cl_import state as well ? */
419         if (oscc->oscc_flags & OSCC_FLAG_EXITING)
420                 GOTO(out_wake, rc = -EIO);
421
422         if (oscc->oscc_flags & OSCC_FLAG_NOSPC_BLK)
423                 GOTO(out_wake, rc = -ENOSPC);
424
425         if (oscc->oscc_flags & OSCC_FLAG_RDONLY)
426                 GOTO(out_wake, rc = -EROFS);
427
428         /* should be try wait until recovery finished */
429         if((oscc->oscc_flags & OSCC_FLAG_RECOVERING) ||
430            (oscc->oscc_flags & OSCC_FLAG_DEGRADED))
431                 RETURN(-EAGAIN);
432
433         if (oscc_has_objects_nolock(oscc, 1)) {
434                 memcpy(oa, &oscc->oscc_oa, sizeof(*oa));
435                 oa->o_id = oscc->oscc_next_id;
436                 lsm->lsm_object_id = oscc->oscc_next_id;
437                 oscc->oscc_next_id++;
438
439                 CDEBUG(D_RPCTRACE, " set oscc_next_id = "LPU64"\n",
440                        oscc->oscc_next_id);
441                 GOTO(out_wake, rc = 0);
442         }
443
444         /* we don't have objects now - continue wait */
445         RETURN(-EAGAIN);
446
447 out_wake:
448
449         rc = oinfo->oi_cb_up(oinfo, rc);
450         ptlrpc_fakereq_finished(req);
451
452         RETURN(rc);
453 }
454
455 static int async_create_interpret(const struct lu_env *env,
456                                   struct ptlrpc_request *req, void *data,
457                                   int rc)
458 {
459         struct osc_create_async_args *args = ptlrpc_req_async_args(req);
460         struct osc_creator    *oscc = args->rq_oscc;
461         int ret;
462
463         cfs_spin_lock(&oscc->oscc_lock);
464         ret = handle_async_create(req, rc);
465         cfs_spin_unlock(&oscc->oscc_lock);
466
467         return ret;
468 }
469
470 int osc_create_async(struct obd_export *exp, struct obd_info *oinfo,
471                      struct lov_stripe_md **ea, struct obd_trans_info *oti)
472 {
473         int rc;
474         struct ptlrpc_request *fake_req;
475         struct osc_create_async_args *args;
476         struct osc_creator *oscc = &exp->exp_obd->u.cli.cl_oscc;
477         struct obdo *oa = oinfo->oi_oa;
478         ENTRY;
479
480         if ((oa->o_valid & OBD_MD_FLGROUP) && !fid_seq_is_mdt(oa->o_seq)) {
481                 rc = osc_real_create(exp, oinfo->oi_oa, ea, oti);
482                 rc = oinfo->oi_cb_up(oinfo, rc);
483                 RETURN(rc);
484         }
485
486         if ((oa->o_valid & OBD_MD_FLFLAGS) &&
487             oa->o_flags == OBD_FL_RECREATE_OBJS) {
488                 rc = osc_real_create(exp, oinfo->oi_oa, ea, oti);
489                 rc = oinfo->oi_cb_up(oinfo, rc);
490                 RETURN(rc);
491         }
492
493         LASSERT((*ea) != NULL);
494
495         fake_req = ptlrpc_prep_fakereq(oscc->oscc_obd->u.cli.cl_import,
496                                        osc_create_timeout,
497                                        async_create_interpret);
498         if (fake_req == NULL) {
499                 rc = oinfo->oi_cb_up(oinfo, -ENOMEM);
500                 RETURN(-ENOMEM);
501         }
502
503         args = ptlrpc_req_async_args(fake_req);
504         CLASSERT(sizeof(*args) <= sizeof(fake_req->rq_async_args));
505
506         args->rq_oscc  = oscc;
507         args->rq_lsm   = *ea;
508         args->rq_oinfo = oinfo;
509
510         cfs_spin_lock(&oscc->oscc_lock);
511         /* try fast path */
512         rc = handle_async_create(fake_req, 0);
513         if (rc == -EAGAIN) {
514                 /* We don't have any objects, wait until we get a reply. */
515                 ptlrpcd_add_req(fake_req, PDL_POLICY_ROUND, -1);
516                 cfs_list_add(&fake_req->rq_list,
517                              &oscc->oscc_wait_create_list);
518                 cfs_spin_unlock(&oscc->oscc_lock);
519                 /* EAGAIN mean - request is delayed */
520                 rc = 0;
521         } else {
522                 cfs_spin_unlock(&oscc->oscc_lock);
523                 /* need free request if was error hit or
524                  * objects already allocated */
525                 ptlrpc_req_finished(fake_req);
526         }
527
528         RETURN(rc);
529 }
530
531 int osc_create(struct obd_export *exp, struct obdo *oa,
532                struct lov_stripe_md **ea, struct obd_trans_info *oti)
533 {
534         struct osc_creator *oscc = &exp->exp_obd->u.cli.cl_oscc;
535         struct obd_import  *imp  = exp->exp_obd->u.cli.cl_import;
536         struct lov_stripe_md *lsm;
537         int del_orphan = 0, rc = 0;
538         ENTRY;
539
540         LASSERT(oa);
541         LASSERT(ea);
542         LASSERT(oa->o_valid & OBD_MD_FLGROUP);
543
544         if ((oa->o_valid & OBD_MD_FLFLAGS) &&
545             oa->o_flags == OBD_FL_RECREATE_OBJS) {
546                 RETURN(osc_real_create(exp, oa, ea, oti));
547         }
548
549         if (!fid_seq_is_mdt(oa->o_seq))
550                 RETURN(osc_real_create(exp, oa, ea, oti));
551
552         /* this is the special case where create removes orphans */
553         if (oa->o_valid & OBD_MD_FLFLAGS &&
554             oa->o_flags == OBD_FL_DELORPHAN) {
555                 cfs_spin_lock(&oscc->oscc_lock);
556                 if (oscc->oscc_flags & OSCC_FLAG_SYNC_IN_PROGRESS) {
557                         cfs_spin_unlock(&oscc->oscc_lock);
558                         RETURN(-EBUSY);
559                 }
560                 if (!(oscc->oscc_flags & OSCC_FLAG_RECOVERING)) {
561                         cfs_spin_unlock(&oscc->oscc_lock);
562                         RETURN(0);
563                 }
564
565                 oscc->oscc_flags |= OSCC_FLAG_SYNC_IN_PROGRESS;
566                 /* seting flag LOW we prevent extra grow precreate size
567                  * and enforce use last assigned size */
568                 oscc->oscc_flags |= OSCC_FLAG_LOW;
569                 cfs_spin_unlock(&oscc->oscc_lock);
570                 CDEBUG(D_HA, "%s: oscc recovery started - delete to "LPU64"\n",
571                        oscc->oscc_obd->obd_name, oscc->oscc_next_id - 1);
572
573                 del_orphan = 1;
574
575                 /* delete from next_id on up */
576                 oa->o_valid |= OBD_MD_FLID;
577                 oa->o_id = oscc->oscc_next_id - 1;
578
579                 rc = osc_real_create(exp, oa, ea, NULL);
580
581                 cfs_spin_lock(&oscc->oscc_lock);
582                 oscc->oscc_flags &= ~OSCC_FLAG_SYNC_IN_PROGRESS;
583                 if (rc == 0 || rc == -ENOSPC) {
584                         struct obd_connect_data *ocd;
585
586                         if (rc == -ENOSPC) {
587                                 oscc->oscc_flags |= OSCC_FLAG_NOSPC;
588                                 if ((oa->o_valid & OBD_MD_FLFLAGS) &&
589                                     (oa->o_flags & OBD_FL_NOSPC_BLK))
590                                         oscc->oscc_flags |= OSCC_FLAG_NOSPC_BLK;
591                         }
592                         oscc->oscc_flags &= ~OSCC_FLAG_RECOVERING;
593
594                         oscc->oscc_last_id = oa->o_id;
595                         ocd = &imp->imp_connect_data;
596                         if (ocd->ocd_connect_flags & OBD_CONNECT_SKIP_ORPHAN) {
597                                 /*
598                                  * The OST reports back in oa->o_id from where
599                                  * we should restart in order to skip orphan
600                                  * objects
601                                  */
602                                 CDEBUG(D_HA, "%s: Skip orphan set, reset last "
603                                        "objid\n", oscc->oscc_obd->obd_name);
604                                 oscc->oscc_next_id = oa->o_id + 1;
605                         }
606
607                         /* sanity check for next objid. see bug 17025 */
608                         LASSERT(oscc->oscc_next_id == oa->o_id + 1);
609
610                         CDEBUG(D_HA, "%s: oscc recovery finished, last_id: "
611                                LPU64", rc: %d\n", oscc->oscc_obd->obd_name,
612                                oscc->oscc_last_id, rc);
613                 } else {
614                         CDEBUG(D_ERROR, "%s: oscc recovery failed: %d\n",
615                                oscc->oscc_obd->obd_name, rc);
616                 }
617
618                 cfs_waitq_signal(&oscc->oscc_waitq);
619                 cfs_spin_unlock(&oscc->oscc_lock);
620
621                 if (rc < 0)
622                         RETURN(rc);
623         }
624
625         lsm = *ea;
626         if (lsm == NULL) {
627                 rc = obd_alloc_memmd(exp, &lsm);
628                 if (rc < 0)
629                         RETURN(rc);
630         }
631
632         while (1) {
633                 if (oscc_in_sync(oscc))
634                         CDEBUG(D_HA,"%s: oscc recovery in progress, waiting\n",
635                                oscc->oscc_obd->obd_name);
636
637                 rc = oscc_precreate(oscc);
638                 if (rc)
639                         CDEBUG(D_HA,"%s: error create %d\n",
640                                oscc->oscc_obd->obd_name, rc);
641
642                 cfs_spin_lock(&oscc->oscc_lock);
643
644                 /* wakeup but recovery did not finished */
645                 if ((oscc->oscc_obd->u.cli.cl_import->imp_invalid) ||
646                     (oscc->oscc_flags & OSCC_FLAG_RECOVERING)) {
647                         rc = -EIO;
648                         cfs_spin_unlock(&oscc->oscc_lock);
649                         break;
650                 }
651
652                 if (oscc->oscc_flags & OSCC_FLAG_NOSPC_BLK) {
653                         rc = -ENOSPC;
654                         cfs_spin_unlock(&oscc->oscc_lock);
655                         break;
656                 }
657
658                 if (oscc->oscc_flags & OSCC_FLAG_RDONLY) {
659                         rc = -EROFS;
660                         cfs_spin_unlock(&oscc->oscc_lock);
661                         break;
662                 }
663
664                 // Should we report -EIO error ?
665                 if (oscc->oscc_flags & OSCC_FLAG_EXITING) {
666                         cfs_spin_unlock(&oscc->oscc_lock);
667                         break;
668                 }
669
670                 /**
671                  * If this is DELORPHAN process, no need create object here,
672                  * otherwise this will create a gap of object id, and MDS
673                  * might create some orphan log (mds_lov_update_objids), then
674                  * remove objects wrongly on OST. Bug 21379.
675                  */
676                 if (oa->o_valid & OBD_MD_FLFLAGS &&
677                         oa->o_flags == OBD_FL_DELORPHAN) {
678                         cfs_spin_unlock(&oscc->oscc_lock);
679                         break;
680                 }
681
682                 if (oscc_has_objects_nolock(oscc, 1)) {
683                         memcpy(oa, &oscc->oscc_oa, sizeof(*oa));
684                         oa->o_id = oscc->oscc_next_id;
685                         lsm->lsm_object_id = oscc->oscc_next_id;
686                         *ea = lsm;
687                         oscc->oscc_next_id++;
688                         cfs_spin_unlock(&oscc->oscc_lock);
689
690                         CDEBUG(D_RPCTRACE, "%s: set oscc_next_id = "LPU64"\n",
691                                exp->exp_obd->obd_name, oscc->oscc_next_id);
692                         break;
693                 }
694
695                 if (oscc->oscc_flags & OSCC_FLAG_NOSPC) {
696                         rc = -ENOSPC;
697                         cfs_spin_unlock(&oscc->oscc_lock);
698                         break;
699                 }
700
701                 cfs_spin_unlock(&oscc->oscc_lock);
702         }
703
704         if (rc == 0) {
705                 CDEBUG(D_INFO, "%s: returning objid "LPU64"\n",
706                        obd2cli_tgt(oscc->oscc_obd), lsm->lsm_object_id);
707         } else {
708                 if (*ea == NULL)
709                         obd_free_memmd(exp, &lsm);
710                 if (del_orphan != 0 && rc != -EIO)
711                         /* Ignore non-IO precreate error for clear orphan */
712                         rc = 0;
713         }
714         RETURN(rc);
715 }
716
717 void oscc_init(struct obd_device *obd)
718 {
719         struct osc_creator *oscc;
720
721         if (obd == NULL)
722                 return;
723
724         oscc = &obd->u.cli.cl_oscc;
725
726         memset(oscc, 0, sizeof(*oscc));
727
728         cfs_waitq_init(&oscc->oscc_waitq);
729         cfs_spin_lock_init(&oscc->oscc_lock);
730         oscc->oscc_obd = obd;
731         oscc->oscc_grow_count = OST_MIN_PRECREATE;
732         oscc->oscc_max_grow_count = OST_MAX_PRECREATE;
733
734         oscc->oscc_next_id = 2;
735         oscc->oscc_last_id = 1;
736         oscc->oscc_flags |= OSCC_FLAG_RECOVERING;
737
738         CFS_INIT_LIST_HEAD(&oscc->oscc_wait_create_list);
739
740         /* XXX the export handle should give the oscc the last object */
741         /* oed->oed_oscc.oscc_last_id = exph->....; */
742 }
743
744 void oscc_fini(struct obd_device *obd)
745 {
746         struct osc_creator *oscc = &obd->u.cli.cl_oscc;
747         ENTRY;
748
749
750         cfs_spin_lock(&oscc->oscc_lock);
751         oscc->oscc_flags &= ~OSCC_FLAG_RECOVERING;
752         oscc->oscc_flags |= OSCC_FLAG_EXITING;
753         cfs_spin_unlock(&oscc->oscc_lock);
754 }