Whamcloud - gitweb
LU-12861 libcfs: provide an scnprintf and start using it
[fs/lustre-release.git] / lustre / tests / fsx.c
1 /*
2  * Copyright (c) 1998-2001 Apple Computer, Inc. All rights reserved.
3  *
4  * Copyright (c) 2012, Intel Corporation.
5  *
6  * @APPLE_LICENSE_HEADER_START@
7  *
8  * The contents of this file constitute Original Code as defined in and
9  * are subject to the Apple Public Source License Version 1.1 (the
10  * "License").  You may not use this file except in compliance with the
11  * License.  Please obtain a copy of the License at
12  * http://www.apple.com/publicsource and read it before using this file.
13  *
14  * This Original Code and all software distributed under the License are
15  * distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY KIND, EITHER
16  * EXPRESS OR IMPLIED, AND APPLE HEREBY DISCLAIMS ALL SUCH WARRANTIES,
17  * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY,
18  * FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT.  Please see the
19  * License for the specific language governing rights and limitations
20  * under the License.
21  *
22  * @APPLE_LICENSE_HEADER_END@
23  *
24  *      File:   fsx.c
25  *      Author: Avadis Tevanian, Jr.
26  *
27  *      File system exerciser.
28  *
29  *      Rewrite and enhancements 1998-2001 Conrad Minshall -- conrad@mac.com
30  *
31  *      Various features from Joe Sokol, Pat Dirks, and Clark Warner.
32  *
33  *      Small changes to work under Linux -- davej@suse.de
34  *
35  *      Sundry porting patches from Guy Harris 12/2001
36  * $FreeBSD: src/tools/regression/fsx/fsx.c,v 1.1 2001/12/20 04:15:57 jkh Exp $
37  */
38 #include <sys/types.h>
39 #include <sys/stat.h>
40 #if defined(_UWIN) || defined(__linux__)
41 # include <sys/param.h>
42 # include <limits.h>
43 # include <time.h>
44 # include <strings.h>
45 # include <sys/time.h>
46 #endif
47 #include <fcntl.h>
48 #include <sys/mman.h>
49 #ifndef MAP_FILE
50 # define MAP_FILE 0
51 #endif
52 #include <limits.h>
53 #include <signal.h>
54 #include <stdio.h>
55 #include <stdlib.h>
56 #include <string.h>
57 #include <unistd.h>
58 #include <stdarg.h>
59 #include <errno.h>
60 #include <libcfs/util/string.h>
61
62 #define NUMPRINTCOLUMNS 32      /* # columns of data to print on each line */
63
64 /*
65  * Each test run will work with one or more separate file descriptors for the
66  * same file.  This allows testing cache coherency across multiple mountpoints
67  * of the same network filesystem on a single client.
68  */
69 struct test_file {
70         char *path;
71         int fd;
72 } *test_files = NULL;
73
74 int num_test_files;
75 enum fd_iteration_policy {
76         FD_SINGLE,
77         FD_ROTATE,
78         FD_RANDOM,
79 };
80 int fd_policy = FD_RANDOM;
81 int fd_last;
82
83 /*
84  *      A log entry is an operation and a bunch of arguments.
85  */
86
87 struct log_entry {
88         int                     operation;
89         int                     args[3];
90         struct timeval          tv;
91         const struct test_file  *tf;
92 };
93
94 #define LOGSIZE 100000
95
96 struct log_entry        oplog[LOGSIZE]; /* the log */
97 int                     logptr = 0;     /* current position in log */
98 int                     logcount = 0;   /* total ops */
99
100 /*
101  *      Define operations
102  */
103
104 #define OP_READ         1
105 #define OP_WRITE        2
106 #define OP_TRUNCATE     3
107 #define OP_CLOSEOPEN    4
108 #define OP_MAPREAD      5
109 #define OP_MAPWRITE     6
110 #define OP_SKIPPED      7
111
112 int page_size;
113 int page_mask;
114
115 char    *original_buf;                  /* a pointer to the original data */
116 char    *good_buf;                      /* a pointer to the correct data */
117 char    *temp_buf;                      /* a pointer to the current data */
118 char    *fname;                         /* name of our test file */
119 char    logfile[PATH_MAX];              /* name of our log file */
120 char    goodfile[PATH_MAX];             /* name of our test file */
121
122 off_t           file_size = 0;
123 off_t           biggest = 0;
124 char            state[256];
125 unsigned long   testcalls = 0;          /* calls to function "test" */
126
127 long    simulatedopcount = 0;           /* -b flag */
128 int     closeprob = 0;                  /* -c flag */
129 int     debug = 0;                      /* -d flag */
130 long    debugstart = 0;                 /* -D flag */
131 long    maxfilelen = 256 * 1024;        /* -l flag */
132 int     sizechecks = 1;                 /* -n flag disables them */
133 int     maxoplen = 64 * 1024;           /* -o flag */
134 int     quiet = 0;                      /* -q flag */
135 long    progressinterval = 0;           /* -p flag */
136 int     readbdy = 1;                    /* -r flag */
137 int     style = 0;                      /* -s flag */
138 int     truncbdy = 1;                   /* -t flag */
139 int     writebdy = 1;                   /* -w flag */
140 long    monitorstart = -1;              /* -m flag */
141 long    monitorend = -1;                /* -m flag */
142 int     lite = 0;                       /* -L flag */
143 long    numops = -1;                    /* -N flag */
144 int     randomoplen = 1;                /* -O flag disables it */
145 int     seed = 1;                       /* -S flag */
146 int     mapped_writes = 1;              /* -W flag disables */
147 int     mapped_reads = 1;               /* -R flag disables it */
148 int     fsxgoodfd = 0;
149 int     o_direct;                       /* -Z */
150 FILE *  fsxlogf = NULL;
151 int badoff = -1;
152
153 void
154 vwarnc(code, fmt, ap)
155         int code;
156         const char *fmt;
157         va_list ap;
158 {
159         fprintf(stderr, "fsx: ");
160         if (fmt != NULL) {
161                 vfprintf(stderr, fmt, ap);
162                 fprintf(stderr, ": ");
163         }
164         fprintf(stderr, "%s\n", strerror(code));
165 }
166
167
168 void
169 warn(const char * fmt, ...)
170 {
171         va_list ap;
172         va_start(ap, fmt);
173         vwarnc(errno, fmt, ap);
174         va_end(ap);
175 }
176
177
178 void
179 __attribute__((format(printf, 1, 2)))
180 prt(char *fmt, ...)
181 {
182         va_list args;
183
184         va_start(args, fmt);
185         vfprintf(stdout, fmt, args);
186         va_end(args);
187
188         if (fsxlogf) {
189                 va_start(args, fmt);
190                 vfprintf(fsxlogf, fmt, args);
191                 va_end(args);
192         }
193 }
194
195 void
196 prterr(char *prefix)
197 {
198         prt("%s%s%s\n", prefix, prefix ? ": " : "", strerror(errno));
199 }
200
201
202 void
203 log4(int operation, int arg0, int arg1, int arg2, struct timeval *tv,
204         const struct test_file *tf)
205 {
206         struct log_entry *le;
207
208         le = &oplog[logptr];
209         le->operation = operation;
210         le->args[0] = arg0;
211         le->args[1] = arg1;
212         le->args[2] = arg2;
213         le->tv = *tv;
214         le->tf = tf;
215         logptr++;
216         logcount++;
217         if (logptr >= LOGSIZE)
218                 logptr = 0;
219 }
220
221 const char *
222 fill_tf_buf(const struct test_file *tf)
223 {
224         static int max_tf_len;
225         static char tf_buf[32];
226
227         if (fd_policy == FD_SINGLE)
228                 return "";
229
230         if (max_tf_len == 0)
231                 max_tf_len = scnprintf(tf_buf, sizeof(tf_buf) - 1,
232                                       "%u", num_test_files - 1);
233
234         snprintf(tf_buf, sizeof(tf_buf), "[%0*lu]", max_tf_len,
235                 (unsigned long)(tf - test_files));
236
237         return tf_buf;
238 }
239
240 void
241 logdump(void)
242 {
243         int     i, count, down;
244         struct log_entry        *lp;
245
246         prt("LOG DUMP (%d total operations):\n", logcount);
247         if (logcount < LOGSIZE) {
248                 i = 0;
249                 count = logcount;
250         } else {
251                 i = logptr;
252                 count = LOGSIZE;
253         }
254         for ( ; count > 0; count--) {
255                 int opnum;
256
257                 opnum = i+1 + (logcount/LOGSIZE)*LOGSIZE;
258                 lp = &oplog[i];
259                 prt("%d%s: %lu.%06lu ", opnum, fill_tf_buf(lp->tf),
260                     lp->tv.tv_sec, lp->tv.tv_usec);
261
262                 switch (lp->operation) {
263                 case OP_MAPREAD:
264                         prt("MAPREAD  0x%x thru 0x%x (0x%x bytes)",
265                             lp->args[0], lp->args[0] + lp->args[1] - 1,
266                             lp->args[1]);
267                         if (badoff >= lp->args[0] && badoff <
268                                                      lp->args[0] + lp->args[1])
269                                 prt("\t***RRRR***");
270                         break;
271                 case OP_MAPWRITE:
272                         prt("MAPWRITE 0x%x thru 0x%x (0x%x bytes)",
273                             lp->args[0], lp->args[0] + lp->args[1] - 1,
274                             lp->args[1]);
275                         if (badoff >= lp->args[0] && badoff <
276                                                      lp->args[0] + lp->args[1])
277                                 prt("\t******WWWW");
278                         break;
279                 case OP_READ:
280                         prt("READ     0x%x thru 0x%x (0x%x bytes)",
281                             lp->args[0], lp->args[0] + lp->args[1] - 1,
282                             lp->args[1]);
283                         if (badoff >= lp->args[0] &&
284                             badoff < lp->args[0] + lp->args[1])
285                                 prt("\t***RRRR***");
286                         break;
287                 case OP_WRITE:
288                         prt("WRITE    0x%x thru 0x%x (0x%x bytes)",
289                             lp->args[0], lp->args[0] + lp->args[1] - 1,
290                             lp->args[1]);
291                         if (lp->args[0] > lp->args[2])
292                                 prt(" HOLE");
293                         else if (lp->args[0] + lp->args[1] > lp->args[2])
294                                 prt(" EXTEND");
295                         if ((badoff >= lp->args[0] || badoff >=lp->args[2]) &&
296                             badoff < lp->args[0] + lp->args[1])
297                                 prt("\t***WWWW");
298                         break;
299                 case OP_TRUNCATE:
300                         down = lp->args[0] < lp->args[1];
301                         prt("TRUNCATE %s\tfrom 0x%x to 0x%x",
302                             down ? "DOWN" : "UP", lp->args[1], lp->args[0]);
303                         if (badoff >= lp->args[!down] &&
304                             badoff < lp->args[!!down])
305                                 prt("\t******WWWW");
306                         break;
307                 case OP_CLOSEOPEN:
308                         prt("CLOSE/OPEN");
309                         break;
310                 case OP_SKIPPED:
311                         prt("SKIPPED (no operation)");
312                         break;
313                 default:
314                         prt("BOGUS LOG ENTRY (operation code = %d)!",
315                             lp->operation);
316                 }
317                 prt("\n");
318                 i++;
319                 if (i == LOGSIZE)
320                         i = 0;
321         }
322 }
323
324
325 void
326 save_buffer(char *buffer, off_t bufferlength, int fd)
327 {
328         off_t ret;
329         ssize_t byteswritten;
330
331         if (fd <= 0 || bufferlength == 0)
332                 return;
333
334         if (bufferlength > SSIZE_MAX) {
335                 prt("fsx flaw: overflow in save_buffer\n");
336                 exit(67);
337         }
338         if (lite) {
339                 off_t size_by_seek = lseek(fd, (off_t)0, SEEK_END);
340                 if (size_by_seek == (off_t)-1)
341                         prterr("save_buffer: lseek eof");
342                 else if (bufferlength > size_by_seek) {
343                         warn("save_buffer: .fsxgood file too short... will"
344                                 "save 0x%llx bytes instead of 0x%llx\n",
345                                 (unsigned long long)size_by_seek,
346                                 (unsigned long long)bufferlength);
347                         bufferlength = size_by_seek;
348                 }
349         }
350
351         ret = lseek(fd, (off_t)0, SEEK_SET);
352         if (ret == (off_t)-1)
353                 prterr("save_buffer: lseek 0");
354
355         byteswritten = write(fd, buffer, (size_t)bufferlength);
356         if (byteswritten != bufferlength) {
357                 if (byteswritten == -1)
358                         prterr("save_buffer write");
359                 else
360                         warn("save_buffer: short write, 0x%x bytes instead"
361                                 "of 0x%llx\n",
362                              (unsigned)byteswritten,
363                              (unsigned long long)bufferlength);
364         }
365 }
366
367
368 void
369 report_failure(int status)
370 {
371         logdump();
372
373         if (fsxgoodfd) {
374                 if (good_buf) {
375                         save_buffer(good_buf, file_size, fsxgoodfd);
376                         prt("Correct content saved for comparison\n");
377                         prt("(maybe hexdump \"%s\" vs \"%s\")\n",
378                             fname, goodfile);
379                 }
380                 close(fsxgoodfd);
381         }
382         exit(status);
383 }
384
385
386 #define short_at(cp) ((unsigned short)((*((unsigned char *)(cp)) << 8) | \
387                                         *(((unsigned char *)(cp)) + 1)))
388
389 void
390 check_buffers(unsigned offset, unsigned size)
391 {
392         unsigned char c, t;
393         unsigned i = 0;
394         unsigned n = 0;
395         unsigned op = 0;
396         unsigned bad = 0;
397
398         if (memcmp(good_buf + offset, temp_buf, size) != 0) {
399                 prt("READ BAD DATA: offset = 0x%x, size = 0x%x\n",
400                     offset, size);
401                 prt("OFFSET\tGOOD\tBAD\tRANGE\n");
402                 while (size > 0) {
403                         c = good_buf[offset];
404                         t = temp_buf[i];
405                         if (c != t) {
406                                 if (n == 0) {
407                                         bad = short_at(&temp_buf[i]);
408                                         prt("%#07x\t%#06x\t%#06x", offset,
409                                             short_at(&good_buf[offset]), bad);
410                                         op = temp_buf[offset & 1 ? i+1 : i];
411                                 }
412                                 n++;
413                                 badoff = offset;
414                         }
415                         offset++;
416                         i++;
417                         size--;
418                 }
419                 if (n) {
420                         prt("\t%#7x\n", n);
421                         if (bad)
422                                 prt("operation# (mod 256) for the bad data"
423                                         "may be %u\n", ((unsigned)op & 0xff));
424                         else
425                                 prt("operation# (mod 256) for the bad data"
426                                         "unknown, check HOLE and EXTEND ops\n");
427                 } else
428                         prt("????????????????\n");
429                 report_failure(110);
430         }
431 }
432
433 struct test_file *
434 get_tf(void)
435 {
436         unsigned index = 0;
437
438         switch (fd_policy) {
439                 case FD_ROTATE:
440                         index = fd_last++;
441                         break;
442                 case FD_RANDOM:
443                         index = random();
444                         break;
445                 case FD_SINGLE:
446                         index = 0;
447                         break;
448                 default:
449                         prt("unknown policy");
450                         exit(1);
451                         break;
452         }
453         return &test_files[ index % num_test_files ];
454 }
455
456 void
457 assign_fd_policy(char *policy)
458 {
459         if (!strcmp(policy, "random"))
460                 fd_policy = FD_RANDOM;
461         else if (!strcmp(policy, "rotate"))
462                 fd_policy = FD_ROTATE;
463         else {
464                 prt("unknown -I policy: '%s'\n", policy);
465                 exit(1);
466         }
467 }
468
469 int
470 get_fd(void)
471 {
472         struct test_file *tf = get_tf();
473         return tf->fd;
474 }
475
476 static const char *my_basename(const char *path)
477 {
478         char *c = strrchr(path, '/');
479
480         return c ? c++ : path;
481 }
482
483 void
484 open_test_files(char **argv, int argc)
485 {
486         struct test_file *tf;
487         int i;
488
489         num_test_files = argc;
490         if (num_test_files == 1)
491                 fd_policy = FD_SINGLE;
492
493         test_files = calloc(num_test_files, sizeof(*test_files));
494         if (test_files == NULL) {
495                 prterr("reallocating space for test files");
496                 exit(1);
497         }
498
499         for (i = 0, tf = test_files; i < num_test_files; i++, tf++) {
500
501                 tf->path = argv[i];
502                 tf->fd = open(tf->path, O_RDWR|(lite ? 0 : O_CREAT|O_TRUNC)|
503                                 o_direct, 0666);
504                 if (tf->fd < 0) {
505                         prterr(tf->path);
506                         exit(91);
507                 }
508         }
509
510         if (quiet || fd_policy == FD_SINGLE)
511                 return;
512
513         for (i = 0, tf = test_files; i < num_test_files; i++, tf++)
514                 prt("fd %d: %s\n", i, tf->path);
515 }
516
517 void
518 close_test_files(void)
519 {
520         int i;
521         struct test_file *tf;
522
523         for (i = 0, tf = test_files; i < num_test_files; i++, tf++) {
524                 if (close(tf->fd)) {
525                         prterr("close");
526                         report_failure(99);
527                 }
528         }
529 }
530
531
532 void
533 check_size(void)
534 {
535         struct stat     statbuf;
536         off_t   size_by_seek;
537         int fd = get_fd();
538
539         if (fstat(fd, &statbuf)) {
540                 prterr("check_size: fstat");
541                 statbuf.st_size = -1;
542         }
543         size_by_seek = lseek(fd, (off_t)0, SEEK_END);
544         if (file_size != statbuf.st_size || file_size != size_by_seek) {
545                 prt("Size error: expected 0x%llx stat 0x%llx seek 0x%llx\n",
546                     (unsigned long long)file_size,
547                     (unsigned long long)statbuf.st_size,
548                     (unsigned long long)size_by_seek);
549                 report_failure(120);
550         }
551 }
552
553
554 void
555 check_trunc_hack(void)
556 {
557         struct stat statbuf;
558         int fd = get_fd();
559
560         /* should not ignore ftruncate(2)'s return value */
561         if (ftruncate(fd, (off_t)0) < 0) {
562                 prterr("trunc_hack: ftruncate(0)");
563                 exit(1);
564         }
565         if (ftruncate(fd, (off_t)100000) < 0) {
566                 prterr("trunc_hack: ftruncate(100000)");
567                 exit(1);
568         }
569         if (fstat(fd, &statbuf)) {
570                 prterr("trunc_hack: fstat");
571                 statbuf.st_size = -1;
572         }
573         if (statbuf.st_size != (off_t)100000) {
574                 prt("no extend on truncate! not posix!\n");
575                 exit(130);
576         }
577         if (ftruncate(fd, 0) < 0) {
578                 prterr("trunc_hack: ftruncate(0) (2nd call)");
579                 exit(1);
580         }
581 }
582
583 void
584 output_line(struct test_file *tf, int op, unsigned offset,
585                 unsigned size, struct timeval *tv)
586 {
587         char *ops[] = {
588                 [OP_READ] = "read",
589                 [OP_WRITE] = "write",
590                 [OP_TRUNCATE] = "trunc from",
591                 [OP_MAPREAD] = "mapread",
592                 [OP_MAPWRITE] = "mapwrite",
593         };
594
595         /* W. */
596         if (!(!quiet && ((progressinterval &&
597                         testcalls % progressinterval == 0) ||
598                        (debug &&
599                         (monitorstart == -1 ||
600                          (offset + size > monitorstart &&
601                           (monitorend == -1 || offset <= monitorend)))))))
602                 return;
603
604         prt("%06lu%s %lu.%06lu %-10s %#08x %s %#08x\t(0x%x bytes)\n",
605                 testcalls, fill_tf_buf(tf), tv->tv_sec, tv->tv_usec,
606                 ops[op],
607                 offset, op == OP_TRUNCATE ? " to " : "thru",
608                 offset + size - 1, size);
609 }
610
611 void
612 doread(unsigned offset, unsigned size)
613 {
614         struct timeval t;
615         off_t ret;
616         unsigned iret;
617         struct test_file *tf = get_tf();
618         int fd = tf->fd;
619
620         offset -= offset % readbdy;
621         if (o_direct)
622                 size -= size % readbdy;
623         gettimeofday(&t, NULL);
624         if (size == 0) {
625                 if (!quiet && testcalls > simulatedopcount && !o_direct)
626                         prt("skipping zero size read\n");
627                 log4(OP_SKIPPED, OP_READ, offset, size, &t, tf);
628                 return;
629         }
630         if (size + offset > file_size) {
631                 if (!quiet && testcalls > simulatedopcount)
632                         prt("skipping seek/read past end of file\n");
633                 log4(OP_SKIPPED, OP_READ, offset, size, &t, tf);
634                 return;
635         }
636
637         log4(OP_READ, offset, size, 0, &t, tf);
638
639         if (testcalls <= simulatedopcount)
640                 return;
641
642         output_line(tf, OP_READ, offset, size, &t);
643
644         ret = lseek(fd, (off_t)offset, SEEK_SET);
645         if (ret == (off_t)-1) {
646                 prterr("doread: lseek");
647                 report_failure(140);
648         }
649         iret = read(fd, temp_buf, size);
650         if (!quiet && (debug > 1 &&
651                         (monitorstart == -1 ||
652                          (offset + size > monitorstart &&
653                           (monitorend == -1 || offset <= monitorend))))) {
654                 gettimeofday(&t, NULL);
655                 prt("       %lu.%06lu read done\n", t.tv_sec, t.tv_usec);
656         }
657         if (iret != size) {
658                 if (iret == -1)
659                         prterr("doread: read");
660                 else
661                         prt("short read: 0x%x bytes instead of 0x%x\n",
662                             iret, size);
663                 report_failure(141);
664         }
665         check_buffers(offset, size);
666 }
667
668
669 void
670 domapread(unsigned offset, unsigned size)
671 {
672         struct timeval t;
673         unsigned pg_offset;
674         unsigned map_size;
675         char    *p;
676         struct test_file *tf = get_tf();
677         int fd = tf->fd;
678
679         offset -= offset % readbdy;
680         gettimeofday(&t, NULL);
681         if (size == 0) {
682                 if (!quiet && testcalls > simulatedopcount)
683                         prt("skipping zero size read\n");
684                 log4(OP_SKIPPED, OP_MAPREAD, offset, size, &t, tf);
685                 return;
686         }
687         if (size + offset > file_size) {
688                 if (!quiet && testcalls > simulatedopcount)
689                         prt("skipping seek/read past end of file\n");
690                 log4(OP_SKIPPED, OP_MAPREAD, offset, size, &t, tf);
691                 return;
692         }
693
694         log4(OP_MAPREAD, offset, size, 0, &t, tf);
695
696         if (testcalls <= simulatedopcount)
697                 return;
698
699         output_line(tf, OP_MAPREAD, offset, size, &t);
700
701         pg_offset = offset & page_mask;
702         map_size  = pg_offset + size;
703
704         if ((p = mmap(0, map_size, PROT_READ, MAP_FILE | MAP_SHARED, fd,
705                       (off_t)(offset - pg_offset))) == MAP_FAILED) {
706                 prterr("domapread: mmap");
707                 report_failure(190);
708         }
709         if (!quiet && (debug > 1 &&
710                         (monitorstart == -1 ||
711                          (offset + size > monitorstart &&
712                           (monitorend == -1 || offset <= monitorend))))) {
713                 gettimeofday(&t, NULL);
714                 prt("       %lu.%06lu mmap done\n", t.tv_sec, t.tv_usec);
715         }
716         memcpy(temp_buf, p + pg_offset, size);
717         if (!quiet && (debug > 1 &&
718                         (monitorstart == -1 ||
719                          (offset + size > monitorstart &&
720                           (monitorend == -1 || offset <= monitorend))))) {
721                 gettimeofday(&t, NULL);
722                 prt("       %lu.%06lu memcpy done\n", t.tv_sec, t.tv_usec);
723         }
724         if (munmap(p, map_size) != 0) {
725                 prterr("domapread: munmap");
726                 report_failure(191);
727         }
728         if (!quiet && (debug > 1 &&
729                         (monitorstart == -1 ||
730                          (offset + size > monitorstart &&
731                           (monitorend == -1 || offset <= monitorend))))) {
732                 gettimeofday(&t, NULL);
733                 prt("       %lu.%06lu munmap done\n", t.tv_sec, t.tv_usec);
734         }
735
736         check_buffers(offset, size);
737 }
738
739
740 void
741 gendata(char *original_buf, char *good_buf, unsigned offset, unsigned size)
742 {
743         while (size--) {
744                 good_buf[offset] = testcalls % 256;
745                 if (offset % 2)
746                         good_buf[offset] += original_buf[offset];
747                 offset++;
748         }
749 }
750
751
752 void
753 dowrite(unsigned offset, unsigned size)
754 {
755         struct timeval t;
756         off_t ret;
757         unsigned iret;
758         struct test_file *tf = get_tf();
759         int fd = tf->fd;
760
761         offset -= offset % writebdy;
762         if (o_direct)
763                 size -= size % writebdy;
764         gettimeofday(&t, NULL);
765         if (size == 0) {
766                 if (!quiet && testcalls > simulatedopcount && !o_direct)
767                         prt("skipping zero size write\n");
768                 log4(OP_SKIPPED, OP_WRITE, offset, size, &t, tf);
769                 return;
770         }
771
772         log4(OP_WRITE, offset, size, file_size, &t, tf);
773
774         gendata(original_buf, good_buf, offset, size);
775         if (file_size < offset + size) {
776                 if (file_size < offset)
777                         memset(good_buf + file_size, '\0', offset - file_size);
778                 file_size = offset + size;
779                 if (lite) {
780                         warn("Lite file size bug in fsx!");
781                         report_failure(149);
782                 }
783         }
784
785         if (testcalls <= simulatedopcount)
786                 return;
787
788         output_line(tf, OP_WRITE, offset, size, &t);
789
790         ret = lseek(fd, (off_t)offset, SEEK_SET);
791         if (ret == (off_t)-1) {
792                 prterr("dowrite: lseek");
793                 report_failure(150);
794         }
795         iret = write(fd, good_buf + offset, size);
796         if (!quiet && (debug > 1 &&
797                         (monitorstart == -1 ||
798                          (offset + size > monitorstart &&
799                           (monitorend == -1 || offset <= monitorend))))) {
800                 gettimeofday(&t, NULL);
801                 prt("       %lu.%06lu write done\n", t.tv_sec, t.tv_usec);
802         }
803         if (iret != size) {
804                 if (iret == -1)
805                         prterr("dowrite: write");
806                 else
807                         prt("short write: 0x%x bytes instead of 0x%x\n",
808                             iret, size);
809                 report_failure(151);
810         }
811 }
812
813
814 void
815 domapwrite(unsigned offset, unsigned size)
816 {
817         struct timeval t;
818         unsigned pg_offset;
819         unsigned map_size;
820         off_t    cur_filesize;
821         char    *p;
822         struct test_file *tf = get_tf();
823         int fd = tf->fd;
824
825         offset -= offset % writebdy;
826         gettimeofday(&t, NULL);
827         if (size == 0) {
828                 if (!quiet && testcalls > simulatedopcount)
829                         prt("skipping zero size write\n");
830                 log4(OP_SKIPPED, OP_MAPWRITE, offset, size, &t, tf);
831                 return;
832         }
833         cur_filesize = file_size;
834
835         log4(OP_MAPWRITE, offset, size, 0, &t, tf);
836
837         gendata(original_buf, good_buf, offset, size);
838         if (file_size < offset + size) {
839                 if (file_size < offset)
840                         memset(good_buf + file_size, '\0', offset - file_size);
841                 file_size = offset + size;
842                 if (lite) {
843                         warn("Lite file size bug in fsx!");
844                         report_failure(200);
845                 }
846         }
847
848         if (testcalls <= simulatedopcount)
849                 return;
850
851         output_line(tf, OP_MAPWRITE, offset, size, &t);
852
853         if (file_size > cur_filesize) {
854                 if (ftruncate(fd, file_size) == -1) {
855                         prterr("domapwrite: ftruncate");
856                         exit(201);
857                 }
858                 if (!quiet && (debug > 1 &&
859                                (monitorstart == -1 ||
860                                 (offset + size > monitorstart &&
861                                  (monitorend == -1 || offset <= monitorend))))) {
862                         gettimeofday(&t, NULL);
863                         prt("       %lu.%06lu truncate done\n", t.tv_sec, t.tv_usec);
864         }
865         }
866         pg_offset = offset & page_mask;
867         map_size  = pg_offset + size;
868
869         if ((p = mmap(0, map_size, PROT_READ | PROT_WRITE, MAP_FILE|MAP_SHARED,
870                       fd, (off_t)(offset - pg_offset))) == MAP_FAILED) {
871                 prterr("domapwrite: mmap");
872                 report_failure(202);
873         }
874         if (!quiet && (debug > 1 &&
875                         (monitorstart == -1 ||
876                          (offset + size > monitorstart &&
877                           (monitorend == -1 || offset <= monitorend))))) {
878                 gettimeofday(&t, NULL);
879                 prt("       %lu.%06lu mmap done\n", t.tv_sec, t.tv_usec);
880         }
881         memcpy(p + pg_offset, good_buf + offset, size);
882         if (!quiet && (debug > 1 &&
883                         (monitorstart == -1 ||
884                          (offset + size > monitorstart &&
885                           (monitorend == -1 || offset <= monitorend))))) {
886                 gettimeofday(&t, NULL);
887                 prt("       %lu.%06lu memcpy done\n", t.tv_sec, t.tv_usec);
888         }
889         if (msync(p, map_size, 0) != 0) {
890                 prterr("domapwrite: msync");
891                 report_failure(203);
892         }
893         if (!quiet && (debug > 1 &&
894                         (monitorstart == -1 ||
895                          (offset + size > monitorstart &&
896                           (monitorend == -1 || offset <= monitorend))))) {
897                 gettimeofday(&t, NULL);
898                 prt("       %lu.%06lu msync done\n", t.tv_sec, t.tv_usec);
899         }
900         if (munmap(p, map_size) != 0) {
901                 prterr("domapwrite: munmap");
902                 report_failure(204);
903         }
904         if (!quiet && (debug > 1 &&
905                         (monitorstart == -1 ||
906                          (offset + size > monitorstart &&
907                           (monitorend == -1 || offset <= monitorend))))) {
908                 gettimeofday(&t, NULL);
909                 prt("       %lu.%06lu munmap done\n", t.tv_sec, t.tv_usec);
910         }
911 }
912
913
914 void
915 dotruncate(unsigned size)
916 {
917         struct timeval t;
918         int oldsize = file_size;
919         struct test_file *tf = get_tf();
920         int fd = tf->fd;
921
922         size -= size % truncbdy;
923         gettimeofday(&t, NULL);
924         if (size > biggest) {
925                 biggest = size;
926                 if (!quiet && testcalls > simulatedopcount)
927                         prt("truncating to largest ever: 0x%x\n", size);
928         }
929
930         log4(OP_TRUNCATE, size, (unsigned)file_size, 0, &t, tf);
931
932         if (size > file_size)
933                 memset(good_buf + file_size, '\0', size - file_size);
934         file_size = size;
935
936         if (testcalls <= simulatedopcount)
937                 return;
938
939         output_line(tf, OP_TRUNCATE, oldsize, size, &t);
940
941         if (ftruncate(fd, (off_t)size) == -1) {
942                 prt("ftruncate1: %x\n", size);
943                 prterr("dotruncate: ftruncate");
944                 report_failure(160);
945         }
946         if (!quiet && debug > 1) {
947                 gettimeofday(&t, NULL);
948                 prt("       %lu.%06lu trunc done\n", t.tv_sec, t.tv_usec);
949         }
950 }
951
952
953 void
954 writefileimage()
955 {
956         ssize_t iret;
957         int fd = get_fd();
958
959         if (lseek(fd, (off_t)0, SEEK_SET) == (off_t)-1) {
960                 prterr("writefileimage: lseek");
961                 report_failure(171);
962         }
963         iret = write(fd, good_buf, file_size);
964         if ((off_t)iret != file_size) {
965                 if (iret == -1)
966                         prterr("writefileimage: write");
967                 else
968                         prt("short write: 0x%lx bytes instead of 0x%llx\n",
969                             (unsigned long)iret,
970                             (unsigned long long)file_size);
971                 report_failure(172);
972         }
973         if (lite ? 0 : ftruncate(fd, file_size) == -1) {
974                 prt("ftruncate2: %llx\n", (unsigned long long)file_size);
975                 prterr("writefileimage: ftruncate");
976                 report_failure(173);
977         }
978 }
979
980
981 void
982 docloseopen(void)
983 {
984         struct timeval t;
985         struct test_file *tf = get_tf();
986
987         if (testcalls <= simulatedopcount)
988                 return;
989
990         gettimeofday(&t, NULL);
991         log4(OP_CLOSEOPEN, file_size, (unsigned)file_size, 0, &t, tf);
992
993         if (debug)
994                 prt("%06lu %lu.%06lu close/open\n", testcalls, t.tv_sec,
995                     t.tv_usec);
996         if (close(tf->fd)) {
997                 prterr("docloseopen: close");
998                 report_failure(180);
999         }
1000         if (!quiet && debug > 1) {
1001                 gettimeofday(&t, NULL);
1002                 prt("       %lu.%06lu close done\n", t.tv_sec, t.tv_usec);
1003         }
1004         tf->fd = open(tf->path, O_RDWR|o_direct, 0);
1005         if (tf->fd < 0) {
1006                 prterr("docloseopen: open");
1007                 report_failure(181);
1008         }
1009         if (!quiet && debug > 1) {
1010                 gettimeofday(&t, NULL);
1011                 prt("       %lu.%06lu open done\n", t.tv_sec, t.tv_usec);
1012         }
1013 }
1014
1015
1016 void
1017 test(void)
1018 {
1019         unsigned long   offset;
1020         unsigned long   size = maxoplen;
1021         unsigned long   rv = random();
1022         unsigned long   op = rv % (3 + !lite + mapped_writes);
1023
1024         /* turn off the map read if necessary */
1025
1026         if (op == 2 && !mapped_reads)
1027             op = 0;
1028
1029         if (simulatedopcount > 0 && testcalls == simulatedopcount)
1030                 writefileimage();
1031
1032         testcalls++;
1033
1034         if (debugstart > 0 && testcalls >= debugstart)
1035                 debug = 1;
1036
1037         if (!quiet && testcalls < simulatedopcount && testcalls % 100000 == 0)
1038                 prt("%lu...\n", testcalls);
1039
1040         /*
1041          * READ:        op = 0
1042          * WRITE:       op = 1
1043          * MAPREAD:     op = 2
1044          * TRUNCATE:    op = 3
1045          * MAPWRITE:    op = 3 or 4
1046          */
1047         if (lite ? 0 : op == 3 && (style & 1) == 0) /* vanilla truncate? */
1048                 dotruncate(random() % maxfilelen);
1049         else {
1050                 if (randomoplen)
1051                         size = random() % (maxoplen+1);
1052                 if (lite ? 0 : op == 3)
1053                         dotruncate(size);
1054                 else {
1055                         offset = random();
1056                         if (op == 1 || op == (lite ? 3 : 4)) {
1057                                 offset %= maxfilelen;
1058                                 if (offset + size > maxfilelen)
1059                                         size = maxfilelen - offset;
1060                                 if (op != 1)
1061                                         domapwrite(offset, size);
1062                                 else
1063                                         dowrite(offset, size);
1064                         } else {
1065                                 if (file_size)
1066                                         offset %= file_size;
1067                                 else
1068                                         offset = 0;
1069                                 if (offset + size > file_size)
1070                                         size = file_size - offset;
1071                                 if (op != 0)
1072                                         domapread(offset, size);
1073                                 else
1074                                         doread(offset, size);
1075                         }
1076                 }
1077         }
1078         if (sizechecks && testcalls > simulatedopcount)
1079                 check_size();
1080         if (closeprob && (rv >> 3) < (1 << 28) / closeprob)
1081                 docloseopen();
1082 }
1083
1084
1085 void
1086 cleanup(sig)
1087         int     sig;
1088 {
1089         if (sig)
1090                 prt("signal %d\n", sig);
1091         prt("testcalls = %lu\n", testcalls);
1092         exit(sig);
1093 }
1094
1095
1096 void
1097 usage(void)
1098 {
1099         fprintf(stdout, "usage: %s",
1100                 "fsx [-dnqLOW] [-b opnum] [-c Prob] [-l flen] [-m "
1101 "start:end] [-o oplen] [-p progressinterval] [-r readbdy] [-s style] [-t "
1102 "truncbdy] [-w writebdy] [-D startingop] [-N numops] [-P dirpath] [-S seed] "
1103 "[ -I random|rotate ] fname [additional paths to fname..]\n"
1104 "       -b opnum: beginning operation number (default 1)\n"
1105 "       -c P: 1 in P chance of file close+open at each op (default infinity)\n"
1106 "       -d: debug output for all operations [-d -d = more debugging]\n"
1107 "       -l flen: the upper bound on file size (default 262144)\n"
1108 "       -m startop:endop: monitor (print debug output) specified byte rang"
1109 "(default 0:infinity)\n"
1110 "       -n: no verifications of file size\n"
1111 "       -o oplen: the upper bound on operation size (default 65536)\n"
1112 "       -p progressinterval: debug output at specified operation interval\n"
1113 "       -q: quieter operation\n"
1114 "       -r readbdy: 4096 would make reads page aligned (default 1)\n"
1115 "       -s style: 1 gives smaller truncates (default 0)\n"
1116 "       -t truncbdy: 4096 would make truncates page aligned (default 1)\n"
1117 "       -w writebdy: 4096 would make writes page aligned (default 1)\n"
1118 "       -D startingop: debug output starting at specified operation\n"
1119 "       -L: fsxLite - no file creations & no file size changes\n"
1120 "       -N numops: total # operations to do (default infinity)\n"
1121 "       -O: use oplen (see -o flag) for every op (default random)\n"
1122 "       -P: save .fsxlog and .fsxgood files in dirpath (default ./)\n"
1123 "       -S seed: for random # generator (default 1) 0 gets timestamp\n"
1124 "       -W: mapped write operations DISabled\n"
1125 "       -R: read() system calls only (mapped reads disabled)\n"
1126 "       -Z: O_DIRECT (use -R, -W, -r and -w too)\n"
1127 "       -I: When multiple paths to the file are given each operation uses\n"
1128 "           a different path.  Iterate through them in order with 'rotate'\n"
1129 "           or chose then at 'random'.  (defaults to random)\n"
1130 "       fname: this filename is REQUIRED (no default)\n");
1131         exit(90);
1132 }
1133
1134
1135 int
1136 getnum(char *s, char **e)
1137 {
1138         int ret = -1;
1139
1140         *e = (char *) 0;
1141         ret = strtol(s, e, 0);
1142         if (*e)
1143                 switch (**e) {
1144                 case 'b':
1145                 case 'B':
1146                         ret *= 512;
1147                         *e = *e + 1;
1148                         break;
1149                 case 'k':
1150                 case 'K':
1151                         ret *= 1024;
1152                         *e = *e + 1;
1153                         break;
1154                 case 'm':
1155                 case 'M':
1156                         ret *= 1024*1024;
1157                         *e = *e + 1;
1158                         break;
1159                 case 'w':
1160                 case 'W':
1161                         ret *= 4;
1162                         *e = *e + 1;
1163                         break;
1164                 }
1165         return (ret);
1166 }
1167
1168 int
1169 main(int argc, char **argv)
1170 {
1171         int     i, style, ch;
1172         char    *endp;
1173         int  dirpath = 0;
1174
1175         goodfile[0] = 0;
1176         logfile[0] = 0;
1177
1178         page_size = getpagesize();
1179         page_mask = page_size - 1;
1180
1181         setvbuf(stdout, (char *)0, _IOLBF, 0); /* line buffered stdout */
1182
1183         while ((ch = getopt(argc, argv,
1184                                 "b:c:dl:m:no:p:qr:s:t:w:D:I:LN:OP:RS:WZ"))
1185                != EOF)
1186                 switch (ch) {
1187                 case 'b':
1188                         simulatedopcount = getnum(optarg, &endp);
1189                         if (!quiet)
1190                                 fprintf(stdout, "Will begin at operation"
1191                                         "%ld\n",
1192                                         simulatedopcount);
1193                         if (simulatedopcount == 0)
1194                                 usage();
1195                         simulatedopcount -= 1;
1196                         break;
1197                 case 'c':
1198                         closeprob = getnum(optarg, &endp);
1199                         if (!quiet)
1200                                 fprintf(stdout,
1201                                         "Chance of close/open is 1 in %d\n",
1202                                         closeprob);
1203                         if (closeprob <= 0)
1204                                 usage();
1205                         break;
1206                 case 'd':
1207                         debug++;
1208                         break;
1209                 case 'l':
1210                         maxfilelen = getnum(optarg, &endp);
1211                         if (maxfilelen <= 0)
1212                                 usage();
1213                         break;
1214                 case 'm':
1215                         monitorstart = getnum(optarg, &endp);
1216                         if (monitorstart < 0)
1217                                 usage();
1218                         if (!endp || *endp++ != ':')
1219                                 usage();
1220                         monitorend = getnum(endp, &endp);
1221                         if (monitorend < 0)
1222                                 usage();
1223                         if (monitorend == 0)
1224                                 monitorend = -1; /* aka infinity */
1225                         debug = 1;
1226                 case 'n':
1227                         sizechecks = 0;
1228                         break;
1229                 case 'o':
1230                         maxoplen = getnum(optarg, &endp);
1231                         if (maxoplen <= 0)
1232                                 usage();
1233                         break;
1234                 case 'p':
1235                         progressinterval = getnum(optarg, &endp);
1236                         if (progressinterval < 0)
1237                                 usage();
1238                         break;
1239                 case 'q':
1240                         quiet = 1;
1241                         break;
1242                 case 'r':
1243                         readbdy = getnum(optarg, &endp);
1244                         if (readbdy <= 0)
1245                                 usage();
1246                         break;
1247                 case 's':
1248                         style = getnum(optarg, &endp);
1249                         if (style < 0 || style > 1)
1250                                 usage();
1251                         break;
1252                 case 't':
1253                         truncbdy = getnum(optarg, &endp);
1254                         if (truncbdy <= 0)
1255                                 usage();
1256                         break;
1257                 case 'w':
1258                         writebdy = getnum(optarg, &endp);
1259                         if (writebdy <= 0)
1260                                 usage();
1261                         break;
1262                 case 'D':
1263                         debugstart = getnum(optarg, &endp);
1264                         if (debugstart < 1)
1265                                 usage();
1266                         break;
1267                 case 'I':
1268                         assign_fd_policy(optarg);
1269                         break;
1270                 case 'L':
1271                         lite = 1;
1272                         break;
1273                 case 'N':
1274                         numops = getnum(optarg, &endp);
1275                         if (numops < 0)
1276                                 usage();
1277                         break;
1278                 case 'O':
1279                         randomoplen = 0;
1280                         break;
1281                 case 'P':
1282                         strncpy(goodfile, optarg, sizeof(goodfile) - 1);
1283                         strcat(goodfile, "/");
1284                         strncpy(logfile, optarg, sizeof(logfile) - 1);
1285                         strcat(logfile, "/");
1286                         dirpath = 1;
1287                         break;
1288                 case 'R':
1289                         mapped_reads = 0;
1290                         break;
1291                 case 'S':
1292                         seed = getnum(optarg, &endp);
1293                         if (seed == 0)
1294                                 seed = time(0) % 10000;
1295                         if (!quiet)
1296                                 fprintf(stdout, "Seed set to %d\n", seed);
1297                         if (seed < 0)
1298                                 usage();
1299                         break;
1300                 case 'W':
1301                         mapped_writes = 0;
1302                         if (!quiet)
1303                                 fprintf(stdout, "mapped writes DISABLED\n");
1304                         break;
1305                 case 'Z':
1306                         o_direct = O_DIRECT;
1307                         break;
1308
1309                 default:
1310                         usage();
1311                         /* NOTREACHED */
1312                 }
1313         argc -= optind;
1314         argv += optind;
1315         if (argc < 1)
1316                 usage();
1317         fname = argv[0];
1318
1319         signal(SIGHUP,  cleanup);
1320         signal(SIGINT,  cleanup);
1321         signal(SIGPIPE, cleanup);
1322         signal(SIGALRM, cleanup);
1323         signal(SIGTERM, cleanup);
1324         signal(SIGXCPU, cleanup);
1325         signal(SIGXFSZ, cleanup);
1326         signal(SIGVTALRM,       cleanup);
1327         signal(SIGUSR1, cleanup);
1328         signal(SIGUSR2, cleanup);
1329
1330         initstate(seed, state, 256);
1331         setstate(state);
1332
1333         open_test_files(argv, argc);
1334
1335         strncat(goodfile, dirpath ? my_basename(fname) : fname, 256);
1336         strcat (goodfile, ".fsxgood");
1337         fsxgoodfd = open(goodfile, O_RDWR|O_CREAT|O_TRUNC, 0666);
1338         if (fsxgoodfd < 0) {
1339                 prterr(goodfile);
1340                 exit(92);
1341         }
1342         strncat(logfile, dirpath ? my_basename(fname) : fname, 256);
1343         strcat (logfile, ".fsxlog");
1344         fsxlogf = fopen(logfile, "w");
1345         if (fsxlogf == NULL) {
1346                 prterr(logfile);
1347                 exit(93);
1348         }
1349         if (lite) {
1350                 off_t ret;
1351                 int fd = get_fd();
1352                 file_size = maxfilelen = lseek(fd, (off_t)0, SEEK_END);
1353                 if (file_size == (off_t)-1) {
1354                         prterr(fname);
1355                         warn("main: lseek eof");
1356                         exit(94);
1357                 }
1358                 ret = lseek(fd, (off_t)0, SEEK_SET);
1359                 if (ret == (off_t)-1) {
1360                         prterr(fname);
1361                         warn("main: lseek 0");
1362                         exit(95);
1363                 }
1364         }
1365         original_buf = (char *) malloc(maxfilelen);
1366         for (i = 0; i < maxfilelen; i++)
1367                 original_buf[i] = random() % 256;
1368         if (o_direct) {
1369                 int ret;
1370
1371                 ret = posix_memalign((void **)&good_buf, writebdy, maxfilelen);
1372                 if (ret) {
1373                         prt("main: posix_memalign failed: %s\n", strerror(ret));
1374                         exit(96);
1375                 }
1376
1377                 ret = posix_memalign((void **)&temp_buf, readbdy, maxoplen);
1378                 if (ret) {
1379                         prt("main: posix_memalign failed: %s\n", strerror(ret));
1380                         exit(97);
1381                 }
1382         } else {
1383                 good_buf = malloc(maxfilelen);
1384                 if (!good_buf) {
1385                         prt("malloc failed.\n");
1386                         exit(98);
1387                 }
1388
1389                 temp_buf = malloc(maxoplen);
1390                 if (!temp_buf) {
1391                         prt("malloc failed.\n");
1392                         exit(99);
1393                 }
1394         }
1395         memset(good_buf, 0, maxfilelen);
1396         memset(temp_buf, 0, maxoplen);
1397
1398         if (lite) {     /* zero entire existing file */
1399                 ssize_t written;
1400                 int fd = get_fd();
1401
1402                 written = write(fd, good_buf, (size_t)maxfilelen);
1403                 if (written != maxfilelen) {
1404                         if (written == -1) {
1405                                 prterr(fname);
1406                                 warn("main: error on write");
1407                         } else
1408                                 warn("main: short write, 0x%x bytes instead"
1409                                         "of 0x%x\n",
1410                                      (unsigned)written, maxfilelen);
1411                         exit(98);
1412                 }
1413         } else
1414                 check_trunc_hack();
1415
1416         while (numops == -1 || numops--)
1417                 test();
1418
1419         close_test_files();
1420         prt("All operations completed A-OK!\n");
1421
1422         exit(0);
1423         return 0;
1424 }