1907036eb394cf257f1960cbe5003e1b005ced93
[xfstests-dev.git] / ltp / fsx.c
1 /*
2  *      Copyright (C) 1991, NeXT Computer, Inc.  All Rights Reserverd.
3  *
4  *      File:   fsx.c
5  *      Author: Avadis Tevanian, Jr.
6  *
7  *      File system exerciser. 
8  *
9  *      Rewritten 8/98 by Conrad Minshall.
10  *
11  *      Small changes to work under Linux -- davej.
12  *
13  *      Checks for mmap last-page zero fill.
14  */
15
16 #include "global.h"
17
18 #include <limits.h>
19 #include <time.h>
20 #include <strings.h>
21 #include <sys/file.h>
22 #include <sys/mman.h>
23 #include <stdbool.h>
24 #ifdef HAVE_ERR_H
25 #include <err.h>
26 #endif
27 #include <signal.h>
28 #include <stdio.h>
29 #include <stddef.h>
30 #include <stdlib.h>
31 #include <string.h>
32 #include <stdarg.h>
33 #include <errno.h>
34 #ifdef AIO
35 #include <libaio.h>
36 #endif
37
38 #ifndef MAP_FILE
39 # define MAP_FILE 0
40 #endif
41
42 #define NUMPRINTCOLUMNS 32      /* # columns of data to print on each line */
43
44 /* Operation flags */
45
46 enum opflags { FL_NONE = 0, FL_SKIPPED = 1, FL_CLOSE_OPEN = 2, FL_KEEP_SIZE = 4 };
47
48 /*
49  *      A log entry is an operation and a bunch of arguments.
50  */
51
52 struct log_entry {
53         int     operation;
54         int     nr_args;
55         int     args[4];
56         enum opflags flags;
57 };
58
59 #define LOGSIZE 10000
60
61 struct log_entry        oplog[LOGSIZE]; /* the log */
62 int                     logptr = 0;     /* current position in log */
63 int                     logcount = 0;   /* total ops */
64
65 /*
66  * The operation matrix is complex due to conditional execution of different
67  * features. Hence when we come to deciding what operation to run, we need to
68  * be careful in how we select the different operations. The active operations
69  * are mapped to numbers as follows:
70  *
71  *                      lite    !lite   integrity
72  * READ:                0       0       0
73  * WRITE:               1       1       1
74  * MAPREAD:             2       2       2
75  * MAPWRITE:            3       3       3
76  * TRUNCATE:            -       4       4
77  * FALLOCATE:           -       5       5
78  * PUNCH HOLE:          -       6       6
79  * ZERO RANGE:          -       7       7
80  * COLLAPSE RANGE:      -       8       8
81  * FSYNC:               -       -       9
82  *
83  * When mapped read/writes are disabled, they are simply converted to normal
84  * reads and writes. When fallocate/fpunch calls are disabled, they are
85  * skipped.
86  *
87  * Because of the "lite" version, we also need to have different "maximum
88  * operation" defines to allow the ops to be selected correctly based on the
89  * mode being run.
90  */
91
92 enum {
93         /* common operations */
94         OP_READ = 0,
95         OP_WRITE,
96         OP_MAPREAD,
97         OP_MAPWRITE,
98         OP_MAX_LITE,
99
100         /* !lite operations */
101         OP_TRUNCATE = OP_MAX_LITE,
102         OP_FALLOCATE,
103         OP_PUNCH_HOLE,
104         OP_ZERO_RANGE,
105         OP_COLLAPSE_RANGE,
106         OP_INSERT_RANGE,
107         OP_MAX_FULL,
108
109         /* integrity operations */
110         OP_FSYNC = OP_MAX_FULL,
111         OP_MAX_INTEGRITY,
112 };
113
114 #undef PAGE_SIZE
115 #define PAGE_SIZE       getpagesize()
116 #undef PAGE_MASK
117 #define PAGE_MASK       (PAGE_SIZE - 1)
118
119 char    *original_buf;                  /* a pointer to the original data */
120 char    *good_buf;                      /* a pointer to the correct data */
121 char    *temp_buf;                      /* a pointer to the current data */
122 char    *fname;                         /* name of our test file */
123 char    *bname;                         /* basename of our test file */
124 char    *logdev;                        /* -i flag */
125 char    *logid;                         /* -j flag */
126 char    dname[1024];                    /* -P flag */
127 char    goodfile[PATH_MAX];
128 int     dirpath = 0;                    /* -P flag */
129 int     fd;                             /* fd for our test file */
130
131 blksize_t       block_size = 0;
132 off_t           file_size = 0;
133 off_t           biggest = 0;
134 unsigned long   testcalls = 0;          /* calls to function "test" */
135
136 unsigned long   simulatedopcount = 0;   /* -b flag */
137 int     closeprob = 0;                  /* -c flag */
138 int     debug = 0;                      /* -d flag */
139 unsigned long   debugstart = 0;         /* -D flag */
140 char    filldata = 0;                   /* -g flag */
141 int     flush = 0;                      /* -f flag */
142 int     do_fsync = 0;                   /* -y flag */
143 unsigned long   maxfilelen = 256 * 1024;        /* -l flag */
144 int     sizechecks = 1;                 /* -n flag disables them */
145 int     maxoplen = 64 * 1024;           /* -o flag */
146 int     quiet = 0;                      /* -q flag */
147 unsigned long progressinterval = 0;     /* -p flag */
148 int     readbdy = 1;                    /* -r flag */
149 int     style = 0;                      /* -s flag */
150 int     prealloc = 0;                   /* -x flag */
151 int     truncbdy = 1;                   /* -t flag */
152 int     writebdy = 1;                   /* -w flag */
153 long    monitorstart = -1;              /* -m flag */
154 long    monitorend = -1;                /* -m flag */
155 int     lite = 0;                       /* -L flag */
156 long    numops = -1;                    /* -N flag */
157 int     randomoplen = 1;                /* -O flag disables it */
158 int     seed = 1;                       /* -S flag */
159 int     mapped_writes = 1;              /* -W flag disables */
160 int     fallocate_calls = 1;            /* -F flag disables */
161 int     keep_size_calls = 1;            /* -K flag disables */
162 int     punch_hole_calls = 1;           /* -H flag disables */
163 int     zero_range_calls = 1;           /* -z flag disables */
164 int     collapse_range_calls = 1;       /* -C flag disables */
165 int     insert_range_calls = 1;         /* -I flag disables */
166 int     mapped_reads = 1;               /* -R flag disables it */
167 int     check_file = 0;                 /* -X flag enables */
168 int     integrity = 0;                  /* -i flag */
169 int     fsxgoodfd = 0;
170 int     o_direct;                       /* -Z */
171 int     aio = 0;
172 int     mark_nr = 0;
173
174 int page_size;
175 int page_mask;
176 int mmap_mask;
177 #ifdef AIO
178 int aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset);
179 #define READ 0
180 #define WRITE 1
181 #define fsxread(a,b,c,d)        aio_rw(READ, a,b,c,d)
182 #define fsxwrite(a,b,c,d)       aio_rw(WRITE, a,b,c,d)
183 #else
184 #define fsxread(a,b,c,d)        read(a,b,c)
185 #define fsxwrite(a,b,c,d)       write(a,b,c)
186 #endif
187
188 const char *replayops = NULL;
189 const char *recordops = NULL;
190 FILE *  fsxlogf = NULL;
191 FILE *  replayopsf = NULL;
192 char opsfile[PATH_MAX];
193 int badoff = -1;
194 int closeopen = 0;
195
196 static void *round_ptr_up(void *ptr, unsigned long align, unsigned long offset)
197 {
198         unsigned long ret = (unsigned long)ptr;
199
200         ret = ((ret + align - 1) & ~(align - 1));
201         ret += offset;
202         return (void *)ret;
203 }
204
205 void
206 vwarnc(int code, const char *fmt, va_list ap)
207 {
208         if (logid)
209                 fprintf(stderr, "%s: ", logid);
210         fprintf(stderr, "fsx: ");
211         if (fmt != NULL) {
212                 vfprintf(stderr, fmt, ap);
213                 fprintf(stderr, ": ");
214         }
215         fprintf(stderr, "%s\n", strerror(code));
216 }
217
218 void
219 warn(const char * fmt, ...)  {
220         va_list ap;
221         va_start(ap, fmt);
222         vwarnc(errno, fmt, ap);
223         va_end(ap);
224 }
225
226 void
227 prt(const char *fmt, ...)
228 {
229         va_list args;
230
231         if (logid)
232                 fprintf(stdout, "%s: ", logid);
233         va_start(args, fmt);
234         vfprintf(stdout, fmt, args);
235         va_end(args);
236         if (fsxlogf) {
237                 va_start(args, fmt);
238                 vfprintf(fsxlogf, fmt, args);
239                 va_end(args);
240         }
241 }
242
243 void
244 prterr(const char *prefix)
245 {
246         prt("%s%s%s\n", prefix, prefix ? ": " : "", strerror(errno));
247 }
248
249
250 static const char *op_names[] = {
251         [OP_READ] = "read",
252         [OP_WRITE] = "write",
253         [OP_MAPREAD] = "mapread",
254         [OP_MAPWRITE] = "mapwrite",
255         [OP_TRUNCATE] = "truncate",
256         [OP_FALLOCATE] = "fallocate",
257         [OP_PUNCH_HOLE] = "punch_hole",
258         [OP_ZERO_RANGE] = "zero_range",
259         [OP_COLLAPSE_RANGE] = "collapse_range",
260         [OP_INSERT_RANGE] = "insert_range",
261         [OP_FSYNC] = "fsync",
262 };
263
264 static const char *op_name(int operation)
265 {
266         if (operation >= 0 &&
267             operation < sizeof(op_names) / sizeof(op_names[0]))
268                 return op_names[operation];
269         return NULL;
270 }
271
272 static int op_code(const char *name)
273 {
274         int i;
275
276         for (i = 0; i < sizeof(op_names) / sizeof(op_names[0]); i++)
277                 if (op_names[i] && strcmp(name, op_names[i]) == 0)
278                         return i;
279         return -1;
280 }
281
282 void
283 log5(int operation, int arg0, int arg1, int arg2, enum opflags flags)
284 {
285         struct log_entry *le;
286
287         le = &oplog[logptr];
288         le->operation = operation;
289         if (closeopen)
290                 flags |= FL_CLOSE_OPEN;
291         le->args[0] = arg0;
292         le->args[1] = arg1;
293         le->args[2] = arg2;
294         le->args[3] = file_size;
295         le->nr_args = 4;
296         le->flags = flags;
297         logptr++;
298         logcount++;
299         if (logptr >= LOGSIZE)
300                 logptr = 0;
301 }
302
303 void
304 log4(int operation, int arg0, int arg1, enum opflags flags)
305 {
306         struct log_entry *le;
307
308         le = &oplog[logptr];
309         le->operation = operation;
310         if (closeopen)
311                 flags |= FL_CLOSE_OPEN;
312         le->args[0] = arg0;
313         le->args[1] = arg1;
314         le->args[2] = file_size;
315         le->nr_args = 3;
316         le->flags = flags;
317         logptr++;
318         logcount++;
319         if (logptr >= LOGSIZE)
320                 logptr = 0;
321 }
322
323
324 void
325 logdump(void)
326 {
327         FILE    *logopsf;
328         int     i, count, down;
329         struct log_entry        *lp;
330
331         prt("LOG DUMP (%d total operations):\n", logcount);
332
333         logopsf = fopen(opsfile, "w");
334         if (!logopsf)
335                 prterr(opsfile);
336
337         if (logcount < LOGSIZE) {
338                 i = 0;
339                 count = logcount;
340         } else {
341                 i = logptr;
342                 count = LOGSIZE;
343         }
344         for ( ; count > 0; count--) {
345                 bool overlap;
346                 int opnum;
347
348                 opnum = i+1 + (logcount/LOGSIZE)*LOGSIZE;
349                 prt("%d(%3d mod 256): ", opnum, opnum%256);
350                 lp = &oplog[i];
351
352                 overlap = badoff >= lp->args[0] &&
353                           badoff < lp->args[0] + lp->args[1];
354
355                 if (lp->flags & FL_SKIPPED) {
356                         prt("SKIPPED (no operation)");
357                         goto skipped;
358                 }
359
360                 switch (lp->operation) {
361                 case OP_MAPREAD:
362                         prt("MAPREAD  0x%x thru 0x%x\t(0x%x bytes)",
363                             lp->args[0], lp->args[0] + lp->args[1] - 1,
364                             lp->args[1]);
365                         if (overlap)
366                                 prt("\t***RRRR***");
367                         break;
368                 case OP_MAPWRITE:
369                         prt("MAPWRITE 0x%x thru 0x%x\t(0x%x bytes)",
370                             lp->args[0], lp->args[0] + lp->args[1] - 1,
371                             lp->args[1]);
372                         if (overlap)
373                                 prt("\t******WWWW");
374                         break;
375                 case OP_READ:
376                         prt("READ     0x%x thru 0x%x\t(0x%x bytes)",
377                             lp->args[0], lp->args[0] + lp->args[1] - 1,
378                             lp->args[1]);
379                         if (overlap)
380                                 prt("\t***RRRR***");
381                         break;
382                 case OP_WRITE:
383                         prt("WRITE    0x%x thru 0x%x\t(0x%x bytes)",
384                             lp->args[0], lp->args[0] + lp->args[1] - 1,
385                             lp->args[1]);
386                         if (lp->args[0] > lp->args[2])
387                                 prt(" HOLE");
388                         else if (lp->args[0] + lp->args[1] > lp->args[2])
389                                 prt(" EXTEND");
390                         overlap = (badoff >= lp->args[0] ||
391                                    badoff >=lp->args[2]) &&
392                                   badoff < lp->args[0] + lp->args[1];
393                         if (overlap)
394                                 prt("\t***WWWW");
395                         break;
396                 case OP_TRUNCATE:
397                         down = lp->args[1] < lp->args[2];
398                         prt("TRUNCATE %s\tfrom 0x%x to 0x%x",
399                             down ? "DOWN" : "UP", lp->args[2], lp->args[1]);
400                         overlap = badoff >= lp->args[1 + !down] &&
401                                   badoff < lp->args[1 + !!down];
402                         if (overlap)
403                                 prt("\t******WWWW");
404                         break;
405                 case OP_FALLOCATE:
406                         /* 0: offset 1: length 2: where alloced */
407                         prt("FALLOC   0x%x thru 0x%x\t(0x%x bytes) ",
408                                 lp->args[0], lp->args[0] + lp->args[1],
409                                 lp->args[1]);
410                         if (lp->args[0] + lp->args[1] <= lp->args[2])
411                                 prt("INTERIOR");
412                         else if (lp->flags & FL_KEEP_SIZE)
413                                 prt("PAST_EOF");
414                         else
415                                 prt("EXTENDING");
416                         if (overlap)
417                                 prt("\t******FFFF");
418                         break;
419                 case OP_PUNCH_HOLE:
420                         prt("PUNCH    0x%x thru 0x%x\t(0x%x bytes)",
421                             lp->args[0], lp->args[0] + lp->args[1] - 1,
422                             lp->args[1]);
423                         if (overlap)
424                                 prt("\t******PPPP");
425                         break;
426                 case OP_ZERO_RANGE:
427                         prt("ZERO     0x%x thru 0x%x\t(0x%x bytes)",
428                             lp->args[0], lp->args[0] + lp->args[1] - 1,
429                             lp->args[1]);
430                         if (overlap)
431                                 prt("\t******ZZZZ");
432                         break;
433                 case OP_COLLAPSE_RANGE:
434                         prt("COLLAPSE 0x%x thru 0x%x\t(0x%x bytes)",
435                             lp->args[0], lp->args[0] + lp->args[1] - 1,
436                             lp->args[1]);
437                         if (overlap)
438                                 prt("\t******CCCC");
439                         break;
440                 case OP_INSERT_RANGE:
441                         prt("INSERT 0x%x thru 0x%x\t(0x%x bytes)",
442                             lp->args[0], lp->args[0] + lp->args[1] - 1,
443                             lp->args[1]);
444                         if (overlap)
445                                 prt("\t******IIII");
446                         break;
447                 case OP_FSYNC:
448                         prt("FSYNC");
449                         break;
450                 default:
451                         prt("BOGUS LOG ENTRY (operation code = %d)!",
452                             lp->operation);
453                         continue;
454                 }
455
456             skipped:
457                 if (lp->flags & FL_CLOSE_OPEN)
458                         prt("\n\t\tCLOSE/OPEN");
459                 prt("\n");
460                 i++;
461                 if (i == LOGSIZE)
462                         i = 0;
463
464                 if (logopsf) {
465                         int j;
466
467                         if (lp->flags & FL_SKIPPED)
468                                 fprintf(logopsf, "skip ");
469                         fprintf(logopsf, "%s", op_name(lp->operation));
470                         for (j = 0; j < lp->nr_args; j++)
471                                 fprintf(logopsf, " 0x%x", lp->args[j]);
472                         if (lp->flags & FL_KEEP_SIZE)
473                                 fprintf(logopsf, " keep_size");
474                         if (lp->flags & FL_CLOSE_OPEN)
475                                 fprintf(logopsf, " close_open");
476                         if (overlap)
477                                 fprintf(logopsf, " *");
478                         fprintf(logopsf, "\n");
479                 }
480         }
481
482         if (logopsf) {
483                 if (fclose(logopsf) != 0)
484                         prterr(opsfile);
485                 else
486                         prt("Log of operations saved to \"%s\"; "
487                             "replay with --replay-ops\n",
488                             opsfile);
489         }
490 }
491
492
493 void
494 save_buffer(char *buffer, off_t bufferlength, int fd)
495 {
496         off_t ret;
497         ssize_t byteswritten;
498
499         if (fd <= 0 || bufferlength == 0)
500                 return;
501
502         if (bufferlength > SSIZE_MAX) {
503                 prt("fsx flaw: overflow in save_buffer\n");
504                 exit(67);
505         }
506         if (lite) {
507                 off_t size_by_seek = lseek(fd, (off_t)0, SEEK_END);
508                 if (size_by_seek == (off_t)-1)
509                         prterr("save_buffer: lseek eof");
510                 else if (bufferlength > size_by_seek) {
511                         warn("save_buffer: .fsxgood file too short... will save 0x%llx bytes instead of 0x%llx\n", (unsigned long long)size_by_seek,
512                              (unsigned long long)bufferlength);
513                         bufferlength = size_by_seek;
514                 }
515         }
516
517         ret = lseek(fd, (off_t)0, SEEK_SET);
518         if (ret == (off_t)-1)
519                 prterr("save_buffer: lseek 0");
520         
521         byteswritten = write(fd, buffer, (size_t)bufferlength);
522         if (byteswritten != bufferlength) {
523                 if (byteswritten == -1)
524                         prterr("save_buffer write");
525                 else
526                         warn("save_buffer: short write, 0x%x bytes instead of 0x%llx\n",
527                              (unsigned)byteswritten,
528                              (unsigned long long)bufferlength);
529         }
530 }
531
532
533 void
534 report_failure(int status)
535 {
536         logdump();
537         
538         if (fsxgoodfd) {
539                 if (good_buf) {
540                         save_buffer(good_buf, file_size, fsxgoodfd);
541                         prt("Correct content saved for comparison\n");
542                         prt("(maybe hexdump \"%s\" vs \"%s\")\n",
543                             fname, goodfile);
544                 }
545                 close(fsxgoodfd);
546         }
547         exit(status);
548 }
549
550
551 #define short_at(cp) ((unsigned short)((*((unsigned char *)(cp)) << 8) | \
552                                         *(((unsigned char *)(cp)) + 1)))
553
554 void
555 mark_log(void)
556 {
557         char command[256];
558         int ret;
559
560         snprintf(command, 256, "dmsetup message %s 0 mark %s.mark%d", logdev,
561                  bname, mark_nr);
562         ret = system(command);
563         if (ret) {
564                 prterr("dmsetup mark failed");
565                 exit(211);
566         }
567 }
568
569 void
570 dump_fsync_buffer(void)
571 {
572         char fname_buffer[PATH_MAX];
573         int good_fd;
574
575         if (!good_buf)
576                 return;
577
578         snprintf(fname_buffer, sizeof(fname_buffer), "%s%s.mark%d", dname,
579                  bname, mark_nr);
580         good_fd = open(fname_buffer, O_WRONLY|O_CREAT|O_TRUNC, 0666);
581         if (good_fd < 0) {
582                 prterr(fname_buffer);
583                 exit(212);
584         }
585
586         save_buffer(good_buf, file_size, good_fd);
587         close(good_fd);
588         prt("Dumped fsync buffer to %s\n", fname_buffer + dirpath);
589 }
590
591 void
592 check_buffers(char *buf, unsigned offset, unsigned size)
593 {
594         unsigned char c, t;
595         unsigned i = 0;
596         unsigned n = 0;
597         unsigned op = 0;
598         unsigned bad = 0;
599
600         if (memcmp(good_buf + offset, buf, size) != 0) {
601                 prt("READ BAD DATA: offset = 0x%x, size = 0x%x, fname = %s\n",
602                     offset, size, fname);
603                 prt("OFFSET\tGOOD\tBAD\tRANGE\n");
604                 while (size > 0) {
605                         c = good_buf[offset];
606                         t = buf[i];
607                         if (c != t) {
608                                 if (n < 16) {
609                                         bad = short_at(&buf[i]);
610                                         prt("0x%05x\t0x%04x\t0x%04x", offset,
611                                             short_at(&good_buf[offset]), bad);
612                                         op = buf[offset & 1 ? i+1 : i];
613                                         prt("\t0x%05x\n", n);
614                                         if (op)
615                                                 prt("operation# (mod 256) for "
616                                                   "the bad data may be %u\n",
617                                                 ((unsigned)op & 0xff));
618                                         else
619                                                 prt("operation# (mod 256) for "
620                                                   "the bad data unknown, check"
621                                                   " HOLE and EXTEND ops\n");
622                                 }
623                                 n++;
624                                 badoff = offset;
625                         }
626                         offset++;
627                         i++;
628                         size--;
629                 }
630                 report_failure(110);
631         }
632 }
633
634
635 void
636 check_size(void)
637 {
638         struct stat     statbuf;
639         off_t   size_by_seek;
640
641         if (fstat(fd, &statbuf)) {
642                 prterr("check_size: fstat");
643                 statbuf.st_size = -1;
644         }
645         size_by_seek = lseek(fd, (off_t)0, SEEK_END);
646         if (file_size != statbuf.st_size || file_size != size_by_seek) {
647                 prt("Size error: expected 0x%llx stat 0x%llx seek 0x%llx\n",
648                     (unsigned long long)file_size,
649                     (unsigned long long)statbuf.st_size,
650                     (unsigned long long)size_by_seek);
651                 report_failure(120);
652         }
653 }
654
655
656 void
657 check_trunc_hack(void)
658 {
659         struct stat statbuf;
660         off_t offset = file_size + (off_t)100000;
661
662         if (ftruncate(fd, file_size))
663                 goto ftruncate_err;
664         if (ftruncate(fd, offset))
665                 goto ftruncate_err;
666         fstat(fd, &statbuf);
667         if (statbuf.st_size != offset) {
668                 prt("no extend on truncate! not posix!\n");
669                 exit(130);
670         }
671         if (ftruncate(fd, file_size)) {
672 ftruncate_err:
673                 prterr("check_trunc_hack: ftruncate");
674                 exit(131);
675         }
676 }
677
678 void
679 doflush(unsigned offset, unsigned size)
680 {
681         unsigned pg_offset;
682         unsigned map_size;
683         char    *p;
684
685         if (o_direct == O_DIRECT)
686                 return;
687
688         pg_offset = offset & mmap_mask;
689         map_size  = pg_offset + size;
690
691         if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
692                               MAP_FILE | MAP_SHARED, fd,
693                               (off_t)(offset - pg_offset))) == (char *)-1) {
694                 prterr("doflush: mmap");
695                 report_failure(202);
696         }
697         if (msync(p, map_size, MS_INVALIDATE) != 0) {
698                 prterr("doflush: msync");
699                 report_failure(203);
700         }
701         if (munmap(p, map_size) != 0) {
702                 prterr("doflush: munmap");
703                 report_failure(204);
704         }
705 }
706
707 void
708 doread(unsigned offset, unsigned size)
709 {
710         off_t ret;
711         unsigned iret;
712
713         offset -= offset % readbdy;
714         if (o_direct)
715                 size -= size % readbdy;
716         if (size == 0) {
717                 if (!quiet && testcalls > simulatedopcount && !o_direct)
718                         prt("skipping zero size read\n");
719                 log4(OP_READ, offset, size, FL_SKIPPED);
720                 return;
721         }
722         if (size + offset > file_size) {
723                 if (!quiet && testcalls > simulatedopcount)
724                         prt("skipping seek/read past end of file\n");
725                 log4(OP_READ, offset, size, FL_SKIPPED);
726                 return;
727         }
728
729         log4(OP_READ, offset, size, FL_NONE);
730
731         if (testcalls <= simulatedopcount)
732                 return;
733
734         if (!quiet &&
735                 ((progressinterval && testcalls % progressinterval == 0)  ||
736                 (debug &&
737                        (monitorstart == -1 ||
738                         (offset + size > monitorstart &&
739                         (monitorend == -1 || offset <= monitorend))))))
740                 prt("%lu read\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
741                     offset, offset + size - 1, size);
742         ret = lseek(fd, (off_t)offset, SEEK_SET);
743         if (ret == (off_t)-1) {
744                 prterr("doread: lseek");
745                 report_failure(140);
746         }
747         iret = fsxread(fd, temp_buf, size, offset);
748         if (iret != size) {
749                 if (iret == -1)
750                         prterr("doread: read");
751                 else
752                         prt("short read: 0x%x bytes instead of 0x%x\n",
753                             iret, size);
754                 report_failure(141);
755         }
756         check_buffers(temp_buf, offset, size);
757 }
758
759 void
760 check_eofpage(char *s, unsigned offset, char *p, int size)
761 {
762         unsigned long last_page, should_be_zero;
763
764         if (offset + size <= (file_size & ~page_mask))
765                 return;
766         /*
767          * we landed in the last page of the file
768          * test to make sure the VM system provided 0's 
769          * beyond the true end of the file mapping
770          * (as required by mmap def in 1996 posix 1003.1)
771          */
772         last_page = ((unsigned long)p + (offset & page_mask) + size) & ~page_mask;
773
774         for (should_be_zero = last_page + (file_size & page_mask);
775              should_be_zero < last_page + page_size;
776              should_be_zero++)
777                 if (*(char *)should_be_zero) {
778                         prt("Mapped %s: non-zero data past EOF (0x%llx) page offset 0x%x is 0x%04x\n",
779                             s, file_size - 1, should_be_zero & page_mask,
780                             short_at(should_be_zero));
781                         report_failure(205);
782                 }
783 }
784
785 void
786 check_contents(void)
787 {
788         static char *check_buf;
789         unsigned offset = 0;
790         unsigned size = file_size;
791         unsigned map_offset;
792         unsigned map_size;
793         char *p;
794         off_t ret;
795         unsigned iret;
796
797         if (!check_buf) {
798                 check_buf = (char *) malloc(maxfilelen + writebdy);
799                 assert(check_buf != NULL);
800                 check_buf = round_ptr_up(check_buf, writebdy, 0);
801                 memset(check_buf, '\0', maxfilelen);
802         }
803
804         if (o_direct)
805                 size -= size % readbdy;
806         if (size == 0)
807                 return;
808
809         ret = lseek(fd, (off_t)offset, SEEK_SET);
810         if (ret == (off_t)-1) {
811                 prterr("doread: lseek");
812                 report_failure(140);
813         }
814
815         iret = fsxread(fd, check_buf, size, offset);
816         if (iret != size) {
817                 if (iret == -1)
818                         prterr("check_contents: read");
819                 else
820                         prt("short check read: 0x%x bytes instead of 0x%x\n",
821                             iret, size);
822                 report_failure(141);
823         }
824         check_buffers(check_buf, offset, size);
825
826         /* Map eof page, check it */
827         map_offset = size - (size & PAGE_MASK);
828         if (map_offset == size)
829                 map_offset -= PAGE_SIZE;
830         map_size  = size - map_offset;
831
832         p = mmap(0, map_size, PROT_READ, MAP_SHARED, fd, map_offset);
833         if (p == MAP_FAILED) {
834                 prterr("check_contents: mmap");
835                 report_failure(190);
836         }
837         check_eofpage("check_contents", map_offset, p, map_size);
838
839         if (munmap(p, map_size) != 0) {
840                 prterr("check_contents: munmap");
841                 report_failure(191);
842         }
843 }
844
845 void
846 domapread(unsigned offset, unsigned size)
847 {
848         unsigned pg_offset;
849         unsigned map_size;
850         char    *p;
851
852         offset -= offset % readbdy;
853         if (size == 0) {
854                 if (!quiet && testcalls > simulatedopcount)
855                         prt("skipping zero size read\n");
856                 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
857                 return;
858         }
859         if (size + offset > file_size) {
860                 if (!quiet && testcalls > simulatedopcount)
861                         prt("skipping seek/read past end of file\n");
862                 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
863                 return;
864         }
865
866         log4(OP_MAPREAD, offset, size, FL_NONE);
867
868         if (testcalls <= simulatedopcount)
869                 return;
870
871         if (!quiet &&
872                 ((progressinterval && testcalls % progressinterval == 0) ||
873                        (debug &&
874                        (monitorstart == -1 ||
875                         (offset + size > monitorstart &&
876                         (monitorend == -1 || offset <= monitorend))))))
877                 prt("%lu mapread\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
878                     offset, offset + size - 1, size);
879
880         pg_offset = offset & PAGE_MASK;
881         map_size  = pg_offset + size;
882
883         if ((p = (char *)mmap(0, map_size, PROT_READ, MAP_SHARED, fd,
884                               (off_t)(offset - pg_offset))) == (char *)-1) {
885                 prterr("domapread: mmap");
886                 report_failure(190);
887         }
888         memcpy(temp_buf, p + pg_offset, size);
889
890         check_eofpage("Read", offset, p, size);
891
892         if (munmap(p, map_size) != 0) {
893                 prterr("domapread: munmap");
894                 report_failure(191);
895         }
896
897         check_buffers(temp_buf, offset, size);
898 }
899
900
901 void
902 gendata(char *original_buf, char *good_buf, unsigned offset, unsigned size)
903 {
904         while (size--) {
905                 if (filldata) {
906                         good_buf[offset] = filldata;
907                 } else {
908                         good_buf[offset] = testcalls % 256;
909                         if (offset % 2)
910                                 good_buf[offset] += original_buf[offset];
911                 }
912                 offset++;
913         }
914 }
915
916
917 void
918 dowrite(unsigned offset, unsigned size)
919 {
920         off_t ret;
921         unsigned iret;
922
923         offset -= offset % writebdy;
924         if (o_direct)
925                 size -= size % writebdy;
926         if (size == 0) {
927                 if (!quiet && testcalls > simulatedopcount && !o_direct)
928                         prt("skipping zero size write\n");
929                 log4(OP_WRITE, offset, size, FL_SKIPPED);
930                 return;
931         }
932
933         log4(OP_WRITE, offset, size, FL_NONE);
934
935         gendata(original_buf, good_buf, offset, size);
936         if (file_size < offset + size) {
937                 if (file_size < offset)
938                         memset(good_buf + file_size, '\0', offset - file_size);
939                 file_size = offset + size;
940                 if (lite) {
941                         warn("Lite file size bug in fsx!");
942                         report_failure(149);
943                 }
944         }
945
946         if (testcalls <= simulatedopcount)
947                 return;
948
949         if (!quiet &&
950                 ((progressinterval && testcalls % progressinterval == 0) ||
951                        (debug &&
952                        (monitorstart == -1 ||
953                         (offset + size > monitorstart &&
954                         (monitorend == -1 || offset <= monitorend))))))
955                 prt("%lu write\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
956                     offset, offset + size - 1, size);
957         ret = lseek(fd, (off_t)offset, SEEK_SET);
958         if (ret == (off_t)-1) {
959                 prterr("dowrite: lseek");
960                 report_failure(150);
961         }
962         iret = fsxwrite(fd, good_buf + offset, size, offset);
963         if (iret != size) {
964                 if (iret == -1)
965                         prterr("dowrite: write");
966                 else
967                         prt("short write: 0x%x bytes instead of 0x%x\n",
968                             iret, size);
969                 report_failure(151);
970         }
971         if (do_fsync) {
972                 if (fsync(fd)) {
973                         prt("fsync() failed: %s\n", strerror(errno));
974                         report_failure(152);
975                 }
976         }
977         if (flush) {
978                 doflush(offset, size);
979         }
980 }
981
982
983 void
984 domapwrite(unsigned offset, unsigned size)
985 {
986         unsigned pg_offset;
987         unsigned map_size;
988         off_t    cur_filesize;
989         char    *p;
990
991         offset -= offset % writebdy;
992         if (size == 0) {
993                 if (!quiet && testcalls > simulatedopcount)
994                         prt("skipping zero size write\n");
995                 log4(OP_MAPWRITE, offset, size, FL_SKIPPED);
996                 return;
997         }
998         cur_filesize = file_size;
999
1000         log4(OP_MAPWRITE, offset, size, FL_NONE);
1001
1002         gendata(original_buf, good_buf, offset, size);
1003         if (file_size < offset + size) {
1004                 if (file_size < offset)
1005                         memset(good_buf + file_size, '\0', offset - file_size);
1006                 file_size = offset + size;
1007                 if (lite) {
1008                         warn("Lite file size bug in fsx!");
1009                         report_failure(200);
1010                 }
1011         }
1012
1013         if (testcalls <= simulatedopcount)
1014                 return;
1015
1016         if (!quiet &&
1017                 ((progressinterval && testcalls % progressinterval == 0) ||
1018                        (debug &&
1019                        (monitorstart == -1 ||
1020                         (offset + size > monitorstart &&
1021                         (monitorend == -1 || offset <= monitorend))))))
1022                 prt("%lu mapwrite\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
1023                     offset, offset + size - 1, size);
1024
1025         if (file_size > cur_filesize) {
1026                 if (ftruncate(fd, file_size) == -1) {
1027                         prterr("domapwrite: ftruncate");
1028                         exit(201);
1029                 }
1030         }
1031         pg_offset = offset & PAGE_MASK;
1032         map_size  = pg_offset + size;
1033
1034         if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
1035                               MAP_FILE | MAP_SHARED, fd,
1036                               (off_t)(offset - pg_offset))) == (char *)-1) {
1037                 prterr("domapwrite: mmap");
1038                 report_failure(202);
1039         }
1040         memcpy(p + pg_offset, good_buf + offset, size);
1041         if (msync(p, map_size, MS_SYNC) != 0) {
1042                 prterr("domapwrite: msync");
1043                 report_failure(203);
1044         }
1045
1046         check_eofpage("Write", offset, p, size);
1047
1048         if (munmap(p, map_size) != 0) {
1049                 prterr("domapwrite: munmap");
1050                 report_failure(204);
1051         }
1052 }
1053
1054
1055 void
1056 dotruncate(unsigned size)
1057 {
1058         int oldsize = file_size;
1059
1060         size -= size % truncbdy;
1061         if (size > biggest) {
1062                 biggest = size;
1063                 if (!quiet && testcalls > simulatedopcount)
1064                         prt("truncating to largest ever: 0x%x\n", size);
1065         }
1066
1067         log4(OP_TRUNCATE, 0, size, FL_NONE);
1068
1069         if (size > file_size)
1070                 memset(good_buf + file_size, '\0', size - file_size);
1071         file_size = size;
1072
1073         if (testcalls <= simulatedopcount)
1074                 return;
1075         
1076         if ((progressinterval && testcalls % progressinterval == 0) ||
1077             (debug && (monitorstart == -1 || monitorend == -1 ||
1078                       size <= monitorend)))
1079                 prt("%lu trunc\tfrom 0x%x to 0x%x\n", testcalls, oldsize, size);
1080         if (ftruncate(fd, (off_t)size) == -1) {
1081                 prt("ftruncate1: %x\n", size);
1082                 prterr("dotruncate: ftruncate");
1083                 report_failure(160);
1084         }
1085 }
1086
1087 #ifdef FALLOC_FL_PUNCH_HOLE
1088 void
1089 do_punch_hole(unsigned offset, unsigned length)
1090 {
1091         unsigned end_offset;
1092         int max_offset = 0;
1093         int max_len = 0;
1094         int mode = FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE;
1095
1096         if (length == 0) {
1097                 if (!quiet && testcalls > simulatedopcount)
1098                         prt("skipping zero length punch hole\n");
1099                 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1100                 return;
1101         }
1102
1103         if (file_size <= (loff_t)offset) {
1104                 if (!quiet && testcalls > simulatedopcount)
1105                         prt("skipping hole punch off the end of the file\n");
1106                 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1107                 return;
1108         }
1109
1110         end_offset = offset + length;
1111
1112         log4(OP_PUNCH_HOLE, offset, length, FL_NONE);
1113
1114         if (testcalls <= simulatedopcount)
1115                 return;
1116
1117         if ((progressinterval && testcalls % progressinterval == 0) ||
1118             (debug && (monitorstart == -1 || monitorend == -1 ||
1119                       end_offset <= monitorend))) {
1120                 prt("%lu punch\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1121                         offset, offset+length, length);
1122         }
1123         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1124                 prt("punch hole: 0x%x to 0x%x\n", offset, offset + length);
1125                 prterr("do_punch_hole: fallocate");
1126                 report_failure(161);
1127         }
1128
1129
1130         max_offset = offset < file_size ? offset : file_size;
1131         max_len = max_offset + length <= file_size ? length :
1132                         file_size - max_offset;
1133         memset(good_buf + max_offset, '\0', max_len);
1134 }
1135
1136 #else
1137 void
1138 do_punch_hole(unsigned offset, unsigned length)
1139 {
1140         return;
1141 }
1142 #endif
1143
1144 #ifdef FALLOC_FL_ZERO_RANGE
1145 void
1146 do_zero_range(unsigned offset, unsigned length, int keep_size)
1147 {
1148         unsigned end_offset;
1149         int mode = FALLOC_FL_ZERO_RANGE;
1150
1151         if (length == 0) {
1152                 if (!quiet && testcalls > simulatedopcount)
1153                         prt("skipping zero length zero range\n");
1154                 log4(OP_ZERO_RANGE, offset, length, FL_SKIPPED |
1155                      (keep_size ? FL_KEEP_SIZE : FL_NONE));
1156                 return;
1157         }
1158
1159         end_offset = keep_size ? 0 : offset + length;
1160
1161         if (end_offset > biggest) {
1162                 biggest = end_offset;
1163                 if (!quiet && testcalls > simulatedopcount)
1164                         prt("zero_range to largest ever: 0x%x\n", end_offset);
1165         }
1166
1167         /*
1168          * last arg matches fallocate string array index in logdump:
1169          *      0: allocate past EOF
1170          *      1: extending prealloc
1171          *      2: interior prealloc
1172          */
1173         log4(OP_ZERO_RANGE, offset, length,
1174              keep_size ? FL_KEEP_SIZE : FL_NONE);
1175
1176         if (testcalls <= simulatedopcount)
1177                 return;
1178
1179         if ((progressinterval && testcalls % progressinterval == 0) ||
1180             (debug && (monitorstart == -1 || monitorend == -1 ||
1181                       end_offset <= monitorend))) {
1182                 prt("%lu zero\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1183                         offset, offset+length, length);
1184         }
1185         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1186                 prt("zero range: 0x%x to 0x%x\n", offset, offset + length);
1187                 prterr("do_zero_range: fallocate");
1188                 report_failure(161);
1189         }
1190
1191         memset(good_buf + offset, '\0', length);
1192 }
1193
1194 #else
1195 void
1196 do_zero_range(unsigned offset, unsigned length, int keep_size)
1197 {
1198         return;
1199 }
1200 #endif
1201
1202 #ifdef FALLOC_FL_COLLAPSE_RANGE
1203 void
1204 do_collapse_range(unsigned offset, unsigned length)
1205 {
1206         unsigned end_offset;
1207         int mode = FALLOC_FL_COLLAPSE_RANGE;
1208
1209         if (length == 0) {
1210                 if (!quiet && testcalls > simulatedopcount)
1211                         prt("skipping zero length collapse range\n");
1212                 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1213                 return;
1214         }
1215
1216         end_offset = offset + length;
1217         if ((loff_t)end_offset >= file_size) {
1218                 if (!quiet && testcalls > simulatedopcount)
1219                         prt("skipping collapse range behind EOF\n");
1220                 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1221                 return;
1222         }
1223
1224         log4(OP_COLLAPSE_RANGE, offset, length, FL_NONE);
1225
1226         if (testcalls <= simulatedopcount)
1227                 return;
1228
1229         if ((progressinterval && testcalls % progressinterval == 0) ||
1230             (debug && (monitorstart == -1 || monitorend == -1 ||
1231                       end_offset <= monitorend))) {
1232                 prt("%lu collapse\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1233                         offset, offset+length, length);
1234         }
1235         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1236                 prt("collapse range: 0x%x to 0x%x\n", offset, offset + length);
1237                 prterr("do_collapse_range: fallocate");
1238                 report_failure(161);
1239         }
1240
1241         memmove(good_buf + offset, good_buf + end_offset,
1242                 file_size - end_offset);
1243         file_size -= length;
1244 }
1245
1246 #else
1247 void
1248 do_collapse_range(unsigned offset, unsigned length)
1249 {
1250         return;
1251 }
1252 #endif
1253
1254 #ifdef FALLOC_FL_INSERT_RANGE
1255 void
1256 do_insert_range(unsigned offset, unsigned length)
1257 {
1258         unsigned end_offset;
1259         int mode = FALLOC_FL_INSERT_RANGE;
1260
1261         if (length == 0) {
1262                 if (!quiet && testcalls > simulatedopcount)
1263                         prt("skipping zero length insert range\n");
1264                 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1265                 return;
1266         }
1267
1268         if ((loff_t)offset >= file_size) {
1269                 if (!quiet && testcalls > simulatedopcount)
1270                         prt("skipping insert range behind EOF\n");
1271                 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1272                 return;
1273         }
1274
1275         log4(OP_INSERT_RANGE, offset, length, FL_NONE);
1276
1277         if (testcalls <= simulatedopcount)
1278                 return;
1279
1280         end_offset = offset + length;
1281         if ((progressinterval && testcalls % progressinterval == 0) ||
1282             (debug && (monitorstart == -1 || monitorend == -1 ||
1283                       end_offset <= monitorend))) {
1284                 prt("%lu insert\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1285                         offset, offset+length, length);
1286         }
1287         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1288                 prt("insert range: 0x%x to 0x%x\n", offset, offset + length);
1289                 prterr("do_insert_range: fallocate");
1290                 report_failure(161);
1291         }
1292
1293         memmove(good_buf + end_offset, good_buf + offset,
1294                 file_size - offset);
1295         memset(good_buf + offset, '\0', length);
1296         file_size += length;
1297 }
1298
1299 #else
1300 void
1301 do_insert_range(unsigned offset, unsigned length)
1302 {
1303         return;
1304 }
1305 #endif
1306
1307 #ifdef HAVE_LINUX_FALLOC_H
1308 /* fallocate is basically a no-op unless extending, then a lot like a truncate */
1309 void
1310 do_preallocate(unsigned offset, unsigned length, int keep_size)
1311 {
1312         unsigned end_offset;
1313
1314         if (length == 0) {
1315                 if (!quiet && testcalls > simulatedopcount)
1316                         prt("skipping zero length fallocate\n");
1317                 log4(OP_FALLOCATE, offset, length, FL_SKIPPED |
1318                      (keep_size ? FL_KEEP_SIZE : FL_NONE));
1319                 return;
1320         }
1321
1322         end_offset = keep_size ? 0 : offset + length;
1323
1324         if (end_offset > biggest) {
1325                 biggest = end_offset;
1326                 if (!quiet && testcalls > simulatedopcount)
1327                         prt("fallocating to largest ever: 0x%x\n", end_offset);
1328         }
1329
1330         /*
1331          * last arg matches fallocate string array index in logdump:
1332          *      0: allocate past EOF
1333          *      1: extending prealloc
1334          *      2: interior prealloc
1335          */
1336         log4(OP_FALLOCATE, offset, length,
1337              keep_size ? FL_KEEP_SIZE : FL_NONE);
1338
1339         if (end_offset > file_size) {
1340                 memset(good_buf + file_size, '\0', end_offset - file_size);
1341                 file_size = end_offset;
1342         }
1343
1344         if (testcalls <= simulatedopcount)
1345                 return;
1346         
1347         if ((progressinterval && testcalls % progressinterval == 0) ||
1348             (debug && (monitorstart == -1 || monitorend == -1 ||
1349                       end_offset <= monitorend)))
1350                 prt("%lu falloc\tfrom 0x%x to 0x%x (0x%x bytes)\n", testcalls,
1351                                 offset, offset + length, length);
1352         if (fallocate(fd, keep_size ? FALLOC_FL_KEEP_SIZE : 0, (loff_t)offset, (loff_t)length) == -1) {
1353                 prt("fallocate: 0x%x to 0x%x\n", offset, offset + length);
1354                 prterr("do_preallocate: fallocate");
1355                 report_failure(161);
1356         }
1357 }
1358 #else
1359 void
1360 do_preallocate(unsigned offset, unsigned length, int keep_size)
1361 {
1362         return;
1363 }
1364 #endif
1365
1366 void
1367 writefileimage()
1368 {
1369         ssize_t iret;
1370
1371         if (lseek(fd, (off_t)0, SEEK_SET) == (off_t)-1) {
1372                 prterr("writefileimage: lseek");
1373                 report_failure(171);
1374         }
1375         iret = write(fd, good_buf, file_size);
1376         if ((off_t)iret != file_size) {
1377                 if (iret == -1)
1378                         prterr("writefileimage: write");
1379                 else
1380                         prt("short write: 0x%x bytes instead of 0x%llx\n",
1381                             iret, (unsigned long long)file_size);
1382                 report_failure(172);
1383         }
1384         if (lite ? 0 : ftruncate(fd, file_size) == -1) {
1385                 prt("ftruncate2: %llx\n", (unsigned long long)file_size);
1386                 prterr("writefileimage: ftruncate");
1387                 report_failure(173);
1388         }
1389 }
1390
1391
1392 void
1393 docloseopen(void)
1394
1395         if (testcalls <= simulatedopcount)
1396                 return;
1397
1398         if (debug)
1399                 prt("%lu close/open\n", testcalls);
1400         if (close(fd)) {
1401                 prterr("docloseopen: close");
1402                 report_failure(180);
1403         }
1404         fd = open(fname, O_RDWR|o_direct, 0);
1405         if (fd < 0) {
1406                 prterr("docloseopen: open");
1407                 report_failure(181);
1408         }
1409 }
1410
1411 void
1412 dofsync(void)
1413 {
1414         int ret;
1415
1416         if (testcalls <= simulatedopcount)
1417                 return;
1418         if (debug)
1419                 prt("%lu fsync\n", testcalls);
1420         log4(OP_FSYNC, 0, 0, 0);
1421         ret = fsync(fd);
1422         if (ret < 0) {
1423                 prterr("dofsync");
1424                 report_failure(210);
1425         }
1426         mark_log();
1427         dump_fsync_buffer();
1428         mark_nr++;
1429 }
1430
1431 #define TRIM_OFF(off, size)                     \
1432 do {                                            \
1433         if (size)                               \
1434                 (off) %= (size);                \
1435         else                                    \
1436                 (off) = 0;                      \
1437 } while (0)
1438
1439 #define TRIM_LEN(off, len, size)                \
1440 do {                                            \
1441         if ((off) + (len) > (size))             \
1442                 (len) = (size) - (off);         \
1443 } while (0)
1444
1445 #define TRIM_OFF_LEN(off, len, size)            \
1446 do {                                            \
1447         TRIM_OFF(off, size);                    \
1448         TRIM_LEN(off, len, size);               \
1449 } while (0)
1450
1451 void
1452 cleanup(int sig)
1453 {
1454         if (sig)
1455                 prt("signal %d\n", sig);
1456         prt("testcalls = %lu\n", testcalls);
1457         exit(sig);
1458 }
1459
1460 static int
1461 op_args_count(int operation)
1462 {
1463         switch (operation) {
1464         default:
1465                 return 3;
1466         }
1467 }
1468
1469 static int
1470 read_op(struct log_entry *log_entry)
1471 {
1472         char line[256];
1473
1474         memset(log_entry, 0, sizeof(*log_entry));
1475         log_entry->operation = -1;
1476
1477         while (log_entry->operation == -1) {
1478                 char *str;
1479                 int i;
1480
1481                 do {
1482                         if (!fgets(line, sizeof(line), replayopsf)) {
1483                                 if (feof(replayopsf)) {
1484                                         replayopsf = NULL;
1485                                         return 0;
1486                                 }
1487                                 goto fail;
1488                         }
1489                         str = strtok(line, " \t\n");
1490                 } while (!str || str[0] == '#');
1491
1492                 if (strcmp(str, "skip") == 0) {
1493                         log_entry->flags |= FL_SKIPPED;
1494                         str = strtok(NULL, " \t\n");
1495                         if (!str)
1496                                 goto fail;
1497                 }
1498                 log_entry->operation = op_code(str);
1499                 if (log_entry->operation == -1)
1500                         goto fail;
1501                 log_entry->nr_args = op_args_count(log_entry->operation);
1502                 for (i = 0; i < log_entry->nr_args; i++) {
1503                         char *end;
1504
1505                         str = strtok(NULL, " \t\n");
1506                         if (!str)
1507                                 goto fail;
1508                         log_entry->args[i] = strtoul(str, &end, 0);
1509                         if (*end)
1510                                 goto fail;
1511                 }
1512                 while ((str = strtok(NULL, " \t\n"))) {
1513                         if (strcmp(str, "keep_size") == 0)
1514                                 log_entry->flags |= FL_KEEP_SIZE;
1515                         else if (strcmp(str, "close_open") == 0)
1516                                 log_entry->flags |= FL_CLOSE_OPEN;
1517                         else if (strcmp(str, "*") == 0)
1518                                 ;  /* overlap marker; ignore */
1519                         else
1520                                 goto fail;
1521                 }
1522         }
1523         return 1;
1524
1525 fail:
1526         fprintf(stderr, "%s: parse error\n", replayops);
1527         fclose(replayopsf);
1528         replayopsf = NULL;
1529         cleanup(100);  /* doesn't return */
1530         return 0;
1531 }
1532
1533
1534 int
1535 test(void)
1536 {
1537         unsigned long   offset;
1538         unsigned long   size;
1539         unsigned long   rv;
1540         unsigned long   op;
1541         int             keep_size = 0;
1542
1543         if (simulatedopcount > 0 && testcalls == simulatedopcount)
1544                 writefileimage();
1545
1546         testcalls++;
1547
1548         if (debugstart > 0 && testcalls >= debugstart)
1549                 debug = 1;
1550
1551         if (!quiet && testcalls < simulatedopcount && testcalls % 100000 == 0)
1552                 prt("%lu...\n", testcalls);
1553
1554         if (replayopsf) {
1555                 struct log_entry log_entry;
1556
1557                 while (read_op(&log_entry)) {
1558                         if (log_entry.flags & FL_SKIPPED) {
1559                                 log4(log_entry.operation,
1560                                      log_entry.args[0], log_entry.args[1],
1561                                      log_entry.flags);
1562                                 continue;
1563                         }
1564
1565                         op = log_entry.operation;
1566                         offset = log_entry.args[0];
1567                         size = log_entry.args[1];
1568                         closeopen = !!(log_entry.flags & FL_CLOSE_OPEN);
1569                         keep_size = !!(log_entry.flags & FL_KEEP_SIZE);
1570                         goto have_op;
1571                 }
1572                 return 0;
1573         }
1574
1575         rv = random();
1576         if (closeprob)
1577                 closeopen = (rv >> 3) < (1 << 28) / closeprob;
1578
1579         offset = random();
1580         size = maxoplen;
1581         if (randomoplen)
1582                 size = random() % (maxoplen + 1);
1583
1584         /* calculate appropriate op to run */
1585         if (lite)
1586                 op = rv % OP_MAX_LITE;
1587         else if (!integrity)
1588                 op = rv % OP_MAX_FULL;
1589         else
1590                 op = rv % OP_MAX_INTEGRITY;
1591
1592         switch(op) {
1593         case OP_TRUNCATE:
1594                 if (!style)
1595                         size = random() % maxfilelen;
1596                 break;
1597         case OP_FALLOCATE:
1598                 if (fallocate_calls && size && keep_size_calls)
1599                         keep_size = random() % 2;
1600                 break;
1601         case OP_ZERO_RANGE:
1602                 if (zero_range_calls && size && keep_size_calls)
1603                         keep_size = random() % 2;
1604                 break;
1605         }
1606
1607 have_op:
1608
1609         switch (op) {
1610         case OP_MAPREAD:
1611                 if (!mapped_reads)
1612                         op = OP_READ;
1613                 break;
1614         case OP_MAPWRITE:
1615                 if (!mapped_writes)
1616                         op = OP_WRITE;
1617                 break;
1618         case OP_FALLOCATE:
1619                 if (!fallocate_calls) {
1620                         log4(OP_FALLOCATE, offset, size, FL_SKIPPED);
1621                         goto out;
1622                 }
1623                 break;
1624         case OP_PUNCH_HOLE:
1625                 if (!punch_hole_calls) {
1626                         log4(OP_PUNCH_HOLE, offset, size, FL_SKIPPED);
1627                         goto out;
1628                 }
1629                 break;
1630         case OP_ZERO_RANGE:
1631                 if (!zero_range_calls) {
1632                         log4(OP_ZERO_RANGE, offset, size, FL_SKIPPED);
1633                         goto out;
1634                 }
1635                 break;
1636         case OP_COLLAPSE_RANGE:
1637                 if (!collapse_range_calls) {
1638                         log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
1639                         goto out;
1640                 }
1641                 break;
1642         case OP_INSERT_RANGE:
1643                 if (!insert_range_calls) {
1644                         log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
1645                         goto out;
1646                 }
1647                 break;
1648         }
1649
1650         switch (op) {
1651         case OP_READ:
1652                 TRIM_OFF_LEN(offset, size, file_size);
1653                 doread(offset, size);
1654                 break;
1655
1656         case OP_WRITE:
1657                 TRIM_OFF_LEN(offset, size, maxfilelen);
1658                 dowrite(offset, size);
1659                 break;
1660
1661         case OP_MAPREAD:
1662                 TRIM_OFF_LEN(offset, size, file_size);
1663                 domapread(offset, size);
1664                 break;
1665
1666         case OP_MAPWRITE:
1667                 TRIM_OFF_LEN(offset, size, maxfilelen);
1668                 domapwrite(offset, size);
1669                 break;
1670
1671         case OP_TRUNCATE:
1672                 dotruncate(size);
1673                 break;
1674
1675         case OP_FALLOCATE:
1676                 TRIM_OFF_LEN(offset, size, maxfilelen);
1677                 do_preallocate(offset, size, keep_size);
1678                 break;
1679
1680         case OP_PUNCH_HOLE:
1681                 TRIM_OFF_LEN(offset, size, file_size);
1682                 do_punch_hole(offset, size);
1683                 break;
1684         case OP_ZERO_RANGE:
1685                 TRIM_OFF_LEN(offset, size, file_size);
1686                 do_zero_range(offset, size, keep_size);
1687                 break;
1688         case OP_COLLAPSE_RANGE:
1689                 TRIM_OFF_LEN(offset, size, file_size - 1);
1690                 offset = offset & ~(block_size - 1);
1691                 size = size & ~(block_size - 1);
1692                 if (size == 0) {
1693                         log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
1694                         goto out;
1695                 }
1696                 do_collapse_range(offset, size);
1697                 break;
1698         case OP_INSERT_RANGE:
1699                 TRIM_OFF(offset, file_size);
1700                 TRIM_LEN(file_size, size, maxfilelen);
1701                 offset = offset & ~(block_size - 1);
1702                 size = size & ~(block_size - 1);
1703                 if (size == 0) {
1704                         log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
1705                         goto out;
1706                 }
1707                 if (file_size + size > maxfilelen) {
1708                         log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
1709                         goto out;
1710                 }
1711
1712                 do_insert_range(offset, size);
1713                 break;
1714         case OP_FSYNC:
1715                 dofsync();
1716                 break;
1717         default:
1718                 prterr("test: unknown operation");
1719                 report_failure(42);
1720                 break;
1721         }
1722
1723         if (check_file && testcalls > simulatedopcount)
1724                 check_contents();
1725
1726 out:
1727         if (sizechecks && testcalls > simulatedopcount)
1728                 check_size();
1729         if (closeopen)
1730                 docloseopen();
1731         return 1;
1732 }
1733
1734
1735 void
1736 usage(void)
1737 {
1738         fprintf(stdout, "usage: %s",
1739                 "fsx [-dknqxAFLOWZ] [-b opnum] [-c Prob] [-g filldata] [-i logdev] [-j logid] [-l flen] [-m start:end] [-o oplen] [-p progressinterval] [-r readbdy] [-s style] [-t truncbdy] [-w writebdy] [-D startingop] [-N numops] [-P dirpath] [-S seed] fname\n\
1740         -b opnum: beginning operation number (default 1)\n\
1741         -c P: 1 in P chance of file close+open at each op (default infinity)\n\
1742         -d: debug output for all operations\n\
1743         -f flush and invalidate cache after I/O\n\
1744         -g X: write character X instead of random generated data\n\
1745         -i logdev: do integrity testing, logdev is the dm log writes device\n\
1746         -j logid: prefix debug log messsages with this id\n\
1747         -k: do not truncate existing file and use its size as upper bound on file size\n\
1748         -l flen: the upper bound on file size (default 262144)\n\
1749         -m startop:endop: monitor (print debug output) specified byte range (default 0:infinity)\n\
1750         -n: no verifications of file size\n\
1751         -o oplen: the upper bound on operation size (default 65536)\n\
1752         -p progressinterval: debug output at specified operation interval\n\
1753         -q: quieter operation\n\
1754         -r readbdy: 4096 would make reads page aligned (default 1)\n\
1755         -s style: 1 gives smaller truncates (default 0)\n\
1756         -t truncbdy: 4096 would make truncates page aligned (default 1)\n\
1757         -w writebdy: 4096 would make writes page aligned (default 1)\n\
1758         -x: preallocate file space before starting, XFS only (default 0)\n\
1759         -y synchronize changes to a file\n"
1760
1761 #ifdef AIO
1762 "       -A: Use the AIO system calls\n"
1763 #endif
1764 "       -D startingop: debug output starting at specified operation\n"
1765 #ifdef HAVE_LINUX_FALLOC_H
1766 "       -F: Do not use fallocate (preallocation) calls\n"
1767 #endif
1768 #ifdef FALLOC_FL_PUNCH_HOLE
1769 "       -H: Do not use punch hole calls\n"
1770 #endif
1771 #ifdef FALLOC_FL_ZERO_RANGE
1772 "       -z: Do not use zero range calls\n"
1773 #endif
1774 #ifdef FALLOC_FL_COLLAPSE_RANGE
1775 "       -C: Do not use collapse range calls\n"
1776 #endif
1777 #ifdef FALLOC_FL_INSERT_RANGE
1778 "       -I: Do not use insert range calls\n"
1779 #endif
1780 "       -L: fsxLite - no file creations & no file size changes\n\
1781         -N numops: total # operations to do (default infinity)\n\
1782         -O: use oplen (see -o flag) for every op (default random)\n\
1783         -P: save .fsxlog .fsxops and .fsxgood files in dirpath (default ./)\n\
1784         -S seed: for random # generator (default 1) 0 gets timestamp\n\
1785         -W: mapped write operations DISabled\n\
1786         -X: Read file and compare to good buffer after every operation.\n\
1787         -R: read() system calls only (mapped reads disabled)\n\
1788         -Z: O_DIRECT (use -R, -W, -r and -w too)\n\
1789         --replay-ops opsfile: replay ops from recorded .fsxops file\n\
1790         --record-ops[=opsfile]: dump ops file also on success. optionally specify ops file name\n\
1791         fname: this filename is REQUIRED (no default)\n");
1792         exit(90);
1793 }
1794
1795
1796 int
1797 getnum(char *s, char **e)
1798 {
1799         int ret;
1800
1801         *e = (char *) 0;
1802         ret = strtol(s, e, 0);
1803         if (*e)
1804                 switch (**e) {
1805                 case 'b':
1806                 case 'B':
1807                         ret *= 512;
1808                         *e = *e + 1;
1809                         break;
1810                 case 'k':
1811                 case 'K':
1812                         ret *= 1024;
1813                         *e = *e + 1;
1814                         break;
1815                 case 'm':
1816                 case 'M':
1817                         ret *= 1024*1024;
1818                         *e = *e + 1;
1819                         break;
1820                 case 'w':
1821                 case 'W':
1822                         ret *= 4;
1823                         *e = *e + 1;
1824                         break;
1825                 }
1826         return (ret);
1827 }
1828
1829 #ifdef AIO
1830
1831 #define QSZ     1024
1832 io_context_t    io_ctx;
1833 struct iocb     iocb;
1834
1835 int aio_setup()
1836 {
1837         int ret;
1838         ret = io_queue_init(QSZ, &io_ctx);
1839         if (ret != 0) {
1840                 fprintf(stderr, "aio_setup: io_queue_init failed: %s\n",
1841                         strerror(ret));
1842                 return(-1);
1843         }
1844         return(0);
1845 }
1846
1847 int
1848 __aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
1849 {
1850         struct io_event event;
1851         static struct timespec ts;
1852         struct iocb *iocbs[] = { &iocb };
1853         int ret;
1854         long res;
1855
1856         if (rw == READ) {
1857                 io_prep_pread(&iocb, fd, buf, len, offset);
1858         } else {
1859                 io_prep_pwrite(&iocb, fd, buf, len, offset);
1860         }
1861
1862         ts.tv_sec = 30;
1863         ts.tv_nsec = 0;
1864         ret = io_submit(io_ctx, 1, iocbs);
1865         if (ret != 1) {
1866                 fprintf(stderr, "errcode=%d\n", ret);
1867                 fprintf(stderr, "aio_rw: io_submit failed: %s\n",
1868                                 strerror(ret));
1869                 goto out_error;
1870         }
1871
1872         ret = io_getevents(io_ctx, 1, 1, &event, &ts);
1873         if (ret != 1) {
1874                 if (ret == 0)
1875                         fprintf(stderr, "aio_rw: no events available\n");
1876                 else {
1877                         fprintf(stderr, "errcode=%d\n", -ret);
1878                         fprintf(stderr, "aio_rw: io_getevents failed: %s\n",
1879                                         strerror(-ret));
1880                 }
1881                 goto out_error;
1882         }
1883         if (len != event.res) {
1884                 /*
1885                  * The b0rked libaio defines event.res as unsigned.
1886                  * However the kernel strucuture has it signed,
1887                  * and it's used to pass negated error value.
1888                  * Till the library is fixed use the temp var.
1889                  */
1890                 res = (long)event.res;
1891                 if (res >= 0)
1892                         fprintf(stderr, "bad io length: %lu instead of %u\n",
1893                                         res, len);
1894                 else {
1895                         fprintf(stderr, "errcode=%ld\n", -res);
1896                         fprintf(stderr, "aio_rw: async io failed: %s\n",
1897                                         strerror(-res));
1898                         ret = res;
1899                         goto out_error;
1900                 }
1901
1902         }
1903         return event.res;
1904
1905 out_error:
1906         /*
1907          * The caller expects error return in traditional libc
1908          * convention, i.e. -1 and the errno set to error.
1909          */
1910         errno = -ret;
1911         return -1;
1912 }
1913
1914 int aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
1915 {
1916         int ret;
1917
1918         if (aio) {
1919                 ret = __aio_rw(rw, fd, buf, len, offset);
1920         } else {
1921                 if (rw == READ)
1922                         ret = read(fd, buf, len);
1923                 else
1924                         ret = write(fd, buf, len);
1925         }
1926         return ret;
1927 }
1928
1929 #endif
1930
1931 #define test_fallocate(mode) __test_fallocate(mode, #mode)
1932
1933 int
1934 __test_fallocate(int mode, const char *mode_str)
1935 {
1936 #ifdef HAVE_LINUX_FALLOC_H
1937         int ret = 0;
1938         if (!lite) {
1939                 if (fallocate(fd, mode, file_size, 1) && errno == EOPNOTSUPP) {
1940                         if(!quiet)
1941                                 fprintf(stderr,
1942                                         "main: filesystem does not support "
1943                                         "fallocate mode %s, disabling!\n",
1944                                         mode_str);
1945                 } else {
1946                         ret = 1;
1947                         if (ftruncate(fd, file_size)) {
1948                                 warn("main: ftruncate");
1949                                 exit(132);
1950                         }
1951                 }
1952         }
1953         return ret;
1954 #endif
1955 }
1956
1957 static struct option longopts[] = {
1958         {"replay-ops", required_argument, 0, 256},
1959         {"record-ops", optional_argument, 0, 255},
1960         { }
1961 };
1962
1963 int
1964 main(int argc, char **argv)
1965 {
1966         int     i, style, ch;
1967         char    *endp, *tmp;
1968         char logfile[PATH_MAX];
1969         struct stat statbuf;
1970         int o_flags = O_RDWR|O_CREAT|O_TRUNC;
1971
1972         logfile[0] = 0;
1973         dname[0] = 0;
1974
1975         page_size = getpagesize();
1976         page_mask = page_size - 1;
1977         mmap_mask = page_mask;
1978         
1979
1980         setvbuf(stdout, (char *)0, _IOLBF, 0); /* line buffered stdout */
1981
1982         while ((ch = getopt_long(argc, argv,
1983                                  "b:c:dfg:i:j:kl:m:no:p:qr:s:t:w:xyAD:FKHzCILN:OP:RS:WXZ",
1984                                  longopts, NULL)) != EOF)
1985                 switch (ch) {
1986                 case 'b':
1987                         simulatedopcount = getnum(optarg, &endp);
1988                         if (!quiet)
1989                                 prt("Will begin at operation %ld\n", simulatedopcount);
1990                         if (simulatedopcount == 0)
1991                                 usage();
1992                         simulatedopcount -= 1;
1993                         break;
1994                 case 'c':
1995                         closeprob = getnum(optarg, &endp);
1996                         if (!quiet)
1997                                 prt("Chance of close/open is 1 in %d\n", closeprob);
1998                         if (closeprob <= 0)
1999                                 usage();
2000                         break;
2001                 case 'd':
2002                         debug = 1;
2003                         break;
2004                 case 'f':
2005                         flush = 1;
2006                         break;
2007                 case 'g':
2008                         filldata = *optarg;
2009                         break;
2010                 case 'i':
2011                         integrity = 1;
2012                         logdev = strdup(optarg);
2013                         if (!logdev) {
2014                                 prterr("strdup");
2015                                 exit(101);
2016                         }
2017                         break;
2018                 case 'j':
2019                         logid = strdup(optarg);
2020                         if (!logid) {
2021                                 prterr("strdup");
2022                                 exit(101);
2023                         }
2024                         break;
2025                 case 'k':
2026                         o_flags &= ~O_TRUNC;
2027                         break;
2028                 case 'l':
2029                         maxfilelen = getnum(optarg, &endp);
2030                         if (maxfilelen <= 0)
2031                                 usage();
2032                         break;
2033                 case 'm':
2034                         monitorstart = getnum(optarg, &endp);
2035                         if (monitorstart < 0)
2036                                 usage();
2037                         if (!endp || *endp++ != ':')
2038                                 usage();
2039                         monitorend = getnum(endp, &endp);
2040                         if (monitorend < 0)
2041                                 usage();
2042                         if (monitorend == 0)
2043                                 monitorend = -1; /* aka infinity */
2044                         debug = 1;
2045                 case 'n':
2046                         sizechecks = 0;
2047                         break;
2048                 case 'o':
2049                         maxoplen = getnum(optarg, &endp);
2050                         if (maxoplen <= 0)
2051                                 usage();
2052                         break;
2053                 case 'p':
2054                         progressinterval = getnum(optarg, &endp);
2055                         if (progressinterval == 0)
2056                                 usage();
2057                         break;
2058                 case 'q':
2059                         quiet = 1;
2060                         break;
2061                 case 'r':
2062                         readbdy = getnum(optarg, &endp);
2063                         if (readbdy <= 0)
2064                                 usage();
2065                         break;
2066                 case 's':
2067                         style = getnum(optarg, &endp);
2068                         if (style < 0 || style > 1)
2069                                 usage();
2070                         break;
2071                 case 't':
2072                         truncbdy = getnum(optarg, &endp);
2073                         if (truncbdy <= 0)
2074                                 usage();
2075                         break;
2076                 case 'w':
2077                         writebdy = getnum(optarg, &endp);
2078                         if (writebdy <= 0)
2079                                 usage();
2080                         break;
2081                 case 'x':
2082                         prealloc = 1;
2083                         break;
2084                 case 'y':
2085                         do_fsync = 1;
2086                         break;
2087                 case 'A':
2088                         aio = 1;
2089                         break;
2090                 case 'D':
2091                         debugstart = getnum(optarg, &endp);
2092                         if (debugstart < 1)
2093                                 usage();
2094                         break;
2095                 case 'F':
2096                         fallocate_calls = 0;
2097                         break;
2098                 case 'K':
2099                         keep_size_calls = 0;
2100                         break;
2101                 case 'H':
2102                         punch_hole_calls = 0;
2103                         break;
2104                 case 'z':
2105                         zero_range_calls = 0;
2106                         break;
2107                 case 'C':
2108                         collapse_range_calls = 0;
2109                         break;
2110                 case 'I':
2111                         insert_range_calls = 0;
2112                         break;
2113                 case 'L':
2114                         lite = 1;
2115                         o_flags &= ~(O_CREAT|O_TRUNC);
2116                         break;
2117                 case 'N':
2118                         numops = getnum(optarg, &endp);
2119                         if (numops < 0)
2120                                 usage();
2121                         break;
2122                 case 'O':
2123                         randomoplen = 0;
2124                         break;
2125                 case 'P':
2126                         strncpy(dname, optarg, sizeof(dname));
2127                         strcat(dname, "/");
2128                         dirpath = strlen(dname);
2129                         break;
2130                 case 'R':
2131                         mapped_reads = 0;
2132                         break;
2133                 case 'S':
2134                         seed = getnum(optarg, &endp);
2135                         if (seed == 0) {
2136                                 seed = time(0) % 10000;
2137                                 seed += (int)getpid();
2138                         }
2139                         if (seed < 0)
2140                                 usage();
2141                         break;
2142                 case 'W':
2143                         mapped_writes = 0;
2144                         if (!quiet)
2145                                 prt("mapped writes DISABLED\n");
2146                         break;
2147                 case 'X':
2148                         check_file = 1;
2149                         break;
2150                 case 'Z':
2151                         o_direct = O_DIRECT;
2152                         o_flags |= O_DIRECT;
2153                         break;
2154                 case 255:  /* --record-ops */
2155                         if (optarg)
2156                                 strncpy(opsfile, optarg, sizeof(opsfile));
2157                         recordops = opsfile;
2158                         break;
2159                 case 256:  /* --replay-ops */
2160                         replayops = optarg;
2161                         break;
2162                 default:
2163                         usage();
2164                         /* NOTREACHED */
2165                 }
2166         argc -= optind;
2167         argv += optind;
2168         if (argc != 1)
2169                 usage();
2170
2171         if (integrity && !dirpath) {
2172                 fprintf(stderr, "option -i <logdev> requires -P <dirpath>\n");
2173                 usage();
2174         }
2175
2176         fname = argv[0];
2177         tmp = strdup(fname);
2178         if (!tmp) {
2179                 prterr("strdup");
2180                 exit(101);
2181         }
2182         bname = basename(tmp);
2183
2184         signal(SIGHUP,  cleanup);
2185         signal(SIGINT,  cleanup);
2186         signal(SIGPIPE, cleanup);
2187         signal(SIGALRM, cleanup);
2188         signal(SIGTERM, cleanup);
2189         signal(SIGXCPU, cleanup);
2190         signal(SIGXFSZ, cleanup);
2191         signal(SIGVTALRM,       cleanup);
2192         signal(SIGUSR1, cleanup);
2193         signal(SIGUSR2, cleanup);
2194
2195         if (!quiet && seed)
2196                 prt("Seed set to %d\n", seed);
2197         srandom(seed);
2198         fd = open(fname, o_flags, 0666);
2199         if (fd < 0) {
2200                 prterr(fname);
2201                 exit(91);
2202         }
2203         if (fstat(fd, &statbuf)) {
2204                 prterr("check_size: fstat");
2205                 exit(91);
2206         }
2207         block_size = statbuf.st_blksize;
2208 #ifdef XFS
2209         if (prealloc) {
2210                 xfs_flock64_t   resv = { 0 };
2211 #ifdef HAVE_XFS_PLATFORM_DEFS_H
2212                 if (!platform_test_xfs_fd(fd)) {
2213                         prterr(fname);
2214                         fprintf(stderr, "main: cannot prealloc, non XFS\n");
2215                         exit(96);
2216                 }
2217 #endif
2218                 resv.l_len = maxfilelen;
2219                 if ((xfsctl(fname, fd, XFS_IOC_RESVSP, &resv)) < 0) {
2220                         prterr(fname);
2221                         exit(97);
2222                 }
2223         }
2224 #endif
2225
2226         if (dirpath) {
2227                 snprintf(goodfile, sizeof(goodfile), "%s%s.fsxgood", dname, bname);
2228                 snprintf(logfile, sizeof(logfile), "%s%s.fsxlog", dname, bname);
2229                 if (!*opsfile)
2230                         snprintf(opsfile, sizeof(opsfile), "%s%s.fsxops", dname, bname);
2231         } else {
2232                 snprintf(goodfile, sizeof(goodfile), "%s.fsxgood", fname);
2233                 snprintf(logfile, sizeof(logfile), "%s.fsxlog", fname);
2234                 if (!*opsfile)
2235                         snprintf(opsfile, sizeof(opsfile), "%s.fsxops", fname);
2236         }
2237         fsxgoodfd = open(goodfile, O_RDWR|O_CREAT|O_TRUNC, 0666);
2238         if (fsxgoodfd < 0) {
2239                 prterr(goodfile);
2240                 exit(92);
2241         }
2242         fsxlogf = fopen(logfile, "w");
2243         if (fsxlogf == NULL) {
2244                 prterr(logfile);
2245                 exit(93);
2246         }
2247         unlink(opsfile);
2248
2249         if (replayops) {
2250                 replayopsf = fopen(replayops, "r");
2251                 if (!replayopsf) {
2252                         prterr(replayops);
2253                         exit(93);
2254                 }
2255         }
2256
2257 #ifdef AIO
2258         if (aio) 
2259                 aio_setup();
2260 #endif
2261
2262         if (!(o_flags & O_TRUNC)) {
2263                 off_t ret;
2264                 file_size = maxfilelen = biggest = lseek(fd, (off_t)0, SEEK_END);
2265                 if (file_size == (off_t)-1) {
2266                         prterr(fname);
2267                         warn("main: lseek eof");
2268                         exit(94);
2269                 }
2270                 ret = lseek(fd, (off_t)0, SEEK_SET);
2271                 if (ret == (off_t)-1) {
2272                         prterr(fname);
2273                         warn("main: lseek 0");
2274                         exit(95);
2275                 }
2276         }
2277         original_buf = (char *) malloc(maxfilelen);
2278         for (i = 0; i < maxfilelen; i++)
2279                 original_buf[i] = random() % 256;
2280         good_buf = (char *) malloc(maxfilelen + writebdy);
2281         good_buf = round_ptr_up(good_buf, writebdy, 0);
2282         memset(good_buf, '\0', maxfilelen);
2283         temp_buf = (char *) malloc(maxoplen + readbdy);
2284         temp_buf = round_ptr_up(temp_buf, readbdy, 0);
2285         memset(temp_buf, '\0', maxoplen);
2286         if (lite) {     /* zero entire existing file */
2287                 ssize_t written;
2288
2289                 written = write(fd, good_buf, (size_t)maxfilelen);
2290                 if (written != maxfilelen) {
2291                         if (written == -1) {
2292                                 prterr(fname);
2293                                 warn("main: error on write");
2294                         } else
2295                                 warn("main: short write, 0x%x bytes instead "
2296                                         "of 0x%lx\n",
2297                                         (unsigned)written,
2298                                         maxfilelen);
2299                         exit(98);
2300                 }
2301         } else {
2302                 ssize_t ret, len = file_size;
2303                 off_t off = 0;
2304
2305                 while (len > 0) {
2306                         ret = read(fd, good_buf + off, len);
2307                         if (ret == -1) {
2308                                 prterr(fname);
2309                                 warn("main: error on read");
2310                                 exit(98);
2311                         }
2312                         len -= ret;
2313                         off += ret;
2314                 }
2315
2316                 check_trunc_hack();
2317         }
2318
2319         if (fallocate_calls)
2320                 fallocate_calls = test_fallocate(0);
2321         if (keep_size_calls)
2322                 keep_size_calls = test_fallocate(FALLOC_FL_KEEP_SIZE);
2323         if (punch_hole_calls)
2324                 punch_hole_calls = test_fallocate(FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE);
2325         if (zero_range_calls)
2326                 zero_range_calls = test_fallocate(FALLOC_FL_ZERO_RANGE);
2327         if (collapse_range_calls)
2328                 collapse_range_calls = test_fallocate(FALLOC_FL_COLLAPSE_RANGE);
2329         if (insert_range_calls)
2330                 insert_range_calls = test_fallocate(FALLOC_FL_INSERT_RANGE);
2331
2332         while (numops == -1 || numops--)
2333                 if (!test())
2334                         break;
2335
2336         free(tmp);
2337         if (close(fd)) {
2338                 prterr("close");
2339                 report_failure(99);
2340         }
2341         prt("All %lu operations completed A-OK!\n", testcalls);
2342         if (recordops)
2343                 logdump();
2344
2345         exit(0);
2346         return 0;
2347 }