5601c70c1b89abe4b43d84ca580df0eee215a7ba
[xfstests-dev.git] / ltp / fsx.c
1 /*
2  *      Copyright (C) 1991, NeXT Computer, Inc.  All Rights Reserverd.
3  *
4  *      File:   fsx.c
5  *      Author: Avadis Tevanian, Jr.
6  *
7  *      File system exerciser. 
8  *
9  *      Rewritten 8/98 by Conrad Minshall.
10  *
11  *      Small changes to work under Linux -- davej.
12  *
13  *      Checks for mmap last-page zero fill.
14  */
15
16 #include "global.h"
17
18 #include <limits.h>
19 #include <time.h>
20 #include <strings.h>
21 #include <sys/file.h>
22 #include <sys/mman.h>
23 #include <stdbool.h>
24 #ifdef HAVE_ERR_H
25 #include <err.h>
26 #endif
27 #include <signal.h>
28 #include <stdio.h>
29 #include <stddef.h>
30 #include <stdlib.h>
31 #include <string.h>
32 #include <stdarg.h>
33 #include <errno.h>
34 #ifdef AIO
35 #include <libaio.h>
36 #endif
37
38 #ifndef MAP_FILE
39 # define MAP_FILE 0
40 #endif
41
42 #define NUMPRINTCOLUMNS 32      /* # columns of data to print on each line */
43
44 /* Operation flags */
45
46 enum opflags { FL_NONE = 0, FL_SKIPPED = 1, FL_CLOSE_OPEN = 2, FL_KEEP_SIZE = 4 };
47
48 /*
49  *      A log entry is an operation and a bunch of arguments.
50  */
51
52 struct log_entry {
53         int     operation;
54         int     args[3];
55         enum opflags flags;
56 };
57
58 #define LOGSIZE 10000
59
60 struct log_entry        oplog[LOGSIZE]; /* the log */
61 int                     logptr = 0;     /* current position in log */
62 int                     logcount = 0;   /* total ops */
63
64 /*
65  * The operation matrix is complex due to conditional execution of different
66  * features. Hence when we come to deciding what operation to run, we need to
67  * be careful in how we select the different operations. The active operations
68  * are mapped to numbers as follows:
69  *
70  *                      lite    !lite   integrity
71  * READ:                0       0       0
72  * WRITE:               1       1       1
73  * MAPREAD:             2       2       2
74  * MAPWRITE:            3       3       3
75  * TRUNCATE:            -       4       4
76  * FALLOCATE:           -       5       5
77  * PUNCH HOLE:          -       6       6
78  * ZERO RANGE:          -       7       7
79  * COLLAPSE RANGE:      -       8       8
80  * FSYNC:               -       -       9
81  *
82  * When mapped read/writes are disabled, they are simply converted to normal
83  * reads and writes. When fallocate/fpunch calls are disabled, they are
84  * skipped.
85  *
86  * Because of the "lite" version, we also need to have different "maximum
87  * operation" defines to allow the ops to be selected correctly based on the
88  * mode being run.
89  */
90
91 /* common operations */
92 #define OP_READ         0
93 #define OP_WRITE        1
94 #define OP_MAPREAD      2
95 #define OP_MAPWRITE     3
96 #define OP_MAX_LITE     4
97
98 /* !lite operations */
99 #define OP_TRUNCATE             4
100 #define OP_FALLOCATE            5
101 #define OP_PUNCH_HOLE           6
102 #define OP_ZERO_RANGE           7
103 #define OP_COLLAPSE_RANGE       8
104 #define OP_INSERT_RANGE 9
105 #define OP_MAX_FULL             10
106
107 /* integrity operations */
108 #define OP_FSYNC                10
109 #define OP_MAX_INTEGRITY        11
110
111 #undef PAGE_SIZE
112 #define PAGE_SIZE       getpagesize()
113 #undef PAGE_MASK
114 #define PAGE_MASK       (PAGE_SIZE - 1)
115
116 char    *original_buf;                  /* a pointer to the original data */
117 char    *good_buf;                      /* a pointer to the correct data */
118 char    *temp_buf;                      /* a pointer to the current data */
119 char    *fname;                         /* name of our test file */
120 char    *bname;                         /* basename of our test file */
121 char    *logdev;                        /* -i flag */
122 char    *logid;                         /* -j flag */
123 char    dname[1024];                    /* -P flag */
124 char    goodfile[PATH_MAX];
125 int     dirpath = 0;                    /* -P flag */
126 int     fd;                             /* fd for our test file */
127
128 blksize_t       block_size = 0;
129 off_t           file_size = 0;
130 off_t           biggest = 0;
131 unsigned long   testcalls = 0;          /* calls to function "test" */
132
133 unsigned long   simulatedopcount = 0;   /* -b flag */
134 int     closeprob = 0;                  /* -c flag */
135 int     debug = 0;                      /* -d flag */
136 unsigned long   debugstart = 0;         /* -D flag */
137 char    filldata = 0;                   /* -g flag */
138 int     flush = 0;                      /* -f flag */
139 int     do_fsync = 0;                   /* -y flag */
140 unsigned long   maxfilelen = 256 * 1024;        /* -l flag */
141 int     sizechecks = 1;                 /* -n flag disables them */
142 int     maxoplen = 64 * 1024;           /* -o flag */
143 int     quiet = 0;                      /* -q flag */
144 unsigned long progressinterval = 0;     /* -p flag */
145 int     readbdy = 1;                    /* -r flag */
146 int     style = 0;                      /* -s flag */
147 int     prealloc = 0;                   /* -x flag */
148 int     truncbdy = 1;                   /* -t flag */
149 int     writebdy = 1;                   /* -w flag */
150 long    monitorstart = -1;              /* -m flag */
151 long    monitorend = -1;                /* -m flag */
152 int     lite = 0;                       /* -L flag */
153 long    numops = -1;                    /* -N flag */
154 int     randomoplen = 1;                /* -O flag disables it */
155 int     seed = 1;                       /* -S flag */
156 int     mapped_writes = 1;              /* -W flag disables */
157 int     fallocate_calls = 1;            /* -F flag disables */
158 int     keep_size_calls = 1;            /* -K flag disables */
159 int     punch_hole_calls = 1;           /* -H flag disables */
160 int     zero_range_calls = 1;           /* -z flag disables */
161 int     collapse_range_calls = 1;       /* -C flag disables */
162 int     insert_range_calls = 1;         /* -I flag disables */
163 int     mapped_reads = 1;               /* -R flag disables it */
164 int     integrity = 0;                  /* -i flag */
165 int     fsxgoodfd = 0;
166 int     o_direct;                       /* -Z */
167 int     aio = 0;
168 int     mark_nr = 0;
169
170 int page_size;
171 int page_mask;
172 int mmap_mask;
173 #ifdef AIO
174 int aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset);
175 #define READ 0
176 #define WRITE 1
177 #define fsxread(a,b,c,d)        aio_rw(READ, a,b,c,d)
178 #define fsxwrite(a,b,c,d)       aio_rw(WRITE, a,b,c,d)
179 #else
180 #define fsxread(a,b,c,d)        read(a,b,c)
181 #define fsxwrite(a,b,c,d)       write(a,b,c)
182 #endif
183
184 const char *replayops = NULL;
185 const char *recordops = NULL;
186 FILE *  fsxlogf = NULL;
187 FILE *  replayopsf = NULL;
188 char opsfile[PATH_MAX];
189 int badoff = -1;
190 int closeopen = 0;
191
192 static void *round_ptr_up(void *ptr, unsigned long align, unsigned long offset)
193 {
194         unsigned long ret = (unsigned long)ptr;
195
196         ret = ((ret + align - 1) & ~(align - 1));
197         ret += offset;
198         return (void *)ret;
199 }
200
201 void
202 vwarnc(int code, const char *fmt, va_list ap)
203 {
204         if (logid)
205                 fprintf(stderr, "%s: ", logid);
206         fprintf(stderr, "fsx: ");
207         if (fmt != NULL) {
208                 vfprintf(stderr, fmt, ap);
209                 fprintf(stderr, ": ");
210         }
211         fprintf(stderr, "%s\n", strerror(code));
212 }
213
214 void
215 warn(const char * fmt, ...)  {
216         va_list ap;
217         va_start(ap, fmt);
218         vwarnc(errno, fmt, ap);
219         va_end(ap);
220 }
221
222 void
223 prt(const char *fmt, ...)
224 {
225         va_list args;
226
227         if (logid)
228                 fprintf(stdout, "%s: ", logid);
229         va_start(args, fmt);
230         vfprintf(stdout, fmt, args);
231         va_end(args);
232         if (fsxlogf) {
233                 va_start(args, fmt);
234                 vfprintf(fsxlogf, fmt, args);
235                 va_end(args);
236         }
237 }
238
239 void
240 prterr(const char *prefix)
241 {
242         prt("%s%s%s\n", prefix, prefix ? ": " : "", strerror(errno));
243 }
244
245
246 static const char *op_names[] = {
247         [OP_READ] = "read",
248         [OP_WRITE] = "write",
249         [OP_MAPREAD] = "mapread",
250         [OP_MAPWRITE] = "mapwrite",
251         [OP_TRUNCATE] = "truncate",
252         [OP_FALLOCATE] = "fallocate",
253         [OP_PUNCH_HOLE] = "punch_hole",
254         [OP_ZERO_RANGE] = "zero_range",
255         [OP_COLLAPSE_RANGE] = "collapse_range",
256         [OP_INSERT_RANGE] = "insert_range",
257         [OP_FSYNC] = "fsync",
258 };
259
260 static const char *op_name(int operation)
261 {
262         if (operation >= 0 &&
263             operation < sizeof(op_names) / sizeof(op_names[0]))
264                 return op_names[operation];
265         return NULL;
266 }
267
268 static int op_code(const char *name)
269 {
270         int i;
271
272         for (i = 0; i < sizeof(op_names) / sizeof(op_names[0]); i++)
273                 if (op_names[i] && strcmp(name, op_names[i]) == 0)
274                         return i;
275         return -1;
276 }
277
278 void
279 log4(int operation, int arg0, int arg1, enum opflags flags)
280 {
281         struct log_entry *le;
282
283         le = &oplog[logptr];
284         le->operation = operation;
285         if (closeopen)
286                 flags |= FL_CLOSE_OPEN;
287         le->args[0] = arg0;
288         le->args[1] = arg1;
289         le->args[2] = file_size;
290         le->flags = flags;
291         logptr++;
292         logcount++;
293         if (logptr >= LOGSIZE)
294                 logptr = 0;
295 }
296
297
298 void
299 logdump(void)
300 {
301         FILE    *logopsf;
302         int     i, count, down;
303         struct log_entry        *lp;
304
305         prt("LOG DUMP (%d total operations):\n", logcount);
306
307         logopsf = fopen(opsfile, "w");
308         if (!logopsf)
309                 prterr(opsfile);
310
311         if (logcount < LOGSIZE) {
312                 i = 0;
313                 count = logcount;
314         } else {
315                 i = logptr;
316                 count = LOGSIZE;
317         }
318         for ( ; count > 0; count--) {
319                 bool overlap;
320                 int opnum;
321
322                 opnum = i+1 + (logcount/LOGSIZE)*LOGSIZE;
323                 prt("%d(%3d mod 256): ", opnum, opnum%256);
324                 lp = &oplog[i];
325
326                 overlap = badoff >= lp->args[0] &&
327                           badoff < lp->args[0] + lp->args[1];
328
329                 if (lp->flags & FL_SKIPPED) {
330                         prt("SKIPPED (no operation)");
331                         goto skipped;
332                 }
333
334                 switch (lp->operation) {
335                 case OP_MAPREAD:
336                         prt("MAPREAD  0x%x thru 0x%x\t(0x%x bytes)",
337                             lp->args[0], lp->args[0] + lp->args[1] - 1,
338                             lp->args[1]);
339                         if (overlap)
340                                 prt("\t***RRRR***");
341                         break;
342                 case OP_MAPWRITE:
343                         prt("MAPWRITE 0x%x thru 0x%x\t(0x%x bytes)",
344                             lp->args[0], lp->args[0] + lp->args[1] - 1,
345                             lp->args[1]);
346                         if (overlap)
347                                 prt("\t******WWWW");
348                         break;
349                 case OP_READ:
350                         prt("READ     0x%x thru 0x%x\t(0x%x bytes)",
351                             lp->args[0], lp->args[0] + lp->args[1] - 1,
352                             lp->args[1]);
353                         if (overlap)
354                                 prt("\t***RRRR***");
355                         break;
356                 case OP_WRITE:
357                         prt("WRITE    0x%x thru 0x%x\t(0x%x bytes)",
358                             lp->args[0], lp->args[0] + lp->args[1] - 1,
359                             lp->args[1]);
360                         if (lp->args[0] > lp->args[2])
361                                 prt(" HOLE");
362                         else if (lp->args[0] + lp->args[1] > lp->args[2])
363                                 prt(" EXTEND");
364                         overlap = (badoff >= lp->args[0] ||
365                                    badoff >=lp->args[2]) &&
366                                   badoff < lp->args[0] + lp->args[1];
367                         if (overlap)
368                                 prt("\t***WWWW");
369                         break;
370                 case OP_TRUNCATE:
371                         down = lp->args[1] < lp->args[2];
372                         prt("TRUNCATE %s\tfrom 0x%x to 0x%x",
373                             down ? "DOWN" : "UP", lp->args[2], lp->args[1]);
374                         overlap = badoff >= lp->args[1 + !down] &&
375                                   badoff < lp->args[1 + !!down];
376                         if (overlap)
377                                 prt("\t******WWWW");
378                         break;
379                 case OP_FALLOCATE:
380                         /* 0: offset 1: length 2: where alloced */
381                         prt("FALLOC   0x%x thru 0x%x\t(0x%x bytes) ",
382                                 lp->args[0], lp->args[0] + lp->args[1],
383                                 lp->args[1]);
384                         if (lp->args[0] + lp->args[1] <= lp->args[2])
385                                 prt("INTERIOR");
386                         else if (lp->flags & FL_KEEP_SIZE)
387                                 prt("PAST_EOF");
388                         else
389                                 prt("EXTENDING");
390                         if (overlap)
391                                 prt("\t******FFFF");
392                         break;
393                 case OP_PUNCH_HOLE:
394                         prt("PUNCH    0x%x thru 0x%x\t(0x%x bytes)",
395                             lp->args[0], lp->args[0] + lp->args[1] - 1,
396                             lp->args[1]);
397                         if (overlap)
398                                 prt("\t******PPPP");
399                         break;
400                 case OP_ZERO_RANGE:
401                         prt("ZERO     0x%x thru 0x%x\t(0x%x bytes)",
402                             lp->args[0], lp->args[0] + lp->args[1] - 1,
403                             lp->args[1]);
404                         if (overlap)
405                                 prt("\t******ZZZZ");
406                         break;
407                 case OP_COLLAPSE_RANGE:
408                         prt("COLLAPSE 0x%x thru 0x%x\t(0x%x bytes)",
409                             lp->args[0], lp->args[0] + lp->args[1] - 1,
410                             lp->args[1]);
411                         if (overlap)
412                                 prt("\t******CCCC");
413                         break;
414                 case OP_INSERT_RANGE:
415                         prt("INSERT 0x%x thru 0x%x\t(0x%x bytes)",
416                             lp->args[0], lp->args[0] + lp->args[1] - 1,
417                             lp->args[1]);
418                         if (overlap)
419                                 prt("\t******IIII");
420                         break;
421                 case OP_FSYNC:
422                         prt("FSYNC");
423                         break;
424                 default:
425                         prt("BOGUS LOG ENTRY (operation code = %d)!",
426                             lp->operation);
427                         continue;
428                 }
429
430             skipped:
431                 if (lp->flags & FL_CLOSE_OPEN)
432                         prt("\n\t\tCLOSE/OPEN");
433                 prt("\n");
434                 i++;
435                 if (i == LOGSIZE)
436                         i = 0;
437
438                 if (logopsf) {
439                         if (lp->flags & FL_SKIPPED)
440                                 fprintf(logopsf, "skip ");
441                         fprintf(logopsf, "%s 0x%x 0x%x 0x%x",
442                                 op_name(lp->operation),
443                                 lp->args[0], lp->args[1], lp->args[2]);
444                         if (lp->flags & FL_KEEP_SIZE)
445                                 fprintf(logopsf, " keep_size");
446                         if (lp->flags & FL_CLOSE_OPEN)
447                                 fprintf(logopsf, " close_open");
448                         if (overlap)
449                                 fprintf(logopsf, " *");
450                         fprintf(logopsf, "\n");
451                 }
452         }
453
454         if (logopsf) {
455                 if (fclose(logopsf) != 0)
456                         prterr(opsfile);
457                 else
458                         prt("Log of operations saved to \"%s\"; "
459                             "replay with --replay-ops\n",
460                             opsfile);
461         }
462 }
463
464
465 void
466 save_buffer(char *buffer, off_t bufferlength, int fd)
467 {
468         off_t ret;
469         ssize_t byteswritten;
470
471         if (fd <= 0 || bufferlength == 0)
472                 return;
473
474         if (bufferlength > SSIZE_MAX) {
475                 prt("fsx flaw: overflow in save_buffer\n");
476                 exit(67);
477         }
478         if (lite) {
479                 off_t size_by_seek = lseek(fd, (off_t)0, SEEK_END);
480                 if (size_by_seek == (off_t)-1)
481                         prterr("save_buffer: lseek eof");
482                 else if (bufferlength > size_by_seek) {
483                         warn("save_buffer: .fsxgood file too short... will save 0x%llx bytes instead of 0x%llx\n", (unsigned long long)size_by_seek,
484                              (unsigned long long)bufferlength);
485                         bufferlength = size_by_seek;
486                 }
487         }
488
489         ret = lseek(fd, (off_t)0, SEEK_SET);
490         if (ret == (off_t)-1)
491                 prterr("save_buffer: lseek 0");
492         
493         byteswritten = write(fd, buffer, (size_t)bufferlength);
494         if (byteswritten != bufferlength) {
495                 if (byteswritten == -1)
496                         prterr("save_buffer write");
497                 else
498                         warn("save_buffer: short write, 0x%x bytes instead of 0x%llx\n",
499                              (unsigned)byteswritten,
500                              (unsigned long long)bufferlength);
501         }
502 }
503
504
505 void
506 report_failure(int status)
507 {
508         logdump();
509         
510         if (fsxgoodfd) {
511                 if (good_buf) {
512                         save_buffer(good_buf, file_size, fsxgoodfd);
513                         prt("Correct content saved for comparison\n");
514                         prt("(maybe hexdump \"%s\" vs \"%s\")\n",
515                             fname, goodfile);
516                 }
517                 close(fsxgoodfd);
518         }
519         exit(status);
520 }
521
522
523 #define short_at(cp) ((unsigned short)((*((unsigned char *)(cp)) << 8) | \
524                                         *(((unsigned char *)(cp)) + 1)))
525
526 void
527 mark_log(void)
528 {
529         char command[256];
530         int ret;
531
532         snprintf(command, 256, "dmsetup message %s 0 mark %s.mark%d", logdev,
533                  bname, mark_nr);
534         ret = system(command);
535         if (ret) {
536                 prterr("dmsetup mark failed");
537                 exit(211);
538         }
539 }
540
541 void
542 dump_fsync_buffer(void)
543 {
544         char fname_buffer[PATH_MAX];
545         int good_fd;
546
547         if (!good_buf)
548                 return;
549
550         snprintf(fname_buffer, sizeof(fname_buffer), "%s%s.mark%d", dname,
551                  bname, mark_nr);
552         good_fd = open(fname_buffer, O_WRONLY|O_CREAT|O_TRUNC, 0666);
553         if (good_fd < 0) {
554                 prterr(fname_buffer);
555                 exit(212);
556         }
557
558         save_buffer(good_buf, file_size, good_fd);
559         close(good_fd);
560         prt("Dumped fsync buffer to %s\n", fname_buffer + dirpath);
561 }
562
563 void
564 check_buffers(unsigned offset, unsigned size)
565 {
566         unsigned char c, t;
567         unsigned i = 0;
568         unsigned n = 0;
569         unsigned op = 0;
570         unsigned bad = 0;
571
572         if (memcmp(good_buf + offset, temp_buf, size) != 0) {
573                 prt("READ BAD DATA: offset = 0x%x, size = 0x%x, fname = %s\n",
574                     offset, size, fname);
575                 prt("OFFSET\tGOOD\tBAD\tRANGE\n");
576                 while (size > 0) {
577                         c = good_buf[offset];
578                         t = temp_buf[i];
579                         if (c != t) {
580                                 if (n < 16) {
581                                         bad = short_at(&temp_buf[i]);
582                                         prt("0x%05x\t0x%04x\t0x%04x", offset,
583                                             short_at(&good_buf[offset]), bad);
584                                         op = temp_buf[offset & 1 ? i+1 : i];
585                                         prt("\t0x%05x\n", n);
586                                         if (op)
587                                                 prt("operation# (mod 256) for "
588                                                   "the bad data may be %u\n",
589                                                 ((unsigned)op & 0xff));
590                                         else
591                                                 prt("operation# (mod 256) for "
592                                                   "the bad data unknown, check"
593                                                   " HOLE and EXTEND ops\n");
594                                 }
595                                 n++;
596                                 badoff = offset;
597                         }
598                         offset++;
599                         i++;
600                         size--;
601                 }
602                 report_failure(110);
603         }
604 }
605
606
607 void
608 check_size(void)
609 {
610         struct stat     statbuf;
611         off_t   size_by_seek;
612
613         if (fstat(fd, &statbuf)) {
614                 prterr("check_size: fstat");
615                 statbuf.st_size = -1;
616         }
617         size_by_seek = lseek(fd, (off_t)0, SEEK_END);
618         if (file_size != statbuf.st_size || file_size != size_by_seek) {
619                 prt("Size error: expected 0x%llx stat 0x%llx seek 0x%llx\n",
620                     (unsigned long long)file_size,
621                     (unsigned long long)statbuf.st_size,
622                     (unsigned long long)size_by_seek);
623                 report_failure(120);
624         }
625 }
626
627
628 void
629 check_trunc_hack(void)
630 {
631         struct stat statbuf;
632         off_t offset = file_size + (off_t)100000;
633
634         if (ftruncate(fd, file_size))
635                 goto ftruncate_err;
636         if (ftruncate(fd, offset))
637                 goto ftruncate_err;
638         fstat(fd, &statbuf);
639         if (statbuf.st_size != offset) {
640                 prt("no extend on truncate! not posix!\n");
641                 exit(130);
642         }
643         if (ftruncate(fd, file_size)) {
644 ftruncate_err:
645                 prterr("check_trunc_hack: ftruncate");
646                 exit(131);
647         }
648 }
649
650 void
651 doflush(unsigned offset, unsigned size)
652 {
653         unsigned pg_offset;
654         unsigned map_size;
655         char    *p;
656
657         if (o_direct == O_DIRECT)
658                 return;
659
660         pg_offset = offset & mmap_mask;
661         map_size  = pg_offset + size;
662
663         if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
664                               MAP_FILE | MAP_SHARED, fd,
665                               (off_t)(offset - pg_offset))) == (char *)-1) {
666                 prterr("doflush: mmap");
667                 report_failure(202);
668         }
669         if (msync(p, map_size, MS_INVALIDATE) != 0) {
670                 prterr("doflush: msync");
671                 report_failure(203);
672         }
673         if (munmap(p, map_size) != 0) {
674                 prterr("doflush: munmap");
675                 report_failure(204);
676         }
677 }
678
679 void
680 doread(unsigned offset, unsigned size)
681 {
682         off_t ret;
683         unsigned iret;
684
685         offset -= offset % readbdy;
686         if (o_direct)
687                 size -= size % readbdy;
688         if (size == 0) {
689                 if (!quiet && testcalls > simulatedopcount && !o_direct)
690                         prt("skipping zero size read\n");
691                 log4(OP_READ, offset, size, FL_SKIPPED);
692                 return;
693         }
694         if (size + offset > file_size) {
695                 if (!quiet && testcalls > simulatedopcount)
696                         prt("skipping seek/read past end of file\n");
697                 log4(OP_READ, offset, size, FL_SKIPPED);
698                 return;
699         }
700
701         log4(OP_READ, offset, size, FL_NONE);
702
703         if (testcalls <= simulatedopcount)
704                 return;
705
706         if (!quiet &&
707                 ((progressinterval && testcalls % progressinterval == 0)  ||
708                 (debug &&
709                        (monitorstart == -1 ||
710                         (offset + size > monitorstart &&
711                         (monitorend == -1 || offset <= monitorend))))))
712                 prt("%lu read\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
713                     offset, offset + size - 1, size);
714         ret = lseek(fd, (off_t)offset, SEEK_SET);
715         if (ret == (off_t)-1) {
716                 prterr("doread: lseek");
717                 report_failure(140);
718         }
719         iret = fsxread(fd, temp_buf, size, offset);
720         if (iret != size) {
721                 if (iret == -1)
722                         prterr("doread: read");
723                 else
724                         prt("short read: 0x%x bytes instead of 0x%x\n",
725                             iret, size);
726                 report_failure(141);
727         }
728         check_buffers(offset, size);
729 }
730
731
732 void
733 check_eofpage(char *s, unsigned offset, char *p, int size)
734 {
735         unsigned long last_page, should_be_zero;
736
737         if (offset + size <= (file_size & ~page_mask))
738                 return;
739         /*
740          * we landed in the last page of the file
741          * test to make sure the VM system provided 0's 
742          * beyond the true end of the file mapping
743          * (as required by mmap def in 1996 posix 1003.1)
744          */
745         last_page = ((unsigned long)p + (offset & page_mask) + size) & ~page_mask;
746
747         for (should_be_zero = last_page + (file_size & page_mask);
748              should_be_zero < last_page + page_size;
749              should_be_zero++)
750                 if (*(char *)should_be_zero) {
751                         prt("Mapped %s: non-zero data past EOF (0x%llx) page offset 0x%x is 0x%04x\n",
752                             s, file_size - 1, should_be_zero & page_mask,
753                             short_at(should_be_zero));
754                         report_failure(205);
755                 }
756 }
757
758
759 void
760 domapread(unsigned offset, unsigned size)
761 {
762         unsigned pg_offset;
763         unsigned map_size;
764         char    *p;
765
766         offset -= offset % readbdy;
767         if (size == 0) {
768                 if (!quiet && testcalls > simulatedopcount)
769                         prt("skipping zero size read\n");
770                 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
771                 return;
772         }
773         if (size + offset > file_size) {
774                 if (!quiet && testcalls > simulatedopcount)
775                         prt("skipping seek/read past end of file\n");
776                 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
777                 return;
778         }
779
780         log4(OP_MAPREAD, offset, size, FL_NONE);
781
782         if (testcalls <= simulatedopcount)
783                 return;
784
785         if (!quiet &&
786                 ((progressinterval && testcalls % progressinterval == 0) ||
787                        (debug &&
788                        (monitorstart == -1 ||
789                         (offset + size > monitorstart &&
790                         (monitorend == -1 || offset <= monitorend))))))
791                 prt("%lu mapread\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
792                     offset, offset + size - 1, size);
793
794         pg_offset = offset & PAGE_MASK;
795         map_size  = pg_offset + size;
796
797         if ((p = (char *)mmap(0, map_size, PROT_READ, MAP_SHARED, fd,
798                               (off_t)(offset - pg_offset))) == (char *)-1) {
799                 prterr("domapread: mmap");
800                 report_failure(190);
801         }
802         memcpy(temp_buf, p + pg_offset, size);
803
804         check_eofpage("Read", offset, p, size);
805
806         if (munmap(p, map_size) != 0) {
807                 prterr("domapread: munmap");
808                 report_failure(191);
809         }
810
811         check_buffers(offset, size);
812 }
813
814
815 void
816 gendata(char *original_buf, char *good_buf, unsigned offset, unsigned size)
817 {
818         while (size--) {
819                 if (filldata) {
820                         good_buf[offset] = filldata;
821                 } else {
822                         good_buf[offset] = testcalls % 256;
823                         if (offset % 2)
824                                 good_buf[offset] += original_buf[offset];
825                 }
826                 offset++;
827         }
828 }
829
830
831 void
832 dowrite(unsigned offset, unsigned size)
833 {
834         off_t ret;
835         unsigned iret;
836
837         offset -= offset % writebdy;
838         if (o_direct)
839                 size -= size % writebdy;
840         if (size == 0) {
841                 if (!quiet && testcalls > simulatedopcount && !o_direct)
842                         prt("skipping zero size write\n");
843                 log4(OP_WRITE, offset, size, FL_SKIPPED);
844                 return;
845         }
846
847         log4(OP_WRITE, offset, size, FL_NONE);
848
849         gendata(original_buf, good_buf, offset, size);
850         if (file_size < offset + size) {
851                 if (file_size < offset)
852                         memset(good_buf + file_size, '\0', offset - file_size);
853                 file_size = offset + size;
854                 if (lite) {
855                         warn("Lite file size bug in fsx!");
856                         report_failure(149);
857                 }
858         }
859
860         if (testcalls <= simulatedopcount)
861                 return;
862
863         if (!quiet &&
864                 ((progressinterval && testcalls % progressinterval == 0) ||
865                        (debug &&
866                        (monitorstart == -1 ||
867                         (offset + size > monitorstart &&
868                         (monitorend == -1 || offset <= monitorend))))))
869                 prt("%lu write\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
870                     offset, offset + size - 1, size);
871         ret = lseek(fd, (off_t)offset, SEEK_SET);
872         if (ret == (off_t)-1) {
873                 prterr("dowrite: lseek");
874                 report_failure(150);
875         }
876         iret = fsxwrite(fd, good_buf + offset, size, offset);
877         if (iret != size) {
878                 if (iret == -1)
879                         prterr("dowrite: write");
880                 else
881                         prt("short write: 0x%x bytes instead of 0x%x\n",
882                             iret, size);
883                 report_failure(151);
884         }
885         if (do_fsync) {
886                 if (fsync(fd)) {
887                         prt("fsync() failed: %s\n", strerror(errno));
888                         report_failure(152);
889                 }
890         }
891         if (flush) {
892                 doflush(offset, size);
893         }
894 }
895
896
897 void
898 domapwrite(unsigned offset, unsigned size)
899 {
900         unsigned pg_offset;
901         unsigned map_size;
902         off_t    cur_filesize;
903         char    *p;
904
905         offset -= offset % writebdy;
906         if (size == 0) {
907                 if (!quiet && testcalls > simulatedopcount)
908                         prt("skipping zero size write\n");
909                 log4(OP_MAPWRITE, offset, size, FL_SKIPPED);
910                 return;
911         }
912         cur_filesize = file_size;
913
914         log4(OP_MAPWRITE, offset, size, FL_NONE);
915
916         gendata(original_buf, good_buf, offset, size);
917         if (file_size < offset + size) {
918                 if (file_size < offset)
919                         memset(good_buf + file_size, '\0', offset - file_size);
920                 file_size = offset + size;
921                 if (lite) {
922                         warn("Lite file size bug in fsx!");
923                         report_failure(200);
924                 }
925         }
926
927         if (testcalls <= simulatedopcount)
928                 return;
929
930         if (!quiet &&
931                 ((progressinterval && testcalls % progressinterval == 0) ||
932                        (debug &&
933                        (monitorstart == -1 ||
934                         (offset + size > monitorstart &&
935                         (monitorend == -1 || offset <= monitorend))))))
936                 prt("%lu mapwrite\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
937                     offset, offset + size - 1, size);
938
939         if (file_size > cur_filesize) {
940                 if (ftruncate(fd, file_size) == -1) {
941                         prterr("domapwrite: ftruncate");
942                         exit(201);
943                 }
944         }
945         pg_offset = offset & PAGE_MASK;
946         map_size  = pg_offset + size;
947
948         if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
949                               MAP_FILE | MAP_SHARED, fd,
950                               (off_t)(offset - pg_offset))) == (char *)-1) {
951                 prterr("domapwrite: mmap");
952                 report_failure(202);
953         }
954         memcpy(p + pg_offset, good_buf + offset, size);
955         if (msync(p, map_size, MS_SYNC) != 0) {
956                 prterr("domapwrite: msync");
957                 report_failure(203);
958         }
959
960         check_eofpage("Write", offset, p, size);
961
962         if (munmap(p, map_size) != 0) {
963                 prterr("domapwrite: munmap");
964                 report_failure(204);
965         }
966 }
967
968
969 void
970 dotruncate(unsigned size)
971 {
972         int oldsize = file_size;
973
974         size -= size % truncbdy;
975         if (size > biggest) {
976                 biggest = size;
977                 if (!quiet && testcalls > simulatedopcount)
978                         prt("truncating to largest ever: 0x%x\n", size);
979         }
980
981         log4(OP_TRUNCATE, 0, size, FL_NONE);
982
983         if (size > file_size)
984                 memset(good_buf + file_size, '\0', size - file_size);
985         file_size = size;
986
987         if (testcalls <= simulatedopcount)
988                 return;
989         
990         if ((progressinterval && testcalls % progressinterval == 0) ||
991             (debug && (monitorstart == -1 || monitorend == -1 ||
992                       size <= monitorend)))
993                 prt("%lu trunc\tfrom 0x%x to 0x%x\n", testcalls, oldsize, size);
994         if (ftruncate(fd, (off_t)size) == -1) {
995                 prt("ftruncate1: %x\n", size);
996                 prterr("dotruncate: ftruncate");
997                 report_failure(160);
998         }
999 }
1000
1001 #ifdef FALLOC_FL_PUNCH_HOLE
1002 void
1003 do_punch_hole(unsigned offset, unsigned length)
1004 {
1005         unsigned end_offset;
1006         int max_offset = 0;
1007         int max_len = 0;
1008         int mode = FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE;
1009
1010         if (length == 0) {
1011                 if (!quiet && testcalls > simulatedopcount)
1012                         prt("skipping zero length punch hole\n");
1013                 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1014                 return;
1015         }
1016
1017         if (file_size <= (loff_t)offset) {
1018                 if (!quiet && testcalls > simulatedopcount)
1019                         prt("skipping hole punch off the end of the file\n");
1020                 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1021                 return;
1022         }
1023
1024         end_offset = offset + length;
1025
1026         log4(OP_PUNCH_HOLE, offset, length, FL_NONE);
1027
1028         if (testcalls <= simulatedopcount)
1029                 return;
1030
1031         if ((progressinterval && testcalls % progressinterval == 0) ||
1032             (debug && (monitorstart == -1 || monitorend == -1 ||
1033                       end_offset <= monitorend))) {
1034                 prt("%lu punch\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1035                         offset, offset+length, length);
1036         }
1037         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1038                 prt("punch hole: 0x%x to 0x%x\n", offset, offset + length);
1039                 prterr("do_punch_hole: fallocate");
1040                 report_failure(161);
1041         }
1042
1043
1044         max_offset = offset < file_size ? offset : file_size;
1045         max_len = max_offset + length <= file_size ? length :
1046                         file_size - max_offset;
1047         memset(good_buf + max_offset, '\0', max_len);
1048 }
1049
1050 #else
1051 void
1052 do_punch_hole(unsigned offset, unsigned length)
1053 {
1054         return;
1055 }
1056 #endif
1057
1058 #ifdef FALLOC_FL_ZERO_RANGE
1059 void
1060 do_zero_range(unsigned offset, unsigned length, int keep_size)
1061 {
1062         unsigned end_offset;
1063         int mode = FALLOC_FL_ZERO_RANGE;
1064
1065         if (length == 0) {
1066                 if (!quiet && testcalls > simulatedopcount)
1067                         prt("skipping zero length zero range\n");
1068                 log4(OP_ZERO_RANGE, offset, length, FL_SKIPPED |
1069                      (keep_size ? FL_KEEP_SIZE : FL_NONE));
1070                 return;
1071         }
1072
1073         end_offset = keep_size ? 0 : offset + length;
1074
1075         if (end_offset > biggest) {
1076                 biggest = end_offset;
1077                 if (!quiet && testcalls > simulatedopcount)
1078                         prt("zero_range to largest ever: 0x%x\n", end_offset);
1079         }
1080
1081         /*
1082          * last arg matches fallocate string array index in logdump:
1083          *      0: allocate past EOF
1084          *      1: extending prealloc
1085          *      2: interior prealloc
1086          */
1087         log4(OP_ZERO_RANGE, offset, length,
1088              keep_size ? FL_KEEP_SIZE : FL_NONE);
1089
1090         if (testcalls <= simulatedopcount)
1091                 return;
1092
1093         if ((progressinterval && testcalls % progressinterval == 0) ||
1094             (debug && (monitorstart == -1 || monitorend == -1 ||
1095                       end_offset <= monitorend))) {
1096                 prt("%lu zero\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1097                         offset, offset+length, length);
1098         }
1099         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1100                 prt("zero range: 0x%x to 0x%x\n", offset, offset + length);
1101                 prterr("do_zero_range: fallocate");
1102                 report_failure(161);
1103         }
1104
1105         memset(good_buf + offset, '\0', length);
1106 }
1107
1108 #else
1109 void
1110 do_zero_range(unsigned offset, unsigned length, int keep_size)
1111 {
1112         return;
1113 }
1114 #endif
1115
1116 #ifdef FALLOC_FL_COLLAPSE_RANGE
1117 void
1118 do_collapse_range(unsigned offset, unsigned length)
1119 {
1120         unsigned end_offset;
1121         int mode = FALLOC_FL_COLLAPSE_RANGE;
1122
1123         if (length == 0) {
1124                 if (!quiet && testcalls > simulatedopcount)
1125                         prt("skipping zero length collapse range\n");
1126                 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1127                 return;
1128         }
1129
1130         end_offset = offset + length;
1131         if ((loff_t)end_offset >= file_size) {
1132                 if (!quiet && testcalls > simulatedopcount)
1133                         prt("skipping collapse range behind EOF\n");
1134                 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1135                 return;
1136         }
1137
1138         log4(OP_COLLAPSE_RANGE, offset, length, FL_NONE);
1139
1140         if (testcalls <= simulatedopcount)
1141                 return;
1142
1143         if ((progressinterval && testcalls % progressinterval == 0) ||
1144             (debug && (monitorstart == -1 || monitorend == -1 ||
1145                       end_offset <= monitorend))) {
1146                 prt("%lu collapse\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1147                         offset, offset+length, length);
1148         }
1149         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1150                 prt("collapse range: 0x%x to 0x%x\n", offset, offset + length);
1151                 prterr("do_collapse_range: fallocate");
1152                 report_failure(161);
1153         }
1154
1155         memmove(good_buf + offset, good_buf + end_offset,
1156                 file_size - end_offset);
1157         file_size -= length;
1158 }
1159
1160 #else
1161 void
1162 do_collapse_range(unsigned offset, unsigned length)
1163 {
1164         return;
1165 }
1166 #endif
1167
1168 #ifdef FALLOC_FL_INSERT_RANGE
1169 void
1170 do_insert_range(unsigned offset, unsigned length)
1171 {
1172         unsigned end_offset;
1173         int mode = FALLOC_FL_INSERT_RANGE;
1174
1175         if (length == 0) {
1176                 if (!quiet && testcalls > simulatedopcount)
1177                         prt("skipping zero length insert range\n");
1178                 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1179                 return;
1180         }
1181
1182         if ((loff_t)offset >= file_size) {
1183                 if (!quiet && testcalls > simulatedopcount)
1184                         prt("skipping insert range behind EOF\n");
1185                 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1186                 return;
1187         }
1188
1189         log4(OP_INSERT_RANGE, offset, length, FL_NONE);
1190
1191         if (testcalls <= simulatedopcount)
1192                 return;
1193
1194         end_offset = offset + length;
1195         if ((progressinterval && testcalls % progressinterval == 0) ||
1196             (debug && (monitorstart == -1 || monitorend == -1 ||
1197                       end_offset <= monitorend))) {
1198                 prt("%lu insert\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1199                         offset, offset+length, length);
1200         }
1201         if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1202                 prt("insert range: 0x%x to 0x%x\n", offset, offset + length);
1203                 prterr("do_insert_range: fallocate");
1204                 report_failure(161);
1205         }
1206
1207         memmove(good_buf + end_offset, good_buf + offset,
1208                 file_size - offset);
1209         memset(good_buf + offset, '\0', length);
1210         file_size += length;
1211 }
1212
1213 #else
1214 void
1215 do_insert_range(unsigned offset, unsigned length)
1216 {
1217         return;
1218 }
1219 #endif
1220
1221 #ifdef HAVE_LINUX_FALLOC_H
1222 /* fallocate is basically a no-op unless extending, then a lot like a truncate */
1223 void
1224 do_preallocate(unsigned offset, unsigned length, int keep_size)
1225 {
1226         unsigned end_offset;
1227
1228         if (length == 0) {
1229                 if (!quiet && testcalls > simulatedopcount)
1230                         prt("skipping zero length fallocate\n");
1231                 log4(OP_FALLOCATE, offset, length, FL_SKIPPED |
1232                      (keep_size ? FL_KEEP_SIZE : FL_NONE));
1233                 return;
1234         }
1235
1236         end_offset = keep_size ? 0 : offset + length;
1237
1238         if (end_offset > biggest) {
1239                 biggest = end_offset;
1240                 if (!quiet && testcalls > simulatedopcount)
1241                         prt("fallocating to largest ever: 0x%x\n", end_offset);
1242         }
1243
1244         /*
1245          * last arg matches fallocate string array index in logdump:
1246          *      0: allocate past EOF
1247          *      1: extending prealloc
1248          *      2: interior prealloc
1249          */
1250         log4(OP_FALLOCATE, offset, length,
1251              keep_size ? FL_KEEP_SIZE : FL_NONE);
1252
1253         if (end_offset > file_size) {
1254                 memset(good_buf + file_size, '\0', end_offset - file_size);
1255                 file_size = end_offset;
1256         }
1257
1258         if (testcalls <= simulatedopcount)
1259                 return;
1260         
1261         if ((progressinterval && testcalls % progressinterval == 0) ||
1262             (debug && (monitorstart == -1 || monitorend == -1 ||
1263                       end_offset <= monitorend)))
1264                 prt("%lu falloc\tfrom 0x%x to 0x%x (0x%x bytes)\n", testcalls,
1265                                 offset, offset + length, length);
1266         if (fallocate(fd, keep_size ? FALLOC_FL_KEEP_SIZE : 0, (loff_t)offset, (loff_t)length) == -1) {
1267                 prt("fallocate: 0x%x to 0x%x\n", offset, offset + length);
1268                 prterr("do_preallocate: fallocate");
1269                 report_failure(161);
1270         }
1271 }
1272 #else
1273 void
1274 do_preallocate(unsigned offset, unsigned length, int keep_size)
1275 {
1276         return;
1277 }
1278 #endif
1279
1280 void
1281 writefileimage()
1282 {
1283         ssize_t iret;
1284
1285         if (lseek(fd, (off_t)0, SEEK_SET) == (off_t)-1) {
1286                 prterr("writefileimage: lseek");
1287                 report_failure(171);
1288         }
1289         iret = write(fd, good_buf, file_size);
1290         if ((off_t)iret != file_size) {
1291                 if (iret == -1)
1292                         prterr("writefileimage: write");
1293                 else
1294                         prt("short write: 0x%x bytes instead of 0x%llx\n",
1295                             iret, (unsigned long long)file_size);
1296                 report_failure(172);
1297         }
1298         if (lite ? 0 : ftruncate(fd, file_size) == -1) {
1299                 prt("ftruncate2: %llx\n", (unsigned long long)file_size);
1300                 prterr("writefileimage: ftruncate");
1301                 report_failure(173);
1302         }
1303 }
1304
1305
1306 void
1307 docloseopen(void)
1308
1309         if (testcalls <= simulatedopcount)
1310                 return;
1311
1312         if (debug)
1313                 prt("%lu close/open\n", testcalls);
1314         if (close(fd)) {
1315                 prterr("docloseopen: close");
1316                 report_failure(180);
1317         }
1318         fd = open(fname, O_RDWR|o_direct, 0);
1319         if (fd < 0) {
1320                 prterr("docloseopen: open");
1321                 report_failure(181);
1322         }
1323 }
1324
1325 void
1326 dofsync(void)
1327 {
1328         int ret;
1329
1330         if (testcalls <= simulatedopcount)
1331                 return;
1332         if (debug)
1333                 prt("%lu fsync\n", testcalls);
1334         log4(OP_FSYNC, 0, 0, 0);
1335         ret = fsync(fd);
1336         if (ret < 0) {
1337                 prterr("dofsync");
1338                 report_failure(210);
1339         }
1340         mark_log();
1341         dump_fsync_buffer();
1342         mark_nr++;
1343 }
1344
1345 #define TRIM_OFF(off, size)                     \
1346 do {                                            \
1347         if (size)                               \
1348                 (off) %= (size);                \
1349         else                                    \
1350                 (off) = 0;                      \
1351 } while (0)
1352
1353 #define TRIM_LEN(off, len, size)                \
1354 do {                                            \
1355         if ((off) + (len) > (size))             \
1356                 (len) = (size) - (off);         \
1357 } while (0)
1358
1359 #define TRIM_OFF_LEN(off, len, size)            \
1360 do {                                            \
1361         TRIM_OFF(off, size);                    \
1362         TRIM_LEN(off, len, size);               \
1363 } while (0)
1364
1365 void
1366 cleanup(int sig)
1367 {
1368         if (sig)
1369                 prt("signal %d\n", sig);
1370         prt("testcalls = %lu\n", testcalls);
1371         exit(sig);
1372 }
1373
1374 static int
1375 read_op(struct log_entry *log_entry)
1376 {
1377         char line[256];
1378
1379         memset(log_entry, 0, sizeof(*log_entry));
1380         log_entry->operation = -1;
1381
1382         while (log_entry->operation == -1) {
1383                 char *str;
1384                 int i;
1385
1386                 do {
1387                         if (!fgets(line, sizeof(line), replayopsf)) {
1388                                 if (feof(replayopsf)) {
1389                                         replayopsf = NULL;
1390                                         return 0;
1391                                 }
1392                                 goto fail;
1393                         }
1394                         str = strtok(line, " \t\n");
1395                 } while (!str || str[0] == '#');
1396
1397                 if (strcmp(str, "skip") == 0) {
1398                         log_entry->flags |= FL_SKIPPED;
1399                         str = strtok(NULL, " \t\n");
1400                         if (!str)
1401                                 goto fail;
1402                 }
1403                 log_entry->operation = op_code(str);
1404                 if (log_entry->operation == -1)
1405                         goto fail;
1406                 for (i = 0; i < 3; i++) {
1407                         char *end;
1408
1409                         str = strtok(NULL, " \t\n");
1410                         if (!str)
1411                                 goto fail;
1412                         log_entry->args[i] = strtoul(str, &end, 0);
1413                         if (*end)
1414                                 goto fail;
1415                 }
1416                 while ((str = strtok(NULL, " \t\n"))) {
1417                         if (strcmp(str, "keep_size") == 0)
1418                                 log_entry->flags |= FL_KEEP_SIZE;
1419                         else if (strcmp(str, "close_open") == 0)
1420                                 log_entry->flags |= FL_CLOSE_OPEN;
1421                         else if (strcmp(str, "*") == 0)
1422                                 ;  /* overlap marker; ignore */
1423                         else
1424                                 goto fail;
1425                 }
1426         }
1427         return 1;
1428
1429 fail:
1430         fprintf(stderr, "%s: parse error\n", replayops);
1431         fclose(replayopsf);
1432         replayopsf = NULL;
1433         cleanup(100);  /* doesn't return */
1434         return 0;
1435 }
1436
1437
1438 int
1439 test(void)
1440 {
1441         unsigned long   offset;
1442         unsigned long   size;
1443         unsigned long   rv;
1444         unsigned long   op;
1445         int             keep_size = 0;
1446
1447         if (simulatedopcount > 0 && testcalls == simulatedopcount)
1448                 writefileimage();
1449
1450         testcalls++;
1451
1452         if (debugstart > 0 && testcalls >= debugstart)
1453                 debug = 1;
1454
1455         if (!quiet && testcalls < simulatedopcount && testcalls % 100000 == 0)
1456                 prt("%lu...\n", testcalls);
1457
1458         if (replayopsf) {
1459                 struct log_entry log_entry;
1460
1461                 while (read_op(&log_entry)) {
1462                         if (log_entry.flags & FL_SKIPPED) {
1463                                 log4(log_entry.operation,
1464                                      log_entry.args[0], log_entry.args[1],
1465                                      log_entry.flags);
1466                                 continue;
1467                         }
1468
1469                         op = log_entry.operation;
1470                         offset = log_entry.args[0];
1471                         size = log_entry.args[1];
1472                         closeopen = !!(log_entry.flags & FL_CLOSE_OPEN);
1473                         keep_size = !!(log_entry.flags & FL_KEEP_SIZE);
1474                         goto have_op;
1475                 }
1476                 return 0;
1477         }
1478
1479         rv = random();
1480         if (closeprob)
1481                 closeopen = (rv >> 3) < (1 << 28) / closeprob;
1482
1483         offset = random();
1484         size = maxoplen;
1485         if (randomoplen)
1486                 size = random() % (maxoplen + 1);
1487
1488         /* calculate appropriate op to run */
1489         if (lite)
1490                 op = rv % OP_MAX_LITE;
1491         else if (!integrity)
1492                 op = rv % OP_MAX_FULL;
1493         else
1494                 op = rv % OP_MAX_INTEGRITY;
1495
1496         switch(op) {
1497         case OP_TRUNCATE:
1498                 if (!style)
1499                         size = random() % maxfilelen;
1500                 break;
1501         case OP_FALLOCATE:
1502                 if (fallocate_calls && size && keep_size_calls)
1503                         keep_size = random() % 2;
1504                 break;
1505         case OP_ZERO_RANGE:
1506                 if (zero_range_calls && size && keep_size_calls)
1507                         keep_size = random() % 2;
1508                 break;
1509         }
1510
1511 have_op:
1512
1513         switch (op) {
1514         case OP_MAPREAD:
1515                 if (!mapped_reads)
1516                         op = OP_READ;
1517                 break;
1518         case OP_MAPWRITE:
1519                 if (!mapped_writes)
1520                         op = OP_WRITE;
1521                 break;
1522         case OP_FALLOCATE:
1523                 if (!fallocate_calls) {
1524                         log4(OP_FALLOCATE, offset, size, FL_SKIPPED);
1525                         goto out;
1526                 }
1527                 break;
1528         case OP_PUNCH_HOLE:
1529                 if (!punch_hole_calls) {
1530                         log4(OP_PUNCH_HOLE, offset, size, FL_SKIPPED);
1531                         goto out;
1532                 }
1533                 break;
1534         case OP_ZERO_RANGE:
1535                 if (!zero_range_calls) {
1536                         log4(OP_ZERO_RANGE, offset, size, FL_SKIPPED);
1537                         goto out;
1538                 }
1539                 break;
1540         case OP_COLLAPSE_RANGE:
1541                 if (!collapse_range_calls) {
1542                         log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
1543                         goto out;
1544                 }
1545                 break;
1546         case OP_INSERT_RANGE:
1547                 if (!insert_range_calls) {
1548                         log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
1549                         goto out;
1550                 }
1551                 break;
1552         }
1553
1554         switch (op) {
1555         case OP_READ:
1556                 TRIM_OFF_LEN(offset, size, file_size);
1557                 doread(offset, size);
1558                 break;
1559
1560         case OP_WRITE:
1561                 TRIM_OFF_LEN(offset, size, maxfilelen);
1562                 dowrite(offset, size);
1563                 break;
1564
1565         case OP_MAPREAD:
1566                 TRIM_OFF_LEN(offset, size, file_size);
1567                 domapread(offset, size);
1568                 break;
1569
1570         case OP_MAPWRITE:
1571                 TRIM_OFF_LEN(offset, size, maxfilelen);
1572                 domapwrite(offset, size);
1573                 break;
1574
1575         case OP_TRUNCATE:
1576                 dotruncate(size);
1577                 break;
1578
1579         case OP_FALLOCATE:
1580                 TRIM_OFF_LEN(offset, size, maxfilelen);
1581                 do_preallocate(offset, size, keep_size);
1582                 break;
1583
1584         case OP_PUNCH_HOLE:
1585                 TRIM_OFF_LEN(offset, size, file_size);
1586                 do_punch_hole(offset, size);
1587                 break;
1588         case OP_ZERO_RANGE:
1589                 TRIM_OFF_LEN(offset, size, file_size);
1590                 do_zero_range(offset, size, keep_size);
1591                 break;
1592         case OP_COLLAPSE_RANGE:
1593                 TRIM_OFF_LEN(offset, size, file_size - 1);
1594                 offset = offset & ~(block_size - 1);
1595                 size = size & ~(block_size - 1);
1596                 if (size == 0) {
1597                         log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
1598                         goto out;
1599                 }
1600                 do_collapse_range(offset, size);
1601                 break;
1602         case OP_INSERT_RANGE:
1603                 TRIM_OFF(offset, file_size);
1604                 TRIM_LEN(file_size, size, maxfilelen);
1605                 offset = offset & ~(block_size - 1);
1606                 size = size & ~(block_size - 1);
1607                 if (size == 0) {
1608                         log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
1609                         goto out;
1610                 }
1611                 if (file_size + size > maxfilelen) {
1612                         log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
1613                         goto out;
1614                 }
1615
1616                 do_insert_range(offset, size);
1617                 break;
1618         case OP_FSYNC:
1619                 dofsync();
1620                 break;
1621         default:
1622                 prterr("test: unknown operation");
1623                 report_failure(42);
1624                 break;
1625         }
1626
1627 out:
1628         if (sizechecks && testcalls > simulatedopcount)
1629                 check_size();
1630         if (closeopen)
1631                 docloseopen();
1632         return 1;
1633 }
1634
1635
1636 void
1637 usage(void)
1638 {
1639         fprintf(stdout, "usage: %s",
1640                 "fsx [-dknqxAFLOWZ] [-b opnum] [-c Prob] [-g filldata] [-i logdev] [-j logid] [-l flen] [-m start:end] [-o oplen] [-p progressinterval] [-r readbdy] [-s style] [-t truncbdy] [-w writebdy] [-D startingop] [-N numops] [-P dirpath] [-S seed] fname\n\
1641         -b opnum: beginning operation number (default 1)\n\
1642         -c P: 1 in P chance of file close+open at each op (default infinity)\n\
1643         -d: debug output for all operations\n\
1644         -f flush and invalidate cache after I/O\n\
1645         -g X: write character X instead of random generated data\n\
1646         -i logdev: do integrity testing, logdev is the dm log writes device\n\
1647         -j logid: prefix debug log messsages with this id\n\
1648         -k: do not truncate existing file and use its size as upper bound on file size\n\
1649         -l flen: the upper bound on file size (default 262144)\n\
1650         -m startop:endop: monitor (print debug output) specified byte range (default 0:infinity)\n\
1651         -n: no verifications of file size\n\
1652         -o oplen: the upper bound on operation size (default 65536)\n\
1653         -p progressinterval: debug output at specified operation interval\n\
1654         -q: quieter operation\n\
1655         -r readbdy: 4096 would make reads page aligned (default 1)\n\
1656         -s style: 1 gives smaller truncates (default 0)\n\
1657         -t truncbdy: 4096 would make truncates page aligned (default 1)\n\
1658         -w writebdy: 4096 would make writes page aligned (default 1)\n\
1659         -x: preallocate file space before starting, XFS only (default 0)\n\
1660         -y synchronize changes to a file\n"
1661
1662 #ifdef AIO
1663 "       -A: Use the AIO system calls\n"
1664 #endif
1665 "       -D startingop: debug output starting at specified operation\n"
1666 #ifdef HAVE_LINUX_FALLOC_H
1667 "       -F: Do not use fallocate (preallocation) calls\n"
1668 #endif
1669 #ifdef FALLOC_FL_PUNCH_HOLE
1670 "       -H: Do not use punch hole calls\n"
1671 #endif
1672 #ifdef FALLOC_FL_ZERO_RANGE
1673 "       -z: Do not use zero range calls\n"
1674 #endif
1675 #ifdef FALLOC_FL_COLLAPSE_RANGE
1676 "       -C: Do not use collapse range calls\n"
1677 #endif
1678 #ifdef FALLOC_FL_INSERT_RANGE
1679 "       -I: Do not use insert range calls\n"
1680 #endif
1681 "       -L: fsxLite - no file creations & no file size changes\n\
1682         -N numops: total # operations to do (default infinity)\n\
1683         -O: use oplen (see -o flag) for every op (default random)\n\
1684         -P: save .fsxlog .fsxops and .fsxgood files in dirpath (default ./)\n\
1685         -S seed: for random # generator (default 1) 0 gets timestamp\n\
1686         -W: mapped write operations DISabled\n\
1687         -R: read() system calls only (mapped reads disabled)\n\
1688         -Z: O_DIRECT (use -R, -W, -r and -w too)\n\
1689         --replay-ops opsfile: replay ops from recorded .fsxops file\n\
1690         --record-ops[=opsfile]: dump ops file also on success. optionally specify ops file name\n\
1691         fname: this filename is REQUIRED (no default)\n");
1692         exit(90);
1693 }
1694
1695
1696 int
1697 getnum(char *s, char **e)
1698 {
1699         int ret;
1700
1701         *e = (char *) 0;
1702         ret = strtol(s, e, 0);
1703         if (*e)
1704                 switch (**e) {
1705                 case 'b':
1706                 case 'B':
1707                         ret *= 512;
1708                         *e = *e + 1;
1709                         break;
1710                 case 'k':
1711                 case 'K':
1712                         ret *= 1024;
1713                         *e = *e + 1;
1714                         break;
1715                 case 'm':
1716                 case 'M':
1717                         ret *= 1024*1024;
1718                         *e = *e + 1;
1719                         break;
1720                 case 'w':
1721                 case 'W':
1722                         ret *= 4;
1723                         *e = *e + 1;
1724                         break;
1725                 }
1726         return (ret);
1727 }
1728
1729 #ifdef AIO
1730
1731 #define QSZ     1024
1732 io_context_t    io_ctx;
1733 struct iocb     iocb;
1734
1735 int aio_setup()
1736 {
1737         int ret;
1738         ret = io_queue_init(QSZ, &io_ctx);
1739         if (ret != 0) {
1740                 fprintf(stderr, "aio_setup: io_queue_init failed: %s\n",
1741                         strerror(ret));
1742                 return(-1);
1743         }
1744         return(0);
1745 }
1746
1747 int
1748 __aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
1749 {
1750         struct io_event event;
1751         static struct timespec ts;
1752         struct iocb *iocbs[] = { &iocb };
1753         int ret;
1754         long res;
1755
1756         if (rw == READ) {
1757                 io_prep_pread(&iocb, fd, buf, len, offset);
1758         } else {
1759                 io_prep_pwrite(&iocb, fd, buf, len, offset);
1760         }
1761
1762         ts.tv_sec = 30;
1763         ts.tv_nsec = 0;
1764         ret = io_submit(io_ctx, 1, iocbs);
1765         if (ret != 1) {
1766                 fprintf(stderr, "errcode=%d\n", ret);
1767                 fprintf(stderr, "aio_rw: io_submit failed: %s\n",
1768                                 strerror(ret));
1769                 goto out_error;
1770         }
1771
1772         ret = io_getevents(io_ctx, 1, 1, &event, &ts);
1773         if (ret != 1) {
1774                 if (ret == 0)
1775                         fprintf(stderr, "aio_rw: no events available\n");
1776                 else {
1777                         fprintf(stderr, "errcode=%d\n", -ret);
1778                         fprintf(stderr, "aio_rw: io_getevents failed: %s\n",
1779                                         strerror(-ret));
1780                 }
1781                 goto out_error;
1782         }
1783         if (len != event.res) {
1784                 /*
1785                  * The b0rked libaio defines event.res as unsigned.
1786                  * However the kernel strucuture has it signed,
1787                  * and it's used to pass negated error value.
1788                  * Till the library is fixed use the temp var.
1789                  */
1790                 res = (long)event.res;
1791                 if (res >= 0)
1792                         fprintf(stderr, "bad io length: %lu instead of %u\n",
1793                                         res, len);
1794                 else {
1795                         fprintf(stderr, "errcode=%ld\n", -res);
1796                         fprintf(stderr, "aio_rw: async io failed: %s\n",
1797                                         strerror(-res));
1798                         ret = res;
1799                         goto out_error;
1800                 }
1801
1802         }
1803         return event.res;
1804
1805 out_error:
1806         /*
1807          * The caller expects error return in traditional libc
1808          * convention, i.e. -1 and the errno set to error.
1809          */
1810         errno = -ret;
1811         return -1;
1812 }
1813
1814 int aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
1815 {
1816         int ret;
1817
1818         if (aio) {
1819                 ret = __aio_rw(rw, fd, buf, len, offset);
1820         } else {
1821                 if (rw == READ)
1822                         ret = read(fd, buf, len);
1823                 else
1824                         ret = write(fd, buf, len);
1825         }
1826         return ret;
1827 }
1828
1829 #endif
1830
1831 #define test_fallocate(mode) __test_fallocate(mode, #mode)
1832
1833 int
1834 __test_fallocate(int mode, const char *mode_str)
1835 {
1836 #ifdef HAVE_LINUX_FALLOC_H
1837         int ret = 0;
1838         if (!lite) {
1839                 if (fallocate(fd, mode, file_size, 1) && errno == EOPNOTSUPP) {
1840                         if(!quiet)
1841                                 fprintf(stderr,
1842                                         "main: filesystem does not support "
1843                                         "fallocate mode %s, disabling!\n",
1844                                         mode_str);
1845                 } else {
1846                         ret = 1;
1847                         if (ftruncate(fd, file_size)) {
1848                                 warn("main: ftruncate");
1849                                 exit(132);
1850                         }
1851                 }
1852         }
1853         return ret;
1854 #endif
1855 }
1856
1857 static struct option longopts[] = {
1858         {"replay-ops", required_argument, 0, 256},
1859         {"record-ops", optional_argument, 0, 255},
1860         { }
1861 };
1862
1863 int
1864 main(int argc, char **argv)
1865 {
1866         int     i, style, ch;
1867         char    *endp, *tmp;
1868         char logfile[PATH_MAX];
1869         struct stat statbuf;
1870         int o_flags = O_RDWR|O_CREAT|O_TRUNC;
1871
1872         logfile[0] = 0;
1873         dname[0] = 0;
1874
1875         page_size = getpagesize();
1876         page_mask = page_size - 1;
1877         mmap_mask = page_mask;
1878         
1879
1880         setvbuf(stdout, (char *)0, _IOLBF, 0); /* line buffered stdout */
1881
1882         while ((ch = getopt_long(argc, argv,
1883                                  "b:c:dfg:i:j:kl:m:no:p:qr:s:t:w:xyAD:FKHzCILN:OP:RS:WZ",
1884                                  longopts, NULL)) != EOF)
1885                 switch (ch) {
1886                 case 'b':
1887                         simulatedopcount = getnum(optarg, &endp);
1888                         if (!quiet)
1889                                 prt("Will begin at operation %ld\n", simulatedopcount);
1890                         if (simulatedopcount == 0)
1891                                 usage();
1892                         simulatedopcount -= 1;
1893                         break;
1894                 case 'c':
1895                         closeprob = getnum(optarg, &endp);
1896                         if (!quiet)
1897                                 prt("Chance of close/open is 1 in %d\n", closeprob);
1898                         if (closeprob <= 0)
1899                                 usage();
1900                         break;
1901                 case 'd':
1902                         debug = 1;
1903                         break;
1904                 case 'f':
1905                         flush = 1;
1906                         break;
1907                 case 'g':
1908                         filldata = *optarg;
1909                         break;
1910                 case 'i':
1911                         integrity = 1;
1912                         logdev = strdup(optarg);
1913                         if (!logdev) {
1914                                 prterr("strdup");
1915                                 exit(101);
1916                         }
1917                         break;
1918                 case 'j':
1919                         logid = strdup(optarg);
1920                         if (!logid) {
1921                                 prterr("strdup");
1922                                 exit(101);
1923                         }
1924                         break;
1925                 case 'k':
1926                         o_flags &= ~O_TRUNC;
1927                         break;
1928                 case 'l':
1929                         maxfilelen = getnum(optarg, &endp);
1930                         if (maxfilelen <= 0)
1931                                 usage();
1932                         break;
1933                 case 'm':
1934                         monitorstart = getnum(optarg, &endp);
1935                         if (monitorstart < 0)
1936                                 usage();
1937                         if (!endp || *endp++ != ':')
1938                                 usage();
1939                         monitorend = getnum(endp, &endp);
1940                         if (monitorend < 0)
1941                                 usage();
1942                         if (monitorend == 0)
1943                                 monitorend = -1; /* aka infinity */
1944                         debug = 1;
1945                 case 'n':
1946                         sizechecks = 0;
1947                         break;
1948                 case 'o':
1949                         maxoplen = getnum(optarg, &endp);
1950                         if (maxoplen <= 0)
1951                                 usage();
1952                         break;
1953                 case 'p':
1954                         progressinterval = getnum(optarg, &endp);
1955                         if (progressinterval == 0)
1956                                 usage();
1957                         break;
1958                 case 'q':
1959                         quiet = 1;
1960                         break;
1961                 case 'r':
1962                         readbdy = getnum(optarg, &endp);
1963                         if (readbdy <= 0)
1964                                 usage();
1965                         break;
1966                 case 's':
1967                         style = getnum(optarg, &endp);
1968                         if (style < 0 || style > 1)
1969                                 usage();
1970                         break;
1971                 case 't':
1972                         truncbdy = getnum(optarg, &endp);
1973                         if (truncbdy <= 0)
1974                                 usage();
1975                         break;
1976                 case 'w':
1977                         writebdy = getnum(optarg, &endp);
1978                         if (writebdy <= 0)
1979                                 usage();
1980                         break;
1981                 case 'x':
1982                         prealloc = 1;
1983                         break;
1984                 case 'y':
1985                         do_fsync = 1;
1986                         break;
1987                 case 'A':
1988                         aio = 1;
1989                         break;
1990                 case 'D':
1991                         debugstart = getnum(optarg, &endp);
1992                         if (debugstart < 1)
1993                                 usage();
1994                         break;
1995                 case 'F':
1996                         fallocate_calls = 0;
1997                         break;
1998                 case 'K':
1999                         keep_size_calls = 0;
2000                         break;
2001                 case 'H':
2002                         punch_hole_calls = 0;
2003                         break;
2004                 case 'z':
2005                         zero_range_calls = 0;
2006                         break;
2007                 case 'C':
2008                         collapse_range_calls = 0;
2009                         break;
2010                 case 'I':
2011                         insert_range_calls = 0;
2012                         break;
2013                 case 'L':
2014                         lite = 1;
2015                         o_flags &= ~(O_CREAT|O_TRUNC);
2016                         break;
2017                 case 'N':
2018                         numops = getnum(optarg, &endp);
2019                         if (numops < 0)
2020                                 usage();
2021                         break;
2022                 case 'O':
2023                         randomoplen = 0;
2024                         break;
2025                 case 'P':
2026                         strncpy(dname, optarg, sizeof(dname));
2027                         strcat(dname, "/");
2028                         dirpath = strlen(dname);
2029                         break;
2030                 case 'R':
2031                         mapped_reads = 0;
2032                         break;
2033                 case 'S':
2034                         seed = getnum(optarg, &endp);
2035                         if (seed == 0) {
2036                                 seed = time(0) % 10000;
2037                                 seed += (int)getpid();
2038                         }
2039                         if (seed < 0)
2040                                 usage();
2041                         break;
2042                 case 'W':
2043                         mapped_writes = 0;
2044                         if (!quiet)
2045                                 prt("mapped writes DISABLED\n");
2046                         break;
2047                 case 'Z':
2048                         o_direct = O_DIRECT;
2049                         o_flags |= O_DIRECT;
2050                         break;
2051                 case 255:  /* --record-ops */
2052                         if (optarg)
2053                                 strncpy(opsfile, optarg, sizeof(opsfile));
2054                         recordops = opsfile;
2055                         break;
2056                 case 256:  /* --replay-ops */
2057                         replayops = optarg;
2058                         break;
2059                 default:
2060                         usage();
2061                         /* NOTREACHED */
2062                 }
2063         argc -= optind;
2064         argv += optind;
2065         if (argc != 1)
2066                 usage();
2067
2068         if (integrity && !dirpath) {
2069                 fprintf(stderr, "option -i <logdev> requires -P <dirpath>\n");
2070                 usage();
2071         }
2072
2073         fname = argv[0];
2074         tmp = strdup(fname);
2075         if (!tmp) {
2076                 prterr("strdup");
2077                 exit(101);
2078         }
2079         bname = basename(tmp);
2080
2081         signal(SIGHUP,  cleanup);
2082         signal(SIGINT,  cleanup);
2083         signal(SIGPIPE, cleanup);
2084         signal(SIGALRM, cleanup);
2085         signal(SIGTERM, cleanup);
2086         signal(SIGXCPU, cleanup);
2087         signal(SIGXFSZ, cleanup);
2088         signal(SIGVTALRM,       cleanup);
2089         signal(SIGUSR1, cleanup);
2090         signal(SIGUSR2, cleanup);
2091
2092         if (!quiet && seed)
2093                 prt("Seed set to %d\n", seed);
2094         srandom(seed);
2095         fd = open(fname, o_flags, 0666);
2096         if (fd < 0) {
2097                 prterr(fname);
2098                 exit(91);
2099         }
2100         if (fstat(fd, &statbuf)) {
2101                 prterr("check_size: fstat");
2102                 exit(91);
2103         }
2104         block_size = statbuf.st_blksize;
2105 #ifdef XFS
2106         if (prealloc) {
2107                 xfs_flock64_t   resv = { 0 };
2108 #ifdef HAVE_XFS_PLATFORM_DEFS_H
2109                 if (!platform_test_xfs_fd(fd)) {
2110                         prterr(fname);
2111                         fprintf(stderr, "main: cannot prealloc, non XFS\n");
2112                         exit(96);
2113                 }
2114 #endif
2115                 resv.l_len = maxfilelen;
2116                 if ((xfsctl(fname, fd, XFS_IOC_RESVSP, &resv)) < 0) {
2117                         prterr(fname);
2118                         exit(97);
2119                 }
2120         }
2121 #endif
2122
2123         if (dirpath) {
2124                 snprintf(goodfile, sizeof(goodfile), "%s%s.fsxgood", dname, bname);
2125                 snprintf(logfile, sizeof(logfile), "%s%s.fsxlog", dname, bname);
2126                 if (!*opsfile)
2127                         snprintf(opsfile, sizeof(opsfile), "%s%s.fsxops", dname, bname);
2128         } else {
2129                 snprintf(goodfile, sizeof(goodfile), "%s.fsxgood", fname);
2130                 snprintf(logfile, sizeof(logfile), "%s.fsxlog", fname);
2131                 if (!*opsfile)
2132                         snprintf(opsfile, sizeof(opsfile), "%s.fsxops", fname);
2133         }
2134         fsxgoodfd = open(goodfile, O_RDWR|O_CREAT|O_TRUNC, 0666);
2135         if (fsxgoodfd < 0) {
2136                 prterr(goodfile);
2137                 exit(92);
2138         }
2139         fsxlogf = fopen(logfile, "w");
2140         if (fsxlogf == NULL) {
2141                 prterr(logfile);
2142                 exit(93);
2143         }
2144         unlink(opsfile);
2145
2146         if (replayops) {
2147                 replayopsf = fopen(replayops, "r");
2148                 if (!replayopsf) {
2149                         prterr(replayops);
2150                         exit(93);
2151                 }
2152         }
2153
2154 #ifdef AIO
2155         if (aio) 
2156                 aio_setup();
2157 #endif
2158
2159         if (!(o_flags & O_TRUNC)) {
2160                 off_t ret;
2161                 file_size = maxfilelen = biggest = lseek(fd, (off_t)0, SEEK_END);
2162                 if (file_size == (off_t)-1) {
2163                         prterr(fname);
2164                         warn("main: lseek eof");
2165                         exit(94);
2166                 }
2167                 ret = lseek(fd, (off_t)0, SEEK_SET);
2168                 if (ret == (off_t)-1) {
2169                         prterr(fname);
2170                         warn("main: lseek 0");
2171                         exit(95);
2172                 }
2173         }
2174         original_buf = (char *) malloc(maxfilelen);
2175         for (i = 0; i < maxfilelen; i++)
2176                 original_buf[i] = random() % 256;
2177         good_buf = (char *) malloc(maxfilelen + writebdy);
2178         good_buf = round_ptr_up(good_buf, writebdy, 0);
2179         memset(good_buf, '\0', maxfilelen);
2180         temp_buf = (char *) malloc(maxoplen + readbdy);
2181         temp_buf = round_ptr_up(temp_buf, readbdy, 0);
2182         memset(temp_buf, '\0', maxoplen);
2183         if (lite) {     /* zero entire existing file */
2184                 ssize_t written;
2185
2186                 written = write(fd, good_buf, (size_t)maxfilelen);
2187                 if (written != maxfilelen) {
2188                         if (written == -1) {
2189                                 prterr(fname);
2190                                 warn("main: error on write");
2191                         } else
2192                                 warn("main: short write, 0x%x bytes instead "
2193                                         "of 0x%lx\n",
2194                                         (unsigned)written,
2195                                         maxfilelen);
2196                         exit(98);
2197                 }
2198         } else {
2199                 ssize_t ret, len = file_size;
2200                 off_t off = 0;
2201
2202                 while (len > 0) {
2203                         ret = read(fd, good_buf + off, len);
2204                         if (ret == -1) {
2205                                 prterr(fname);
2206                                 warn("main: error on read");
2207                                 exit(98);
2208                         }
2209                         len -= ret;
2210                         off += ret;
2211                 }
2212
2213                 check_trunc_hack();
2214         }
2215
2216         if (fallocate_calls)
2217                 fallocate_calls = test_fallocate(0);
2218         if (keep_size_calls)
2219                 keep_size_calls = test_fallocate(FALLOC_FL_KEEP_SIZE);
2220         if (punch_hole_calls)
2221                 punch_hole_calls = test_fallocate(FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE);
2222         if (zero_range_calls)
2223                 zero_range_calls = test_fallocate(FALLOC_FL_ZERO_RANGE);
2224         if (collapse_range_calls)
2225                 collapse_range_calls = test_fallocate(FALLOC_FL_COLLAPSE_RANGE);
2226         if (insert_range_calls)
2227                 insert_range_calls = test_fallocate(FALLOC_FL_INSERT_RANGE);
2228
2229         while (numops == -1 || numops--)
2230                 if (!test())
2231                         break;
2232
2233         free(tmp);
2234         if (close(fd)) {
2235                 prterr("close");
2236                 report_failure(99);
2237         }
2238         prt("All %lu operations completed A-OK!\n", testcalls);
2239         if (recordops)
2240                 logdump();
2241
2242         exit(0);
2243         return 0;
2244 }