2 * Copyright (C) 1991, NeXT Computer, Inc. All Rights Reserverd.
5 * Author: Avadis Tevanian, Jr.
7 * File system exerciser.
9 * Rewritten 8/98 by Conrad Minshall.
11 * Small changes to work under Linux -- davej.
13 * Checks for mmap last-page zero fill.
40 #include <sys/syscall.h>
46 #define NUMPRINTCOLUMNS 32 /* # columns of data to print on each line */
50 enum opflags { FL_NONE = 0, FL_SKIPPED = 1, FL_CLOSE_OPEN = 2, FL_KEEP_SIZE = 4 };
53 * A log entry is an operation and a bunch of arguments.
65 struct log_entry oplog[LOGSIZE]; /* the log */
66 int logptr = 0; /* current position in log */
67 int logcount = 0; /* total ops */
70 * The operation matrix is complex due to conditional execution of different
71 * features. Hence when we come to deciding what operation to run, we need to
72 * be careful in how we select the different operations. The active operations
73 * are mapped to numbers as follows:
75 * lite !lite integrity
84 * COLLAPSE RANGE: - 8 8
87 * When mapped read/writes are disabled, they are simply converted to normal
88 * reads and writes. When fallocate/fpunch calls are disabled, they are
91 * Because of the "lite" version, we also need to have different "maximum
92 * operation" defines to allow the ops to be selected correctly based on the
97 /* common operations */
104 /* !lite operations */
105 OP_TRUNCATE = OP_MAX_LITE,
116 /* integrity operations */
117 OP_FSYNC = OP_MAX_FULL,
122 #define PAGE_SIZE getpagesize()
124 #define PAGE_MASK (PAGE_SIZE - 1)
126 char *original_buf; /* a pointer to the original data */
127 char *good_buf; /* a pointer to the correct data */
128 char *temp_buf; /* a pointer to the current data */
129 char *fname; /* name of our test file */
130 char *bname; /* basename of our test file */
131 char *logdev; /* -i flag */
132 char *logid; /* -j flag */
133 char dname[1024]; /* -P flag */
134 char goodfile[PATH_MAX];
135 int dirpath = 0; /* -P flag */
136 int fd; /* fd for our test file */
138 blksize_t block_size = 0;
141 long long testcalls = 0; /* calls to function "test" */
143 long long simulatedopcount = 0; /* -b flag */
144 int closeprob = 0; /* -c flag */
145 int debug = 0; /* -d flag */
146 long long debugstart = 0; /* -D flag */
147 char filldata = 0; /* -g flag */
148 int flush = 0; /* -f flag */
149 int do_fsync = 0; /* -y flag */
150 unsigned long maxfilelen = 256 * 1024; /* -l flag */
151 int sizechecks = 1; /* -n flag disables them */
152 int maxoplen = 64 * 1024; /* -o flag */
153 int quiet = 0; /* -q flag */
154 long long progressinterval = 0; /* -p flag */
155 int readbdy = 1; /* -r flag */
156 int style = 0; /* -s flag */
157 int prealloc = 0; /* -x flag */
158 int truncbdy = 1; /* -t flag */
159 int writebdy = 1; /* -w flag */
160 long monitorstart = -1; /* -m flag */
161 long monitorend = -1; /* -m flag */
162 int lite = 0; /* -L flag */
163 long long numops = -1; /* -N flag */
164 int randomoplen = 1; /* -O flag disables it */
165 int seed = 1; /* -S flag */
166 int mapped_writes = 1; /* -W flag disables */
167 int fallocate_calls = 1; /* -F flag disables */
168 int keep_size_calls = 1; /* -K flag disables */
169 int punch_hole_calls = 1; /* -H flag disables */
170 int zero_range_calls = 1; /* -z flag disables */
171 int collapse_range_calls = 1; /* -C flag disables */
172 int insert_range_calls = 1; /* -I flag disables */
173 int mapped_reads = 1; /* -R flag disables it */
174 int check_file = 0; /* -X flag enables */
175 int clone_range_calls = 1; /* -J flag disables */
176 int dedupe_range_calls = 1; /* -B flag disables */
177 int copy_range_calls = 1; /* -E flag disables */
178 int integrity = 0; /* -i flag */
180 int o_direct; /* -Z */
188 int fsx_rw(int rw, int fd, char *buf, unsigned len, unsigned offset);
191 #define fsxread(a,b,c,d) fsx_rw(READ, a,b,c,d)
192 #define fsxwrite(a,b,c,d) fsx_rw(WRITE, a,b,c,d)
194 const char *replayops = NULL;
195 const char *recordops = NULL;
196 FILE * fsxlogf = NULL;
197 FILE * replayopsf = NULL;
198 char opsfile[PATH_MAX];
202 static void *round_ptr_up(void *ptr, unsigned long align, unsigned long offset)
204 unsigned long ret = (unsigned long)ptr;
206 ret = ((ret + align - 1) & ~(align - 1));
212 vwarnc(int code, const char *fmt, va_list ap)
215 fprintf(stderr, "%s: ", logid);
216 fprintf(stderr, "fsx: ");
218 vfprintf(stderr, fmt, ap);
219 fprintf(stderr, ": ");
221 fprintf(stderr, "%s\n", strerror(code));
225 warn(const char * fmt, ...) {
228 vwarnc(errno, fmt, ap);
233 prt(const char *fmt, ...)
238 fprintf(stdout, "%s: ", logid);
240 vfprintf(stdout, fmt, args);
244 vfprintf(fsxlogf, fmt, args);
250 prterr(const char *prefix)
252 prt("%s%s%s\n", prefix, prefix ? ": " : "", strerror(errno));
256 static const char *op_names[] = {
258 [OP_WRITE] = "write",
259 [OP_MAPREAD] = "mapread",
260 [OP_MAPWRITE] = "mapwrite",
261 [OP_TRUNCATE] = "truncate",
262 [OP_FALLOCATE] = "fallocate",
263 [OP_PUNCH_HOLE] = "punch_hole",
264 [OP_ZERO_RANGE] = "zero_range",
265 [OP_COLLAPSE_RANGE] = "collapse_range",
266 [OP_INSERT_RANGE] = "insert_range",
267 [OP_CLONE_RANGE] = "clone_range",
268 [OP_DEDUPE_RANGE] = "dedupe_range",
269 [OP_COPY_RANGE] = "copy_range",
270 [OP_FSYNC] = "fsync",
273 static const char *op_name(int operation)
275 if (operation >= 0 &&
276 operation < sizeof(op_names) / sizeof(op_names[0]))
277 return op_names[operation];
281 static int op_code(const char *name)
285 for (i = 0; i < sizeof(op_names) / sizeof(op_names[0]); i++)
286 if (op_names[i] && strcmp(name, op_names[i]) == 0)
292 log5(int operation, int arg0, int arg1, int arg2, enum opflags flags)
294 struct log_entry *le;
297 le->operation = operation;
299 flags |= FL_CLOSE_OPEN;
303 le->args[3] = file_size;
308 if (logptr >= LOGSIZE)
313 log4(int operation, int arg0, int arg1, enum opflags flags)
315 struct log_entry *le;
318 le->operation = operation;
320 flags |= FL_CLOSE_OPEN;
323 le->args[2] = file_size;
328 if (logptr >= LOGSIZE)
337 struct log_entry *lp;
339 prt("LOG DUMP (%d total operations):\n", logcount);
341 logopsf = fopen(opsfile, "w");
345 if (logcount < LOGSIZE) {
352 for ( ; count > 0; count--) {
353 bool overlap, overlap2;
356 opnum = i+1 + (logcount/LOGSIZE)*LOGSIZE;
357 prt("%d(%3d mod 256): ", opnum, opnum%256);
360 overlap = badoff >= lp->args[0] &&
361 badoff < lp->args[0] + lp->args[1];
363 if (lp->flags & FL_SKIPPED) {
364 prt("SKIPPED (no operation)");
368 switch (lp->operation) {
370 prt("MAPREAD 0x%x thru 0x%x\t(0x%x bytes)",
371 lp->args[0], lp->args[0] + lp->args[1] - 1,
377 prt("MAPWRITE 0x%x thru 0x%x\t(0x%x bytes)",
378 lp->args[0], lp->args[0] + lp->args[1] - 1,
384 prt("READ 0x%x thru 0x%x\t(0x%x bytes)",
385 lp->args[0], lp->args[0] + lp->args[1] - 1,
391 prt("WRITE 0x%x thru 0x%x\t(0x%x bytes)",
392 lp->args[0], lp->args[0] + lp->args[1] - 1,
394 if (lp->args[0] > lp->args[2])
396 else if (lp->args[0] + lp->args[1] > lp->args[2])
398 overlap = (badoff >= lp->args[0] ||
399 badoff >=lp->args[2]) &&
400 badoff < lp->args[0] + lp->args[1];
405 down = lp->args[1] < lp->args[2];
406 prt("TRUNCATE %s\tfrom 0x%x to 0x%x",
407 down ? "DOWN" : "UP", lp->args[2], lp->args[1]);
408 overlap = badoff >= lp->args[1 + !down] &&
409 badoff < lp->args[1 + !!down];
414 /* 0: offset 1: length 2: where alloced */
415 prt("FALLOC 0x%x thru 0x%x\t(0x%x bytes) ",
416 lp->args[0], lp->args[0] + lp->args[1],
418 if (lp->args[0] + lp->args[1] <= lp->args[2])
420 else if (lp->flags & FL_KEEP_SIZE)
428 prt("PUNCH 0x%x thru 0x%x\t(0x%x bytes)",
429 lp->args[0], lp->args[0] + lp->args[1] - 1,
435 prt("ZERO 0x%x thru 0x%x\t(0x%x bytes)",
436 lp->args[0], lp->args[0] + lp->args[1] - 1,
441 case OP_COLLAPSE_RANGE:
442 prt("COLLAPSE 0x%x thru 0x%x\t(0x%x bytes)",
443 lp->args[0], lp->args[0] + lp->args[1] - 1,
448 case OP_INSERT_RANGE:
449 prt("INSERT 0x%x thru 0x%x\t(0x%x bytes)",
450 lp->args[0], lp->args[0] + lp->args[1] - 1,
456 prt("CLONE 0x%x thru 0x%x\t(0x%x bytes) to 0x%x thru 0x%x",
457 lp->args[0], lp->args[0] + lp->args[1] - 1,
459 lp->args[2], lp->args[2] + lp->args[1] - 1);
460 overlap2 = badoff >= lp->args[2] &&
461 badoff < lp->args[2] + lp->args[1];
462 if (overlap && overlap2)
469 case OP_DEDUPE_RANGE:
470 prt("DEDUPE 0x%x thru 0x%x\t(0x%x bytes) to 0x%x thru 0x%x",
471 lp->args[0], lp->args[0] + lp->args[1] - 1,
473 lp->args[2], lp->args[2] + lp->args[1] - 1);
474 overlap2 = badoff >= lp->args[2] &&
475 badoff < lp->args[2] + lp->args[1];
476 if (overlap && overlap2)
484 prt("COPY 0x%x thru 0x%x\t(0x%x bytes) to 0x%x thru 0x%x",
485 lp->args[0], lp->args[0] + lp->args[1] - 1,
487 lp->args[2], lp->args[2] + lp->args[1] - 1);
488 overlap2 = badoff >= lp->args[2] &&
489 badoff < lp->args[2] + lp->args[1];
490 if (overlap && overlap2)
501 prt("BOGUS LOG ENTRY (operation code = %d)!",
507 if (lp->flags & FL_CLOSE_OPEN)
508 prt("\n\t\tCLOSE/OPEN");
517 if (lp->flags & FL_SKIPPED)
518 fprintf(logopsf, "skip ");
519 fprintf(logopsf, "%s", op_name(lp->operation));
520 for (j = 0; j < lp->nr_args; j++)
521 fprintf(logopsf, " 0x%x", lp->args[j]);
522 if (lp->flags & FL_KEEP_SIZE)
523 fprintf(logopsf, " keep_size");
524 if (lp->flags & FL_CLOSE_OPEN)
525 fprintf(logopsf, " close_open");
527 fprintf(logopsf, " *");
528 fprintf(logopsf, "\n");
533 if (fclose(logopsf) != 0)
536 prt("Log of operations saved to \"%s\"; "
537 "replay with --replay-ops\n",
544 save_buffer(char *buffer, off_t bufferlength, int fd)
547 ssize_t byteswritten;
549 if (fd <= 0 || bufferlength == 0)
552 if (bufferlength > SSIZE_MAX) {
553 prt("fsx flaw: overflow in save_buffer\n");
557 off_t size_by_seek = lseek(fd, (off_t)0, SEEK_END);
558 if (size_by_seek == (off_t)-1)
559 prterr("save_buffer: lseek eof");
560 else if (bufferlength > size_by_seek) {
561 warn("save_buffer: .fsxgood file too short... will save 0x%llx bytes instead of 0x%llx\n", (unsigned long long)size_by_seek,
562 (unsigned long long)bufferlength);
563 bufferlength = size_by_seek;
567 ret = lseek(fd, (off_t)0, SEEK_SET);
568 if (ret == (off_t)-1)
569 prterr("save_buffer: lseek 0");
571 byteswritten = write(fd, buffer, (size_t)bufferlength);
572 if (byteswritten != bufferlength) {
573 if (byteswritten == -1)
574 prterr("save_buffer write");
576 warn("save_buffer: short write, 0x%x bytes instead of 0x%llx\n",
577 (unsigned)byteswritten,
578 (unsigned long long)bufferlength);
584 report_failure(int status)
590 save_buffer(good_buf, file_size, fsxgoodfd);
591 prt("Correct content saved for comparison\n");
592 prt("(maybe hexdump \"%s\" vs \"%s\")\n",
601 #define short_at(cp) ((unsigned short)((*((unsigned char *)(cp)) << 8) | \
602 *(((unsigned char *)(cp)) + 1)))
610 snprintf(command, 256, "dmsetup message %s 0 mark %s.mark%d", logdev,
612 ret = system(command);
614 prterr("dmsetup mark failed");
620 dump_fsync_buffer(void)
622 char fname_buffer[PATH_MAX];
628 snprintf(fname_buffer, sizeof(fname_buffer), "%s%s.mark%d", dname,
630 good_fd = open(fname_buffer, O_WRONLY|O_CREAT|O_TRUNC, 0666);
632 prterr(fname_buffer);
636 save_buffer(good_buf, file_size, good_fd);
638 prt("Dumped fsync buffer to %s\n", fname_buffer + dirpath);
642 check_buffers(char *buf, unsigned offset, unsigned size)
650 if (memcmp(good_buf + offset, buf, size) != 0) {
651 prt("READ BAD DATA: offset = 0x%x, size = 0x%x, fname = %s\n",
652 offset, size, fname);
653 prt("OFFSET\tGOOD\tBAD\tRANGE\n");
655 c = good_buf[offset];
659 bad = short_at(&buf[i]);
660 prt("0x%05x\t0x%04x\t0x%04x", offset,
661 short_at(&good_buf[offset]), bad);
662 op = buf[offset & 1 ? i+1 : i];
663 prt("\t0x%05x\n", n);
665 prt("operation# (mod 256) for "
666 "the bad data may be %u\n",
667 ((unsigned)op & 0xff));
669 prt("operation# (mod 256) for "
670 "the bad data unknown, check"
671 " HOLE and EXTEND ops\n");
691 if (fstat(fd, &statbuf)) {
692 prterr("check_size: fstat");
693 statbuf.st_size = -1;
695 size_by_seek = lseek(fd, (off_t)0, SEEK_END);
696 if (file_size != statbuf.st_size || file_size != size_by_seek) {
697 prt("Size error: expected 0x%llx stat 0x%llx seek 0x%llx\n",
698 (unsigned long long)file_size,
699 (unsigned long long)statbuf.st_size,
700 (unsigned long long)size_by_seek);
707 check_trunc_hack(void)
710 off_t offset = file_size + (off_t)100000;
712 if (ftruncate(fd, file_size))
714 if (ftruncate(fd, offset))
717 if (statbuf.st_size != offset) {
718 prt("no extend on truncate! not posix!\n");
721 if (ftruncate(fd, file_size)) {
723 prterr("check_trunc_hack: ftruncate");
729 doflush(unsigned offset, unsigned size)
735 if (o_direct == O_DIRECT)
738 pg_offset = offset & mmap_mask;
739 map_size = pg_offset + size;
741 if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
742 MAP_FILE | MAP_SHARED, fd,
743 (off_t)(offset - pg_offset))) == (char *)-1) {
744 prterr("doflush: mmap");
747 if (msync(p, map_size, MS_INVALIDATE) != 0) {
748 prterr("doflush: msync");
751 if (munmap(p, map_size) != 0) {
752 prterr("doflush: munmap");
758 doread(unsigned offset, unsigned size)
763 offset -= offset % readbdy;
765 size -= size % readbdy;
767 if (!quiet && testcalls > simulatedopcount && !o_direct)
768 prt("skipping zero size read\n");
769 log4(OP_READ, offset, size, FL_SKIPPED);
772 if (size + offset > file_size) {
773 if (!quiet && testcalls > simulatedopcount)
774 prt("skipping seek/read past end of file\n");
775 log4(OP_READ, offset, size, FL_SKIPPED);
779 log4(OP_READ, offset, size, FL_NONE);
781 if (testcalls <= simulatedopcount)
785 ((progressinterval && testcalls % progressinterval == 0) ||
787 (monitorstart == -1 ||
788 (offset + size > monitorstart &&
789 (monitorend == -1 || offset <= monitorend))))))
790 prt("%lld read\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
791 offset, offset + size - 1, size);
792 ret = lseek(fd, (off_t)offset, SEEK_SET);
793 if (ret == (off_t)-1) {
794 prterr("doread: lseek");
797 iret = fsxread(fd, temp_buf, size, offset);
800 prterr("doread: read");
802 prt("short read: 0x%x bytes instead of 0x%x\n",
806 check_buffers(temp_buf, offset, size);
810 check_eofpage(char *s, unsigned offset, char *p, int size)
812 unsigned long last_page, should_be_zero;
814 if (offset + size <= (file_size & ~page_mask))
817 * we landed in the last page of the file
818 * test to make sure the VM system provided 0's
819 * beyond the true end of the file mapping
820 * (as required by mmap def in 1996 posix 1003.1)
822 last_page = ((unsigned long)p + (offset & page_mask) + size) & ~page_mask;
824 for (should_be_zero = last_page + (file_size & page_mask);
825 should_be_zero < last_page + page_size;
827 if (*(char *)should_be_zero) {
828 prt("Mapped %s: non-zero data past EOF (0x%llx) page offset 0x%x is 0x%04x\n",
829 s, file_size - 1, should_be_zero & page_mask,
830 short_at(should_be_zero));
838 static char *check_buf;
840 unsigned size = file_size;
848 check_buf = (char *) malloc(maxfilelen + writebdy);
849 assert(check_buf != NULL);
850 check_buf = round_ptr_up(check_buf, writebdy, 0);
851 memset(check_buf, '\0', maxfilelen);
855 size -= size % readbdy;
859 ret = lseek(fd, (off_t)offset, SEEK_SET);
860 if (ret == (off_t)-1) {
861 prterr("doread: lseek");
865 iret = fsxread(fd, check_buf, size, offset);
868 prterr("check_contents: read");
870 prt("short check read: 0x%x bytes instead of 0x%x\n",
874 check_buffers(check_buf, offset, size);
876 /* Map eof page, check it */
877 map_offset = size - (size & PAGE_MASK);
878 if (map_offset == size)
879 map_offset -= PAGE_SIZE;
880 map_size = size - map_offset;
882 p = mmap(0, map_size, PROT_READ, MAP_SHARED, fd, map_offset);
883 if (p == MAP_FAILED) {
884 prterr("check_contents: mmap");
887 check_eofpage("check_contents", map_offset, p, map_size);
889 if (munmap(p, map_size) != 0) {
890 prterr("check_contents: munmap");
896 domapread(unsigned offset, unsigned size)
902 offset -= offset % readbdy;
904 if (!quiet && testcalls > simulatedopcount)
905 prt("skipping zero size read\n");
906 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
909 if (size + offset > file_size) {
910 if (!quiet && testcalls > simulatedopcount)
911 prt("skipping seek/read past end of file\n");
912 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
916 log4(OP_MAPREAD, offset, size, FL_NONE);
918 if (testcalls <= simulatedopcount)
922 ((progressinterval && testcalls % progressinterval == 0) ||
924 (monitorstart == -1 ||
925 (offset + size > monitorstart &&
926 (monitorend == -1 || offset <= monitorend))))))
927 prt("%lld mapread\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
928 offset, offset + size - 1, size);
930 pg_offset = offset & PAGE_MASK;
931 map_size = pg_offset + size;
933 if ((p = (char *)mmap(0, map_size, PROT_READ, MAP_SHARED, fd,
934 (off_t)(offset - pg_offset))) == (char *)-1) {
935 prterr("domapread: mmap");
938 memcpy(temp_buf, p + pg_offset, size);
940 check_eofpage("Read", offset, p, size);
942 if (munmap(p, map_size) != 0) {
943 prterr("domapread: munmap");
947 check_buffers(temp_buf, offset, size);
952 gendata(char *original_buf, char *good_buf, unsigned offset, unsigned size)
956 good_buf[offset] = filldata;
958 good_buf[offset] = testcalls % 256;
960 good_buf[offset] += original_buf[offset];
968 dowrite(unsigned offset, unsigned size)
973 offset -= offset % writebdy;
975 size -= size % writebdy;
977 if (!quiet && testcalls > simulatedopcount && !o_direct)
978 prt("skipping zero size write\n");
979 log4(OP_WRITE, offset, size, FL_SKIPPED);
983 log4(OP_WRITE, offset, size, FL_NONE);
985 gendata(original_buf, good_buf, offset, size);
986 if (file_size < offset + size) {
987 if (file_size < offset)
988 memset(good_buf + file_size, '\0', offset - file_size);
989 file_size = offset + size;
991 warn("Lite file size bug in fsx!");
996 if (testcalls <= simulatedopcount)
1000 ((progressinterval && testcalls % progressinterval == 0) ||
1002 (monitorstart == -1 ||
1003 (offset + size > monitorstart &&
1004 (monitorend == -1 || offset <= monitorend))))))
1005 prt("%lld write\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
1006 offset, offset + size - 1, size);
1007 ret = lseek(fd, (off_t)offset, SEEK_SET);
1008 if (ret == (off_t)-1) {
1009 prterr("dowrite: lseek");
1010 report_failure(150);
1012 iret = fsxwrite(fd, good_buf + offset, size, offset);
1015 prterr("dowrite: write");
1017 prt("short write: 0x%x bytes instead of 0x%x\n",
1019 report_failure(151);
1023 prt("fsync() failed: %s\n", strerror(errno));
1024 report_failure(152);
1028 doflush(offset, size);
1034 domapwrite(unsigned offset, unsigned size)
1041 offset -= offset % writebdy;
1043 if (!quiet && testcalls > simulatedopcount)
1044 prt("skipping zero size write\n");
1045 log4(OP_MAPWRITE, offset, size, FL_SKIPPED);
1048 cur_filesize = file_size;
1050 log4(OP_MAPWRITE, offset, size, FL_NONE);
1052 gendata(original_buf, good_buf, offset, size);
1053 if (file_size < offset + size) {
1054 if (file_size < offset)
1055 memset(good_buf + file_size, '\0', offset - file_size);
1056 file_size = offset + size;
1058 warn("Lite file size bug in fsx!");
1059 report_failure(200);
1063 if (testcalls <= simulatedopcount)
1067 ((progressinterval && testcalls % progressinterval == 0) ||
1069 (monitorstart == -1 ||
1070 (offset + size > monitorstart &&
1071 (monitorend == -1 || offset <= monitorend))))))
1072 prt("%lld mapwrite\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
1073 offset, offset + size - 1, size);
1075 if (file_size > cur_filesize) {
1076 if (ftruncate(fd, file_size) == -1) {
1077 prterr("domapwrite: ftruncate");
1081 pg_offset = offset & PAGE_MASK;
1082 map_size = pg_offset + size;
1084 if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
1085 MAP_FILE | MAP_SHARED, fd,
1086 (off_t)(offset - pg_offset))) == (char *)-1) {
1087 prterr("domapwrite: mmap");
1088 report_failure(202);
1090 memcpy(p + pg_offset, good_buf + offset, size);
1091 if (msync(p, map_size, MS_SYNC) != 0) {
1092 prterr("domapwrite: msync");
1093 report_failure(203);
1096 check_eofpage("Write", offset, p, size);
1098 if (munmap(p, map_size) != 0) {
1099 prterr("domapwrite: munmap");
1100 report_failure(204);
1106 dotruncate(unsigned size)
1108 int oldsize = file_size;
1110 size -= size % truncbdy;
1111 if (size > biggest) {
1113 if (!quiet && testcalls > simulatedopcount)
1114 prt("truncating to largest ever: 0x%x\n", size);
1117 log4(OP_TRUNCATE, 0, size, FL_NONE);
1119 if (size > file_size)
1120 memset(good_buf + file_size, '\0', size - file_size);
1123 if (testcalls <= simulatedopcount)
1126 if ((progressinterval && testcalls % progressinterval == 0) ||
1127 (debug && (monitorstart == -1 || monitorend == -1 ||
1128 size <= monitorend)))
1129 prt("%lld trunc\tfrom 0x%x to 0x%x\n", testcalls, oldsize,
1131 if (ftruncate(fd, (off_t)size) == -1) {
1132 prt("ftruncate1: %x\n", size);
1133 prterr("dotruncate: ftruncate");
1134 report_failure(160);
1138 #ifdef FALLOC_FL_PUNCH_HOLE
1140 do_punch_hole(unsigned offset, unsigned length)
1142 unsigned end_offset;
1145 int mode = FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE;
1148 if (!quiet && testcalls > simulatedopcount)
1149 prt("skipping zero length punch hole\n");
1150 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1154 if (file_size <= (loff_t)offset) {
1155 if (!quiet && testcalls > simulatedopcount)
1156 prt("skipping hole punch off the end of the file\n");
1157 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1161 end_offset = offset + length;
1163 log4(OP_PUNCH_HOLE, offset, length, FL_NONE);
1165 if (testcalls <= simulatedopcount)
1168 if ((progressinterval && testcalls % progressinterval == 0) ||
1169 (debug && (monitorstart == -1 || monitorend == -1 ||
1170 end_offset <= monitorend))) {
1171 prt("%lld punch\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1172 offset, offset+length, length);
1174 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1175 prt("punch hole: 0x%x to 0x%x\n", offset, offset + length);
1176 prterr("do_punch_hole: fallocate");
1177 report_failure(161);
1181 max_offset = offset < file_size ? offset : file_size;
1182 max_len = max_offset + length <= file_size ? length :
1183 file_size - max_offset;
1184 memset(good_buf + max_offset, '\0', max_len);
1189 do_punch_hole(unsigned offset, unsigned length)
1195 #ifdef FALLOC_FL_ZERO_RANGE
1197 do_zero_range(unsigned offset, unsigned length, int keep_size)
1199 unsigned end_offset;
1200 int mode = FALLOC_FL_ZERO_RANGE;
1203 mode |= FALLOC_FL_KEEP_SIZE;
1206 if (!quiet && testcalls > simulatedopcount)
1207 prt("skipping zero length zero range\n");
1208 log4(OP_ZERO_RANGE, offset, length, FL_SKIPPED |
1209 (keep_size ? FL_KEEP_SIZE : FL_NONE));
1213 end_offset = keep_size ? 0 : offset + length;
1215 if (end_offset > biggest) {
1216 biggest = end_offset;
1217 if (!quiet && testcalls > simulatedopcount)
1218 prt("zero_range to largest ever: 0x%x\n", end_offset);
1222 * last arg matches fallocate string array index in logdump:
1223 * 0: allocate past EOF
1224 * 1: extending prealloc
1225 * 2: interior prealloc
1227 log4(OP_ZERO_RANGE, offset, length,
1228 keep_size ? FL_KEEP_SIZE : FL_NONE);
1230 if (testcalls <= simulatedopcount)
1233 if ((progressinterval && testcalls % progressinterval == 0) ||
1234 (debug && (monitorstart == -1 || monitorend == -1 ||
1235 end_offset <= monitorend))) {
1236 prt("%lld zero\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1237 offset, offset+length, length);
1239 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1240 prt("zero range: 0x%x to 0x%x\n", offset, offset + length);
1241 prterr("do_zero_range: fallocate");
1242 report_failure(161);
1245 memset(good_buf + offset, '\0', length);
1247 if (!keep_size && end_offset > file_size) {
1249 * If there's a gap between the old file size and the offset of
1250 * the zero range operation, fill the gap with zeroes.
1252 if (offset > file_size)
1253 memset(good_buf + file_size, '\0', offset - file_size);
1255 file_size = end_offset;
1261 do_zero_range(unsigned offset, unsigned length, int keep_size)
1267 #ifdef FALLOC_FL_COLLAPSE_RANGE
1269 do_collapse_range(unsigned offset, unsigned length)
1271 unsigned end_offset;
1272 int mode = FALLOC_FL_COLLAPSE_RANGE;
1275 if (!quiet && testcalls > simulatedopcount)
1276 prt("skipping zero length collapse range\n");
1277 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1281 end_offset = offset + length;
1282 if ((loff_t)end_offset >= file_size) {
1283 if (!quiet && testcalls > simulatedopcount)
1284 prt("skipping collapse range behind EOF\n");
1285 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1289 log4(OP_COLLAPSE_RANGE, offset, length, FL_NONE);
1291 if (testcalls <= simulatedopcount)
1294 if ((progressinterval && testcalls % progressinterval == 0) ||
1295 (debug && (monitorstart == -1 || monitorend == -1 ||
1296 end_offset <= monitorend))) {
1297 prt("%lld collapse\tfrom 0x%x to 0x%x, (0x%x bytes)\n",
1298 testcalls, offset, offset+length, length);
1300 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1301 prt("collapse range: 0x%x to 0x%x\n", offset, offset + length);
1302 prterr("do_collapse_range: fallocate");
1303 report_failure(161);
1306 memmove(good_buf + offset, good_buf + end_offset,
1307 file_size - end_offset);
1308 file_size -= length;
1313 do_collapse_range(unsigned offset, unsigned length)
1319 #ifdef FALLOC_FL_INSERT_RANGE
1321 do_insert_range(unsigned offset, unsigned length)
1323 unsigned end_offset;
1324 int mode = FALLOC_FL_INSERT_RANGE;
1327 if (!quiet && testcalls > simulatedopcount)
1328 prt("skipping zero length insert range\n");
1329 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1333 if ((loff_t)offset >= file_size) {
1334 if (!quiet && testcalls > simulatedopcount)
1335 prt("skipping insert range behind EOF\n");
1336 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1340 log4(OP_INSERT_RANGE, offset, length, FL_NONE);
1342 if (testcalls <= simulatedopcount)
1345 end_offset = offset + length;
1346 if ((progressinterval && testcalls % progressinterval == 0) ||
1347 (debug && (monitorstart == -1 || monitorend == -1 ||
1348 end_offset <= monitorend))) {
1349 prt("%lld insert\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1350 offset, offset+length, length);
1352 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1353 prt("insert range: 0x%x to 0x%x\n", offset, offset + length);
1354 prterr("do_insert_range: fallocate");
1355 report_failure(161);
1358 memmove(good_buf + end_offset, good_buf + offset,
1359 file_size - offset);
1360 memset(good_buf + offset, '\0', length);
1361 file_size += length;
1366 do_insert_range(unsigned offset, unsigned length)
1374 test_clone_range(void)
1376 struct file_clone_range fcr = {
1380 if (ioctl(fd, FICLONERANGE, &fcr) &&
1381 (errno == EOPNOTSUPP || errno == ENOTTY)) {
1384 "main: filesystem does not support "
1385 "clone range, disabling!\n");
1393 do_clone_range(unsigned offset, unsigned length, unsigned dest)
1395 struct file_clone_range fcr = {
1397 .src_offset = offset,
1398 .src_length = length,
1399 .dest_offset = dest,
1403 if (!quiet && testcalls > simulatedopcount)
1404 prt("skipping zero length clone range\n");
1405 log5(OP_CLONE_RANGE, offset, length, dest, FL_SKIPPED);
1409 if ((loff_t)offset >= file_size) {
1410 if (!quiet && testcalls > simulatedopcount)
1411 prt("skipping clone range behind EOF\n");
1412 log5(OP_CLONE_RANGE, offset, length, dest, FL_SKIPPED);
1416 if (dest + length > biggest) {
1417 biggest = dest + length;
1418 if (!quiet && testcalls > simulatedopcount)
1419 prt("cloning to largest ever: 0x%x\n", dest + length);
1422 log5(OP_CLONE_RANGE, offset, length, dest, FL_NONE);
1424 if (testcalls <= simulatedopcount)
1427 if ((progressinterval && testcalls % progressinterval == 0) ||
1428 (debug && (monitorstart == -1 || monitorend == -1 ||
1429 dest <= monitorstart || dest + length <= monitorend))) {
1430 prt("%lu clone\tfrom 0x%x to 0x%x, (0x%x bytes) at 0x%x\n",
1431 testcalls, offset, offset+length, length, dest);
1434 if (ioctl(fd, FICLONERANGE, &fcr) == -1) {
1435 prt("clone range: 0x%x to 0x%x at 0x%x\n", offset,
1436 offset + length, dest);
1437 prterr("do_clone_range: FICLONERANGE");
1438 report_failure(161);
1441 memcpy(good_buf + dest, good_buf + offset, length);
1442 if (dest > file_size)
1443 memset(good_buf + file_size, '\0', dest - file_size);
1444 if (dest + length > file_size)
1445 file_size = dest + length;
1450 test_clone_range(void)
1456 do_clone_range(unsigned offset, unsigned length, unsigned dest)
1462 #ifdef FIDEDUPERANGE
1464 test_dedupe_range(void)
1466 struct file_dedupe_range *fdr;
1472 fdr = calloc(sizeof(struct file_dedupe_range_info) +
1473 sizeof(struct file_dedupe_range), 1);
1475 prterr("do_dedupe_range: malloc");
1476 report_failure(161);
1479 /* Make sure we have at least two blocks */
1480 new_len = block_size * 2;
1481 if (file_size < new_len && ftruncate(fd, new_len)) {
1482 warn("main: ftruncate");
1486 /* Try to dedupe them */
1487 fdr->src_length = block_size;
1488 fdr->dest_count = 1;
1489 fdr->info[0].dest_fd = fd;
1490 fdr->info[0].dest_offset = block_size;
1492 if (ioctl(fd, FIDEDUPERANGE, fdr))
1494 else if (fdr->info[0].status < 0)
1495 error = -fdr->info[0].status;
1499 /* Older kernels may return EINVAL... */
1500 if (error == EOPNOTSUPP || error == ENOTTY || error == EINVAL) {
1503 "main: filesystem does not support "
1504 "dedupe range, disabling!\n");
1508 /* Put the file back the way it was. */
1509 if (file_size < new_len && ftruncate(fd, file_size)) {
1510 warn("main: ftruncate");
1519 do_dedupe_range(unsigned offset, unsigned length, unsigned dest)
1521 struct file_dedupe_range *fdr;
1524 if (!quiet && testcalls > simulatedopcount)
1525 prt("skipping zero length dedupe range\n");
1526 log5(OP_DEDUPE_RANGE, offset, length, dest, FL_SKIPPED);
1530 if ((loff_t)offset >= file_size) {
1531 if (!quiet && testcalls > simulatedopcount)
1532 prt("skipping dedupe range behind EOF\n");
1533 log5(OP_DEDUPE_RANGE, offset, length, dest, FL_SKIPPED);
1537 log5(OP_DEDUPE_RANGE, offset, length, dest, FL_NONE);
1539 if (testcalls <= simulatedopcount)
1542 if ((progressinterval && testcalls % progressinterval == 0) ||
1543 (debug && (monitorstart == -1 || monitorend == -1 ||
1544 dest <= monitorstart || dest + length <= monitorend))) {
1545 prt("%lu dedupe\tfrom 0x%x to 0x%x, (0x%x bytes) at 0x%x\n",
1546 testcalls, offset, offset+length, length, dest);
1550 fdr = calloc(sizeof(struct file_dedupe_range_info) +
1551 sizeof(struct file_dedupe_range), 1);
1553 prterr("do_dedupe_range: malloc");
1554 report_failure(161);
1557 /* Dedupe data blocks */
1558 fdr->src_offset = offset;
1559 fdr->src_length = length;
1560 fdr->dest_count = 1;
1561 fdr->info[0].dest_fd = fd;
1562 fdr->info[0].dest_offset = dest;
1564 if (ioctl(fd, FIDEDUPERANGE, fdr) == -1) {
1565 prt("dedupe range: 0x%x to 0x%x at 0x%x\n", offset,
1566 offset + length, dest);
1567 prterr("do_dedupe_range(0): FIDEDUPERANGE");
1568 report_failure(161);
1569 } else if (fdr->info[0].status < 0) {
1570 errno = -fdr->info[0].status;
1571 prt("dedupe range: 0x%x to 0x%x at 0x%x\n", offset,
1572 offset + length, dest);
1573 prterr("do_dedupe_range(1): FIDEDUPERANGE");
1574 report_failure(161);
1582 test_dedupe_range(void)
1588 do_dedupe_range(unsigned offset, unsigned length, unsigned dest)
1594 #ifdef HAVE_COPY_FILE_RANGE
1596 test_copy_range(void)
1598 loff_t o1 = 0, o2 = 1;
1600 if (syscall(__NR_copy_file_range, fd, &o1, fd, &o2, 1, 0) == -1 &&
1601 (errno == ENOSYS || errno == EOPNOTSUPP || errno == ENOTTY)) {
1604 "main: filesystem does not support "
1605 "copy range, disabling!\n");
1613 do_copy_range(unsigned offset, unsigned length, unsigned dest)
1621 if (!quiet && testcalls > simulatedopcount)
1622 prt("skipping zero length copy range\n");
1623 log5(OP_COPY_RANGE, offset, length, dest, FL_SKIPPED);
1627 if ((loff_t)offset >= file_size) {
1628 if (!quiet && testcalls > simulatedopcount)
1629 prt("skipping copy range behind EOF\n");
1630 log5(OP_COPY_RANGE, offset, length, dest, FL_SKIPPED);
1634 if (dest + length > biggest) {
1635 biggest = dest + length;
1636 if (!quiet && testcalls > simulatedopcount)
1637 prt("copying to largest ever: 0x%x\n", dest + length);
1640 log5(OP_COPY_RANGE, offset, length, dest, FL_NONE);
1642 if (testcalls <= simulatedopcount)
1645 if ((progressinterval && testcalls % progressinterval == 0) ||
1646 (debug && (monitorstart == -1 || monitorend == -1 ||
1647 dest <= monitorstart || dest + length <= monitorend))) {
1648 prt("%lu copy\tfrom 0x%x to 0x%x, (0x%x bytes) at 0x%x\n",
1649 testcalls, offset, offset+length, length, dest);
1657 nr = syscall(__NR_copy_file_range, fd, &o1, fd, &o2, olen, 0);
1659 if (errno != EAGAIN || tries++ >= 300)
1661 } else if (nr > olen) {
1662 prt("copy range: 0x%x to 0x%x at 0x%x\n", offset,
1663 offset + length, dest);
1664 prt("do_copy_range: asked %u, copied %u??\n",
1666 report_failure(161);
1671 prt("copy range: 0x%x to 0x%x at 0x%x\n", offset,
1672 offset + length, dest);
1673 prterr("do_copy_range:");
1674 report_failure(161);
1677 memcpy(good_buf + dest, good_buf + offset, length);
1678 if (dest > file_size)
1679 memset(good_buf + file_size, '\0', dest - file_size);
1680 if (dest + length > file_size)
1681 file_size = dest + length;
1686 test_copy_range(void)
1692 do_copy_range(unsigned offset, unsigned length, unsigned dest)
1698 #ifdef HAVE_LINUX_FALLOC_H
1699 /* fallocate is basically a no-op unless extending, then a lot like a truncate */
1701 do_preallocate(unsigned offset, unsigned length, int keep_size)
1703 unsigned end_offset;
1706 if (!quiet && testcalls > simulatedopcount)
1707 prt("skipping zero length fallocate\n");
1708 log4(OP_FALLOCATE, offset, length, FL_SKIPPED |
1709 (keep_size ? FL_KEEP_SIZE : FL_NONE));
1713 end_offset = keep_size ? 0 : offset + length;
1715 if (end_offset > biggest) {
1716 biggest = end_offset;
1717 if (!quiet && testcalls > simulatedopcount)
1718 prt("fallocating to largest ever: 0x%x\n", end_offset);
1722 * last arg matches fallocate string array index in logdump:
1723 * 0: allocate past EOF
1724 * 1: extending prealloc
1725 * 2: interior prealloc
1727 log4(OP_FALLOCATE, offset, length,
1728 keep_size ? FL_KEEP_SIZE : FL_NONE);
1730 if (end_offset > file_size) {
1731 memset(good_buf + file_size, '\0', end_offset - file_size);
1732 file_size = end_offset;
1735 if (testcalls <= simulatedopcount)
1738 if ((progressinterval && testcalls % progressinterval == 0) ||
1739 (debug && (monitorstart == -1 || monitorend == -1 ||
1740 end_offset <= monitorend)))
1741 prt("%lld falloc\tfrom 0x%x to 0x%x (0x%x bytes)\n", testcalls,
1742 offset, offset + length, length);
1743 if (fallocate(fd, keep_size ? FALLOC_FL_KEEP_SIZE : 0, (loff_t)offset, (loff_t)length) == -1) {
1744 prt("fallocate: 0x%x to 0x%x\n", offset, offset + length);
1745 prterr("do_preallocate: fallocate");
1746 report_failure(161);
1751 do_preallocate(unsigned offset, unsigned length, int keep_size)
1762 if (lseek(fd, (off_t)0, SEEK_SET) == (off_t)-1) {
1763 prterr("writefileimage: lseek");
1764 report_failure(171);
1766 iret = write(fd, good_buf, file_size);
1767 if ((off_t)iret != file_size) {
1769 prterr("writefileimage: write");
1771 prt("short write: 0x%x bytes instead of 0x%llx\n",
1772 iret, (unsigned long long)file_size);
1773 report_failure(172);
1775 if (lite ? 0 : ftruncate(fd, file_size) == -1) {
1776 prt("ftruncate2: %llx\n", (unsigned long long)file_size);
1777 prterr("writefileimage: ftruncate");
1778 report_failure(173);
1786 if (testcalls <= simulatedopcount)
1790 prt("%lld close/open\n", testcalls);
1792 prterr("docloseopen: close");
1793 report_failure(180);
1795 if (system("echo 3 > /proc/sys/vm/drop_caches")) {
1796 prterr("docloseopen: drop_caches");
1797 report_failure(181);
1799 fd = open(fname, O_RDWR|o_direct, 0);
1801 prterr("docloseopen: open");
1802 report_failure(182);
1811 if (testcalls <= simulatedopcount)
1814 prt("%lld fsync\n", testcalls);
1815 log4(OP_FSYNC, 0, 0, 0);
1819 report_failure(210);
1822 dump_fsync_buffer();
1826 #define TRIM_OFF(off, size) \
1834 #define TRIM_LEN(off, len, size) \
1836 if ((off) + (len) > (size)) \
1837 (len) = (size) - (off); \
1840 #define TRIM_OFF_LEN(off, len, size) \
1842 TRIM_OFF(off, size); \
1843 TRIM_LEN(off, len, size); \
1850 prt("signal %d\n", sig);
1851 prt("testcalls = %lld\n", testcalls);
1856 op_args_count(int operation)
1858 switch (operation) {
1859 case OP_CLONE_RANGE:
1860 case OP_DEDUPE_RANGE:
1869 read_op(struct log_entry *log_entry)
1873 memset(log_entry, 0, sizeof(*log_entry));
1874 log_entry->operation = -1;
1876 while (log_entry->operation == -1) {
1881 if (!fgets(line, sizeof(line), replayopsf)) {
1882 if (feof(replayopsf)) {
1888 str = strtok(line, " \t\n");
1889 } while (!str || str[0] == '#');
1891 if (strcmp(str, "skip") == 0) {
1892 log_entry->flags |= FL_SKIPPED;
1893 str = strtok(NULL, " \t\n");
1897 log_entry->operation = op_code(str);
1898 if (log_entry->operation == -1)
1900 log_entry->nr_args = op_args_count(log_entry->operation);
1901 for (i = 0; i < log_entry->nr_args; i++) {
1904 str = strtok(NULL, " \t\n");
1907 log_entry->args[i] = strtoul(str, &end, 0);
1911 while ((str = strtok(NULL, " \t\n"))) {
1912 if (strcmp(str, "keep_size") == 0)
1913 log_entry->flags |= FL_KEEP_SIZE;
1914 else if (strcmp(str, "close_open") == 0)
1915 log_entry->flags |= FL_CLOSE_OPEN;
1916 else if (strcmp(str, "*") == 0)
1917 ; /* overlap marker; ignore */
1925 fprintf(stderr, "%s: parse error\n", replayops);
1928 cleanup(100); /* doesn't return */
1938 return llabs((unsigned long long)off1 - off0) < size;
1941 static void generate_dest_range(bool bdy_align,
1942 unsigned long max_range_end,
1943 unsigned long *src_offset,
1944 unsigned long *size,
1945 unsigned long *dst_offset)
1949 TRIM_OFF_LEN(*src_offset, *size, file_size);
1951 *src_offset -= *src_offset % readbdy;
1953 *size -= *size % readbdy;
1955 *src_offset = *src_offset & ~(block_size - 1);
1956 *size = *size & ~(block_size - 1);
1960 if (tries++ >= 30) {
1964 *dst_offset = random();
1965 TRIM_OFF(*dst_offset, max_range_end);
1967 *dst_offset -= *dst_offset % writebdy;
1969 *dst_offset = *dst_offset & ~(block_size - 1);
1970 } while (range_overlaps(*src_offset, *dst_offset, *size) ||
1971 *dst_offset + *size > max_range_end);
1977 unsigned long offset, offset2;
1983 if (simulatedopcount > 0 && testcalls == simulatedopcount)
1988 if (debugstart > 0 && testcalls >= debugstart)
1991 if (!quiet && testcalls < simulatedopcount && testcalls % 100000 == 0)
1992 prt("%lld...\n", testcalls);
1995 struct log_entry log_entry;
1997 while (read_op(&log_entry)) {
1998 if (log_entry.flags & FL_SKIPPED) {
1999 log4(log_entry.operation,
2000 log_entry.args[0], log_entry.args[1],
2005 op = log_entry.operation;
2006 offset = log_entry.args[0];
2007 size = log_entry.args[1];
2008 offset2 = log_entry.args[2];
2009 closeopen = !!(log_entry.flags & FL_CLOSE_OPEN);
2010 keep_size = !!(log_entry.flags & FL_KEEP_SIZE);
2018 closeopen = (rv >> 3) < (1 << 28) / closeprob;
2024 size = random() % (maxoplen + 1);
2026 /* calculate appropriate op to run */
2028 op = rv % OP_MAX_LITE;
2029 else if (!integrity)
2030 op = rv % OP_MAX_FULL;
2032 op = rv % OP_MAX_INTEGRITY;
2037 size = random() % maxfilelen;
2040 if (fallocate_calls && size && keep_size_calls)
2041 keep_size = random() % 2;
2044 if (zero_range_calls && size && keep_size_calls)
2045 keep_size = random() % 2;
2047 case OP_CLONE_RANGE:
2048 generate_dest_range(false, maxfilelen, &offset, &size, &offset2);
2050 case OP_DEDUPE_RANGE:
2051 generate_dest_range(false, file_size, &offset, &size, &offset2);
2054 generate_dest_range(true, maxfilelen, &offset, &size, &offset2);
2070 if (!fallocate_calls) {
2071 log4(OP_FALLOCATE, offset, size, FL_SKIPPED);
2076 if (!punch_hole_calls) {
2077 log4(OP_PUNCH_HOLE, offset, size, FL_SKIPPED);
2082 if (!zero_range_calls) {
2083 log4(OP_ZERO_RANGE, offset, size, FL_SKIPPED);
2087 case OP_COLLAPSE_RANGE:
2088 if (!collapse_range_calls) {
2089 log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
2093 case OP_INSERT_RANGE:
2094 if (!insert_range_calls) {
2095 log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
2099 case OP_CLONE_RANGE:
2100 if (!clone_range_calls) {
2101 log5(op, offset, size, offset2, FL_SKIPPED);
2105 case OP_DEDUPE_RANGE:
2106 if (!dedupe_range_calls) {
2107 log5(op, offset, size, offset2, FL_SKIPPED);
2112 if (!copy_range_calls) {
2113 log5(op, offset, size, offset2, FL_SKIPPED);
2121 TRIM_OFF_LEN(offset, size, file_size);
2122 doread(offset, size);
2126 TRIM_OFF_LEN(offset, size, maxfilelen);
2127 dowrite(offset, size);
2131 TRIM_OFF_LEN(offset, size, file_size);
2132 domapread(offset, size);
2136 TRIM_OFF_LEN(offset, size, maxfilelen);
2137 domapwrite(offset, size);
2145 TRIM_OFF_LEN(offset, size, maxfilelen);
2146 do_preallocate(offset, size, keep_size);
2150 TRIM_OFF_LEN(offset, size, file_size);
2151 do_punch_hole(offset, size);
2154 TRIM_OFF_LEN(offset, size, maxfilelen);
2155 do_zero_range(offset, size, keep_size);
2157 case OP_COLLAPSE_RANGE:
2158 TRIM_OFF_LEN(offset, size, file_size - 1);
2159 offset = offset & ~(block_size - 1);
2160 size = size & ~(block_size - 1);
2162 log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
2165 do_collapse_range(offset, size);
2167 case OP_INSERT_RANGE:
2168 TRIM_OFF(offset, file_size);
2169 TRIM_LEN(file_size, size, maxfilelen);
2170 offset = offset & ~(block_size - 1);
2171 size = size & ~(block_size - 1);
2173 log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
2176 if (file_size + size > maxfilelen) {
2177 log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
2181 do_insert_range(offset, size);
2183 case OP_CLONE_RANGE:
2185 log5(OP_CLONE_RANGE, offset, size, offset2, FL_SKIPPED);
2188 if (offset2 + size > maxfilelen) {
2189 log5(OP_CLONE_RANGE, offset, size, offset2, FL_SKIPPED);
2193 do_clone_range(offset, size, offset2);
2195 case OP_DEDUPE_RANGE:
2197 log5(OP_DEDUPE_RANGE, offset, size, offset2, FL_SKIPPED);
2200 if (offset2 + size > maxfilelen) {
2201 log5(OP_DEDUPE_RANGE, offset, size, offset2, FL_SKIPPED);
2205 do_dedupe_range(offset, size, offset2);
2209 log5(OP_COPY_RANGE, offset, size, offset2, FL_SKIPPED);
2212 if (offset2 + size > maxfilelen) {
2213 log5(OP_COPY_RANGE, offset, size, offset2, FL_SKIPPED);
2217 do_copy_range(offset, size, offset2);
2223 prterr("test: unknown operation");
2228 if (check_file && testcalls > simulatedopcount)
2234 if (sizechecks && testcalls > simulatedopcount)
2243 fprintf(stdout, "usage: %s",
2244 "fsx [-dknqxBEFJLOWZ][-A|-U] [-b opnum] [-c Prob] [-g filldata] [-i logdev] [-j logid] [-l flen] [-m start:end] [-o oplen] [-p progressinterval] [-r readbdy] [-s style] [-t truncbdy] [-w writebdy] [-D startingop] [-N numops] [-P dirpath] [-S seed] fname\n\
2245 -b opnum: beginning operation number (default 1)\n\
2246 -c P: 1 in P chance of file close+open at each op (default infinity)\n\
2247 -d: debug output for all operations\n\
2248 -f flush and invalidate cache after I/O\n\
2249 -g X: write character X instead of random generated data\n\
2250 -i logdev: do integrity testing, logdev is the dm log writes device\n\
2251 -j logid: prefix debug log messsages with this id\n\
2252 -k: do not truncate existing file and use its size as upper bound on file size\n\
2253 -l flen: the upper bound on file size (default 262144)\n\
2254 -m startop:endop: monitor (print debug output) specified byte range (default 0:infinity)\n\
2255 -n: no verifications of file size\n\
2256 -o oplen: the upper bound on operation size (default 65536)\n\
2257 -p progressinterval: debug output at specified operation interval\n\
2258 -q: quieter operation\n\
2259 -r readbdy: 4096 would make reads page aligned (default 1)\n\
2260 -s style: 1 gives smaller truncates (default 0)\n\
2261 -t truncbdy: 4096 would make truncates page aligned (default 1)\n\
2262 -w writebdy: 4096 would make writes page aligned (default 1)\n\
2263 -x: preallocate file space before starting, XFS only (default 0)\n\
2264 -y synchronize changes to a file\n"
2267 " -A: Use the AIO system calls, -A excludes -U\n"
2270 " -U: Use the IO_URING system calls, -U excludes -A\n"
2272 " -D startingop: debug output starting at specified operation\n"
2273 #ifdef HAVE_LINUX_FALLOC_H
2274 " -F: Do not use fallocate (preallocation) calls\n"
2276 #ifdef FALLOC_FL_PUNCH_HOLE
2277 " -H: Do not use punch hole calls\n"
2279 #ifdef FALLOC_FL_ZERO_RANGE
2280 " -z: Do not use zero range calls\n"
2282 #ifdef FALLOC_FL_COLLAPSE_RANGE
2283 " -C: Do not use collapse range calls\n"
2285 #ifdef FALLOC_FL_INSERT_RANGE
2286 " -I: Do not use insert range calls\n"
2289 " -J: Do not use clone range calls\n"
2291 #ifdef FIDEDUPERANGE
2292 " -B: Do not use dedupe range calls\n"
2294 #ifdef HAVE_COPY_FILE_RANGE
2295 " -E: Do not use copy range calls\n"
2297 " -L: fsxLite - no file creations & no file size changes\n\
2298 -N numops: total # operations to do (default infinity)\n\
2299 -O: use oplen (see -o flag) for every op (default random)\n\
2300 -P: save .fsxlog .fsxops and .fsxgood files in dirpath (default ./)\n\
2301 -S seed: for random # generator (default 1) 0 gets timestamp\n\
2302 -W: mapped write operations DISabled\n\
2303 -X: Read file and compare to good buffer after every operation.\n\
2304 -R: read() system calls only (mapped reads disabled)\n\
2305 -Z: O_DIRECT (use -R, -W, -r and -w too)\n\
2306 --replay-ops opsfile: replay ops from recorded .fsxops file\n\
2307 --record-ops[=opsfile]: dump ops file also on success. optionally specify ops file name\n\
2308 fname: this filename is REQUIRED (no default)\n");
2314 getnum(char *s, char **e)
2319 ret = strtoll(s, e, 0);
2349 io_context_t io_ctx;
2356 ret = io_queue_init(QSZ, &io_ctx);
2358 fprintf(stderr, "aio_setup: io_queue_init failed: %s\n",
2366 aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
2368 struct io_event event;
2369 static struct timespec ts;
2370 struct iocb *iocbs[] = { &iocb };
2375 io_prep_pread(&iocb, fd, buf, len, offset);
2377 io_prep_pwrite(&iocb, fd, buf, len, offset);
2382 ret = io_submit(io_ctx, 1, iocbs);
2384 fprintf(stderr, "errcode=%d\n", ret);
2385 fprintf(stderr, "aio_rw: io_submit failed: %s\n",
2390 ret = io_getevents(io_ctx, 1, 1, &event, &ts);
2393 fprintf(stderr, "aio_rw: no events available\n");
2395 fprintf(stderr, "errcode=%d\n", -ret);
2396 fprintf(stderr, "aio_rw: io_getevents failed: %s\n",
2401 if (len != event.res) {
2403 * The b0rked libaio defines event.res as unsigned.
2404 * However the kernel strucuture has it signed,
2405 * and it's used to pass negated error value.
2406 * Till the library is fixed use the temp var.
2408 res = (long)event.res;
2410 fprintf(stderr, "bad io length: %lu instead of %u\n",
2413 fprintf(stderr, "errcode=%ld\n", -res);
2414 fprintf(stderr, "aio_rw: async io failed: %s\n",
2425 * The caller expects error return in traditional libc
2426 * convention, i.e. -1 and the errno set to error.
2432 aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
2434 fprintf(stderr, "io_rw: need AIO support!\n");
2441 struct io_uring ring;
2442 #define URING_ENTRIES 1024
2449 ret = io_uring_queue_init(URING_ENTRIES, &ring, 0);
2451 fprintf(stderr, "uring_setup: io_uring_queue_init failed: %s\n",
2459 uring_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
2461 struct io_uring_sqe *sqe;
2462 struct io_uring_cqe *cqe;
2468 unsigned o = offset;
2471 * Due to io_uring tries non-blocking IOs (especially read), that
2472 * always cause 'normal' short reading. To avoid this short read
2473 * fail, try to loop read/write (escpecilly read) data.
2476 sqe = io_uring_get_sqe(&ring);
2478 fprintf(stderr, "uring_rw: io_uring_get_sqe failed: %s\n",
2486 io_uring_prep_readv(sqe, fd, &iovec, 1, o);
2488 io_uring_prep_writev(sqe, fd, &iovec, 1, o);
2491 ret = io_uring_submit_and_wait(&ring, 1);
2493 fprintf(stderr, "errcode=%d\n", -ret);
2494 fprintf(stderr, "uring %s: io_uring_submit failed: %s\n",
2495 rw == READ ? "read":"write", strerror(-ret));
2499 ret = io_uring_wait_cqe(&ring, &cqe);
2501 fprintf(stderr, "errcode=%d\n", -ret);
2502 fprintf(stderr, "uring %s: io_uring_wait_cqe failed: %s\n",
2503 rw == READ ? "read":"write", strerror(-ret));
2508 io_uring_cqe_seen(&ring, cqe);
2515 } else if (ret < 0) {
2516 fprintf(stderr, "errcode=%d\n", -ret);
2517 fprintf(stderr, "uring %s: io_uring failed: %s\n",
2518 rw == READ ? "read":"write", strerror(-ret));
2521 fprintf(stderr, "uring %s bad io length: %d instead of %u\n",
2522 rw == READ ? "read":"write", res, len);
2530 * The caller expects error return in traditional libc
2531 * convention, i.e. -1 and the errno set to error.
2538 uring_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
2540 fprintf(stderr, "io_rw: need IO_URING support!\n");
2546 fsx_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
2551 ret = aio_rw(rw, fd, buf, len, offset);
2553 ret = uring_rw(rw, fd, buf, len, offset);
2556 ret = read(fd, buf, len);
2558 ret = write(fd, buf, len);
2563 #define test_fallocate(mode) __test_fallocate(mode, #mode)
2566 __test_fallocate(int mode, const char *mode_str)
2568 #ifdef HAVE_LINUX_FALLOC_H
2571 if (fallocate(fd, mode, file_size, 1) &&
2572 (errno == ENOSYS || errno == EOPNOTSUPP)) {
2575 "main: filesystem does not support "
2576 "fallocate mode %s, disabling!\n",
2580 if (ftruncate(fd, file_size)) {
2581 warn("main: ftruncate");
2590 static struct option longopts[] = {
2591 {"replay-ops", required_argument, 0, 256},
2592 {"record-ops", optional_argument, 0, 255},
2597 main(int argc, char **argv)
2601 char logfile[PATH_MAX];
2602 struct stat statbuf;
2603 int o_flags = O_RDWR|O_CREAT|O_TRUNC;
2608 page_size = getpagesize();
2609 page_mask = page_size - 1;
2610 mmap_mask = page_mask;
2613 setvbuf(stdout, (char *)0, _IOLBF, 0); /* line buffered stdout */
2615 while ((ch = getopt_long(argc, argv,
2616 "b:c:dfg:i:j:kl:m:no:p:qr:s:t:w:xyABD:EFJKHzCILN:OP:RS:UWXZ",
2617 longopts, NULL)) != EOF)
2620 simulatedopcount = getnum(optarg, &endp);
2622 prt("Will begin at operation %lld\n",
2624 if (simulatedopcount == 0)
2626 simulatedopcount -= 1;
2629 closeprob = getnum(optarg, &endp);
2631 prt("Chance of close/open is 1 in %d\n", closeprob);
2646 logdev = strdup(optarg);
2653 logid = strdup(optarg);
2660 o_flags &= ~O_TRUNC;
2663 maxfilelen = getnum(optarg, &endp);
2664 if (maxfilelen <= 0)
2668 monitorstart = getnum(optarg, &endp);
2669 if (monitorstart < 0)
2671 if (!endp || *endp++ != ':')
2673 monitorend = getnum(endp, &endp);
2676 if (monitorend == 0)
2677 monitorend = -1; /* aka infinity */
2683 maxoplen = getnum(optarg, &endp);
2688 progressinterval = getnum(optarg, &endp);
2689 if (progressinterval == 0)
2696 readbdy = getnum(optarg, &endp);
2701 style = getnum(optarg, &endp);
2702 if (style < 0 || style > 1)
2706 truncbdy = getnum(optarg, &endp);
2711 writebdy = getnum(optarg, &endp);
2728 debugstart = getnum(optarg, &endp);
2733 fallocate_calls = 0;
2736 keep_size_calls = 0;
2739 punch_hole_calls = 0;
2742 zero_range_calls = 0;
2745 collapse_range_calls = 0;
2748 insert_range_calls = 0;
2751 clone_range_calls = 0;
2754 dedupe_range_calls = 0;
2757 copy_range_calls = 0;
2761 o_flags &= ~(O_CREAT|O_TRUNC);
2764 numops = getnum(optarg, &endp);
2772 snprintf(dname, sizeof(dname), "%s/", optarg);
2773 dirpath = strlen(dname);
2779 seed = getnum(optarg, &endp);
2781 seed = time(0) % 10000;
2782 seed += (int)getpid();
2790 prt("mapped writes DISABLED\n");
2796 o_direct = O_DIRECT;
2797 o_flags |= O_DIRECT;
2799 case 255: /* --record-ops */
2801 snprintf(opsfile, sizeof(opsfile), "%s", optarg);
2802 recordops = opsfile;
2804 case 256: /* --replay-ops */
2817 fprintf(stderr, "-A and -U shouldn't be used together\n");
2821 if (integrity && !dirpath) {
2822 fprintf(stderr, "option -i <logdev> requires -P <dirpath>\n");
2827 tmp = strdup(fname);
2832 bname = basename(tmp);
2834 signal(SIGHUP, cleanup);
2835 signal(SIGINT, cleanup);
2836 signal(SIGPIPE, cleanup);
2837 signal(SIGALRM, cleanup);
2838 signal(SIGTERM, cleanup);
2839 signal(SIGXCPU, cleanup);
2840 signal(SIGXFSZ, cleanup);
2841 signal(SIGVTALRM, cleanup);
2842 signal(SIGUSR1, cleanup);
2843 signal(SIGUSR2, cleanup);
2846 prt("Seed set to %d\n", seed);
2848 fd = open(fname, o_flags, 0666);
2853 if (fstat(fd, &statbuf)) {
2854 prterr("check_size: fstat");
2857 block_size = statbuf.st_blksize;
2860 xfs_flock64_t resv = { 0 };
2861 #ifdef HAVE_XFS_PLATFORM_DEFS_H
2862 if (!platform_test_xfs_fd(fd)) {
2864 fprintf(stderr, "main: cannot prealloc, non XFS\n");
2868 resv.l_len = maxfilelen;
2869 if ((xfsctl(fname, fd, XFS_IOC_RESVSP, &resv)) < 0) {
2877 snprintf(goodfile, sizeof(goodfile), "%s%s.fsxgood", dname, bname);
2878 snprintf(logfile, sizeof(logfile), "%s%s.fsxlog", dname, bname);
2880 snprintf(opsfile, sizeof(opsfile), "%s%s.fsxops", dname, bname);
2882 snprintf(goodfile, sizeof(goodfile), "%s.fsxgood", fname);
2883 snprintf(logfile, sizeof(logfile), "%s.fsxlog", fname);
2885 snprintf(opsfile, sizeof(opsfile), "%s.fsxops", fname);
2887 fsxgoodfd = open(goodfile, O_RDWR|O_CREAT|O_TRUNC, 0666);
2888 if (fsxgoodfd < 0) {
2892 fsxlogf = fopen(logfile, "w");
2893 if (fsxlogf == NULL) {
2900 replayopsf = fopen(replayops, "r");
2916 if (!(o_flags & O_TRUNC)) {
2918 file_size = maxfilelen = biggest = lseek(fd, (off_t)0, SEEK_END);
2919 if (file_size == (off_t)-1) {
2921 warn("main: lseek eof");
2924 ret = lseek(fd, (off_t)0, SEEK_SET);
2925 if (ret == (off_t)-1) {
2927 warn("main: lseek 0");
2931 original_buf = (char *) malloc(maxfilelen);
2932 for (i = 0; i < maxfilelen; i++)
2933 original_buf[i] = random() % 256;
2934 good_buf = (char *) malloc(maxfilelen + writebdy);
2935 good_buf = round_ptr_up(good_buf, writebdy, 0);
2936 memset(good_buf, '\0', maxfilelen);
2937 temp_buf = (char *) malloc(maxoplen + readbdy);
2938 temp_buf = round_ptr_up(temp_buf, readbdy, 0);
2939 memset(temp_buf, '\0', maxoplen);
2940 if (lite) { /* zero entire existing file */
2943 written = write(fd, good_buf, (size_t)maxfilelen);
2944 if (written != maxfilelen) {
2945 if (written == -1) {
2947 warn("main: error on write");
2949 warn("main: short write, 0x%x bytes instead "
2956 ssize_t ret, len = file_size;
2960 ret = read(fd, good_buf + off, len);
2963 warn("main: error on read");
2973 if (fallocate_calls)
2974 fallocate_calls = test_fallocate(0);
2975 if (keep_size_calls)
2976 keep_size_calls = test_fallocate(FALLOC_FL_KEEP_SIZE);
2977 if (punch_hole_calls)
2978 punch_hole_calls = test_fallocate(FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE);
2979 if (zero_range_calls)
2980 zero_range_calls = test_fallocate(FALLOC_FL_ZERO_RANGE);
2981 if (collapse_range_calls)
2982 collapse_range_calls = test_fallocate(FALLOC_FL_COLLAPSE_RANGE);
2983 if (insert_range_calls)
2984 insert_range_calls = test_fallocate(FALLOC_FL_INSERT_RANGE);
2985 if (clone_range_calls)
2986 clone_range_calls = test_clone_range();
2987 if (dedupe_range_calls)
2988 dedupe_range_calls = test_dedupe_range();
2989 if (copy_range_calls)
2990 copy_range_calls = test_copy_range();
2992 while (numops == -1 || numops--)
3001 prt("All %lld operations completed A-OK!\n", testcalls);