2 * Copyright (C) 1991, NeXT Computer, Inc. All Rights Reserverd.
5 * Author: Avadis Tevanian, Jr.
7 * File system exerciser.
9 * Rewritten 8/98 by Conrad Minshall.
11 * Small changes to work under Linux -- davej.
13 * Checks for mmap last-page zero fill.
37 #include <sys/syscall.h>
43 #define NUMPRINTCOLUMNS 32 /* # columns of data to print on each line */
47 enum opflags { FL_NONE = 0, FL_SKIPPED = 1, FL_CLOSE_OPEN = 2, FL_KEEP_SIZE = 4 };
50 * A log entry is an operation and a bunch of arguments.
62 struct log_entry oplog[LOGSIZE]; /* the log */
63 int logptr = 0; /* current position in log */
64 int logcount = 0; /* total ops */
67 * The operation matrix is complex due to conditional execution of different
68 * features. Hence when we come to deciding what operation to run, we need to
69 * be careful in how we select the different operations. The active operations
70 * are mapped to numbers as follows:
72 * lite !lite integrity
81 * COLLAPSE RANGE: - 8 8
84 * When mapped read/writes are disabled, they are simply converted to normal
85 * reads and writes. When fallocate/fpunch calls are disabled, they are
88 * Because of the "lite" version, we also need to have different "maximum
89 * operation" defines to allow the ops to be selected correctly based on the
94 /* common operations */
101 /* !lite operations */
102 OP_TRUNCATE = OP_MAX_LITE,
113 /* integrity operations */
114 OP_FSYNC = OP_MAX_FULL,
119 #define PAGE_SIZE getpagesize()
121 #define PAGE_MASK (PAGE_SIZE - 1)
123 char *original_buf; /* a pointer to the original data */
124 char *good_buf; /* a pointer to the correct data */
125 char *temp_buf; /* a pointer to the current data */
126 char *fname; /* name of our test file */
127 char *bname; /* basename of our test file */
128 char *logdev; /* -i flag */
129 char *logid; /* -j flag */
130 char dname[1024]; /* -P flag */
131 char goodfile[PATH_MAX];
132 int dirpath = 0; /* -P flag */
133 int fd; /* fd for our test file */
135 blksize_t block_size = 0;
138 long long testcalls = 0; /* calls to function "test" */
140 long long simulatedopcount = 0; /* -b flag */
141 int closeprob = 0; /* -c flag */
142 int debug = 0; /* -d flag */
143 long long debugstart = 0; /* -D flag */
144 char filldata = 0; /* -g flag */
145 int flush = 0; /* -f flag */
146 int do_fsync = 0; /* -y flag */
147 unsigned long maxfilelen = 256 * 1024; /* -l flag */
148 int sizechecks = 1; /* -n flag disables them */
149 int maxoplen = 64 * 1024; /* -o flag */
150 int quiet = 0; /* -q flag */
151 long long progressinterval = 0; /* -p flag */
152 int readbdy = 1; /* -r flag */
153 int style = 0; /* -s flag */
154 int prealloc = 0; /* -x flag */
155 int truncbdy = 1; /* -t flag */
156 int writebdy = 1; /* -w flag */
157 long monitorstart = -1; /* -m flag */
158 long monitorend = -1; /* -m flag */
159 int lite = 0; /* -L flag */
160 long long numops = -1; /* -N flag */
161 int randomoplen = 1; /* -O flag disables it */
162 int seed = 1; /* -S flag */
163 int mapped_writes = 1; /* -W flag disables */
164 int fallocate_calls = 1; /* -F flag disables */
165 int keep_size_calls = 1; /* -K flag disables */
166 int punch_hole_calls = 1; /* -H flag disables */
167 int zero_range_calls = 1; /* -z flag disables */
168 int collapse_range_calls = 1; /* -C flag disables */
169 int insert_range_calls = 1; /* -I flag disables */
170 int mapped_reads = 1; /* -R flag disables it */
171 int check_file = 0; /* -X flag enables */
172 int clone_range_calls = 1; /* -J flag disables */
173 int dedupe_range_calls = 1; /* -B flag disables */
174 int copy_range_calls = 1; /* -E flag disables */
175 int integrity = 0; /* -i flag */
177 int o_direct; /* -Z */
185 int aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset);
188 #define fsxread(a,b,c,d) aio_rw(READ, a,b,c,d)
189 #define fsxwrite(a,b,c,d) aio_rw(WRITE, a,b,c,d)
191 #define fsxread(a,b,c,d) read(a,b,c)
192 #define fsxwrite(a,b,c,d) write(a,b,c)
195 const char *replayops = NULL;
196 const char *recordops = NULL;
197 FILE * fsxlogf = NULL;
198 FILE * replayopsf = NULL;
199 char opsfile[PATH_MAX];
203 static void *round_ptr_up(void *ptr, unsigned long align, unsigned long offset)
205 unsigned long ret = (unsigned long)ptr;
207 ret = ((ret + align - 1) & ~(align - 1));
213 vwarnc(int code, const char *fmt, va_list ap)
216 fprintf(stderr, "%s: ", logid);
217 fprintf(stderr, "fsx: ");
219 vfprintf(stderr, fmt, ap);
220 fprintf(stderr, ": ");
222 fprintf(stderr, "%s\n", strerror(code));
226 warn(const char * fmt, ...) {
229 vwarnc(errno, fmt, ap);
234 prt(const char *fmt, ...)
239 fprintf(stdout, "%s: ", logid);
241 vfprintf(stdout, fmt, args);
245 vfprintf(fsxlogf, fmt, args);
251 prterr(const char *prefix)
253 prt("%s%s%s\n", prefix, prefix ? ": " : "", strerror(errno));
257 static const char *op_names[] = {
259 [OP_WRITE] = "write",
260 [OP_MAPREAD] = "mapread",
261 [OP_MAPWRITE] = "mapwrite",
262 [OP_TRUNCATE] = "truncate",
263 [OP_FALLOCATE] = "fallocate",
264 [OP_PUNCH_HOLE] = "punch_hole",
265 [OP_ZERO_RANGE] = "zero_range",
266 [OP_COLLAPSE_RANGE] = "collapse_range",
267 [OP_INSERT_RANGE] = "insert_range",
268 [OP_CLONE_RANGE] = "clone_range",
269 [OP_DEDUPE_RANGE] = "dedupe_range",
270 [OP_COPY_RANGE] = "copy_range",
271 [OP_FSYNC] = "fsync",
274 static const char *op_name(int operation)
276 if (operation >= 0 &&
277 operation < sizeof(op_names) / sizeof(op_names[0]))
278 return op_names[operation];
282 static int op_code(const char *name)
286 for (i = 0; i < sizeof(op_names) / sizeof(op_names[0]); i++)
287 if (op_names[i] && strcmp(name, op_names[i]) == 0)
293 log5(int operation, int arg0, int arg1, int arg2, enum opflags flags)
295 struct log_entry *le;
298 le->operation = operation;
300 flags |= FL_CLOSE_OPEN;
304 le->args[3] = file_size;
309 if (logptr >= LOGSIZE)
314 log4(int operation, int arg0, int arg1, enum opflags flags)
316 struct log_entry *le;
319 le->operation = operation;
321 flags |= FL_CLOSE_OPEN;
324 le->args[2] = file_size;
329 if (logptr >= LOGSIZE)
338 struct log_entry *lp;
340 prt("LOG DUMP (%d total operations):\n", logcount);
342 logopsf = fopen(opsfile, "w");
346 if (logcount < LOGSIZE) {
353 for ( ; count > 0; count--) {
354 bool overlap, overlap2;
357 opnum = i+1 + (logcount/LOGSIZE)*LOGSIZE;
358 prt("%d(%3d mod 256): ", opnum, opnum%256);
361 overlap = badoff >= lp->args[0] &&
362 badoff < lp->args[0] + lp->args[1];
364 if (lp->flags & FL_SKIPPED) {
365 prt("SKIPPED (no operation)");
369 switch (lp->operation) {
371 prt("MAPREAD 0x%x thru 0x%x\t(0x%x bytes)",
372 lp->args[0], lp->args[0] + lp->args[1] - 1,
378 prt("MAPWRITE 0x%x thru 0x%x\t(0x%x bytes)",
379 lp->args[0], lp->args[0] + lp->args[1] - 1,
385 prt("READ 0x%x thru 0x%x\t(0x%x bytes)",
386 lp->args[0], lp->args[0] + lp->args[1] - 1,
392 prt("WRITE 0x%x thru 0x%x\t(0x%x bytes)",
393 lp->args[0], lp->args[0] + lp->args[1] - 1,
395 if (lp->args[0] > lp->args[2])
397 else if (lp->args[0] + lp->args[1] > lp->args[2])
399 overlap = (badoff >= lp->args[0] ||
400 badoff >=lp->args[2]) &&
401 badoff < lp->args[0] + lp->args[1];
406 down = lp->args[1] < lp->args[2];
407 prt("TRUNCATE %s\tfrom 0x%x to 0x%x",
408 down ? "DOWN" : "UP", lp->args[2], lp->args[1]);
409 overlap = badoff >= lp->args[1 + !down] &&
410 badoff < lp->args[1 + !!down];
415 /* 0: offset 1: length 2: where alloced */
416 prt("FALLOC 0x%x thru 0x%x\t(0x%x bytes) ",
417 lp->args[0], lp->args[0] + lp->args[1],
419 if (lp->args[0] + lp->args[1] <= lp->args[2])
421 else if (lp->flags & FL_KEEP_SIZE)
429 prt("PUNCH 0x%x thru 0x%x\t(0x%x bytes)",
430 lp->args[0], lp->args[0] + lp->args[1] - 1,
436 prt("ZERO 0x%x thru 0x%x\t(0x%x bytes)",
437 lp->args[0], lp->args[0] + lp->args[1] - 1,
442 case OP_COLLAPSE_RANGE:
443 prt("COLLAPSE 0x%x thru 0x%x\t(0x%x bytes)",
444 lp->args[0], lp->args[0] + lp->args[1] - 1,
449 case OP_INSERT_RANGE:
450 prt("INSERT 0x%x thru 0x%x\t(0x%x bytes)",
451 lp->args[0], lp->args[0] + lp->args[1] - 1,
457 prt("CLONE 0x%x thru 0x%x\t(0x%x bytes) to 0x%x thru 0x%x",
458 lp->args[0], lp->args[0] + lp->args[1] - 1,
460 lp->args[2], lp->args[2] + lp->args[1] - 1);
461 overlap2 = badoff >= lp->args[2] &&
462 badoff < lp->args[2] + lp->args[1];
463 if (overlap && overlap2)
470 case OP_DEDUPE_RANGE:
471 prt("DEDUPE 0x%x thru 0x%x\t(0x%x bytes) to 0x%x thru 0x%x",
472 lp->args[0], lp->args[0] + lp->args[1] - 1,
474 lp->args[2], lp->args[2] + lp->args[1] - 1);
475 overlap2 = badoff >= lp->args[2] &&
476 badoff < lp->args[2] + lp->args[1];
477 if (overlap && overlap2)
485 prt("COPY 0x%x thru 0x%x\t(0x%x bytes) to 0x%x thru 0x%x",
486 lp->args[0], lp->args[0] + lp->args[1] - 1,
488 lp->args[2], lp->args[2] + lp->args[1] - 1);
489 overlap2 = badoff >= lp->args[2] &&
490 badoff < lp->args[2] + lp->args[1];
491 if (overlap && overlap2)
502 prt("BOGUS LOG ENTRY (operation code = %d)!",
508 if (lp->flags & FL_CLOSE_OPEN)
509 prt("\n\t\tCLOSE/OPEN");
518 if (lp->flags & FL_SKIPPED)
519 fprintf(logopsf, "skip ");
520 fprintf(logopsf, "%s", op_name(lp->operation));
521 for (j = 0; j < lp->nr_args; j++)
522 fprintf(logopsf, " 0x%x", lp->args[j]);
523 if (lp->flags & FL_KEEP_SIZE)
524 fprintf(logopsf, " keep_size");
525 if (lp->flags & FL_CLOSE_OPEN)
526 fprintf(logopsf, " close_open");
528 fprintf(logopsf, " *");
529 fprintf(logopsf, "\n");
534 if (fclose(logopsf) != 0)
537 prt("Log of operations saved to \"%s\"; "
538 "replay with --replay-ops\n",
545 save_buffer(char *buffer, off_t bufferlength, int fd)
548 ssize_t byteswritten;
550 if (fd <= 0 || bufferlength == 0)
553 if (bufferlength > SSIZE_MAX) {
554 prt("fsx flaw: overflow in save_buffer\n");
558 off_t size_by_seek = lseek(fd, (off_t)0, SEEK_END);
559 if (size_by_seek == (off_t)-1)
560 prterr("save_buffer: lseek eof");
561 else if (bufferlength > size_by_seek) {
562 warn("save_buffer: .fsxgood file too short... will save 0x%llx bytes instead of 0x%llx\n", (unsigned long long)size_by_seek,
563 (unsigned long long)bufferlength);
564 bufferlength = size_by_seek;
568 ret = lseek(fd, (off_t)0, SEEK_SET);
569 if (ret == (off_t)-1)
570 prterr("save_buffer: lseek 0");
572 byteswritten = write(fd, buffer, (size_t)bufferlength);
573 if (byteswritten != bufferlength) {
574 if (byteswritten == -1)
575 prterr("save_buffer write");
577 warn("save_buffer: short write, 0x%x bytes instead of 0x%llx\n",
578 (unsigned)byteswritten,
579 (unsigned long long)bufferlength);
585 report_failure(int status)
591 save_buffer(good_buf, file_size, fsxgoodfd);
592 prt("Correct content saved for comparison\n");
593 prt("(maybe hexdump \"%s\" vs \"%s\")\n",
602 #define short_at(cp) ((unsigned short)((*((unsigned char *)(cp)) << 8) | \
603 *(((unsigned char *)(cp)) + 1)))
611 snprintf(command, 256, "dmsetup message %s 0 mark %s.mark%d", logdev,
613 ret = system(command);
615 prterr("dmsetup mark failed");
621 dump_fsync_buffer(void)
623 char fname_buffer[PATH_MAX];
629 snprintf(fname_buffer, sizeof(fname_buffer), "%s%s.mark%d", dname,
631 good_fd = open(fname_buffer, O_WRONLY|O_CREAT|O_TRUNC, 0666);
633 prterr(fname_buffer);
637 save_buffer(good_buf, file_size, good_fd);
639 prt("Dumped fsync buffer to %s\n", fname_buffer + dirpath);
643 check_buffers(char *buf, unsigned offset, unsigned size)
651 if (memcmp(good_buf + offset, buf, size) != 0) {
652 prt("READ BAD DATA: offset = 0x%x, size = 0x%x, fname = %s\n",
653 offset, size, fname);
654 prt("OFFSET\tGOOD\tBAD\tRANGE\n");
656 c = good_buf[offset];
660 bad = short_at(&buf[i]);
661 prt("0x%05x\t0x%04x\t0x%04x", offset,
662 short_at(&good_buf[offset]), bad);
663 op = buf[offset & 1 ? i+1 : i];
664 prt("\t0x%05x\n", n);
666 prt("operation# (mod 256) for "
667 "the bad data may be %u\n",
668 ((unsigned)op & 0xff));
670 prt("operation# (mod 256) for "
671 "the bad data unknown, check"
672 " HOLE and EXTEND ops\n");
692 if (fstat(fd, &statbuf)) {
693 prterr("check_size: fstat");
694 statbuf.st_size = -1;
696 size_by_seek = lseek(fd, (off_t)0, SEEK_END);
697 if (file_size != statbuf.st_size || file_size != size_by_seek) {
698 prt("Size error: expected 0x%llx stat 0x%llx seek 0x%llx\n",
699 (unsigned long long)file_size,
700 (unsigned long long)statbuf.st_size,
701 (unsigned long long)size_by_seek);
708 check_trunc_hack(void)
711 off_t offset = file_size + (off_t)100000;
713 if (ftruncate(fd, file_size))
715 if (ftruncate(fd, offset))
718 if (statbuf.st_size != offset) {
719 prt("no extend on truncate! not posix!\n");
722 if (ftruncate(fd, file_size)) {
724 prterr("check_trunc_hack: ftruncate");
730 doflush(unsigned offset, unsigned size)
736 if (o_direct == O_DIRECT)
739 pg_offset = offset & mmap_mask;
740 map_size = pg_offset + size;
742 if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
743 MAP_FILE | MAP_SHARED, fd,
744 (off_t)(offset - pg_offset))) == (char *)-1) {
745 prterr("doflush: mmap");
748 if (msync(p, map_size, MS_INVALIDATE) != 0) {
749 prterr("doflush: msync");
752 if (munmap(p, map_size) != 0) {
753 prterr("doflush: munmap");
759 doread(unsigned offset, unsigned size)
764 offset -= offset % readbdy;
766 size -= size % readbdy;
768 if (!quiet && testcalls > simulatedopcount && !o_direct)
769 prt("skipping zero size read\n");
770 log4(OP_READ, offset, size, FL_SKIPPED);
773 if (size + offset > file_size) {
774 if (!quiet && testcalls > simulatedopcount)
775 prt("skipping seek/read past end of file\n");
776 log4(OP_READ, offset, size, FL_SKIPPED);
780 log4(OP_READ, offset, size, FL_NONE);
782 if (testcalls <= simulatedopcount)
786 ((progressinterval && testcalls % progressinterval == 0) ||
788 (monitorstart == -1 ||
789 (offset + size > monitorstart &&
790 (monitorend == -1 || offset <= monitorend))))))
791 prt("%lld read\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
792 offset, offset + size - 1, size);
793 ret = lseek(fd, (off_t)offset, SEEK_SET);
794 if (ret == (off_t)-1) {
795 prterr("doread: lseek");
798 iret = fsxread(fd, temp_buf, size, offset);
801 prterr("doread: read");
803 prt("short read: 0x%x bytes instead of 0x%x\n",
807 check_buffers(temp_buf, offset, size);
811 check_eofpage(char *s, unsigned offset, char *p, int size)
813 unsigned long last_page, should_be_zero;
815 if (offset + size <= (file_size & ~page_mask))
818 * we landed in the last page of the file
819 * test to make sure the VM system provided 0's
820 * beyond the true end of the file mapping
821 * (as required by mmap def in 1996 posix 1003.1)
823 last_page = ((unsigned long)p + (offset & page_mask) + size) & ~page_mask;
825 for (should_be_zero = last_page + (file_size & page_mask);
826 should_be_zero < last_page + page_size;
828 if (*(char *)should_be_zero) {
829 prt("Mapped %s: non-zero data past EOF (0x%llx) page offset 0x%x is 0x%04x\n",
830 s, file_size - 1, should_be_zero & page_mask,
831 short_at(should_be_zero));
839 static char *check_buf;
841 unsigned size = file_size;
849 check_buf = (char *) malloc(maxfilelen + writebdy);
850 assert(check_buf != NULL);
851 check_buf = round_ptr_up(check_buf, writebdy, 0);
852 memset(check_buf, '\0', maxfilelen);
856 size -= size % readbdy;
860 ret = lseek(fd, (off_t)offset, SEEK_SET);
861 if (ret == (off_t)-1) {
862 prterr("doread: lseek");
866 iret = fsxread(fd, check_buf, size, offset);
869 prterr("check_contents: read");
871 prt("short check read: 0x%x bytes instead of 0x%x\n",
875 check_buffers(check_buf, offset, size);
877 /* Map eof page, check it */
878 map_offset = size - (size & PAGE_MASK);
879 if (map_offset == size)
880 map_offset -= PAGE_SIZE;
881 map_size = size - map_offset;
883 p = mmap(0, map_size, PROT_READ, MAP_SHARED, fd, map_offset);
884 if (p == MAP_FAILED) {
885 prterr("check_contents: mmap");
888 check_eofpage("check_contents", map_offset, p, map_size);
890 if (munmap(p, map_size) != 0) {
891 prterr("check_contents: munmap");
897 domapread(unsigned offset, unsigned size)
903 offset -= offset % readbdy;
905 if (!quiet && testcalls > simulatedopcount)
906 prt("skipping zero size read\n");
907 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
910 if (size + offset > file_size) {
911 if (!quiet && testcalls > simulatedopcount)
912 prt("skipping seek/read past end of file\n");
913 log4(OP_MAPREAD, offset, size, FL_SKIPPED);
917 log4(OP_MAPREAD, offset, size, FL_NONE);
919 if (testcalls <= simulatedopcount)
923 ((progressinterval && testcalls % progressinterval == 0) ||
925 (monitorstart == -1 ||
926 (offset + size > monitorstart &&
927 (monitorend == -1 || offset <= monitorend))))))
928 prt("%lld mapread\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
929 offset, offset + size - 1, size);
931 pg_offset = offset & PAGE_MASK;
932 map_size = pg_offset + size;
934 if ((p = (char *)mmap(0, map_size, PROT_READ, MAP_SHARED, fd,
935 (off_t)(offset - pg_offset))) == (char *)-1) {
936 prterr("domapread: mmap");
939 memcpy(temp_buf, p + pg_offset, size);
941 check_eofpage("Read", offset, p, size);
943 if (munmap(p, map_size) != 0) {
944 prterr("domapread: munmap");
948 check_buffers(temp_buf, offset, size);
953 gendata(char *original_buf, char *good_buf, unsigned offset, unsigned size)
957 good_buf[offset] = filldata;
959 good_buf[offset] = testcalls % 256;
961 good_buf[offset] += original_buf[offset];
969 dowrite(unsigned offset, unsigned size)
974 offset -= offset % writebdy;
976 size -= size % writebdy;
978 if (!quiet && testcalls > simulatedopcount && !o_direct)
979 prt("skipping zero size write\n");
980 log4(OP_WRITE, offset, size, FL_SKIPPED);
984 log4(OP_WRITE, offset, size, FL_NONE);
986 gendata(original_buf, good_buf, offset, size);
987 if (file_size < offset + size) {
988 if (file_size < offset)
989 memset(good_buf + file_size, '\0', offset - file_size);
990 file_size = offset + size;
992 warn("Lite file size bug in fsx!");
997 if (testcalls <= simulatedopcount)
1001 ((progressinterval && testcalls % progressinterval == 0) ||
1003 (monitorstart == -1 ||
1004 (offset + size > monitorstart &&
1005 (monitorend == -1 || offset <= monitorend))))))
1006 prt("%lld write\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
1007 offset, offset + size - 1, size);
1008 ret = lseek(fd, (off_t)offset, SEEK_SET);
1009 if (ret == (off_t)-1) {
1010 prterr("dowrite: lseek");
1011 report_failure(150);
1013 iret = fsxwrite(fd, good_buf + offset, size, offset);
1016 prterr("dowrite: write");
1018 prt("short write: 0x%x bytes instead of 0x%x\n",
1020 report_failure(151);
1024 prt("fsync() failed: %s\n", strerror(errno));
1025 report_failure(152);
1029 doflush(offset, size);
1035 domapwrite(unsigned offset, unsigned size)
1042 offset -= offset % writebdy;
1044 if (!quiet && testcalls > simulatedopcount)
1045 prt("skipping zero size write\n");
1046 log4(OP_MAPWRITE, offset, size, FL_SKIPPED);
1049 cur_filesize = file_size;
1051 log4(OP_MAPWRITE, offset, size, FL_NONE);
1053 gendata(original_buf, good_buf, offset, size);
1054 if (file_size < offset + size) {
1055 if (file_size < offset)
1056 memset(good_buf + file_size, '\0', offset - file_size);
1057 file_size = offset + size;
1059 warn("Lite file size bug in fsx!");
1060 report_failure(200);
1064 if (testcalls <= simulatedopcount)
1068 ((progressinterval && testcalls % progressinterval == 0) ||
1070 (monitorstart == -1 ||
1071 (offset + size > monitorstart &&
1072 (monitorend == -1 || offset <= monitorend))))))
1073 prt("%lld mapwrite\t0x%x thru\t0x%x\t(0x%x bytes)\n", testcalls,
1074 offset, offset + size - 1, size);
1076 if (file_size > cur_filesize) {
1077 if (ftruncate(fd, file_size) == -1) {
1078 prterr("domapwrite: ftruncate");
1082 pg_offset = offset & PAGE_MASK;
1083 map_size = pg_offset + size;
1085 if ((p = (char *)mmap(0, map_size, PROT_READ | PROT_WRITE,
1086 MAP_FILE | MAP_SHARED, fd,
1087 (off_t)(offset - pg_offset))) == (char *)-1) {
1088 prterr("domapwrite: mmap");
1089 report_failure(202);
1091 memcpy(p + pg_offset, good_buf + offset, size);
1092 if (msync(p, map_size, MS_SYNC) != 0) {
1093 prterr("domapwrite: msync");
1094 report_failure(203);
1097 check_eofpage("Write", offset, p, size);
1099 if (munmap(p, map_size) != 0) {
1100 prterr("domapwrite: munmap");
1101 report_failure(204);
1107 dotruncate(unsigned size)
1109 int oldsize = file_size;
1111 size -= size % truncbdy;
1112 if (size > biggest) {
1114 if (!quiet && testcalls > simulatedopcount)
1115 prt("truncating to largest ever: 0x%x\n", size);
1118 log4(OP_TRUNCATE, 0, size, FL_NONE);
1120 if (size > file_size)
1121 memset(good_buf + file_size, '\0', size - file_size);
1124 if (testcalls <= simulatedopcount)
1127 if ((progressinterval && testcalls % progressinterval == 0) ||
1128 (debug && (monitorstart == -1 || monitorend == -1 ||
1129 size <= monitorend)))
1130 prt("%lld trunc\tfrom 0x%x to 0x%x\n", testcalls, oldsize,
1132 if (ftruncate(fd, (off_t)size) == -1) {
1133 prt("ftruncate1: %x\n", size);
1134 prterr("dotruncate: ftruncate");
1135 report_failure(160);
1139 #ifdef FALLOC_FL_PUNCH_HOLE
1141 do_punch_hole(unsigned offset, unsigned length)
1143 unsigned end_offset;
1146 int mode = FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE;
1149 if (!quiet && testcalls > simulatedopcount)
1150 prt("skipping zero length punch hole\n");
1151 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1155 if (file_size <= (loff_t)offset) {
1156 if (!quiet && testcalls > simulatedopcount)
1157 prt("skipping hole punch off the end of the file\n");
1158 log4(OP_PUNCH_HOLE, offset, length, FL_SKIPPED);
1162 end_offset = offset + length;
1164 log4(OP_PUNCH_HOLE, offset, length, FL_NONE);
1166 if (testcalls <= simulatedopcount)
1169 if ((progressinterval && testcalls % progressinterval == 0) ||
1170 (debug && (monitorstart == -1 || monitorend == -1 ||
1171 end_offset <= monitorend))) {
1172 prt("%lld punch\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1173 offset, offset+length, length);
1175 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1176 prt("punch hole: 0x%x to 0x%x\n", offset, offset + length);
1177 prterr("do_punch_hole: fallocate");
1178 report_failure(161);
1182 max_offset = offset < file_size ? offset : file_size;
1183 max_len = max_offset + length <= file_size ? length :
1184 file_size - max_offset;
1185 memset(good_buf + max_offset, '\0', max_len);
1190 do_punch_hole(unsigned offset, unsigned length)
1196 #ifdef FALLOC_FL_ZERO_RANGE
1198 do_zero_range(unsigned offset, unsigned length, int keep_size)
1200 unsigned end_offset;
1201 int mode = FALLOC_FL_ZERO_RANGE;
1204 mode |= FALLOC_FL_KEEP_SIZE;
1207 if (!quiet && testcalls > simulatedopcount)
1208 prt("skipping zero length zero range\n");
1209 log4(OP_ZERO_RANGE, offset, length, FL_SKIPPED |
1210 (keep_size ? FL_KEEP_SIZE : FL_NONE));
1214 end_offset = keep_size ? 0 : offset + length;
1216 if (end_offset > biggest) {
1217 biggest = end_offset;
1218 if (!quiet && testcalls > simulatedopcount)
1219 prt("zero_range to largest ever: 0x%x\n", end_offset);
1223 * last arg matches fallocate string array index in logdump:
1224 * 0: allocate past EOF
1225 * 1: extending prealloc
1226 * 2: interior prealloc
1228 log4(OP_ZERO_RANGE, offset, length,
1229 keep_size ? FL_KEEP_SIZE : FL_NONE);
1231 if (testcalls <= simulatedopcount)
1234 if ((progressinterval && testcalls % progressinterval == 0) ||
1235 (debug && (monitorstart == -1 || monitorend == -1 ||
1236 end_offset <= monitorend))) {
1237 prt("%lld zero\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1238 offset, offset+length, length);
1240 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1241 prt("zero range: 0x%x to 0x%x\n", offset, offset + length);
1242 prterr("do_zero_range: fallocate");
1243 report_failure(161);
1246 memset(good_buf + offset, '\0', length);
1248 if (!keep_size && end_offset > file_size) {
1250 * If there's a gap between the old file size and the offset of
1251 * the zero range operation, fill the gap with zeroes.
1253 if (offset > file_size)
1254 memset(good_buf + file_size, '\0', offset - file_size);
1256 file_size = end_offset;
1262 do_zero_range(unsigned offset, unsigned length, int keep_size)
1268 #ifdef FALLOC_FL_COLLAPSE_RANGE
1270 do_collapse_range(unsigned offset, unsigned length)
1272 unsigned end_offset;
1273 int mode = FALLOC_FL_COLLAPSE_RANGE;
1276 if (!quiet && testcalls > simulatedopcount)
1277 prt("skipping zero length collapse range\n");
1278 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1282 end_offset = offset + length;
1283 if ((loff_t)end_offset >= file_size) {
1284 if (!quiet && testcalls > simulatedopcount)
1285 prt("skipping collapse range behind EOF\n");
1286 log4(OP_COLLAPSE_RANGE, offset, length, FL_SKIPPED);
1290 log4(OP_COLLAPSE_RANGE, offset, length, FL_NONE);
1292 if (testcalls <= simulatedopcount)
1295 if ((progressinterval && testcalls % progressinterval == 0) ||
1296 (debug && (monitorstart == -1 || monitorend == -1 ||
1297 end_offset <= monitorend))) {
1298 prt("%lld collapse\tfrom 0x%x to 0x%x, (0x%x bytes)\n",
1299 testcalls, offset, offset+length, length);
1301 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1302 prt("collapse range: 0x%x to 0x%x\n", offset, offset + length);
1303 prterr("do_collapse_range: fallocate");
1304 report_failure(161);
1307 memmove(good_buf + offset, good_buf + end_offset,
1308 file_size - end_offset);
1309 file_size -= length;
1314 do_collapse_range(unsigned offset, unsigned length)
1320 #ifdef FALLOC_FL_INSERT_RANGE
1322 do_insert_range(unsigned offset, unsigned length)
1324 unsigned end_offset;
1325 int mode = FALLOC_FL_INSERT_RANGE;
1328 if (!quiet && testcalls > simulatedopcount)
1329 prt("skipping zero length insert range\n");
1330 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1334 if ((loff_t)offset >= file_size) {
1335 if (!quiet && testcalls > simulatedopcount)
1336 prt("skipping insert range behind EOF\n");
1337 log4(OP_INSERT_RANGE, offset, length, FL_SKIPPED);
1341 log4(OP_INSERT_RANGE, offset, length, FL_NONE);
1343 if (testcalls <= simulatedopcount)
1346 end_offset = offset + length;
1347 if ((progressinterval && testcalls % progressinterval == 0) ||
1348 (debug && (monitorstart == -1 || monitorend == -1 ||
1349 end_offset <= monitorend))) {
1350 prt("%lld insert\tfrom 0x%x to 0x%x, (0x%x bytes)\n", testcalls,
1351 offset, offset+length, length);
1353 if (fallocate(fd, mode, (loff_t)offset, (loff_t)length) == -1) {
1354 prt("insert range: 0x%x to 0x%x\n", offset, offset + length);
1355 prterr("do_insert_range: fallocate");
1356 report_failure(161);
1359 memmove(good_buf + end_offset, good_buf + offset,
1360 file_size - offset);
1361 memset(good_buf + offset, '\0', length);
1362 file_size += length;
1367 do_insert_range(unsigned offset, unsigned length)
1375 test_clone_range(void)
1377 struct file_clone_range fcr = {
1381 if (ioctl(fd, FICLONERANGE, &fcr) &&
1382 (errno == EOPNOTSUPP || errno == ENOTTY)) {
1385 "main: filesystem does not support "
1386 "clone range, disabling!\n");
1394 do_clone_range(unsigned offset, unsigned length, unsigned dest)
1396 struct file_clone_range fcr = {
1398 .src_offset = offset,
1399 .src_length = length,
1400 .dest_offset = dest,
1404 if (!quiet && testcalls > simulatedopcount)
1405 prt("skipping zero length clone range\n");
1406 log5(OP_CLONE_RANGE, offset, length, dest, FL_SKIPPED);
1410 if ((loff_t)offset >= file_size) {
1411 if (!quiet && testcalls > simulatedopcount)
1412 prt("skipping clone range behind EOF\n");
1413 log5(OP_CLONE_RANGE, offset, length, dest, FL_SKIPPED);
1417 if (dest + length > biggest) {
1418 biggest = dest + length;
1419 if (!quiet && testcalls > simulatedopcount)
1420 prt("cloning to largest ever: 0x%x\n", dest + length);
1423 log5(OP_CLONE_RANGE, offset, length, dest, FL_NONE);
1425 if (testcalls <= simulatedopcount)
1428 if ((progressinterval && testcalls % progressinterval == 0) ||
1429 (debug && (monitorstart == -1 || monitorend == -1 ||
1430 dest <= monitorstart || dest + length <= monitorend))) {
1431 prt("%lu clone\tfrom 0x%x to 0x%x, (0x%x bytes) at 0x%x\n",
1432 testcalls, offset, offset+length, length, dest);
1435 if (ioctl(fd, FICLONERANGE, &fcr) == -1) {
1436 prt("clone range: 0x%x to 0x%x at 0x%x\n", offset,
1437 offset + length, dest);
1438 prterr("do_clone_range: FICLONERANGE");
1439 report_failure(161);
1442 memcpy(good_buf + dest, good_buf + offset, length);
1443 if (dest > file_size)
1444 memset(good_buf + file_size, '\0', dest - file_size);
1445 if (dest + length > file_size)
1446 file_size = dest + length;
1451 test_clone_range(void)
1457 do_clone_range(unsigned offset, unsigned length, unsigned dest)
1463 #ifdef FIDEDUPERANGE
1465 test_dedupe_range(void)
1467 struct file_dedupe_range *fdr;
1473 fdr = calloc(sizeof(struct file_dedupe_range_info) +
1474 sizeof(struct file_dedupe_range), 1);
1476 prterr("do_dedupe_range: malloc");
1477 report_failure(161);
1480 /* Make sure we have at least two blocks */
1481 new_len = block_size * 2;
1482 if (file_size < new_len && ftruncate(fd, new_len)) {
1483 warn("main: ftruncate");
1487 /* Try to dedupe them */
1488 fdr->src_length = block_size;
1489 fdr->dest_count = 1;
1490 fdr->info[0].dest_fd = fd;
1491 fdr->info[0].dest_offset = block_size;
1493 if (ioctl(fd, FIDEDUPERANGE, fdr))
1495 else if (fdr->info[0].status < 0)
1496 error = -fdr->info[0].status;
1500 /* Older kernels may return EINVAL... */
1501 if (error == EOPNOTSUPP || error == ENOTTY || error == EINVAL) {
1504 "main: filesystem does not support "
1505 "dedupe range, disabling!\n");
1509 /* Put the file back the way it was. */
1510 if (file_size < new_len && ftruncate(fd, file_size)) {
1511 warn("main: ftruncate");
1520 do_dedupe_range(unsigned offset, unsigned length, unsigned dest)
1522 struct file_dedupe_range *fdr;
1525 if (!quiet && testcalls > simulatedopcount)
1526 prt("skipping zero length dedupe range\n");
1527 log5(OP_DEDUPE_RANGE, offset, length, dest, FL_SKIPPED);
1531 if ((loff_t)offset >= file_size) {
1532 if (!quiet && testcalls > simulatedopcount)
1533 prt("skipping dedupe range behind EOF\n");
1534 log5(OP_DEDUPE_RANGE, offset, length, dest, FL_SKIPPED);
1538 log5(OP_DEDUPE_RANGE, offset, length, dest, FL_NONE);
1540 if (testcalls <= simulatedopcount)
1543 if ((progressinterval && testcalls % progressinterval == 0) ||
1544 (debug && (monitorstart == -1 || monitorend == -1 ||
1545 dest <= monitorstart || dest + length <= monitorend))) {
1546 prt("%lu dedupe\tfrom 0x%x to 0x%x, (0x%x bytes) at 0x%x\n",
1547 testcalls, offset, offset+length, length, dest);
1551 fdr = calloc(sizeof(struct file_dedupe_range_info) +
1552 sizeof(struct file_dedupe_range), 1);
1554 prterr("do_dedupe_range: malloc");
1555 report_failure(161);
1558 /* Dedupe data blocks */
1559 fdr->src_offset = offset;
1560 fdr->src_length = length;
1561 fdr->dest_count = 1;
1562 fdr->info[0].dest_fd = fd;
1563 fdr->info[0].dest_offset = dest;
1565 if (ioctl(fd, FIDEDUPERANGE, fdr) == -1) {
1566 prt("dedupe range: 0x%x to 0x%x at 0x%x\n", offset,
1567 offset + length, dest);
1568 prterr("do_dedupe_range(0): FIDEDUPERANGE");
1569 report_failure(161);
1570 } else if (fdr->info[0].status < 0) {
1571 errno = -fdr->info[0].status;
1572 prt("dedupe range: 0x%x to 0x%x at 0x%x\n", offset,
1573 offset + length, dest);
1574 prterr("do_dedupe_range(1): FIDEDUPERANGE");
1575 report_failure(161);
1583 test_dedupe_range(void)
1589 do_dedupe_range(unsigned offset, unsigned length, unsigned dest)
1595 #ifdef HAVE_COPY_FILE_RANGE
1597 test_copy_range(void)
1599 loff_t o1 = 0, o2 = 1;
1601 if (syscall(__NR_copy_file_range, fd, &o1, fd, &o2, 1, 0) == -1 &&
1602 (errno == ENOSYS || errno == EOPNOTSUPP || errno == ENOTTY)) {
1605 "main: filesystem does not support "
1606 "copy range, disabling!\n");
1614 do_copy_range(unsigned offset, unsigned length, unsigned dest)
1622 if (!quiet && testcalls > simulatedopcount)
1623 prt("skipping zero length copy range\n");
1624 log5(OP_COPY_RANGE, offset, length, dest, FL_SKIPPED);
1628 if ((loff_t)offset >= file_size) {
1629 if (!quiet && testcalls > simulatedopcount)
1630 prt("skipping copy range behind EOF\n");
1631 log5(OP_COPY_RANGE, offset, length, dest, FL_SKIPPED);
1635 if (dest + length > biggest) {
1636 biggest = dest + length;
1637 if (!quiet && testcalls > simulatedopcount)
1638 prt("copying to largest ever: 0x%x\n", dest + length);
1641 log5(OP_COPY_RANGE, offset, length, dest, FL_NONE);
1643 if (testcalls <= simulatedopcount)
1646 if ((progressinterval && testcalls % progressinterval == 0) ||
1647 (debug && (monitorstart == -1 || monitorend == -1 ||
1648 dest <= monitorstart || dest + length <= monitorend))) {
1649 prt("%lu copy\tfrom 0x%x to 0x%x, (0x%x bytes) at 0x%x\n",
1650 testcalls, offset, offset+length, length, dest);
1658 nr = syscall(__NR_copy_file_range, fd, &o1, fd, &o2, olen, 0);
1660 if (errno != EAGAIN || tries++ >= 300)
1662 } else if (nr > olen) {
1663 prt("copy range: 0x%x to 0x%x at 0x%x\n", offset,
1664 offset + length, dest);
1665 prt("do_copy_range: asked %u, copied %u??\n",
1667 report_failure(161);
1672 prt("copy range: 0x%x to 0x%x at 0x%x\n", offset,
1673 offset + length, dest);
1674 prterr("do_copy_range:");
1675 report_failure(161);
1678 memcpy(good_buf + dest, good_buf + offset, length);
1679 if (dest > file_size)
1680 memset(good_buf + file_size, '\0', dest - file_size);
1681 if (dest + length > file_size)
1682 file_size = dest + length;
1687 test_copy_range(void)
1693 do_copy_range(unsigned offset, unsigned length, unsigned dest)
1699 #ifdef HAVE_LINUX_FALLOC_H
1700 /* fallocate is basically a no-op unless extending, then a lot like a truncate */
1702 do_preallocate(unsigned offset, unsigned length, int keep_size)
1704 unsigned end_offset;
1707 if (!quiet && testcalls > simulatedopcount)
1708 prt("skipping zero length fallocate\n");
1709 log4(OP_FALLOCATE, offset, length, FL_SKIPPED |
1710 (keep_size ? FL_KEEP_SIZE : FL_NONE));
1714 end_offset = keep_size ? 0 : offset + length;
1716 if (end_offset > biggest) {
1717 biggest = end_offset;
1718 if (!quiet && testcalls > simulatedopcount)
1719 prt("fallocating to largest ever: 0x%x\n", end_offset);
1723 * last arg matches fallocate string array index in logdump:
1724 * 0: allocate past EOF
1725 * 1: extending prealloc
1726 * 2: interior prealloc
1728 log4(OP_FALLOCATE, offset, length,
1729 keep_size ? FL_KEEP_SIZE : FL_NONE);
1731 if (end_offset > file_size) {
1732 memset(good_buf + file_size, '\0', end_offset - file_size);
1733 file_size = end_offset;
1736 if (testcalls <= simulatedopcount)
1739 if ((progressinterval && testcalls % progressinterval == 0) ||
1740 (debug && (monitorstart == -1 || monitorend == -1 ||
1741 end_offset <= monitorend)))
1742 prt("%lld falloc\tfrom 0x%x to 0x%x (0x%x bytes)\n", testcalls,
1743 offset, offset + length, length);
1744 if (fallocate(fd, keep_size ? FALLOC_FL_KEEP_SIZE : 0, (loff_t)offset, (loff_t)length) == -1) {
1745 prt("fallocate: 0x%x to 0x%x\n", offset, offset + length);
1746 prterr("do_preallocate: fallocate");
1747 report_failure(161);
1752 do_preallocate(unsigned offset, unsigned length, int keep_size)
1763 if (lseek(fd, (off_t)0, SEEK_SET) == (off_t)-1) {
1764 prterr("writefileimage: lseek");
1765 report_failure(171);
1767 iret = write(fd, good_buf, file_size);
1768 if ((off_t)iret != file_size) {
1770 prterr("writefileimage: write");
1772 prt("short write: 0x%x bytes instead of 0x%llx\n",
1773 iret, (unsigned long long)file_size);
1774 report_failure(172);
1776 if (lite ? 0 : ftruncate(fd, file_size) == -1) {
1777 prt("ftruncate2: %llx\n", (unsigned long long)file_size);
1778 prterr("writefileimage: ftruncate");
1779 report_failure(173);
1787 if (testcalls <= simulatedopcount)
1791 prt("%lld close/open\n", testcalls);
1793 prterr("docloseopen: close");
1794 report_failure(180);
1796 if (system("echo 3 > /proc/sys/vm/drop_caches")) {
1797 prterr("docloseopen: drop_caches");
1798 report_failure(181);
1800 fd = open(fname, O_RDWR|o_direct, 0);
1802 prterr("docloseopen: open");
1803 report_failure(182);
1812 if (testcalls <= simulatedopcount)
1815 prt("%lld fsync\n", testcalls);
1816 log4(OP_FSYNC, 0, 0, 0);
1820 report_failure(210);
1823 dump_fsync_buffer();
1827 #define TRIM_OFF(off, size) \
1835 #define TRIM_LEN(off, len, size) \
1837 if ((off) + (len) > (size)) \
1838 (len) = (size) - (off); \
1841 #define TRIM_OFF_LEN(off, len, size) \
1843 TRIM_OFF(off, size); \
1844 TRIM_LEN(off, len, size); \
1851 prt("signal %d\n", sig);
1852 prt("testcalls = %lld\n", testcalls);
1857 op_args_count(int operation)
1859 switch (operation) {
1860 case OP_CLONE_RANGE:
1861 case OP_DEDUPE_RANGE:
1870 read_op(struct log_entry *log_entry)
1874 memset(log_entry, 0, sizeof(*log_entry));
1875 log_entry->operation = -1;
1877 while (log_entry->operation == -1) {
1882 if (!fgets(line, sizeof(line), replayopsf)) {
1883 if (feof(replayopsf)) {
1889 str = strtok(line, " \t\n");
1890 } while (!str || str[0] == '#');
1892 if (strcmp(str, "skip") == 0) {
1893 log_entry->flags |= FL_SKIPPED;
1894 str = strtok(NULL, " \t\n");
1898 log_entry->operation = op_code(str);
1899 if (log_entry->operation == -1)
1901 log_entry->nr_args = op_args_count(log_entry->operation);
1902 for (i = 0; i < log_entry->nr_args; i++) {
1905 str = strtok(NULL, " \t\n");
1908 log_entry->args[i] = strtoul(str, &end, 0);
1912 while ((str = strtok(NULL, " \t\n"))) {
1913 if (strcmp(str, "keep_size") == 0)
1914 log_entry->flags |= FL_KEEP_SIZE;
1915 else if (strcmp(str, "close_open") == 0)
1916 log_entry->flags |= FL_CLOSE_OPEN;
1917 else if (strcmp(str, "*") == 0)
1918 ; /* overlap marker; ignore */
1926 fprintf(stderr, "%s: parse error\n", replayops);
1929 cleanup(100); /* doesn't return */
1939 return llabs((unsigned long long)off1 - off0) < size;
1942 static void generate_dest_range(bool bdy_align,
1943 unsigned long max_range_end,
1944 unsigned long *src_offset,
1945 unsigned long *size,
1946 unsigned long *dst_offset)
1950 TRIM_OFF_LEN(*src_offset, *size, file_size);
1952 *src_offset -= *src_offset % readbdy;
1954 *size -= *size % readbdy;
1956 *src_offset = *src_offset & ~(block_size - 1);
1957 *size = *size & ~(block_size - 1);
1961 if (tries++ >= 30) {
1965 *dst_offset = random();
1966 TRIM_OFF(*dst_offset, max_range_end);
1968 *dst_offset -= *dst_offset % writebdy;
1970 *dst_offset = *dst_offset & ~(block_size - 1);
1971 } while (range_overlaps(*src_offset, *dst_offset, *size) ||
1972 *dst_offset + *size > max_range_end);
1978 unsigned long offset, offset2;
1984 if (simulatedopcount > 0 && testcalls == simulatedopcount)
1989 if (debugstart > 0 && testcalls >= debugstart)
1992 if (!quiet && testcalls < simulatedopcount && testcalls % 100000 == 0)
1993 prt("%lld...\n", testcalls);
1996 struct log_entry log_entry;
1998 while (read_op(&log_entry)) {
1999 if (log_entry.flags & FL_SKIPPED) {
2000 log4(log_entry.operation,
2001 log_entry.args[0], log_entry.args[1],
2006 op = log_entry.operation;
2007 offset = log_entry.args[0];
2008 size = log_entry.args[1];
2009 offset2 = log_entry.args[2];
2010 closeopen = !!(log_entry.flags & FL_CLOSE_OPEN);
2011 keep_size = !!(log_entry.flags & FL_KEEP_SIZE);
2019 closeopen = (rv >> 3) < (1 << 28) / closeprob;
2025 size = random() % (maxoplen + 1);
2027 /* calculate appropriate op to run */
2029 op = rv % OP_MAX_LITE;
2030 else if (!integrity)
2031 op = rv % OP_MAX_FULL;
2033 op = rv % OP_MAX_INTEGRITY;
2038 size = random() % maxfilelen;
2041 if (fallocate_calls && size && keep_size_calls)
2042 keep_size = random() % 2;
2045 if (zero_range_calls && size && keep_size_calls)
2046 keep_size = random() % 2;
2048 case OP_CLONE_RANGE:
2049 generate_dest_range(false, maxfilelen, &offset, &size, &offset2);
2051 case OP_DEDUPE_RANGE:
2052 generate_dest_range(false, file_size, &offset, &size, &offset2);
2055 generate_dest_range(true, maxfilelen, &offset, &size, &offset2);
2071 if (!fallocate_calls) {
2072 log4(OP_FALLOCATE, offset, size, FL_SKIPPED);
2077 if (!punch_hole_calls) {
2078 log4(OP_PUNCH_HOLE, offset, size, FL_SKIPPED);
2083 if (!zero_range_calls) {
2084 log4(OP_ZERO_RANGE, offset, size, FL_SKIPPED);
2088 case OP_COLLAPSE_RANGE:
2089 if (!collapse_range_calls) {
2090 log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
2094 case OP_INSERT_RANGE:
2095 if (!insert_range_calls) {
2096 log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
2100 case OP_CLONE_RANGE:
2101 if (!clone_range_calls) {
2102 log5(op, offset, size, offset2, FL_SKIPPED);
2106 case OP_DEDUPE_RANGE:
2107 if (!dedupe_range_calls) {
2108 log5(op, offset, size, offset2, FL_SKIPPED);
2113 if (!copy_range_calls) {
2114 log5(op, offset, size, offset2, FL_SKIPPED);
2122 TRIM_OFF_LEN(offset, size, file_size);
2123 doread(offset, size);
2127 TRIM_OFF_LEN(offset, size, maxfilelen);
2128 dowrite(offset, size);
2132 TRIM_OFF_LEN(offset, size, file_size);
2133 domapread(offset, size);
2137 TRIM_OFF_LEN(offset, size, maxfilelen);
2138 domapwrite(offset, size);
2146 TRIM_OFF_LEN(offset, size, maxfilelen);
2147 do_preallocate(offset, size, keep_size);
2151 TRIM_OFF_LEN(offset, size, file_size);
2152 do_punch_hole(offset, size);
2155 TRIM_OFF_LEN(offset, size, maxfilelen);
2156 do_zero_range(offset, size, keep_size);
2158 case OP_COLLAPSE_RANGE:
2159 TRIM_OFF_LEN(offset, size, file_size - 1);
2160 offset = offset & ~(block_size - 1);
2161 size = size & ~(block_size - 1);
2163 log4(OP_COLLAPSE_RANGE, offset, size, FL_SKIPPED);
2166 do_collapse_range(offset, size);
2168 case OP_INSERT_RANGE:
2169 TRIM_OFF(offset, file_size);
2170 TRIM_LEN(file_size, size, maxfilelen);
2171 offset = offset & ~(block_size - 1);
2172 size = size & ~(block_size - 1);
2174 log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
2177 if (file_size + size > maxfilelen) {
2178 log4(OP_INSERT_RANGE, offset, size, FL_SKIPPED);
2182 do_insert_range(offset, size);
2184 case OP_CLONE_RANGE:
2186 log5(OP_CLONE_RANGE, offset, size, offset2, FL_SKIPPED);
2189 if (offset2 + size > maxfilelen) {
2190 log5(OP_CLONE_RANGE, offset, size, offset2, FL_SKIPPED);
2194 do_clone_range(offset, size, offset2);
2196 case OP_DEDUPE_RANGE:
2198 log5(OP_DEDUPE_RANGE, offset, size, offset2, FL_SKIPPED);
2201 if (offset2 + size > maxfilelen) {
2202 log5(OP_DEDUPE_RANGE, offset, size, offset2, FL_SKIPPED);
2206 do_dedupe_range(offset, size, offset2);
2210 log5(OP_COPY_RANGE, offset, size, offset2, FL_SKIPPED);
2213 if (offset2 + size > maxfilelen) {
2214 log5(OP_COPY_RANGE, offset, size, offset2, FL_SKIPPED);
2218 do_copy_range(offset, size, offset2);
2224 prterr("test: unknown operation");
2229 if (check_file && testcalls > simulatedopcount)
2235 if (sizechecks && testcalls > simulatedopcount)
2244 fprintf(stdout, "usage: %s",
2245 "fsx [-dknqxABEFJLOWZ] [-b opnum] [-c Prob] [-g filldata] [-i logdev] [-j logid] [-l flen] [-m start:end] [-o oplen] [-p progressinterval] [-r readbdy] [-s style] [-t truncbdy] [-w writebdy] [-D startingop] [-N numops] [-P dirpath] [-S seed] fname\n\
2246 -b opnum: beginning operation number (default 1)\n\
2247 -c P: 1 in P chance of file close+open at each op (default infinity)\n\
2248 -d: debug output for all operations\n\
2249 -f flush and invalidate cache after I/O\n\
2250 -g X: write character X instead of random generated data\n\
2251 -i logdev: do integrity testing, logdev is the dm log writes device\n\
2252 -j logid: prefix debug log messsages with this id\n\
2253 -k: do not truncate existing file and use its size as upper bound on file size\n\
2254 -l flen: the upper bound on file size (default 262144)\n\
2255 -m startop:endop: monitor (print debug output) specified byte range (default 0:infinity)\n\
2256 -n: no verifications of file size\n\
2257 -o oplen: the upper bound on operation size (default 65536)\n\
2258 -p progressinterval: debug output at specified operation interval\n\
2259 -q: quieter operation\n\
2260 -r readbdy: 4096 would make reads page aligned (default 1)\n\
2261 -s style: 1 gives smaller truncates (default 0)\n\
2262 -t truncbdy: 4096 would make truncates page aligned (default 1)\n\
2263 -w writebdy: 4096 would make writes page aligned (default 1)\n\
2264 -x: preallocate file space before starting, XFS only (default 0)\n\
2265 -y synchronize changes to a file\n"
2268 " -A: Use the AIO system calls\n"
2270 " -D startingop: debug output starting at specified operation\n"
2271 #ifdef HAVE_LINUX_FALLOC_H
2272 " -F: Do not use fallocate (preallocation) calls\n"
2274 #ifdef FALLOC_FL_PUNCH_HOLE
2275 " -H: Do not use punch hole calls\n"
2277 #ifdef FALLOC_FL_ZERO_RANGE
2278 " -z: Do not use zero range calls\n"
2280 #ifdef FALLOC_FL_COLLAPSE_RANGE
2281 " -C: Do not use collapse range calls\n"
2283 #ifdef FALLOC_FL_INSERT_RANGE
2284 " -I: Do not use insert range calls\n"
2287 " -J: Do not use clone range calls\n"
2289 #ifdef FIDEDUPERANGE
2290 " -B: Do not use dedupe range calls\n"
2292 #ifdef HAVE_COPY_FILE_RANGE
2293 " -E: Do not use copy range calls\n"
2295 " -L: fsxLite - no file creations & no file size changes\n\
2296 -N numops: total # operations to do (default infinity)\n\
2297 -O: use oplen (see -o flag) for every op (default random)\n\
2298 -P: save .fsxlog .fsxops and .fsxgood files in dirpath (default ./)\n\
2299 -S seed: for random # generator (default 1) 0 gets timestamp\n\
2300 -W: mapped write operations DISabled\n\
2301 -X: Read file and compare to good buffer after every operation.\n\
2302 -R: read() system calls only (mapped reads disabled)\n\
2303 -Z: O_DIRECT (use -R, -W, -r and -w too)\n\
2304 --replay-ops opsfile: replay ops from recorded .fsxops file\n\
2305 --record-ops[=opsfile]: dump ops file also on success. optionally specify ops file name\n\
2306 fname: this filename is REQUIRED (no default)\n");
2312 getnum(char *s, char **e)
2317 ret = strtoll(s, e, 0);
2347 io_context_t io_ctx;
2353 ret = io_queue_init(QSZ, &io_ctx);
2355 fprintf(stderr, "aio_setup: io_queue_init failed: %s\n",
2363 __aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
2365 struct io_event event;
2366 static struct timespec ts;
2367 struct iocb *iocbs[] = { &iocb };
2372 io_prep_pread(&iocb, fd, buf, len, offset);
2374 io_prep_pwrite(&iocb, fd, buf, len, offset);
2379 ret = io_submit(io_ctx, 1, iocbs);
2381 fprintf(stderr, "errcode=%d\n", ret);
2382 fprintf(stderr, "aio_rw: io_submit failed: %s\n",
2387 ret = io_getevents(io_ctx, 1, 1, &event, &ts);
2390 fprintf(stderr, "aio_rw: no events available\n");
2392 fprintf(stderr, "errcode=%d\n", -ret);
2393 fprintf(stderr, "aio_rw: io_getevents failed: %s\n",
2398 if (len != event.res) {
2400 * The b0rked libaio defines event.res as unsigned.
2401 * However the kernel strucuture has it signed,
2402 * and it's used to pass negated error value.
2403 * Till the library is fixed use the temp var.
2405 res = (long)event.res;
2407 fprintf(stderr, "bad io length: %lu instead of %u\n",
2410 fprintf(stderr, "errcode=%ld\n", -res);
2411 fprintf(stderr, "aio_rw: async io failed: %s\n",
2422 * The caller expects error return in traditional libc
2423 * convention, i.e. -1 and the errno set to error.
2429 int aio_rw(int rw, int fd, char *buf, unsigned len, unsigned offset)
2434 ret = __aio_rw(rw, fd, buf, len, offset);
2437 ret = read(fd, buf, len);
2439 ret = write(fd, buf, len);
2446 #define test_fallocate(mode) __test_fallocate(mode, #mode)
2449 __test_fallocate(int mode, const char *mode_str)
2451 #ifdef HAVE_LINUX_FALLOC_H
2454 if (fallocate(fd, mode, file_size, 1) &&
2455 (errno == ENOSYS || errno == EOPNOTSUPP)) {
2458 "main: filesystem does not support "
2459 "fallocate mode %s, disabling!\n",
2463 if (ftruncate(fd, file_size)) {
2464 warn("main: ftruncate");
2473 static struct option longopts[] = {
2474 {"replay-ops", required_argument, 0, 256},
2475 {"record-ops", optional_argument, 0, 255},
2480 main(int argc, char **argv)
2484 char logfile[PATH_MAX];
2485 struct stat statbuf;
2486 int o_flags = O_RDWR|O_CREAT|O_TRUNC;
2491 page_size = getpagesize();
2492 page_mask = page_size - 1;
2493 mmap_mask = page_mask;
2496 setvbuf(stdout, (char *)0, _IOLBF, 0); /* line buffered stdout */
2498 while ((ch = getopt_long(argc, argv,
2499 "b:c:dfg:i:j:kl:m:no:p:qr:s:t:w:xyABD:EFJKHzCILN:OP:RS:WXZ",
2500 longopts, NULL)) != EOF)
2503 simulatedopcount = getnum(optarg, &endp);
2505 prt("Will begin at operation %lld\n",
2507 if (simulatedopcount == 0)
2509 simulatedopcount -= 1;
2512 closeprob = getnum(optarg, &endp);
2514 prt("Chance of close/open is 1 in %d\n", closeprob);
2529 logdev = strdup(optarg);
2536 logid = strdup(optarg);
2543 o_flags &= ~O_TRUNC;
2546 maxfilelen = getnum(optarg, &endp);
2547 if (maxfilelen <= 0)
2551 monitorstart = getnum(optarg, &endp);
2552 if (monitorstart < 0)
2554 if (!endp || *endp++ != ':')
2556 monitorend = getnum(endp, &endp);
2559 if (monitorend == 0)
2560 monitorend = -1; /* aka infinity */
2566 maxoplen = getnum(optarg, &endp);
2571 progressinterval = getnum(optarg, &endp);
2572 if (progressinterval == 0)
2579 readbdy = getnum(optarg, &endp);
2584 style = getnum(optarg, &endp);
2585 if (style < 0 || style > 1)
2589 truncbdy = getnum(optarg, &endp);
2594 writebdy = getnum(optarg, &endp);
2608 debugstart = getnum(optarg, &endp);
2613 fallocate_calls = 0;
2616 keep_size_calls = 0;
2619 punch_hole_calls = 0;
2622 zero_range_calls = 0;
2625 collapse_range_calls = 0;
2628 insert_range_calls = 0;
2631 clone_range_calls = 0;
2634 dedupe_range_calls = 0;
2637 copy_range_calls = 0;
2641 o_flags &= ~(O_CREAT|O_TRUNC);
2644 numops = getnum(optarg, &endp);
2652 strncpy(dname, optarg, sizeof(dname));
2654 dirpath = strlen(dname);
2660 seed = getnum(optarg, &endp);
2662 seed = time(0) % 10000;
2663 seed += (int)getpid();
2671 prt("mapped writes DISABLED\n");
2677 o_direct = O_DIRECT;
2678 o_flags |= O_DIRECT;
2680 case 255: /* --record-ops */
2682 strncpy(opsfile, optarg, sizeof(opsfile));
2683 recordops = opsfile;
2685 case 256: /* --replay-ops */
2697 if (integrity && !dirpath) {
2698 fprintf(stderr, "option -i <logdev> requires -P <dirpath>\n");
2703 tmp = strdup(fname);
2708 bname = basename(tmp);
2710 signal(SIGHUP, cleanup);
2711 signal(SIGINT, cleanup);
2712 signal(SIGPIPE, cleanup);
2713 signal(SIGALRM, cleanup);
2714 signal(SIGTERM, cleanup);
2715 signal(SIGXCPU, cleanup);
2716 signal(SIGXFSZ, cleanup);
2717 signal(SIGVTALRM, cleanup);
2718 signal(SIGUSR1, cleanup);
2719 signal(SIGUSR2, cleanup);
2722 prt("Seed set to %d\n", seed);
2724 fd = open(fname, o_flags, 0666);
2729 if (fstat(fd, &statbuf)) {
2730 prterr("check_size: fstat");
2733 block_size = statbuf.st_blksize;
2736 xfs_flock64_t resv = { 0 };
2737 #ifdef HAVE_XFS_PLATFORM_DEFS_H
2738 if (!platform_test_xfs_fd(fd)) {
2740 fprintf(stderr, "main: cannot prealloc, non XFS\n");
2744 resv.l_len = maxfilelen;
2745 if ((xfsctl(fname, fd, XFS_IOC_RESVSP, &resv)) < 0) {
2753 snprintf(goodfile, sizeof(goodfile), "%s%s.fsxgood", dname, bname);
2754 snprintf(logfile, sizeof(logfile), "%s%s.fsxlog", dname, bname);
2756 snprintf(opsfile, sizeof(opsfile), "%s%s.fsxops", dname, bname);
2758 snprintf(goodfile, sizeof(goodfile), "%s.fsxgood", fname);
2759 snprintf(logfile, sizeof(logfile), "%s.fsxlog", fname);
2761 snprintf(opsfile, sizeof(opsfile), "%s.fsxops", fname);
2763 fsxgoodfd = open(goodfile, O_RDWR|O_CREAT|O_TRUNC, 0666);
2764 if (fsxgoodfd < 0) {
2768 fsxlogf = fopen(logfile, "w");
2769 if (fsxlogf == NULL) {
2776 replayopsf = fopen(replayops, "r");
2788 if (!(o_flags & O_TRUNC)) {
2790 file_size = maxfilelen = biggest = lseek(fd, (off_t)0, SEEK_END);
2791 if (file_size == (off_t)-1) {
2793 warn("main: lseek eof");
2796 ret = lseek(fd, (off_t)0, SEEK_SET);
2797 if (ret == (off_t)-1) {
2799 warn("main: lseek 0");
2803 original_buf = (char *) malloc(maxfilelen);
2804 for (i = 0; i < maxfilelen; i++)
2805 original_buf[i] = random() % 256;
2806 good_buf = (char *) malloc(maxfilelen + writebdy);
2807 good_buf = round_ptr_up(good_buf, writebdy, 0);
2808 memset(good_buf, '\0', maxfilelen);
2809 temp_buf = (char *) malloc(maxoplen + readbdy);
2810 temp_buf = round_ptr_up(temp_buf, readbdy, 0);
2811 memset(temp_buf, '\0', maxoplen);
2812 if (lite) { /* zero entire existing file */
2815 written = write(fd, good_buf, (size_t)maxfilelen);
2816 if (written != maxfilelen) {
2817 if (written == -1) {
2819 warn("main: error on write");
2821 warn("main: short write, 0x%x bytes instead "
2828 ssize_t ret, len = file_size;
2832 ret = read(fd, good_buf + off, len);
2835 warn("main: error on read");
2845 if (fallocate_calls)
2846 fallocate_calls = test_fallocate(0);
2847 if (keep_size_calls)
2848 keep_size_calls = test_fallocate(FALLOC_FL_KEEP_SIZE);
2849 if (punch_hole_calls)
2850 punch_hole_calls = test_fallocate(FALLOC_FL_PUNCH_HOLE | FALLOC_FL_KEEP_SIZE);
2851 if (zero_range_calls)
2852 zero_range_calls = test_fallocate(FALLOC_FL_ZERO_RANGE);
2853 if (collapse_range_calls)
2854 collapse_range_calls = test_fallocate(FALLOC_FL_COLLAPSE_RANGE);
2855 if (insert_range_calls)
2856 insert_range_calls = test_fallocate(FALLOC_FL_INSERT_RANGE);
2857 if (clone_range_calls)
2858 clone_range_calls = test_clone_range();
2859 if (dedupe_range_calls)
2860 dedupe_range_calls = test_dedupe_range();
2861 if (copy_range_calls)
2862 copy_range_calls = test_copy_range();
2864 while (numops == -1 || numops--)
2873 prt("All %lld operations completed A-OK!\n", testcalls);