Re: mmap over nfs leads to excessive system load

From: Kenny Simpson
Date: Thu Nov 17 2005 - 16:15:06 EST


--- Andrew Morton <akpm@xxxxxxxx> wrote:
> Could you send the test app please? (Apologies if you've already done so
> and I missed it).
>

Here it is again... this one skips to just under 4GB before starting.
run with "writetest -m <filename>" for the mmap test.

-Kenny




__________________________________
Start your day with Yahoo! - Make it your home page!
http://www.yahoo.com/r/hs// test the write throughput of a sliding mmap window vs simple FILE*

#include <errno.h>
#include <fcntl.h>
#include <stdio.h>
#include <stdlib.h>
#include <signal.h>
#include <string.h>
#include <unistd.h>
#include <time.h>
#include <errno.h>
#include <sys/mman.h>
#include <sys/stat.h>
#include <sys/types.h>
#include <sys/time.h>

int total_bytes = 0;
int last_bytes = 0;

struct timeval last_time;

void timeout(int)
{
struct timeval now;
gettimeofday(&now, 0);

double time_diff = (now.tv_sec - last_time.tv_sec) + ((now.tv_usec - last_time.tv_usec) / 1000000.);
last_time = now;

int new_bytes = total_bytes;
int diff = new_bytes - last_bytes;
printf("wrote %dk %dM bytes in %f seconds -> %fM/sec\n", diff / 1024, diff / (1024 * 1024), time_diff, (diff / (time_diff * 1000000.)));
last_bytes = new_bytes;
}


// tests O_DIRECT + pwrite = fail
// O_DIRECT + truncate = happy
// truncate = happy

// pwrite = happy
// O_DIRECT + truncate = happy
// truncate = happy
// O_DIRECT + pwrite = fail

void do_mapwrite(int fd)
{
// lets write as fast as we can....
int const window_size = 2 * 1024 * 1024; // 2 * 1024 * 1024; // 16k
int const window_pages = window_size / 4096;

int file_page_offset = 0;
long long file_size = window_size;


// fast-forward... by 2046 windows
file_size += 2046u * (2 * 1024 * 1024);
file_page_offset += 2046;


//ftruncate64(fd, file_size);
printf("pwrite to %llx %llu\n", file_size, file_size);
pwrite64(fd, "", 1, file_size);

char* mapping_start = static_cast<char*>(mmap64(0, window_size, PROT_READ | PROT_WRITE, MAP_SHARED, fd, file_size - window_size));


// scribble into buffer and walk the window
for (;;) {
memset(mapping_start, 0, window_size);

// grow file
file_size += window_size;

//ftruncate64(fd, file_size);
pwrite64(fd, "", 1, file_size);

file_page_offset += window_pages;
//munmap(mapping_start, window_size);
//mapping_start = static_cast<char*>(mmap64(mapping_start, window_size, PROT_READ | PROT_WRITE, MAP_SHARED | MAP_FIXED, fd, file_size - window_size));
while (remap_file_pages(mapping_start, window_size, 0, file_page_offset, MAP_SHARED /*| MAP_NONBLOCK*/) <0)
perror("remap_file_pages");

total_bytes += window_size;
}
}



void do_filewrite(int fd)
{
FILE* ptr = fdopen(fd, "w+");

int line_len = 80;
char* buf = (char*)malloc(line_len);
memset(buf, 0, line_len);

for (;;) {
fwrite(buf, line_len, 1, ptr);
total_bytes += line_len;
}
}

void do_syswrite(int fd)
{
int line_len = 64 * 1024;
char* buf = (char*)malloc(line_len);
memset(buf, 0, line_len);

for (;;) {
write(fd, buf, line_len);
total_bytes += line_len;
}
}


int main(int argc, char* argv[])
{
if (argc != 3) {
printf("usage: %s -[mfw] <filename>\n", argv[0]);
return 0;
}

if ((argv[1][0] != '-') ||
((argv[1][1] != 'm') &&
(argv[1][1] != 'w') &&
(argv[1][1] != 'f'))) {
printf("usage: %s -[mfw] <filename>\n", argv[0]);
return 0;
}

int fd = open(argv[2], O_RDWR | O_CREAT | O_LARGEFILE | O_DIRECT, 0644);
if (fd < 0) {
perror("open");
return 0;
}

// start the clock...
signal(SIGALRM, timeout);
{
struct itimerval itv;
itv.it_interval.tv_sec = 1;
itv.it_interval.tv_usec = 0;
itv.it_value = itv.it_interval;

setitimer(ITIMER_REAL, &itv, 0);
}

switch (argv[1][1]) {
case 'm': do_mapwrite(fd); break;
case 'f': do_filewrite(fd); break;
case 'w': do_syswrite(fd); break;
}

return 0;
}