#include <iomanip>
#include <vector>
#include <stxxl/io>
#include <stxxl/aligned_alloc>
#include <stxxl/timer>
using stxxl::request_ptr;
using stxxl::file;
using stxxl::timer;
using stxxl::timestamp;
#define BLOCK_ALIGN 4096
#define POLL_DELAY 1000
#define RAW_ACCESS
void watch_times(request_ptr reqs[], unsigned n, double * out)
bool * finished = new bool[n];
unsigned count = 0;
for (unsigned i = 0; i < n; i++)
finished[i] = false;
while (count != n)
unsigned i = 0;
for (i = 0; i < n; i++)
if (!finished[i])
if (reqs[i]->poll())
finished[i] = true;
out[i] = timestamp();
delete[] finished;
void out_stat(double start, double end, double * times, unsigned n, const std::vector<std::string> & names)
for (unsigned i = 0; i < n; i++)
std::cout << i << " " << names[i] << " took " <<
100. * (times[i] - start) / (end - start) << " %" << std::endl;
#define MB (1024 * 1024)
#define GB (1024 * 1024 * 1024)
void usage(const char * argv0)
std::cout << "Usage: " << argv0 << " pattern offset length [block_size [batch_size]] [nd] [r|w] [--] diskfile..." << std::endl;
std::cout << " 'pattern' is a 32bit unsigned value like '0', '0xffffffff', ..." << std::endl;
std::cout << " starting 'offset' and 'length' are given in GiB," << std::endl;
std::cout << " 'block_size' (default 8) in MiB (in B if it has a suffix B)," << std::endl;
std::cout << " increase 'batch_size' (default 1)" << std::endl;
std::cout << " to submit several I/Os at once and report average rate" << std::endl;
std::cout << " open mode: includes O_DIRECT unless the 'nd' flag is given" << std::endl;
std::cout << " ops: write and reread (default), (r)ead only, (w)rite only" << std::endl;
std::cout << " length == 0 implies till end of space (please ignore the write error)" << std::endl;
std::cout << " Memory consumption: block_size * batch_size * num_disks" << std::endl;
inline double throughput(double bytes, double seconds)
if (seconds == 0.0)
return 0.0;
return bytes / (1024 * 1024) / seconds;
int main(int argc, char * argv[])
if (argc < 5)
unsigned pattern = strtol(argv[1], NULL, 0);
stxxl::int64 offset = stxxl::int64(GB) * stxxl::int64(atoi(argv[2]));
stxxl::int64 length = stxxl::int64(GB) * stxxl::int64(atoi(argv[3]));
stxxl::int64 endpos = offset + length;
stxxl::int64 block_size = 0;
stxxl::int64 batch_size = 0;
bool verify_failed = false;
bool do_read = true, do_write = true;
bool direct_io = true;
int first_disk_arg = 4;
if (first_disk_arg < argc)
block_size = atoi(argv[first_disk_arg]);
if (block_size > 0) {
int l = strlen(argv[first_disk_arg]);
if (argv[first_disk_arg][l - 1] == 'B' || argv[first_disk_arg][l - 1] == 'b') {
} else {
block_size *= MB;
} else {
block_size = 8 * MB;
if (first_disk_arg < argc)
batch_size = atoi(argv[first_disk_arg]);
if (batch_size > 0) {
} else {
batch_size = 1;
if (first_disk_arg < argc && (strcmp("nd", argv[first_disk_arg]) == 0 || strcmp("ND", argv[first_disk_arg]) == 0)) {
direct_io = false;
if (first_disk_arg < argc && (strcmp("r", argv[first_disk_arg]) == 0 || strcmp("R", argv[first_disk_arg]) == 0)) {
do_write = false;
} else if (first_disk_arg < argc && (strcmp("w", argv[first_disk_arg]) == 0 || strcmp("W", argv[first_disk_arg]) == 0)) {
do_read = false;
if (first_disk_arg < argc && strcmp("--", argv[first_disk_arg]) == 0) {
std::vector<std::string> disks_arr;
if (!(first_disk_arg < argc))
for (int ii = first_disk_arg; ii < argc; ii++)
std::cout << "# Add disk: " << argv[ii] << std::endl;
const unsigned ndisks = disks_arr.size();
const stxxl::unsigned_type step_size = block_size * batch_size;
const unsigned block_size_int = block_size / sizeof(int);
const stxxl::int64 step_size_int = step_size / sizeof(int);
unsigned * buffer = (unsigned *)stxxl::aligned_alloc<BLOCK_ALIGN>(step_size * ndisks);
file ** disks = new file *[ndisks];
request_ptr * reqs = new request_ptr[ndisks * batch_size];
double * r_finish_times = new double[ndisks];
double * w_finish_times = new double[ndisks];
double totaltimeread = 0, totaltimewrite = 0;
stxxl::int64 totalsizeread = 0, totalsizewrite = 0;
for (unsigned i = 0; i < ndisks * step_size_int; i++)
buffer[i] = pattern;
for (unsigned i = 0; i < ndisks; i++)
int openmode = file::CREAT | file::RDWR;
if (direct_io) {
openmode |= file::DIRECT;
disks[i] = new stxxl::wincall_file(disks_arr[i], openmode, i);
disks[i] = new stxxl::syscall_file(disks_arr[i], openmode, i);
do_write = false;
#ifdef NOREAD
do_read = false;
const char * myrev = "$Revision$";
const char * myself = strrchr(argv[0], '/');
if (!myself || !*(++myself))
myself = argv[0];
std::cout << "# " << myself << " " << myrev << std::endl;
std::cout << "# Step size: "
<< step_size << " bytes per disk ("
<< batch_size << " block" << (batch_size == 1 ? "" : "s") << " of "
<< block_size << " bytes) pattern=0x"
<< std::hex << pattern << std::dec << std::endl;
timer t_total(true);
try {
while (offset < endpos)
const stxxl::int64 current_step_size = std::min<stxxl::int64>(step_size, endpos - offset);
const stxxl::int64 current_step_size_int = current_step_size / sizeof(int);
const unsigned current_num_blocks = stxxl::div_ceil(current_step_size, block_size);
std::cout << "Disk offset " << std::setw(8) << offset / MB << " MiB: " << std::fixed;
double begin = timestamp(), end, elapsed;
if (do_write) {
for (unsigned j = 42, b = offset >> 9; j < current_step_size_int; j += 512 / sizeof(unsigned), ++b)
for (unsigned i = 0; i < ndisks; i++)
buffer[current_step_size_int * i + j] = b;
for (unsigned i = 0; i < ndisks; i++)
for (unsigned j = 0; j < current_num_blocks; j++)
reqs[i * current_num_blocks + j] =
disks[i]->awrite(buffer + current_step_size_int * i + j * block_size_int,
offset + j * block_size,
watch_times(reqs, ndisks, w_finish_times);
wait_all(reqs, ndisks * current_num_blocks);
end = timestamp();
elapsed = end - begin;
totalsizewrite += current_step_size;
totaltimewrite += elapsed;
} else {
elapsed = 0.0;
#if 0
std::cout << "WRITE\nDisks: " << ndisks
<< " \nElapsed time: " << end - begin
<< " \nThroughput: " << int(double(current_step_size * ndisks) / MB / (end - begin))
<< " MiB/s \nPer one disk:"
<< int(double(current_step_size) / MB / (end - begin)) << " MiB/s"
<< std::endl;
out_stat(begin, end, w_finish_times, ndisks, disks_arr);
std::cout << std::setw(2) << ndisks << " * "
<< std::setw(8) << std::setprecision(3) << (throughput(current_step_size, elapsed)) << " = "
<< std::setw(8) << std::setprecision(3) << (throughput(current_step_size, elapsed) * ndisks) << " MiB/s write,";
begin = timestamp();
if (do_read) {
for (unsigned i = 0; i < ndisks; i++)
for (unsigned j = 0; j < current_num_blocks; j++)
reqs[i * current_num_blocks + j] = disks[i]->aread(buffer + current_step_size_int * i + j * block_size_int,
offset + j * block_size,
watch_times(reqs, ndisks, r_finish_times);
wait_all(reqs, ndisks * current_num_blocks);
end = timestamp();
elapsed = end - begin;
totalsizeread += current_step_size;
totaltimeread += elapsed;
} else {
elapsed = 0.0;
#if 0
std::cout << "READ\nDisks: " << ndisks
<< " \nElapsed time: " << end - begin
<< " \nThroughput: " << int(double(current_step_size * ndisks) / MB / (end - begin))
<< " MiB/s \nPer one disk:"
<< int(double(current_step_size) / MB / (end - begin)) << " MiB/s"
<< std::endl;
std::cout << std::setw(2) << ndisks << " * "
<< std::setw(8) << std::setprecision(3) << (throughput(current_step_size, elapsed)) << " = "
<< std::setw(8) << std::setprecision(3) << (throughput(current_step_size, elapsed) * ndisks) << " MiB/s read";
out_stat(begin, end, r_finish_times, ndisks, disks_arr);
if (do_read) {
for (unsigned d = 0; d < ndisks; ++d) {
for (unsigned s = 0; s < (current_step_size >> 9); ++s) {
unsigned i = d * current_step_size_int + s * (512 / sizeof(unsigned)) + 42;
unsigned b = (offset >> 9) + s;
if (buffer[i] != b) {
verify_failed = true;
std::cout << "Error on disk " << d << " sector " << std::hex << std::setw(8) << b
<< " got: " << std::hex << std::setw(8) << buffer[i] << " wanted: " << std::hex << std::setw(8) << b
<< std::dec << std::endl;
buffer[i] = pattern;
for (unsigned i = 0; i < ndisks * current_step_size_int; i++)
if (buffer[i] != pattern)
verify_failed = true;
int ibuf = i / current_step_size_int;
int pos = i % current_step_size_int;
std::cout << "Error on disk " << ibuf << " position " << std::hex << std::setw(8) << offset + pos * sizeof(int)
<< " got: " << std::hex << std::setw(8) << buffer[i] << " wanted: " << std::hex << std::setw(8) << pattern
<< std::dec << std::endl;
i = (ibuf + 1) * current_step_size_int;
std::cout << std::endl;
offset += current_step_size;
catch (const std::exception & ex)
std::cout << std::endl;
std::cout << "=============================================================================================" << std::endl;
std::cout << "# Average over " << std::setw(8) << stxxl::STXXL_MAX(totalsizewrite, totalsizeread) / MB << " MiB: ";
std::cout << std::setw(2) << ndisks << " * "
<< std::setw(8) << std::setprecision(3) << (throughput(totalsizewrite, totaltimewrite)) << " = "
<< std::setw(8) << std::setprecision(3) << (throughput(totalsizewrite, totaltimewrite) * ndisks) << " MiB/s write,";
std::cout << std::setw(2) << ndisks << " * "
<< std::setw(8) << std::setprecision(3) << (throughput(totalsizeread, totaltimeread)) << " = "
<< std::setw(8) << std::setprecision(3) << (throughput(totalsizeread, totaltimeread) * ndisks) << " MiB/s read"
<< std::endl;
if (totaltimewrite != 0.0)
std::cout << "# Write time " << std::setw(8) << std::setprecision(3) << totaltimewrite << " s" << std::endl;
if (totaltimeread != 0.0)
std::cout << "# Read time " << std::setw(8) << std::setprecision(3) << totaltimeread << " s" << std::endl;
std::cout << "# Non-I/O time " << std::setw(8) << std::setprecision(3) << (t_total.seconds() - totaltimewrite - totaltimeread) << " s, average throughput "
<< std::setw(8) << std::setprecision(3) << (throughput(totalsizewrite + totalsizeread, t_total.seconds() - totaltimewrite - totaltimeread) * ndisks) << " MiB/s"
<< std::endl;
std::cout << "# Total time " << std::setw(8) << std::setprecision(3) << t_total.seconds() << " s, average throughput "
<< std::setw(8) << std::setprecision(3) << (throughput(totalsizewrite + totalsizeread, t_total.seconds()) * ndisks) << " MiB/s"
<< std::endl;
delete[] r_finish_times;
delete[] w_finish_times;
delete[] reqs;
for (unsigned i = 0; i < ndisks; i++)
delete disks[i];
delete[] disks;
return verify_failed ? 1 : 0;