blob: eefb7767f3eab953f202236a395b096ef8f67636 [file] [log] [blame]
/*
* libpmem: IO engine that uses PMDK libpmem to read and write data
*
* Copyright (C) 2017 Nippon Telegraph and Telephone Corporation.
* Copyright 2018-2020, Intel Corporation
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public License,
* version 2 as published by the Free Software Foundation..
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
*/
/*
* libpmem engine
*
* IO engine that uses libpmem to write data (and memcpy to read)
*
* To use:
* ioengine=libpmem
*
* Other relevant settings:
* iodepth=1
* direct=1
* sync=1
* directory=/mnt/pmem0/
* bs=4k
*
* sync=1 means that pmem_drain() is executed for each write operation.
* Otherwise is not and should be called on demand.
*
* direct=1 means PMEM_F_MEM_NONTEMPORAL flag is set in pmem_memcpy().
*
* The pmem device must have a DAX-capable filesystem and be mounted
* with DAX enabled. Directory must point to a mount point of DAX FS.
*
* Example:
* mkfs.xfs /dev/pmem0
* mkdir /mnt/pmem0
* mount -o dax /dev/pmem0 /mnt/pmem0
*
* See examples/libpmem.fio for more.
*
*
* libpmem.so
* By default, the libpmem engine will let the system find the libpmem.so
* that it uses. You can use an alternative libpmem by setting the
* FIO_PMEM_LIB environment variable to the full path to the desired
* libpmem.so. This engine requires PMDK >= 1.5.
*/
#include <stdio.h>
#include <limits.h>
#include <stdlib.h>
#include <unistd.h>
#include <errno.h>
#include <sys/mman.h>
#include <sys/stat.h>
#include <sys/sysmacros.h>
#include <libgen.h>
#include <libpmem.h>
#include "../fio.h"
#include "../verify.h"
struct fio_libpmem_data {
void *libpmem_ptr;
size_t libpmem_sz;
off_t libpmem_off;
};
static int fio_libpmem_init(struct thread_data *td)
{
struct thread_options *o = &td->o;
dprint(FD_IO,"o->rw_min_bs %llu \n o->fsync_blocks %u \n o->fdatasync_blocks %u \n",
o->rw_min_bs,o->fsync_blocks,o->fdatasync_blocks);
dprint(FD_IO, "DEBUG fio_libpmem_init\n");
if ((o->rw_min_bs & page_mask) &&
(o->fsync_blocks || o->fdatasync_blocks)) {
log_err("libpmem: mmap options dictate a minimum block size of "
"%llu bytes\n", (unsigned long long) page_size);
return 1;
}
return 0;
}
/*
* This is the pmem_map_file execution function
*/
static int fio_libpmem_file(struct thread_data *td, struct fio_file *f,
size_t length, off_t off)
{
struct fio_libpmem_data *fdd = FILE_ENG_DATA(f);
mode_t mode = 0;
size_t mapped_len;
int is_pmem;
if(td_rw(td))
mode = S_IWUSR | S_IRUSR;
else if (td_write(td))
mode = S_IWUSR;
else
mode = S_IRUSR;
dprint(FD_IO, "DEBUG fio_libpmem_file\n");
dprint(FD_IO, "f->file_name = %s td->o.verify = %d \n", f->file_name,
td->o.verify);
dprint(FD_IO, "length = %ld f->fd = %d off = %ld file mode = %d \n",
length, f->fd, off, mode);
/* unmap any existing mapping */
if (fdd->libpmem_ptr) {
dprint(FD_IO,"pmem_unmap \n");
if (pmem_unmap(fdd->libpmem_ptr, fdd->libpmem_sz) < 0)
return errno;
fdd->libpmem_ptr = NULL;
}
if((fdd->libpmem_ptr = pmem_map_file(f->file_name, length, PMEM_FILE_CREATE, mode, &mapped_len, &is_pmem)) == NULL) {
td_verror(td, errno, pmem_errormsg());
goto err;
}
if (!is_pmem) {
td_verror(td, errno, "file_name does not point to persistent memory");
}
err:
if (td->error && fdd->libpmem_ptr)
pmem_unmap(fdd->libpmem_ptr, length);
return td->error;
}
static int fio_libpmem_open_file(struct thread_data *td, struct fio_file *f)
{
struct fio_libpmem_data *fdd;
dprint(FD_IO,"DEBUG fio_libpmem_open_file\n");
dprint(FD_IO,"f->io_size=%ld \n",f->io_size);
dprint(FD_IO,"td->o.size=%lld \n",td->o.size);
dprint(FD_IO,"td->o.iodepth=%d\n",td->o.iodepth);
dprint(FD_IO,"td->o.iodepth_batch=%d \n",td->o.iodepth_batch);
if (fio_file_open(f))
td_io_close_file(td, f);
fdd = calloc(1, sizeof(*fdd));
if (!fdd) {
return 1;
}
FILE_SET_ENG_DATA(f, fdd);
fdd->libpmem_sz = f->io_size;
fdd->libpmem_off = 0;
return fio_libpmem_file(td, f, fdd->libpmem_sz, fdd->libpmem_off);
}
static int fio_libpmem_prep(struct thread_data *td, struct io_u *io_u)
{
struct fio_file *f = io_u->file;
struct fio_libpmem_data *fdd = FILE_ENG_DATA(f);
dprint(FD_IO, "DEBUG fio_libpmem_prep\n" );
dprint(FD_IO," io_u->offset %llu : fdd->libpmem_off %ld : "
"io_u->buflen %llu : fdd->libpmem_sz %ld\n",
io_u->offset, fdd->libpmem_off,
io_u->buflen, fdd->libpmem_sz);
if (io_u->buflen > f->real_file_size) {
log_err("libpmem: bs bigger than the file size\n");
return EIO;
}
io_u->mmap_data = fdd->libpmem_ptr + io_u->offset - fdd->libpmem_off
- f->file_offset;
return 0;
}
static enum fio_q_status fio_libpmem_queue(struct thread_data *td,
struct io_u *io_u)
{
unsigned flags = 0;
fio_ro_check(td, io_u);
io_u->error = 0;
dprint(FD_IO, "DEBUG fio_libpmem_queue\n");
dprint(FD_IO,"td->o.odirect %d td->o.sync_io %d \n",td->o.odirect, td->o.sync_io);
/* map both O_SYNC / DSYNC to not using NODRAIN */
flags = td->o.sync_io ? 0 : PMEM_F_MEM_NODRAIN;
flags |= td->o.odirect ? PMEM_F_MEM_NONTEMPORAL : PMEM_F_MEM_TEMPORAL;
switch (io_u->ddir) {
case DDIR_READ:
memcpy(io_u->xfer_buf, io_u->mmap_data, io_u->xfer_buflen);
break;
case DDIR_WRITE:
dprint(FD_IO, "DEBUG mmap_data=%p, xfer_buf=%p\n",
io_u->mmap_data, io_u->xfer_buf );
pmem_memcpy(io_u->mmap_data,
io_u->xfer_buf,
io_u->xfer_buflen,
flags);
break;
case DDIR_SYNC:
case DDIR_DATASYNC:
case DDIR_SYNC_FILE_RANGE:
pmem_drain();
break;
default:
io_u->error = EINVAL;
break;
}
return FIO_Q_COMPLETED;
}
static int fio_libpmem_close_file(struct thread_data *td, struct fio_file *f)
{
struct fio_libpmem_data *fdd = FILE_ENG_DATA(f);
int ret = 0;
dprint(FD_IO,"DEBUG fio_libpmem_close_file\n");
dprint(FD_IO,"td->o.odirect %d \n",td->o.odirect);
if (!td->o.odirect) {
dprint(FD_IO,"pmem_drain\n");
pmem_drain();
}
if (fdd->libpmem_ptr)
ret = pmem_unmap(fdd->libpmem_ptr, fdd->libpmem_sz);
if (fio_file_open(f))
ret &= generic_close_file(td, f);
FILE_SET_ENG_DATA(f, NULL);
free(fdd);
return ret;
}
FIO_STATIC struct ioengine_ops ioengine = {
.name = "libpmem",
.version = FIO_IOOPS_VERSION,
.init = fio_libpmem_init,
.prep = fio_libpmem_prep,
.queue = fio_libpmem_queue,
.open_file = fio_libpmem_open_file,
.close_file = fio_libpmem_close_file,
.get_file_size = generic_get_file_size,
.flags = FIO_SYNCIO | FIO_RAWIO | FIO_DISKLESSIO | FIO_NOEXTEND |
FIO_NODISKUTIL | FIO_BARRIER | FIO_MEMALIGN,
};
static void fio_init fio_libpmem_register(void)
{
register_ioengine(&ioengine);
}
static void fio_exit fio_libpmem_unregister(void)
{
unregister_ioengine(&ioengine);
}