|  | // SPDX-License-Identifier: GPL-2.0-or-later | 
|  | /* Direct I/O support. | 
|  | * | 
|  | * Copyright (C) 2023 Red Hat, Inc. All Rights Reserved. | 
|  | * Written by David Howells (dhowells@redhat.com) | 
|  | */ | 
|  |  | 
|  | #include <linux/export.h> | 
|  | #include <linux/fs.h> | 
|  | #include <linux/mm.h> | 
|  | #include <linux/pagemap.h> | 
|  | #include <linux/slab.h> | 
|  | #include <linux/uio.h> | 
|  | #include <linux/sched/mm.h> | 
|  | #include <linux/task_io_accounting_ops.h> | 
|  | #include <linux/netfs.h> | 
|  | #include "internal.h" | 
|  |  | 
|  | static void netfs_prepare_dio_read_iterator(struct netfs_io_subrequest *subreq) | 
|  | { | 
|  | struct netfs_io_request *rreq = subreq->rreq; | 
|  | size_t rsize; | 
|  |  | 
|  | rsize = umin(subreq->len, rreq->io_streams[0].sreq_max_len); | 
|  | subreq->len = rsize; | 
|  |  | 
|  | if (unlikely(rreq->io_streams[0].sreq_max_segs)) { | 
|  | size_t limit = netfs_limit_iter(&rreq->iter, 0, rsize, | 
|  | rreq->io_streams[0].sreq_max_segs); | 
|  |  | 
|  | if (limit < rsize) { | 
|  | subreq->len = limit; | 
|  | trace_netfs_sreq(subreq, netfs_sreq_trace_limited); | 
|  | } | 
|  | } | 
|  |  | 
|  | trace_netfs_sreq(subreq, netfs_sreq_trace_prepare); | 
|  |  | 
|  | subreq->io_iter	= rreq->iter; | 
|  | iov_iter_truncate(&subreq->io_iter, subreq->len); | 
|  | iov_iter_advance(&rreq->iter, subreq->len); | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Perform a read to a buffer from the server, slicing up the region to be read | 
|  | * according to the network rsize. | 
|  | */ | 
|  | static int netfs_dispatch_unbuffered_reads(struct netfs_io_request *rreq) | 
|  | { | 
|  | unsigned long long start = rreq->start; | 
|  | ssize_t size = rreq->len; | 
|  | int ret = 0; | 
|  |  | 
|  | atomic_set(&rreq->nr_outstanding, 1); | 
|  |  | 
|  | do { | 
|  | struct netfs_io_subrequest *subreq; | 
|  | ssize_t slice; | 
|  |  | 
|  | subreq = netfs_alloc_subrequest(rreq); | 
|  | if (!subreq) { | 
|  | ret = -ENOMEM; | 
|  | break; | 
|  | } | 
|  |  | 
|  | subreq->source	= NETFS_DOWNLOAD_FROM_SERVER; | 
|  | subreq->start	= start; | 
|  | subreq->len	= size; | 
|  |  | 
|  | atomic_inc(&rreq->nr_outstanding); | 
|  | spin_lock_bh(&rreq->lock); | 
|  | list_add_tail(&subreq->rreq_link, &rreq->subrequests); | 
|  | subreq->prev_donated = rreq->prev_donated; | 
|  | rreq->prev_donated = 0; | 
|  | trace_netfs_sreq(subreq, netfs_sreq_trace_added); | 
|  | spin_unlock_bh(&rreq->lock); | 
|  |  | 
|  | netfs_stat(&netfs_n_rh_download); | 
|  | if (rreq->netfs_ops->prepare_read) { | 
|  | ret = rreq->netfs_ops->prepare_read(subreq); | 
|  | if (ret < 0) { | 
|  | atomic_dec(&rreq->nr_outstanding); | 
|  | netfs_put_subrequest(subreq, false, netfs_sreq_trace_put_cancel); | 
|  | break; | 
|  | } | 
|  | } | 
|  |  | 
|  | netfs_prepare_dio_read_iterator(subreq); | 
|  | slice = subreq->len; | 
|  | rreq->netfs_ops->issue_read(subreq); | 
|  |  | 
|  | size -= slice; | 
|  | start += slice; | 
|  | rreq->submitted += slice; | 
|  |  | 
|  | if (test_bit(NETFS_RREQ_BLOCKED, &rreq->flags) && | 
|  | test_bit(NETFS_RREQ_NONBLOCK, &rreq->flags)) | 
|  | break; | 
|  | cond_resched(); | 
|  | } while (size > 0); | 
|  |  | 
|  | if (atomic_dec_and_test(&rreq->nr_outstanding)) | 
|  | netfs_rreq_terminated(rreq, false); | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | /* | 
|  | * Perform a read to an application buffer, bypassing the pagecache and the | 
|  | * local disk cache. | 
|  | */ | 
|  | static int netfs_unbuffered_read(struct netfs_io_request *rreq, bool sync) | 
|  | { | 
|  | int ret; | 
|  |  | 
|  | _enter("R=%x %llx-%llx", | 
|  | rreq->debug_id, rreq->start, rreq->start + rreq->len - 1); | 
|  |  | 
|  | if (rreq->len == 0) { | 
|  | pr_err("Zero-sized read [R=%x]\n", rreq->debug_id); | 
|  | return -EIO; | 
|  | } | 
|  |  | 
|  | // TODO: Use bounce buffer if requested | 
|  |  | 
|  | inode_dio_begin(rreq->inode); | 
|  |  | 
|  | ret = netfs_dispatch_unbuffered_reads(rreq); | 
|  |  | 
|  | if (!rreq->submitted) { | 
|  | netfs_put_request(rreq, false, netfs_rreq_trace_put_no_submit); | 
|  | inode_dio_end(rreq->inode); | 
|  | ret = 0; | 
|  | goto out; | 
|  | } | 
|  |  | 
|  | if (sync) { | 
|  | trace_netfs_rreq(rreq, netfs_rreq_trace_wait_ip); | 
|  | wait_on_bit(&rreq->flags, NETFS_RREQ_IN_PROGRESS, | 
|  | TASK_UNINTERRUPTIBLE); | 
|  |  | 
|  | ret = rreq->error; | 
|  | if (ret == 0 && rreq->submitted < rreq->len && | 
|  | rreq->origin != NETFS_DIO_READ) { | 
|  | trace_netfs_failure(rreq, NULL, ret, netfs_fail_short_read); | 
|  | ret = -EIO; | 
|  | } | 
|  | } else { | 
|  | ret = -EIOCBQUEUED; | 
|  | } | 
|  |  | 
|  | out: | 
|  | _leave(" = %d", ret); | 
|  | return ret; | 
|  | } | 
|  |  | 
|  | /** | 
|  | * netfs_unbuffered_read_iter_locked - Perform an unbuffered or direct I/O read | 
|  | * @iocb: The I/O control descriptor describing the read | 
|  | * @iter: The output buffer (also specifies read length) | 
|  | * | 
|  | * Perform an unbuffered I/O or direct I/O from the file in @iocb to the | 
|  | * output buffer.  No use is made of the pagecache. | 
|  | * | 
|  | * The caller must hold any appropriate locks. | 
|  | */ | 
|  | ssize_t netfs_unbuffered_read_iter_locked(struct kiocb *iocb, struct iov_iter *iter) | 
|  | { | 
|  | struct netfs_io_request *rreq; | 
|  | ssize_t ret; | 
|  | size_t orig_count = iov_iter_count(iter); | 
|  | bool sync = is_sync_kiocb(iocb); | 
|  |  | 
|  | _enter(""); | 
|  |  | 
|  | if (!orig_count) | 
|  | return 0; /* Don't update atime */ | 
|  |  | 
|  | ret = kiocb_write_and_wait(iocb, orig_count); | 
|  | if (ret < 0) | 
|  | return ret; | 
|  | file_accessed(iocb->ki_filp); | 
|  |  | 
|  | rreq = netfs_alloc_request(iocb->ki_filp->f_mapping, iocb->ki_filp, | 
|  | iocb->ki_pos, orig_count, | 
|  | NETFS_DIO_READ); | 
|  | if (IS_ERR(rreq)) | 
|  | return PTR_ERR(rreq); | 
|  |  | 
|  | netfs_stat(&netfs_n_rh_dio_read); | 
|  | trace_netfs_read(rreq, rreq->start, rreq->len, netfs_read_trace_dio_read); | 
|  |  | 
|  | /* If this is an async op, we have to keep track of the destination | 
|  | * buffer for ourselves as the caller's iterator will be trashed when | 
|  | * we return. | 
|  | * | 
|  | * In such a case, extract an iterator to represent as much of the the | 
|  | * output buffer as we can manage.  Note that the extraction might not | 
|  | * be able to allocate a sufficiently large bvec array and may shorten | 
|  | * the request. | 
|  | */ | 
|  | if (user_backed_iter(iter)) { | 
|  | ret = netfs_extract_user_iter(iter, rreq->len, &rreq->iter, 0); | 
|  | if (ret < 0) | 
|  | goto out; | 
|  | rreq->direct_bv = (struct bio_vec *)rreq->iter.bvec; | 
|  | rreq->direct_bv_count = ret; | 
|  | rreq->direct_bv_unpin = iov_iter_extract_will_pin(iter); | 
|  | rreq->len = iov_iter_count(&rreq->iter); | 
|  | } else { | 
|  | rreq->iter = *iter; | 
|  | rreq->len = orig_count; | 
|  | rreq->direct_bv_unpin = false; | 
|  | iov_iter_advance(iter, orig_count); | 
|  | } | 
|  |  | 
|  | // TODO: Set up bounce buffer if needed | 
|  |  | 
|  | if (!sync) | 
|  | rreq->iocb = iocb; | 
|  |  | 
|  | ret = netfs_unbuffered_read(rreq, sync); | 
|  | if (ret < 0) | 
|  | goto out; /* May be -EIOCBQUEUED */ | 
|  | if (sync) { | 
|  | // TODO: Copy from bounce buffer | 
|  | iocb->ki_pos += rreq->transferred; | 
|  | ret = rreq->transferred; | 
|  | } | 
|  |  | 
|  | out: | 
|  | netfs_put_request(rreq, false, netfs_rreq_trace_put_return); | 
|  | if (ret > 0) | 
|  | orig_count -= ret; | 
|  | return ret; | 
|  | } | 
|  | EXPORT_SYMBOL(netfs_unbuffered_read_iter_locked); | 
|  |  | 
|  | /** | 
|  | * netfs_unbuffered_read_iter - Perform an unbuffered or direct I/O read | 
|  | * @iocb: The I/O control descriptor describing the read | 
|  | * @iter: The output buffer (also specifies read length) | 
|  | * | 
|  | * Perform an unbuffered I/O or direct I/O from the file in @iocb to the | 
|  | * output buffer.  No use is made of the pagecache. | 
|  | */ | 
|  | ssize_t netfs_unbuffered_read_iter(struct kiocb *iocb, struct iov_iter *iter) | 
|  | { | 
|  | struct inode *inode = file_inode(iocb->ki_filp); | 
|  | ssize_t ret; | 
|  |  | 
|  | if (!iter->count) | 
|  | return 0; /* Don't update atime */ | 
|  |  | 
|  | ret = netfs_start_io_direct(inode); | 
|  | if (ret == 0) { | 
|  | ret = netfs_unbuffered_read_iter_locked(iocb, iter); | 
|  | netfs_end_io_direct(inode); | 
|  | } | 
|  | return ret; | 
|  | } | 
|  | EXPORT_SYMBOL(netfs_unbuffered_read_iter); |