1 // SPDX-License-Identifier: GPL-2.0-or-later 2 /* Iterator helpers. 3 * 4 * Copyright (C) 2022 Red Hat, Inc. All Rights Reserved. 5 * Written by David Howells (dhowells@redhat.com) 6 */ 7 8 #include <linux/export.h> 9 #include <linux/slab.h> 10 #include <linux/mm.h> 11 #include <linux/uio.h> 12 #include <linux/scatterlist.h> 13 #include <linux/netfs.h> 14 #include "internal.h" 15 16 /** 17 * netfs_extract_user_iter - Extract the pages from a user iterator into a bvec 18 * @orig: The original iterator 19 * @orig_len: The amount of iterator to copy 20 * @new: The iterator to be set up 21 * @extraction_flags: Flags to qualify the request 22 * 23 * Extract the page fragments from the given amount of the source iterator and 24 * build up a second iterator that refers to all of those bits. This allows 25 * the original iterator to be disposed of. 26 * 27 * @extraction_flags can have ITER_ALLOW_P2PDMA set to request peer-to-peer DMA be 28 * allowed on the pages extracted. 29 * 30 * On success, the number of elements in the bvec is returned, the original 31 * iterator will have been advanced by the amount extracted. 32 * 33 * The iov_iter_extract_mode() function should be used to query how cleanup 34 * should be performed. 35 */ 36 ssize_t netfs_extract_user_iter(struct iov_iter *orig, size_t orig_len, 37 struct iov_iter *new, 38 iov_iter_extraction_t extraction_flags) 39 { 40 struct bio_vec *bv = NULL; 41 struct page **pages; 42 unsigned int cur_npages; 43 unsigned int max_pages; 44 unsigned int npages = 0; 45 unsigned int i; 46 ssize_t ret = 0; 47 size_t count = orig_len, offset, len; 48 size_t bv_size, pg_size; 49 50 if (WARN_ON_ONCE(!iter_is_ubuf(orig) && !iter_is_iovec(orig))) 51 return -EIO; 52 53 max_pages = iov_iter_npages(orig, INT_MAX); 54 bv_size = array_size(max_pages, sizeof(*bv)); 55 bv = kvmalloc(bv_size, GFP_KERNEL); 56 if (!bv) 57 return -ENOMEM; 58 59 /* Put the page list at the end of the bvec list storage. bvec 60 * elements are larger than page pointers, so as long as we work 61 * 0->last, we should be fine. 62 */ 63 pg_size = array_size(max_pages, sizeof(*pages)); 64 pages = (void *)bv + bv_size - pg_size; 65 66 while (count && npages < max_pages) { 67 ret = iov_iter_extract_pages(orig, &pages, count, 68 max_pages - npages, extraction_flags, 69 &offset); 70 if (unlikely(ret <= 0)) { 71 ret = ret ?: -EIO; 72 break; 73 } 74 75 if (WARN(ret > count, 76 "%s: extract_pages overrun %zd > %zu bytes\n", 77 __func__, ret, count)) { 78 ret = -EIO; 79 break; 80 } 81 82 cur_npages = DIV_ROUND_UP(offset + ret, PAGE_SIZE); 83 if (WARN(cur_npages > max_pages - npages, 84 "%s: extract_pages overrun %u > %u pages\n", 85 __func__, npages + cur_npages, max_pages)) { 86 ret = -EIO; 87 break; 88 } 89 90 count -= ret; 91 ret += offset; 92 93 for (i = 0; i < cur_npages; i++) { 94 len = ret > PAGE_SIZE ? PAGE_SIZE : ret; 95 bvec_set_page(bv + npages + i, *pages++, len - offset, offset); 96 ret -= len; 97 offset = 0; 98 } 99 100 npages += cur_npages; 101 } 102 103 /* Note: Don't try to clean up after EIO. Either we got no pages, so 104 * nothing to clean up, or we got a buffer overrun, memory corruption 105 * and can't trust the stuff in the buffer (a WARN was emitted). 106 */ 107 108 if (ret < 0 && (ret == -ENOMEM || npages == 0)) { 109 for (i = 0; i < npages; i++) 110 unpin_user_page(bv[i].bv_page); 111 kvfree(bv); 112 return ret; 113 } 114 115 iov_iter_bvec(new, orig->data_source, bv, npages, orig_len - count); 116 return npages; 117 } 118 EXPORT_SYMBOL_GPL(netfs_extract_user_iter); 119 120 /* 121 * Select the span of a bvec iterator we're going to use. Limit it by both maximum 122 * size and maximum number of segments. Returns the size of the span in bytes. 123 */ 124 static size_t netfs_limit_bvec(const struct iov_iter *iter, size_t start_offset, 125 size_t max_size, size_t max_segs) 126 { 127 const struct bio_vec *bvecs = iter->bvec; 128 unsigned int nbv = iter->nr_segs, ix = 0, nsegs = 0; 129 size_t len, span = 0, n = iter->count; 130 size_t skip = iter->iov_offset + start_offset; 131 132 if (WARN_ON(!iov_iter_is_bvec(iter)) || 133 WARN_ON(start_offset > n) || 134 n == 0) 135 return 0; 136 137 while (n && ix < nbv && skip) { 138 len = bvecs[ix].bv_len; 139 if (skip < len) 140 break; 141 skip -= len; 142 n -= len; 143 ix++; 144 } 145 146 while (n && ix < nbv) { 147 len = min3(n, bvecs[ix].bv_len - skip, max_size); 148 span += len; 149 nsegs++; 150 ix++; 151 if (span >= max_size || nsegs >= max_segs) 152 break; 153 skip = 0; 154 n -= len; 155 } 156 157 return min(span, max_size); 158 } 159 160 /* 161 * Select the span of a kvec iterator we're going to use. Limit it by both 162 * maximum size and maximum number of segments. Returns the size of the span 163 * in bytes. 164 */ 165 static size_t netfs_limit_kvec(const struct iov_iter *iter, size_t start_offset, 166 size_t max_size, size_t max_segs) 167 { 168 const struct kvec *kvecs = iter->kvec; 169 unsigned int nkv = iter->nr_segs, ix = 0, nsegs = 0; 170 size_t len, span = 0, n = iter->count; 171 size_t skip = iter->iov_offset + start_offset; 172 173 if (WARN_ON(!iov_iter_is_kvec(iter)) || 174 WARN_ON(start_offset > n) || 175 n == 0) 176 return 0; 177 178 while (n && ix < nkv && skip) { 179 len = kvecs[ix].iov_len; 180 if (skip < len) 181 break; 182 skip -= len; 183 n -= len; 184 ix++; 185 } 186 187 while (n && ix < nkv) { 188 len = min3(n, kvecs[ix].iov_len - skip, max_size); 189 span += len; 190 nsegs++; 191 ix++; 192 if (span >= max_size || nsegs >= max_segs) 193 break; 194 skip = 0; 195 n -= len; 196 } 197 198 return min(span, max_size); 199 } 200 201 /* 202 * Select the span of an xarray iterator we're going to use. Limit it by both 203 * maximum size and maximum number of segments. It is assumed that segments 204 * can be larger than a page in size, provided they're physically contiguous. 205 * Returns the size of the span in bytes. 206 */ 207 static size_t netfs_limit_xarray(const struct iov_iter *iter, size_t start_offset, 208 size_t max_size, size_t max_segs) 209 { 210 struct folio *folio; 211 unsigned int nsegs = 0; 212 loff_t pos = iter->xarray_start + iter->iov_offset; 213 pgoff_t index = pos / PAGE_SIZE; 214 size_t span = 0, n = iter->count; 215 216 XA_STATE(xas, iter->xarray, index); 217 218 if (WARN_ON(!iov_iter_is_xarray(iter)) || 219 WARN_ON(start_offset > n) || 220 n == 0) 221 return 0; 222 max_size = min(max_size, n - start_offset); 223 224 rcu_read_lock(); 225 xas_for_each(&xas, folio, ULONG_MAX) { 226 size_t offset, flen, len; 227 if (xas_retry(&xas, folio)) 228 continue; 229 if (WARN_ON(xa_is_value(folio))) 230 break; 231 if (WARN_ON(folio_test_hugetlb(folio))) 232 break; 233 234 flen = folio_size(folio); 235 offset = offset_in_folio(folio, pos); 236 len = min(max_size, flen - offset); 237 span += len; 238 nsegs++; 239 if (span >= max_size || nsegs >= max_segs) 240 break; 241 } 242 243 rcu_read_unlock(); 244 return min(span, max_size); 245 } 246 247 /* 248 * Select the span of a folio queue iterator we're going to use. Limit it by 249 * both maximum size and maximum number of segments. Returns the size of the 250 * span in bytes. 251 */ 252 static size_t netfs_limit_folioq(const struct iov_iter *iter, size_t start_offset, 253 size_t max_size, size_t max_segs) 254 { 255 const struct folio_queue *folioq = iter->folioq; 256 unsigned int nsegs = 0; 257 unsigned int slot = iter->folioq_slot; 258 size_t span = 0, n = iter->count; 259 260 if (WARN_ON(!iov_iter_is_folioq(iter)) || 261 WARN_ON(start_offset > n) || 262 n == 0) 263 return 0; 264 max_size = umin(max_size, n - start_offset); 265 266 if (slot >= folioq_nr_slots(folioq)) { 267 folioq = folioq->next; 268 slot = 0; 269 } 270 271 start_offset += iter->iov_offset; 272 do { 273 size_t flen = folioq_folio_size(folioq, slot); 274 275 if (start_offset < flen) { 276 span += flen - start_offset; 277 nsegs++; 278 start_offset = 0; 279 } else { 280 start_offset -= flen; 281 } 282 if (span >= max_size || nsegs >= max_segs) 283 break; 284 285 slot++; 286 if (slot >= folioq_nr_slots(folioq)) { 287 folioq = folioq->next; 288 slot = 0; 289 } 290 } while (folioq); 291 292 return umin(span, max_size); 293 } 294 295 size_t netfs_limit_iter(const struct iov_iter *iter, size_t start_offset, 296 size_t max_size, size_t max_segs) 297 { 298 if (iov_iter_is_folioq(iter)) 299 return netfs_limit_folioq(iter, start_offset, max_size, max_segs); 300 if (iov_iter_is_bvec(iter)) 301 return netfs_limit_bvec(iter, start_offset, max_size, max_segs); 302 if (iov_iter_is_xarray(iter)) 303 return netfs_limit_xarray(iter, start_offset, max_size, max_segs); 304 if (iov_iter_is_kvec(iter)) 305 return netfs_limit_kvec(iter, start_offset, max_size, max_segs); 306 BUG(); 307 } 308 EXPORT_SYMBOL(netfs_limit_iter); 309