Lines Matching +full:buffered +full:- +full:negative

1 // SPDX-License-Identifier: GPL-2.0-only
5 * Copyright (C) 1994-1999 Linus Torvalds
28 #include <linux/error-injection.h>
31 #include <linux/backing-dev.h>
65 * finished 'unifying' the page and buffer cache and SMP-threaded the
66 * page-cache, 21.05.1999, Ingo Molnar <mingo@redhat.com>
68 * SMP-threaded pagemap-LRU 1999, Andrea Arcangeli <andrea@suse.de>
74 * ->i_mmap_rwsem (truncate_pagecache)
75 * ->private_lock (__free_pte->__set_page_dirty_buffers)
76 * ->swap_lock (exclusive_swap_page, others)
77 * ->i_pages lock
79 * ->i_rwsem
80 * ->invalidate_lock (acquired by fs in truncate path)
81 * ->i_mmap_rwsem (truncate->unmap_mapping_range)
83 * ->mmap_lock
84 * ->i_mmap_rwsem
85 * ->page_table_lock or pte_lock (various, mainly in memory.c)
86 * ->i_pages lock (arch-dependent flush_dcache_mmap_lock)
88 * ->mmap_lock
89 * ->invalidate_lock (filemap_fault)
90 * ->lock_page (filemap_fault, access_process_vm)
92 * ->i_rwsem (generic_perform_write)
93 * ->mmap_lock (fault_in_pages_readable->do_page_fault)
95 * bdi->wb.list_lock
96 * sb_lock (fs/fs-writeback.c)
97 * ->i_pages lock (__sync_single_inode)
99 * ->i_mmap_rwsem
100 * ->anon_vma.lock (vma_adjust)
102 * ->anon_vma.lock
103 * ->page_table_lock or pte_lock (anon_vma_prepare and various)
105 * ->page_table_lock or pte_lock
106 * ->swap_lock (try_to_unmap_one)
107 * ->private_lock (try_to_unmap_one)
108 * ->i_pages lock (try_to_unmap_one)
109 * ->lruvec->lru_lock (follow_page->mark_page_accessed)
110 * ->lruvec->lru_lock (check_pte_range->isolate_lru_page)
111 * ->private_lock (page_remove_rmap->set_page_dirty)
112 * ->i_pages lock (page_remove_rmap->set_page_dirty)
113 * bdi.wb->list_lock (page_remove_rmap->set_page_dirty)
114 * ->inode->i_lock (page_remove_rmap->set_page_dirty)
115 * ->memcg->move_lock (page_remove_rmap->lock_page_memcg)
116 * bdi.wb->list_lock (zap_pte_range->set_page_dirty)
117 * ->inode->i_lock (zap_pte_range->set_page_dirty)
118 * ->private_lock (zap_pte_range->__set_page_dirty_buffers)
120 * ->i_mmap_rwsem
121 * ->tasklist_lock (memory_failure, collect_procs_ao)
127 XA_STATE(xas, &mapping->i_pages, page->index); in page_cache_delete()
134 xas_set_order(&xas, page->index, compound_order(page)); in page_cache_delete()
145 page->mapping = NULL; in page_cache_delete()
146 /* Leave page->index set: truncation lookup relies upon it */ in page_cache_delete()
147 mapping->nrpages -= nr; in page_cache_delete()
171 current->comm, page_to_pfn(page)); in unaccount_page_cache_page()
196 __mod_lruvec_page_state(page, NR_FILE_PAGES, -nr); in unaccount_page_cache_page()
198 __mod_lruvec_page_state(page, NR_SHMEM, -nr); in unaccount_page_cache_page()
200 __mod_lruvec_page_state(page, NR_SHMEM_THPS, -nr); in unaccount_page_cache_page()
202 __mod_lruvec_page_state(page, NR_FILE_THPS, -nr); in unaccount_page_cache_page()
217 account_page_cleaned(page, mapping, inode_to_wb(mapping->host)); in unaccount_page_cache_page()
222 * sure the page is locked and that nobody else uses it - or that usage
227 struct address_space *mapping = page->mapping; in __delete_from_page_cache()
240 freepage = mapping->a_ops->freepage; in page_cache_free_page()
253 * delete_from_page_cache - delete page from page cache
265 xa_lock_irq(&mapping->i_pages); in delete_from_page_cache()
267 xa_unlock_irq(&mapping->i_pages); in delete_from_page_cache()
274 * page_cache_delete_batch - delete several pages from page cache
278 * The function walks over mapping->i_pages and removes pages passed in @pvec
290 XA_STATE(xas, &mapping->i_pages, pvec->pages[0]->index); in page_cache_delete_batch()
310 if (page != pvec->pages[i]) { in page_cache_delete_batch()
311 VM_BUG_ON_PAGE(page->index > pvec->pages[i]->index, in page_cache_delete_batch()
318 if (page->index == xas.xa_index) in page_cache_delete_batch()
319 page->mapping = NULL; in page_cache_delete_batch()
320 /* Leave page->index set: truncation lookup relies on it */ in page_cache_delete_batch()
324 * page or the index is of the last sub-page of this compound in page_cache_delete_batch()
327 if (page->index + compound_nr(page) - 1 == xas.xa_index) in page_cache_delete_batch()
332 mapping->nrpages -= total_pages; in page_cache_delete_batch()
343 xa_lock_irq(&mapping->i_pages); in delete_from_page_cache_batch()
345 trace_mm_filemap_delete_from_page_cache(pvec->pages[i]); in delete_from_page_cache_batch()
347 unaccount_page_cache_page(mapping, pvec->pages[i]); in delete_from_page_cache_batch()
350 xa_unlock_irq(&mapping->i_pages); in delete_from_page_cache_batch()
353 page_cache_free_page(mapping, pvec->pages[i]); in delete_from_page_cache_batch()
360 if (test_bit(AS_ENOSPC, &mapping->flags) && in filemap_check_errors()
361 test_and_clear_bit(AS_ENOSPC, &mapping->flags)) in filemap_check_errors()
362 ret = -ENOSPC; in filemap_check_errors()
363 if (test_bit(AS_EIO, &mapping->flags) && in filemap_check_errors()
364 test_and_clear_bit(AS_EIO, &mapping->flags)) in filemap_check_errors()
365 ret = -EIO; in filemap_check_errors()
373 if (test_bit(AS_EIO, &mapping->flags)) in filemap_check_and_keep_errors()
374 return -EIO; in filemap_check_and_keep_errors()
375 if (test_bit(AS_ENOSPC, &mapping->flags)) in filemap_check_and_keep_errors()
376 return -ENOSPC; in filemap_check_and_keep_errors()
381 * filemap_fdatawrite_wbc - start writeback on mapping dirty pages in range
388 * Return: %0 on success, negative error code otherwise.
399 wbc_attach_fdatawrite_inode(wbc, mapping->host); in filemap_fdatawrite_wbc()
407 * __filemap_fdatawrite_range - start writeback on mapping dirty pages in range
421 * Return: %0 on success, negative error code otherwise.
456 * filemap_flush - mostly a non-blocking flush
459 * This is a mostly non-blocking flush. Not suitable for data-integrity
460 * purposes - I/O may not be started against all dirty pages.
462 * Return: %0 on success, negative error code otherwise.
471 * filemap_range_has_page - check if a page exists in range.
486 XA_STATE(xas, &mapping->i_pages, start_byte >> PAGE_SHIFT); in filemap_range_has_page()
545 * filemap_fdatawait_range - wait for writeback to complete
550 * Walk the list of under-writeback pages of the given address space
569 * filemap_fdatawait_range_keep_errors - wait for writeback to complete
574 * Walk the list of under-writeback pages of the given address space in the
579 * call sites are system-wide / filesystem-wide data flushers: e.g. sync(2),
591 * file_fdatawait_range - wait for writeback to complete
596 * Walk the list of under-writeback pages of the address space that file
598 * status of the address space vs. the file->f_wb_err cursor and return it.
604 * Return: error status of the address space vs. the file->f_wb_err cursor.
608 struct address_space *mapping = file->f_mapping; in file_fdatawait_range()
616 * filemap_fdatawait_keep_errors - wait for writeback without clearing errors
619 * Walk the list of under-writeback pages of the given address space
624 * call sites are system-wide / filesystem-wide data flushers: e.g. sync(2),
639 return mapping->nrpages; in mapping_needs_writeback()
643 * filemap_range_needs_writeback - check if range potentially needs writeback
659 XA_STATE(xas, &mapping->i_pages, start_byte >> PAGE_SHIFT); in filemap_range_needs_writeback()
686 * filemap_write_and_wait_range - write out & wait on a file range
691 * Write out and wait upon file offsets lstart->lend, inclusive.
694 * that this function can be used to write to the very end-of-file (end = -1).
708 * written partially (e.g. -ENOSPC), so we wait for it. in filemap_write_and_wait_range()
709 * But the -EIO is special case, it may indicate the worst in filemap_write_and_wait_range()
712 if (err != -EIO) { in filemap_write_and_wait_range()
730 errseq_t eseq = errseq_set(&mapping->wb_err, err); in __filemap_set_wb_err()
737 * file_check_and_advance_wb_err - report wb error (if any) that was previously
754 * While we handle mapping->wb_err with atomic operations, the f_wb_err
758 * Return: %0 on success, negative error code otherwise.
763 errseq_t old = READ_ONCE(file->f_wb_err); in file_check_and_advance_wb_err()
764 struct address_space *mapping = file->f_mapping; in file_check_and_advance_wb_err()
767 if (errseq_check(&mapping->wb_err, old)) { in file_check_and_advance_wb_err()
769 spin_lock(&file->f_lock); in file_check_and_advance_wb_err()
770 old = file->f_wb_err; in file_check_and_advance_wb_err()
771 err = errseq_check_and_advance(&mapping->wb_err, in file_check_and_advance_wb_err()
772 &file->f_wb_err); in file_check_and_advance_wb_err()
774 spin_unlock(&file->f_lock); in file_check_and_advance_wb_err()
782 clear_bit(AS_EIO, &mapping->flags); in file_check_and_advance_wb_err()
783 clear_bit(AS_ENOSPC, &mapping->flags); in file_check_and_advance_wb_err()
789 * file_write_and_wait_range - write out & wait on a file range
794 * Write out and wait upon file offsets lstart->lend, inclusive.
797 * that this function can be used to write to the very end-of-file (end = -1).
802 * Return: %0 on success, negative error code otherwise.
807 struct address_space *mapping = file->f_mapping; in file_write_and_wait_range()
813 if (err != -EIO) in file_write_and_wait_range()
824 * replace_page_cache_page - replace a pagecache page with a new one
838 struct address_space *mapping = old->mapping; in replace_page_cache_page()
839 void (*freepage)(struct page *) = mapping->a_ops->freepage; in replace_page_cache_page()
840 pgoff_t offset = old->index; in replace_page_cache_page()
841 XA_STATE(xas, &mapping->i_pages, offset); in replace_page_cache_page()
845 VM_BUG_ON_PAGE(new->mapping, new); in replace_page_cache_page()
848 new->mapping = mapping; in replace_page_cache_page()
849 new->index = offset; in replace_page_cache_page()
856 old->mapping = NULL; in replace_page_cache_page()
878 XA_STATE(xas, &mapping->i_pages, offset); in __add_to_page_cache_locked()
888 page->mapping = mapping; in __add_to_page_cache_locked()
889 page->index = offset; in __add_to_page_cache_locked()
911 xas_set_err(&xas, -EEXIST); in __add_to_page_cache_locked()
931 mapping->nrpages++; in __add_to_page_cache_locked()
950 page->mapping = NULL; in __add_to_page_cache_locked()
951 /* Leave page->index set: truncation relies upon it */ in __add_to_page_cache_locked()
958 * add_to_page_cache_locked - add a locked page to the pagecache
967 * Return: %0 on success, negative error code otherwise.
1028 * filemap_invalidate_lock_two - lock invalidate_lock for two mappings
1041 down_write(&mapping1->invalidate_lock); in filemap_invalidate_lock_two()
1043 down_write_nested(&mapping2->invalidate_lock, 1); in filemap_invalidate_lock_two()
1048 * filemap_invalidate_unlock_two - unlock invalidate_lock for two mappings
1059 up_write(&mapping1->invalidate_lock); in filemap_invalidate_unlock_two()
1061 up_write(&mapping2->invalidate_lock); in filemap_invalidate_unlock_two()
1095 * The page wait code treats the "wait->flags" somewhat unusually, because
1142 flags = wait->flags; in wake_page_function()
1144 if (test_bit(key->bit_nr, &key->page->flags)) in wake_page_function()
1145 return -1; in wake_page_function()
1147 if (test_and_set_bit(key->bit_nr, &key->page->flags)) in wake_page_function()
1148 return -1; in wake_page_function()
1154 * We are holding the wait-queue lock, but the waiter that in wake_page_function()
1159 * afterwards to avoid any races. This store-release pairs in wake_page_function()
1160 * with the load-acquire in wait_on_page_bit_common(). in wake_page_function()
1162 smp_store_release(&wait->flags, flags | WQ_FLAG_WOKEN); in wake_page_function()
1163 wake_up_state(wait->private, mode); in wake_page_function()
1171 * After this list_del_init(&wait->entry) the wait entry in wake_page_function()
1172 * might be de-allocated and the process might even have in wake_page_function()
1175 list_del_init_careful(&wait->entry); in wake_page_function()
1195 spin_lock_irqsave(&q->lock, flags); in wake_up_page_bit()
1205 spin_unlock_irqrestore(&q->lock, flags); in wake_up_page_bit()
1207 spin_lock_irqsave(&q->lock, flags); in wake_up_page_bit()
1213 * hash, so in that case check for a page match. That prevents a long- in wake_up_page_bit()
1230 spin_unlock_irqrestore(&q->lock, flags); in wake_up_page_bit()
1262 if (wait->flags & WQ_FLAG_EXCLUSIVE) { in trylock_page_bit_common()
1263 if (test_and_set_bit(bit_nr, &page->flags)) in trylock_page_bit_common()
1265 } else if (test_bit(bit_nr, &page->flags)) in trylock_page_bit_common()
1268 wait->flags |= WQ_FLAG_WOKEN | WQ_FLAG_DONE; in trylock_page_bit_common()
1296 wait->func = wake_page_function; in wait_on_page_bit_common()
1301 wait->flags = 0; in wait_on_page_bit_common()
1303 wait->flags = WQ_FLAG_EXCLUSIVE; in wait_on_page_bit_common()
1304 if (--unfairness < 0) in wait_on_page_bit_common()
1305 wait->flags |= WQ_FLAG_CUSTOM; in wait_on_page_bit_common()
1322 spin_lock_irq(&q->lock); in wait_on_page_bit_common()
1326 spin_unlock_irq(&q->lock); in wait_on_page_bit_common()
1342 * be very careful with the 'wait->flags', because in wait_on_page_bit_common()
1351 flags = smp_load_acquire(&wait->flags); in wait_on_page_bit_common()
1360 /* If we were non-exclusive, we're done */ in wait_on_page_bit_common()
1374 if (unlikely(test_and_set_bit(bit_nr, &page->flags))) in wait_on_page_bit_common()
1377 wait->flags |= WQ_FLAG_DONE; in wait_on_page_bit_common()
1383 * waiter from the wait-queues, but the PageWaiters bit will remain in wait_on_page_bit_common()
1396 * NOTE! The wait->flags weren't stable until we've done the in wait_on_page_bit_common()
1405 * Also note that WQ_FLAG_WOKEN is sufficient for a non-exclusive in wait_on_page_bit_common()
1409 return wait->flags & WQ_FLAG_DONE ? 0 : -EINTR; in wait_on_page_bit_common()
1411 return wait->flags & WQ_FLAG_WOKEN ? 0 : -EINTR; in wait_on_page_bit_common()
1429 * put_and_wait_on_page_locked - Drop a reference and wait for it to be unlocked
1439 * Return: 0 if the page was unlocked or -EINTR if interrupted by a signal.
1451 * add_page_wait_queue - Add an arbitrary waiter to a page's wait queue
1462 spin_lock_irqsave(&q->lock, flags); in add_page_wait_queue()
1465 spin_unlock_irqrestore(&q->lock, flags); in add_page_wait_queue()
1493 * unlock_page - unlock a locked page
1499 * But that's OK - sleepers in wait_on_page_writeback() just go back to sleep.
1502 * that contains PG_locked - thus the BUILD_BUG_ON(). That allows us to
1512 if (clear_bit_unlock_is_negative_byte(PG_locked, &page->flags)) in unlock_page()
1518 * end_page_private_2 - Clear PG_private_2 and release any waiters
1532 clear_bit_unlock(PG_private_2, &page->flags); in end_page_private_2()
1539 * wait_on_page_private_2 - Wait for PG_private_2 to be cleared on a page
1553 * wait_on_page_private_2_killable - Wait for PG_private_2 to be cleared on a page
1560 * - 0 if successful.
1561 * - -EINTR if a fatal signal was encountered.
1579 * end_page_writeback - end writeback against a page
1641 * __lock_page - get a lock on the page, assuming we need to sleep to get it
1667 wait->page = page; in __lock_page_async()
1668 wait->bit_nr = PG_locked; in __lock_page_async()
1670 spin_lock_irq(&q->lock); in __lock_page_async()
1671 __add_wait_queue_entry_tail(q, &wait->wait); in __lock_page_async()
1681 __remove_wait_queue(q, &wait->wait); in __lock_page_async()
1683 ret = -EIOCBQUEUED; in __lock_page_async()
1684 spin_unlock_irq(&q->lock); in __lock_page_async()
1690 * 1 - page is locked; mmap_lock is still held.
1691 * 0 - page is not locked.
1733 * page_cache_next_miss() - Find the next gap in the page cache.
1738 * Search the range [index, min(index + max_scan - 1, ULONG_MAX)] for the
1748 * range specified (in which case 'return - index >= max_scan' will be true).
1749 * In the rare case of index wrap-around, 0 will be returned.
1754 XA_STATE(xas, &mapping->i_pages, index); in page_cache_next_miss()
1756 while (max_scan--) { in page_cache_next_miss()
1769 * page_cache_prev_miss() - Find the previous gap in the page cache.
1774 * Search the range [max(index - max_scan + 1, 0), index] for the
1784 * range specified (in which case 'index - return >= max_scan' will be true).
1785 * In the rare case of wrap-around, ULONG_MAX will be returned.
1790 XA_STATE(xas, &mapping->i_pages, index); in page_cache_prev_miss()
1792 while (max_scan--) { in page_cache_prev_miss()
1805 * mapping_get_entry - Get a page cache entry.
1820 XA_STATE(xas, &mapping->i_pages, index); in mapping_get_entry()
1855 * pagecache_get_page - Find and get a reference to a page.
1865 * * %FGP_ACCESSED - The page will be marked accessed.
1866 * * %FGP_LOCK - The page is returned locked.
1867 * * %FGP_HEAD - If the page is present and a THP, return the head page
1869 * * %FGP_ENTRY - If there is a shadow / swap / DAX entry, return it
1871 * * %FGP_CREAT - If no page is present then a new page is allocated using
1874 * * %FGP_FOR_MMAP - The caller wants to do its own locking dance if the
1877 * * %FGP_WRITE - The page will be written
1878 * * %FGP_NOFS - __GFP_FS will get cleared in gfp mask
1879 * * %FGP_NOWAIT - Don't get blocked by page lock
1914 if (unlikely(page->mapping != mapping)) { in pagecache_get_page()
1955 if (err == -EEXIST) in pagecache_get_page()
2008 * find_get_entries - gang pagecache lookup
2019 * The search returns a group of mapping-contiguous page cache entries
2021 * not-present pages.
2036 XA_STATE(xas, &mapping->i_pages, start); in find_get_entries()
2054 pvec->pages[ret] = page; in find_get_entries()
2060 pvec->nr = ret; in find_get_entries()
2065 * find_lock_entries - Find a batch of pagecache entries.
2080 * due to not-present entries, THP pages, pages which could not be locked
2088 XA_STATE(xas, &mapping->i_pages, start); in find_lock_entries()
2094 if (page->index < start) in find_lock_entries()
2096 VM_BUG_ON_PAGE(page->index != xas.xa_index, page); in find_lock_entries()
2097 if (page->index + thp_nr_pages(page) - 1 > end) in find_lock_entries()
2101 if (page->mapping != mapping || PageWriteback(page)) in find_lock_entries()
2106 indices[pvec->nr] = xas.xa_index; in find_lock_entries()
2118 /* Final THP may cross MAX_LFS_FILESIZE on 32-bit */ in find_lock_entries()
2119 xas_set(&xas, page->index + nr_pages); in find_lock_entries()
2130 * find_get_pages_range - gang pagecache lookup
2142 * The search returns a group of mapping-contiguous pages with ascending
2143 * indexes. There may be holes in the indices due to not-present pages.
2154 XA_STATE(xas, &mapping->i_pages, *start); in find_get_pages_range()
2177 * breaks the iteration when there is a page at index -1 but that is in find_get_pages_range()
2180 if (end == (pgoff_t)-1) in find_get_pages_range()
2181 *start = (pgoff_t)-1; in find_get_pages_range()
2191 * find_get_pages_contig - gang contiguous pagecache lookup
2205 XA_STATE(xas, &mapping->i_pages, index); in find_get_pages_contig()
2245 * find_get_pages_range_tag - Find and return head pages matching @tag.
2263 XA_STATE(xas, &mapping->i_pages, *index); in find_get_pages_range_tag()
2282 *index = page->index + thp_nr_pages(page); in find_get_pages_range_tag()
2290 * iteration when there is a page at index -1 but that is already in find_get_pages_range_tag()
2293 if (end == (pgoff_t)-1) in find_get_pages_range_tag()
2294 *index = (pgoff_t)-1; in find_get_pages_range_tag()
2308 * ---R__________________________________________B__________
2321 ra->ra_pages /= 4; in shrink_readahead_size_eio()
2325 * filemap_get_read_batch - Get a batch of pages for read
2336 XA_STATE(xas, &mapping->i_pages, index); in filemap_get_read_batch()
2358 xas.xa_index = head->index + thp_nr_pages(head) - 1; in filemap_get_read_batch()
2381 error = mapping->a_ops->readpage(file, page); in filemap_read_page()
2390 shrink_readahead_size_eio(&file->f_ra); in filemap_read_page()
2391 return -EIO; in filemap_read_page()
2404 if (!mapping->a_ops->is_partially_uptodate) in filemap_range_uptodate()
2406 if (mapping->host->i_blkbits >= (PAGE_SHIFT + thp_order(page))) in filemap_range_uptodate()
2409 count = iter->count; in filemap_range_uptodate()
2411 count -= page_offset(page) - pos; in filemap_range_uptodate()
2414 pos -= page_offset(page); in filemap_range_uptodate()
2417 return mapping->a_ops->is_partially_uptodate(page, pos, count); in filemap_range_uptodate()
2426 if (iocb->ki_flags & IOCB_NOWAIT) { in filemap_update_page()
2428 return -EAGAIN; in filemap_update_page()
2434 error = -EAGAIN; in filemap_update_page()
2435 if (iocb->ki_flags & (IOCB_NOWAIT | IOCB_NOIO)) in filemap_update_page()
2437 if (!(iocb->ki_flags & IOCB_WAITQ)) { in filemap_update_page()
2442 error = __lock_page_async(page, iocb->ki_waitq); in filemap_update_page()
2448 if (!page->mapping) in filemap_update_page()
2452 if (filemap_range_uptodate(mapping, iocb->ki_pos, iter, page)) in filemap_update_page()
2455 error = -EAGAIN; in filemap_update_page()
2456 if (iocb->ki_flags & (IOCB_NOIO | IOCB_NOWAIT | IOCB_WAITQ)) in filemap_update_page()
2459 error = filemap_read_page(iocb->ki_filp, mapping, page); in filemap_update_page()
2479 return -ENOMEM; in filemap_create_page()
2489 * ->readpages() that need to hold invalidate_lock while mapping blocks in filemap_create_page()
2496 if (error == -EEXIST) in filemap_create_page()
2518 if (iocb->ki_flags & IOCB_NOIO) in filemap_readahead()
2519 return -EAGAIN; in filemap_readahead()
2520 page_cache_async_readahead(mapping, &file->f_ra, file, page, in filemap_readahead()
2521 page->index, last_index - page->index); in filemap_readahead()
2528 struct file *filp = iocb->ki_filp; in filemap_get_pages()
2529 struct address_space *mapping = filp->f_mapping; in filemap_get_pages()
2530 struct file_ra_state *ra = &filp->f_ra; in filemap_get_pages()
2531 pgoff_t index = iocb->ki_pos >> PAGE_SHIFT; in filemap_get_pages()
2536 last_index = DIV_ROUND_UP(iocb->ki_pos + iter->count, PAGE_SIZE); in filemap_get_pages()
2539 return -EINTR; in filemap_get_pages()
2543 if (iocb->ki_flags & IOCB_NOIO) in filemap_get_pages()
2544 return -EAGAIN; in filemap_get_pages()
2546 last_index - index); in filemap_get_pages()
2550 if (iocb->ki_flags & (IOCB_NOWAIT | IOCB_WAITQ)) in filemap_get_pages()
2551 return -EAGAIN; in filemap_get_pages()
2553 iocb->ki_pos >> PAGE_SHIFT, pvec); in filemap_get_pages()
2559 page = pvec->pages[pagevec_count(pvec) - 1]; in filemap_get_pages()
2566 if ((iocb->ki_flags & IOCB_WAITQ) && pagevec_count(pvec) > 1) in filemap_get_pages()
2567 iocb->ki_flags |= IOCB_NOWAIT; in filemap_get_pages()
2577 if (likely(--pvec->nr)) in filemap_get_pages()
2585 * filemap_read - Read data from the page cache.
2595 * a negative error number.
2600 struct file *filp = iocb->ki_filp; in filemap_read()
2601 struct file_ra_state *ra = &filp->f_ra; in filemap_read()
2602 struct address_space *mapping = filp->f_mapping; in filemap_read()
2603 struct inode *inode = mapping->host; in filemap_read()
2609 if (unlikely(iocb->ki_pos >= inode->i_sb->s_maxbytes)) in filemap_read()
2614 iov_iter_truncate(iter, inode->i_sb->s_maxbytes); in filemap_read()
2622 * can no longer safely return -EIOCBQUEUED. Hence mark in filemap_read()
2625 if ((iocb->ki_flags & IOCB_WAITQ) && already_read) in filemap_read()
2626 iocb->ki_flags |= IOCB_NOWAIT; in filemap_read()
2636 * the correct value for "nr", which means the zero-filled in filemap_read()
2638 * another truncate extends the file - this is desired though). in filemap_read()
2641 if (unlikely(iocb->ki_pos >= isize)) in filemap_read()
2643 end_offset = min_t(loff_t, isize, iocb->ki_pos + iter->count); in filemap_read()
2655 if (iocb->ki_pos >> PAGE_SHIFT != in filemap_read()
2656 ra->prev_pos >> PAGE_SHIFT) in filemap_read()
2662 size_t offset = iocb->ki_pos & (page_size - 1); in filemap_read()
2663 size_t bytes = min_t(loff_t, end_offset - iocb->ki_pos, in filemap_read()
2664 page_size - offset); in filemap_read()
2686 iocb->ki_pos += copied; in filemap_read()
2687 ra->prev_pos = iocb->ki_pos; in filemap_read()
2690 error = -EFAULT; in filemap_read()
2698 } while (iov_iter_count(iter) && iocb->ki_pos < isize && !error); in filemap_read()
2707 * generic_file_read_iter - generic filesystem read routine
2714 * The IOCB_NOWAIT flag in iocb->ki_flags indicates that -EAGAIN shall
2718 * The IOCB_NOIO flag in iocb->ki_flags indicates that no new I/O
2720 * can be read, -EAGAIN shall be returned. When readahead would be
2725 * * negative error code (or 0 if IOCB_NOIO) if nothing was read
2736 if (iocb->ki_flags & IOCB_DIRECT) { in generic_file_read_iter()
2737 struct file *file = iocb->ki_filp; in generic_file_read_iter()
2738 struct address_space *mapping = file->f_mapping; in generic_file_read_iter()
2739 struct inode *inode = mapping->host; in generic_file_read_iter()
2743 if (iocb->ki_flags & IOCB_NOWAIT) { in generic_file_read_iter()
2744 if (filemap_range_needs_writeback(mapping, iocb->ki_pos, in generic_file_read_iter()
2745 iocb->ki_pos + count - 1)) in generic_file_read_iter()
2746 return -EAGAIN; in generic_file_read_iter()
2749 iocb->ki_pos, in generic_file_read_iter()
2750 iocb->ki_pos + count - 1); in generic_file_read_iter()
2757 retval = mapping->a_ops->direct_IO(iocb, iter); in generic_file_read_iter()
2759 iocb->ki_pos += retval; in generic_file_read_iter()
2760 count -= retval; in generic_file_read_iter()
2762 if (retval != -EIOCBQUEUED) in generic_file_read_iter()
2763 iov_iter_revert(iter, count - iov_iter_count(iter)); in generic_file_read_iter()
2770 * and return. Otherwise fallthrough to buffered io for in generic_file_read_iter()
2771 * the rest of the read. Buffered reads will not work for in generic_file_read_iter()
2774 if (retval < 0 || !count || iocb->ki_pos >= size || in generic_file_read_iter()
2787 const struct address_space_operations *ops = mapping->a_ops; in page_seek_hole_data()
2788 size_t offset, bsz = i_blocksize(mapping->host); in page_seek_hole_data()
2792 if (!ops->is_partially_uptodate) in page_seek_hole_data()
2798 if (unlikely(page->mapping != mapping)) in page_seek_hole_data()
2801 offset = offset_in_thp(page, start) & ~(bsz - 1); in page_seek_hole_data()
2804 if (ops->is_partially_uptodate(page, offset, bsz) == seek_data) in page_seek_hole_data()
2806 start = (start + bsz) & ~(bsz - 1); in page_seek_hole_data()
2819 return PAGE_SIZE << xa_get_order(xas->xa, xas->xa_index); in seek_page_size()
2824 * mapping_seek_hole_data - Seek for SEEK_DATA / SEEK_HOLE in the page cache.
2833 * entirely memory-based such as tmpfs, and filesystems which support
2836 * Return: The requested offset on success, or -ENXIO if @whence specifies
2838 * after @end - 1, so SEEK_HOLE returns @end if all the bytes between @start
2844 XA_STATE(xas, &mapping->i_pages, start >> PAGE_SHIFT); in mapping_seek_hole_data()
2845 pgoff_t max = (end - 1) >> PAGE_SHIFT; in mapping_seek_hole_data()
2850 return -ENXIO; in mapping_seek_hole_data()
2877 start = -ENXIO; in mapping_seek_hole_data()
2890 * lock_page_maybe_drop_mmap - lock the page, possibly dropping the mmap_lock
2891 * @vmf - the vm_fault for this fault.
2892 * @page - the page to lock.
2893 * @fpin - the pointer to the file we may pin (or is already pinned).
2911 if (vmf->flags & FAULT_FLAG_RETRY_NOWAIT) in lock_page_maybe_drop_mmap()
2915 if (vmf->flags & FAULT_FLAG_KILLABLE) { in lock_page_maybe_drop_mmap()
2924 mmap_read_unlock(vmf->vma->vm_mm); in lock_page_maybe_drop_mmap()
2942 struct file *file = vmf->vma->vm_file; in do_sync_mmap_readahead()
2943 struct file_ra_state *ra = &file->f_ra; in do_sync_mmap_readahead()
2944 struct address_space *mapping = file->f_mapping; in do_sync_mmap_readahead()
2945 DEFINE_READAHEAD(ractl, file, ra, mapping, vmf->pgoff); in do_sync_mmap_readahead()
2949 /* If we don't want any read-ahead, don't bother */ in do_sync_mmap_readahead()
2950 if (vmf->vma->vm_flags & VM_RAND_READ) in do_sync_mmap_readahead()
2952 if (!ra->ra_pages) in do_sync_mmap_readahead()
2955 if (vmf->vma->vm_flags & VM_SEQ_READ) { in do_sync_mmap_readahead()
2957 page_cache_sync_ra(&ractl, ra->ra_pages); in do_sync_mmap_readahead()
2962 mmap_miss = READ_ONCE(ra->mmap_miss); in do_sync_mmap_readahead()
2964 WRITE_ONCE(ra->mmap_miss, ++mmap_miss); in do_sync_mmap_readahead()
2968 * stop bothering with read-ahead. It will only hurt. in do_sync_mmap_readahead()
2974 * mmap read-around in do_sync_mmap_readahead()
2977 ra->start = max_t(long, 0, vmf->pgoff - ra->ra_pages / 2); in do_sync_mmap_readahead()
2978 ra->size = ra->ra_pages; in do_sync_mmap_readahead()
2979 ra->async_size = ra->ra_pages / 4; in do_sync_mmap_readahead()
2980 ractl._index = ra->start; in do_sync_mmap_readahead()
2981 do_page_cache_ra(&ractl, ra->size, ra->async_size); in do_sync_mmap_readahead()
2993 struct file *file = vmf->vma->vm_file; in do_async_mmap_readahead()
2994 struct file_ra_state *ra = &file->f_ra; in do_async_mmap_readahead()
2995 struct address_space *mapping = file->f_mapping; in do_async_mmap_readahead()
2998 pgoff_t offset = vmf->pgoff; in do_async_mmap_readahead()
3000 /* If we don't want any read-ahead, don't bother */ in do_async_mmap_readahead()
3001 if (vmf->vma->vm_flags & VM_RAND_READ || !ra->ra_pages) in do_async_mmap_readahead()
3003 mmap_miss = READ_ONCE(ra->mmap_miss); in do_async_mmap_readahead()
3005 WRITE_ONCE(ra->mmap_miss, --mmap_miss); in do_async_mmap_readahead()
3009 page, offset, ra->ra_pages); in do_async_mmap_readahead()
3015 * filemap_fault - read in file data for page fault handling
3025 * vma->vm_mm->mmap_lock must be held on entry.
3035 * Return: bitwise-OR of %VM_FAULT_ codes.
3040 struct file *file = vmf->vma->vm_file; in filemap_fault()
3042 struct address_space *mapping = file->f_mapping; in filemap_fault()
3043 struct inode *inode = mapping->host; in filemap_fault()
3044 pgoff_t offset = vmf->pgoff; in filemap_fault()
3063 if (!(vmf->flags & FAULT_FLAG_TRIED)) in filemap_fault()
3072 count_memcg_event_mm(vmf->vma->vm_mm, PGMAJFAULT); in filemap_fault()
3086 vmf->gfp_mask); in filemap_fault()
3099 if (unlikely(compound_head(page)->mapping != mapping)) { in filemap_fault()
3108 * that it's up-to-date. If not, it is going to be due to an error. in filemap_fault()
3127 * time to return to the upper layer and have it re-find the vma and in filemap_fault()
3148 vmf->page = page; in filemap_fault()
3153 * Umm, take care of errors if the page isn't up-to-date. in filemap_fault()
3154 * Try to re-read it _once_. We do this synchronously, in filemap_fault()
3173 * re-find the vma and come back and find our hopefully still populated in filemap_fault()
3188 struct mm_struct *mm = vmf->vma->vm_mm; in filemap_map_pmd()
3191 if (pmd_trans_huge(*vmf->pmd)) { in filemap_map_pmd()
3197 if (pmd_none(*vmf->pmd) && PageTransHuge(page)) { in filemap_map_pmd()
3206 if (pmd_none(*vmf->pmd)) { in filemap_map_pmd()
3207 vmf->ptl = pmd_lock(mm, vmf->pmd); in filemap_map_pmd()
3208 if (likely(pmd_none(*vmf->pmd))) { in filemap_map_pmd()
3210 pmd_populate(mm, vmf->pmd, vmf->prealloc_pte); in filemap_map_pmd()
3211 vmf->prealloc_pte = NULL; in filemap_map_pmd()
3213 spin_unlock(vmf->ptl); in filemap_map_pmd()
3217 if (pmd_devmap_trans_unstable(vmf->pmd)) { in filemap_map_pmd()
3252 if (page->mapping != mapping) in next_uptodate_page()
3256 max_idx = DIV_ROUND_UP(i_size_read(mapping->host), PAGE_SIZE); in next_uptodate_page()
3257 if (xas->xa_index >= max_idx) in next_uptodate_page()
3288 struct vm_area_struct *vma = vmf->vma; in filemap_map_pages()
3289 struct file *file = vma->vm_file; in filemap_map_pages()
3290 struct address_space *mapping = file->f_mapping; in filemap_map_pages()
3293 XA_STATE(xas, &mapping->i_pages, start_pgoff); in filemap_map_pages()
3295 unsigned int mmap_miss = READ_ONCE(file->f_ra.mmap_miss); in filemap_map_pages()
3308 addr = vma->vm_start + ((start_pgoff - vma->vm_pgoff) << PAGE_SHIFT); in filemap_map_pages()
3309 vmf->pte = pte_offset_map_lock(vma->vm_mm, vmf->pmd, addr, &vmf->ptl); in filemap_map_pages()
3316 mmap_miss--; in filemap_map_pages()
3318 addr += (xas.xa_index - last_pgoff) << PAGE_SHIFT; in filemap_map_pages()
3319 vmf->pte += xas.xa_index - last_pgoff; in filemap_map_pages()
3322 if (!pte_none(*vmf->pte)) in filemap_map_pages()
3326 if (vmf->address == addr) in filemap_map_pages()
3330 /* no need to invalidate: a not-present page won't be cached */ in filemap_map_pages()
3331 update_mmu_cache(vma, addr, vmf->pte); in filemap_map_pages()
3338 pte_unmap_unlock(vmf->pte, vmf->ptl); in filemap_map_pages()
3341 WRITE_ONCE(file->f_ra.mmap_miss, mmap_miss); in filemap_map_pages()
3348 struct address_space *mapping = vmf->vma->vm_file->f_mapping; in filemap_page_mkwrite()
3349 struct page *page = vmf->page; in filemap_page_mkwrite()
3352 sb_start_pagefault(mapping->host->i_sb); in filemap_page_mkwrite()
3353 file_update_time(vmf->vma->vm_file); in filemap_page_mkwrite()
3355 if (page->mapping != mapping) { in filemap_page_mkwrite()
3368 sb_end_pagefault(mapping->host->i_sb); in filemap_page_mkwrite()
3382 struct address_space *mapping = file->f_mapping; in generic_file_mmap()
3384 if (!mapping->a_ops->readpage) in generic_file_mmap()
3385 return -ENOEXEC; in generic_file_mmap()
3387 vma->vm_ops = &generic_file_vm_ops; in generic_file_mmap()
3392 * This is for filesystems which do not implement ->writepage.
3396 if ((vma->vm_flags & VM_SHARED) && (vma->vm_flags & VM_MAYWRITE)) in generic_file_readonly_mmap()
3397 return -EINVAL; in generic_file_readonly_mmap()
3407 return -ENOSYS; in generic_file_mmap()
3411 return -ENOSYS; in generic_file_readonly_mmap()
3425 page = ERR_PTR(-EIO); in wait_on_page_read()
3444 return ERR_PTR(-ENOMEM); in do_read_cache_page()
3448 if (err == -EEXIST) in do_read_cache_page()
3458 err = mapping->a_ops->readpage(data, page); in do_read_cache_page()
3512 if (!page->mapping) { in do_read_cache_page()
3539 * read_cache_page - read into page cache, fill it if needed
3548 * If the page does not get brought uptodate, return -EIO.
3550 * The function expects mapping->invalidate_lock to be already held.
3565 * read_cache_page_gfp - read into page cache, using specified page allocation flags.
3573 * If the page does not get brought uptodate, return -EIO.
3575 * The function expects mapping->invalidate_lock to be already held.
3591 const struct address_space_operations *aops = mapping->a_ops; in pagecache_write_begin()
3593 return aops->write_begin(file, mapping, pos, len, flags, in pagecache_write_begin()
3602 const struct address_space_operations *aops = mapping->a_ops; in pagecache_write_end()
3604 return aops->write_end(file, mapping, pos, len, copied, page, fsdata); in pagecache_write_end()
3617 errseq_set(&filp->f_mapping->wb_err, -EIO); in dio_warn_stale_pagecache()
3622 …alidation failure on direct I/O. Possible data corruption due to collision with buffered I/O!\n"); in dio_warn_stale_pagecache()
3623 pr_crit("File: %s PID: %d Comm: %.20s\n", path, current->pid, in dio_warn_stale_pagecache()
3624 current->comm); in dio_warn_stale_pagecache()
3631 struct file *file = iocb->ki_filp; in generic_file_direct_write()
3632 struct address_space *mapping = file->f_mapping; in generic_file_direct_write()
3633 struct inode *inode = mapping->host; in generic_file_direct_write()
3634 loff_t pos = iocb->ki_pos; in generic_file_direct_write()
3640 end = (pos + write_len - 1) >> PAGE_SHIFT; in generic_file_direct_write()
3642 if (iocb->ki_flags & IOCB_NOWAIT) { in generic_file_direct_write()
3644 if (filemap_range_has_page(file->f_mapping, pos, in generic_file_direct_write()
3645 pos + write_len - 1)) in generic_file_direct_write()
3646 return -EAGAIN; in generic_file_direct_write()
3649 pos + write_len - 1); in generic_file_direct_write()
3655 * After a write we want buffered reads to be sure to go to disk to get in generic_file_direct_write()
3658 * without clobbering -EIOCBQUEUED from ->direct_IO(). in generic_file_direct_write()
3664 * to buffered write. in generic_file_direct_write()
3667 if (written == -EBUSY) in generic_file_direct_write()
3672 written = mapping->a_ops->direct_IO(iocb, from); in generic_file_direct_write()
3676 * cached by non-direct readahead, or faulted in by get_user_pages() in generic_file_direct_write()
3691 if (written > 0 && mapping->nrpages && in generic_file_direct_write()
3697 write_len -= written; in generic_file_direct_write()
3698 if (pos > i_size_read(inode) && !S_ISBLK(inode->i_mode)) { in generic_file_direct_write()
3702 iocb->ki_pos = pos; in generic_file_direct_write()
3704 if (written != -EIOCBQUEUED) in generic_file_direct_write()
3705 iov_iter_revert(from, write_len - iov_iter_count(from)); in generic_file_direct_write()
3713 * page. This function is specifically for buffered writes.
3736 struct address_space *mapping = file->f_mapping; in generic_perform_write()
3737 const struct address_space_operations *a_ops = mapping->a_ops; in generic_perform_write()
3749 offset = (pos & (PAGE_SIZE - 1)); in generic_perform_write()
3750 bytes = min_t(unsigned long, PAGE_SIZE - offset, in generic_perform_write()
3758 * up-to-date. in generic_perform_write()
3761 status = -EFAULT; in generic_perform_write()
3766 status = -EINTR; in generic_perform_write()
3770 status = a_ops->write_begin(file, mapping, pos, bytes, flags, in generic_perform_write()
3781 status = a_ops->write_end(file, mapping, pos, bytes, copied, in generic_perform_write()
3784 iov_iter_revert(i, copied - max(status, 0L)); in generic_perform_write()
3792 * A short copy made ->write_end() reject the in generic_perform_write()
3812 * __generic_file_write_iter - write data to a file
3819 * do direct IO or a standard buffered write.
3830 * * negative error code if no data has been written at all
3834 struct file *file = iocb->ki_filp; in __generic_file_write_iter()
3835 struct address_space *mapping = file->f_mapping; in __generic_file_write_iter()
3836 struct inode *inode = mapping->host; in __generic_file_write_iter()
3842 current->backing_dev_info = inode_to_bdi(inode); in __generic_file_write_iter()
3851 if (iocb->ki_flags & IOCB_DIRECT) { in __generic_file_write_iter()
3857 * buffered writes. Some filesystems do this for writes to in __generic_file_write_iter()
3858 * holes, for example. For DAX files, a buffered write will in __generic_file_write_iter()
3860 * page-cache pages correctly). in __generic_file_write_iter()
3865 status = generic_perform_write(file, from, pos = iocb->ki_pos); in __generic_file_write_iter()
3869 * direct-written, or the error code if that was zero. Note in __generic_file_write_iter()
3870 * that this differs from normal direct-io semantics, which in __generic_file_write_iter()
3871 * will return -EFOO even if some bytes were written. in __generic_file_write_iter()
3882 endbyte = pos + status - 1; in __generic_file_write_iter()
3885 iocb->ki_pos = endbyte + 1; in __generic_file_write_iter()
3893 * the number of bytes which were direct-written in __generic_file_write_iter()
3897 written = generic_perform_write(file, from, iocb->ki_pos); in __generic_file_write_iter()
3899 iocb->ki_pos += written; in __generic_file_write_iter()
3902 current->backing_dev_info = NULL; in __generic_file_write_iter()
3908 * generic_file_write_iter - write data to a file
3916 * * negative error code if no data has been written at all of
3922 struct file *file = iocb->ki_filp; in generic_file_write_iter()
3923 struct inode *inode = file->f_mapping->host; in generic_file_write_iter()
3939 * try_to_release_page() - release old fs-specific metadata on a page
3945 * (presumably at page->private).
3957 struct address_space * const mapping = page->mapping; in try_to_release_page()
3963 if (mapping && mapping->a_ops->releasepage) in try_to_release_page()
3964 return mapping->a_ops->releasepage(page, gfp_mask); in try_to_release_page()