Blame view
mm/fadvise.c
4 KB
1da177e4c
|
1 2 3 4 5 |
/* * mm/fadvise.c * * Copyright (C) 2002, Linus Torvalds * |
e1f8e8744
|
6 |
* 11Jan2003 Andrew Morton |
1da177e4c
|
7 8 9 10 11 12 13 14 15 16 17 |
* Initial version. */ #include <linux/kernel.h> #include <linux/file.h> #include <linux/fs.h> #include <linux/mm.h> #include <linux/pagemap.h> #include <linux/backing-dev.h> #include <linux/pagevec.h> #include <linux/fadvise.h> |
ebcf28e1c
|
18 |
#include <linux/writeback.h> |
1da177e4c
|
19 |
#include <linux/syscalls.h> |
67d46b296
|
20 |
#include <linux/swap.h> |
1da177e4c
|
21 22 23 24 25 26 27 |
#include <asm/unistd.h> /* * POSIX_FADV_WILLNEED could set PG_Referenced, and POSIX_FADV_NOREUSE could * deactivate the pages and clear PG_Referenced. */ |
4a0fd5bf0
|
28 |
SYSCALL_DEFINE4(fadvise64_64, int, fd, loff_t, offset, loff_t, len, int, advice) |
1da177e4c
|
29 |
{ |
2903ff019
|
30 |
struct fd f = fdget(fd); |
e748dcd09
|
31 |
struct inode *inode; |
1da177e4c
|
32 33 |
struct address_space *mapping; struct backing_dev_info *bdi; |
ebcf28e1c
|
34 |
loff_t endbyte; /* inclusive */ |
1da177e4c
|
35 36 37 38 |
pgoff_t start_index; pgoff_t end_index; unsigned long nrpages; int ret = 0; |
2903ff019
|
39 |
if (!f.file) |
1da177e4c
|
40 |
return -EBADF; |
e748dcd09
|
41 42 |
inode = file_inode(f.file); if (S_ISFIFO(inode->i_mode)) { |
87ba81dba
|
43 44 45 |
ret = -ESPIPE; goto out; } |
2903ff019
|
46 |
mapping = f.file->f_mapping; |
1da177e4c
|
47 48 49 50 |
if (!mapping || len < 0) { ret = -EINVAL; goto out; } |
e748dcd09
|
51 |
if (IS_DAX(inode)) { |
b5beb1caf
|
52 53 54 55 56 57 58 59 60 61 62 63 |
switch (advice) { case POSIX_FADV_NORMAL: case POSIX_FADV_RANDOM: case POSIX_FADV_SEQUENTIAL: case POSIX_FADV_WILLNEED: case POSIX_FADV_NOREUSE: case POSIX_FADV_DONTNEED: /* no bad return value, but ignore advice */ break; default: ret = -EINVAL; } |
fe77ba6f4
|
64 |
goto out; |
b5beb1caf
|
65 |
} |
fe77ba6f4
|
66 |
|
1da177e4c
|
67 68 69 70 |
/* Careful about overflows. Len == 0 means "as much as possible" */ endbyte = offset + len; if (!len || endbyte < len) endbyte = -1; |
ebcf28e1c
|
71 72 |
else endbyte--; /* inclusive */ |
1da177e4c
|
73 |
|
de1414a65
|
74 |
bdi = inode_to_bdi(mapping->host); |
1da177e4c
|
75 76 77 |
switch (advice) { case POSIX_FADV_NORMAL: |
2903ff019
|
78 79 80 81 |
f.file->f_ra.ra_pages = bdi->ra_pages; spin_lock(&f.file->f_lock); f.file->f_mode &= ~FMODE_RANDOM; spin_unlock(&f.file->f_lock); |
1da177e4c
|
82 83 |
break; case POSIX_FADV_RANDOM: |
2903ff019
|
84 85 86 |
spin_lock(&f.file->f_lock); f.file->f_mode |= FMODE_RANDOM; spin_unlock(&f.file->f_lock); |
1da177e4c
|
87 88 |
break; case POSIX_FADV_SEQUENTIAL: |
2903ff019
|
89 90 91 92 |
f.file->f_ra.ra_pages = bdi->ra_pages * 2; spin_lock(&f.file->f_lock); f.file->f_mode &= ~FMODE_RANDOM; spin_unlock(&f.file->f_lock); |
1da177e4c
|
93 94 |
break; case POSIX_FADV_WILLNEED: |
1da177e4c
|
95 |
/* First and last PARTIAL page! */ |
09cbfeaf1
|
96 97 |
start_index = offset >> PAGE_SHIFT; end_index = endbyte >> PAGE_SHIFT; |
1da177e4c
|
98 99 100 101 102 |
/* Careful about overflow on the "+1" */ nrpages = end_index - start_index + 1; if (!nrpages) nrpages = ~0UL; |
3d3727cdb
|
103 104 105 106 107 |
/* * Ignore return value because fadvise() shall return * success even if filesystem can't retrieve a hint, */ |
2903ff019
|
108 |
force_page_cache_readahead(mapping, f.file, start_index, |
3d3727cdb
|
109 |
nrpages); |
1da177e4c
|
110 |
break; |
60c371bc7
|
111 112 |
case POSIX_FADV_NOREUSE: break; |
1da177e4c
|
113 |
case POSIX_FADV_DONTNEED: |
703c27088
|
114 |
if (!inode_write_congested(mapping->host)) |
ad8a1b558
|
115 116 |
__filemap_fdatawrite_range(mapping, offset, endbyte, WB_SYNC_NONE); |
1da177e4c
|
117 |
|
441c228f8
|
118 119 120 121 122 |
/* * First and last FULL page! Partial pages are deliberately * preserved on the expectation that it is better to preserve * needed memory than to discard unneeded memory. */ |
09cbfeaf1
|
123 124 |
start_index = (offset+(PAGE_SIZE-1)) >> PAGE_SHIFT; end_index = (endbyte >> PAGE_SHIFT); |
18aba41cb
|
125 126 127 128 129 130 131 132 133 134 135 |
if ((endbyte & ~PAGE_MASK) != ~PAGE_MASK) { /* First page is tricky as 0 - 1 = -1, but pgoff_t * is unsigned, so the end_index >= start_index * check below would be true and we'll discard the whole * file cache which is not what was asked. */ if (end_index == 0) break; end_index--; } |
1da177e4c
|
136 |
|
67d46b296
|
137 138 139 140 141 142 143 144 145 146 147 148 149 |
if (end_index >= start_index) { unsigned long count = invalidate_mapping_pages(mapping, start_index, end_index); /* * If fewer pages were invalidated than expected then * it is possible that some of the pages were on * a per-cpu pagevec for a remote CPU. Drain all * pagevecs and try again. */ if (count < (end_index - start_index + 1)) { lru_add_drain_all(); invalidate_mapping_pages(mapping, start_index, |
ebcf28e1c
|
150 |
end_index); |
67d46b296
|
151 152 |
} } |
ebcf28e1c
|
153 |
break; |
1da177e4c
|
154 155 156 157 |
default: ret = -EINVAL; } out: |
2903ff019
|
158 |
fdput(f); |
1da177e4c
|
159 160 161 162 |
return ret; } #ifdef __ARCH_WANT_SYS_FADVISE64 |
4a0fd5bf0
|
163 |
SYSCALL_DEFINE4(fadvise64, int, fd, loff_t, offset, size_t, len, int, advice) |
1da177e4c
|
164 165 166 167 168 |
{ return sys_fadvise64_64(fd, offset, len, advice); } #endif |