Commit | Line | Data |
---|---|---|
1da177e4 | 1 | /* |
7b718769 NS |
2 | * Copyright (c) 2000-2005 Silicon Graphics, Inc. |
3 | * All Rights Reserved. | |
1da177e4 | 4 | * |
7b718769 NS |
5 | * This program is free software; you can redistribute it and/or |
6 | * modify it under the terms of the GNU General Public License as | |
1da177e4 LT |
7 | * published by the Free Software Foundation. |
8 | * | |
7b718769 NS |
9 | * This program is distributed in the hope that it would be useful, |
10 | * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
11 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
12 | * GNU General Public License for more details. | |
1da177e4 | 13 | * |
7b718769 NS |
14 | * You should have received a copy of the GNU General Public License |
15 | * along with this program; if not, write the Free Software Foundation, | |
16 | * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA | |
1da177e4 LT |
17 | */ |
18 | #ifndef __XFS_LINUX__ | |
19 | #define __XFS_LINUX__ | |
20 | ||
21 | #include <linux/types.h> | |
22 | #include <linux/config.h> | |
23 | ||
24 | /* | |
25 | * Some types are conditional depending on the target system. | |
26 | * XFS_BIG_BLKNOS needs block layer disk addresses to be 64 bits. | |
27 | * XFS_BIG_INUMS needs the VFS inode number to be 64 bits, as well | |
28 | * as requiring XFS_BIG_BLKNOS to be set. | |
29 | */ | |
30 | #if defined(CONFIG_LBD) || (BITS_PER_LONG == 64) | |
31 | # define XFS_BIG_BLKNOS 1 | |
32 | # if BITS_PER_LONG == 64 | |
33 | # define XFS_BIG_INUMS 1 | |
34 | # else | |
35 | # define XFS_BIG_INUMS 0 | |
36 | # endif | |
37 | #else | |
38 | # define XFS_BIG_BLKNOS 0 | |
39 | # define XFS_BIG_INUMS 0 | |
40 | #endif | |
41 | ||
42 | #include <xfs_types.h> | |
43 | #include <xfs_arch.h> | |
44 | ||
45 | #include <kmem.h> | |
46 | #include <mrlock.h> | |
47 | #include <spin.h> | |
48 | #include <sv.h> | |
49 | #include <mutex.h> | |
50 | #include <sema.h> | |
51 | #include <time.h> | |
52 | ||
1da177e4 LT |
53 | #include <support/ktrace.h> |
54 | #include <support/debug.h> | |
55 | #include <support/move.h> | |
56 | #include <support/uuid.h> | |
57 | ||
58 | #include <linux/mm.h> | |
59 | #include <linux/kernel.h> | |
60 | #include <linux/blkdev.h> | |
61 | #include <linux/slab.h> | |
62 | #include <linux/module.h> | |
63 | #include <linux/file.h> | |
64 | #include <linux/swap.h> | |
65 | #include <linux/errno.h> | |
66 | #include <linux/sched.h> | |
67 | #include <linux/bitops.h> | |
68 | #include <linux/major.h> | |
69 | #include <linux/pagemap.h> | |
70 | #include <linux/vfs.h> | |
71 | #include <linux/seq_file.h> | |
72 | #include <linux/init.h> | |
73 | #include <linux/list.h> | |
74 | #include <linux/proc_fs.h> | |
1da177e4 | 75 | #include <linux/sort.h> |
e8234a68 DC |
76 | #include <linux/cpu.h> |
77 | #include <linux/notifier.h> | |
01e1b69c | 78 | #include <linux/delay.h> |
1da177e4 LT |
79 | |
80 | #include <asm/page.h> | |
81 | #include <asm/div64.h> | |
82 | #include <asm/param.h> | |
83 | #include <asm/uaccess.h> | |
84 | #include <asm/byteorder.h> | |
85 | #include <asm/unaligned.h> | |
86 | ||
87 | #include <xfs_behavior.h> | |
88 | #include <xfs_vfs.h> | |
89 | #include <xfs_cred.h> | |
90 | #include <xfs_vnode.h> | |
91 | #include <xfs_stats.h> | |
92 | #include <xfs_sysctl.h> | |
93 | #include <xfs_iops.h> | |
0829c360 | 94 | #include <xfs_aops.h> |
1da177e4 LT |
95 | #include <xfs_super.h> |
96 | #include <xfs_globals.h> | |
97 | #include <xfs_fs_subr.h> | |
98 | #include <xfs_lrw.h> | |
99 | #include <xfs_buf.h> | |
100 | ||
101 | /* | |
102 | * Feature macros (disable/enable) | |
103 | */ | |
104 | #undef HAVE_REFCACHE /* reference cache not needed for NFS in 2.6 */ | |
105 | #define HAVE_SENDFILE /* sendfile(2) exists in 2.6, but not in 2.4 */ | |
1b895840 | 106 | #define HAVE_SPLICE /* a splice(2) exists in 2.6, but not in 2.4 */ |
d2c32edf | 107 | #ifdef CONFIG_SMP |
8d280b98 DC |
108 | #define HAVE_PERCPU_SB /* per cpu superblock counters are a 2.6 feature */ |
109 | #else | |
110 | #undef HAVE_PERCPU_SB /* per cpu superblock counters are a 2.6 feature */ | |
111 | #endif | |
1da177e4 LT |
112 | |
113 | /* | |
114 | * State flag for unwritten extent buffers. | |
115 | * | |
116 | * We need to be able to distinguish between these and delayed | |
117 | * allocate buffers within XFS. The generic IO path code does | |
118 | * not need to distinguish - we use the BH_Delay flag for both | |
119 | * delalloc and these ondisk-uninitialised buffers. | |
120 | */ | |
121 | BUFFER_FNS(PrivateStart, unwritten); | |
1da177e4 LT |
122 | |
123 | #define restricted_chown xfs_params.restrict_chown.val | |
124 | #define irix_sgid_inherit xfs_params.sgid_inherit.val | |
125 | #define irix_symlink_mode xfs_params.symlink_mode.val | |
126 | #define xfs_panic_mask xfs_params.panic_mask.val | |
127 | #define xfs_error_level xfs_params.error_level.val | |
128 | #define xfs_syncd_centisecs xfs_params.syncd_timer.val | |
129 | #define xfs_stats_clear xfs_params.stats_clear.val | |
130 | #define xfs_inherit_sync xfs_params.inherit_sync.val | |
131 | #define xfs_inherit_nodump xfs_params.inherit_nodump.val | |
132 | #define xfs_inherit_noatime xfs_params.inherit_noatim.val | |
133 | #define xfs_buf_timer_centisecs xfs_params.xfs_buf_timer.val | |
134 | #define xfs_buf_age_centisecs xfs_params.xfs_buf_age.val | |
135 | #define xfs_inherit_nosymlinks xfs_params.inherit_nosym.val | |
136 | #define xfs_rotorstep xfs_params.rotorstep.val | |
d3446eac | 137 | #define xfs_inherit_nodefrag xfs_params.inherit_nodfrg.val |
1da177e4 | 138 | |
59c1b082 | 139 | #define current_cpu() (raw_smp_processor_id()) |
1da177e4 LT |
140 | #define current_pid() (current->pid) |
141 | #define current_fsuid(cred) (current->fsuid) | |
142 | #define current_fsgid(cred) (current->fsgid) | |
59c1b082 NS |
143 | #define current_set_flags(f) (current->flags |= (f)) |
144 | #define current_test_flags(f) (current->flags & (f)) | |
145 | #define current_clear_flags(f) (current->flags & ~(f)) | |
146 | #define current_set_flags_nested(sp, f) \ | |
147 | (*(sp) = current->flags, current->flags |= (f)) | |
148 | #define current_clear_flags_nested(sp, f) \ | |
149 | (*(sp) = current->flags, current->flags &= ~(f)) | |
150 | #define current_restore_flags_nested(sp, f) \ | |
151 | (current->flags = ((current->flags & ~(f)) | (*(sp) & (f)))) | |
1da177e4 LT |
152 | |
153 | #define NBPP PAGE_SIZE | |
154 | #define DPPSHFT (PAGE_SHIFT - 9) | |
155 | #define NDPP (1 << (PAGE_SHIFT - 9)) | |
156 | #define dtop(DD) (((DD) + NDPP - 1) >> DPPSHFT) | |
157 | #define dtopt(DD) ((DD) >> DPPSHFT) | |
158 | #define dpoff(DD) ((DD) & (NDPP-1)) | |
159 | ||
160 | #define NBBY 8 /* number of bits per byte */ | |
161 | #define NBPC PAGE_SIZE /* Number of bytes per click */ | |
162 | #define BPCSHIFT PAGE_SHIFT /* LOG2(NBPC) if exact */ | |
163 | ||
164 | /* | |
165 | * Size of block device i/o is parameterized here. | |
166 | * Currently the system supports page-sized i/o. | |
167 | */ | |
168 | #define BLKDEV_IOSHIFT BPCSHIFT | |
169 | #define BLKDEV_IOSIZE (1<<BLKDEV_IOSHIFT) | |
170 | /* number of BB's per block device block */ | |
171 | #define BLKDEV_BB BTOBB(BLKDEV_IOSIZE) | |
172 | ||
173 | /* bytes to clicks */ | |
174 | #define btoc(x) (((__psunsigned_t)(x)+(NBPC-1))>>BPCSHIFT) | |
175 | #define btoct(x) ((__psunsigned_t)(x)>>BPCSHIFT) | |
176 | #define btoc64(x) (((__uint64_t)(x)+(NBPC-1))>>BPCSHIFT) | |
177 | #define btoct64(x) ((__uint64_t)(x)>>BPCSHIFT) | |
178 | #define io_btoc(x) (((__psunsigned_t)(x)+(IO_NBPC-1))>>IO_BPCSHIFT) | |
179 | #define io_btoct(x) ((__psunsigned_t)(x)>>IO_BPCSHIFT) | |
180 | ||
181 | /* off_t bytes to clicks */ | |
182 | #define offtoc(x) (((__uint64_t)(x)+(NBPC-1))>>BPCSHIFT) | |
183 | #define offtoct(x) ((xfs_off_t)(x)>>BPCSHIFT) | |
184 | ||
185 | /* clicks to off_t bytes */ | |
186 | #define ctooff(x) ((xfs_off_t)(x)<<BPCSHIFT) | |
187 | ||
188 | /* clicks to bytes */ | |
189 | #define ctob(x) ((__psunsigned_t)(x)<<BPCSHIFT) | |
190 | #define btoct(x) ((__psunsigned_t)(x)>>BPCSHIFT) | |
191 | #define ctob64(x) ((__uint64_t)(x)<<BPCSHIFT) | |
192 | #define io_ctob(x) ((__psunsigned_t)(x)<<IO_BPCSHIFT) | |
193 | ||
194 | /* bytes to clicks */ | |
195 | #define btoc(x) (((__psunsigned_t)(x)+(NBPC-1))>>BPCSHIFT) | |
196 | ||
1da177e4 LT |
197 | #ifndef ENOATTR |
198 | #define ENOATTR ENODATA /* Attribute not found */ | |
199 | #endif | |
200 | ||
201 | /* Note: EWRONGFS never visible outside the kernel */ | |
202 | #define EWRONGFS EINVAL /* Mount with wrong filesystem type */ | |
203 | ||
204 | /* | |
205 | * XXX EFSCORRUPTED needs a real value in errno.h. asm-i386/errno.h won't | |
206 | * return codes out of its known range in errno. | |
207 | * XXX Also note: needs to be < 1000 and fairly unique on Linux (mustn't | |
208 | * conflict with any code we use already or any code a driver may use) | |
209 | * XXX Some options (currently we do #2): | |
210 | * 1/ New error code ["Filesystem is corrupted", _after_ glibc updated] | |
211 | * 2/ 990 ["Unknown error 990"] | |
212 | * 3/ EUCLEAN ["Structure needs cleaning"] | |
213 | * 4/ Convert EFSCORRUPTED to EIO [just prior to return into userspace] | |
214 | */ | |
215 | #define EFSCORRUPTED 990 /* Filesystem is corrupted */ | |
216 | ||
217 | #define SYNCHRONIZE() barrier() | |
218 | #define __return_address __builtin_return_address(0) | |
219 | ||
220 | /* | |
221 | * IRIX (BSD) quotactl makes use of separate commands for user/group, | |
222 | * whereas on Linux the syscall encodes this information into the cmd | |
223 | * field (see the QCMD macro in quota.h). These macros help keep the | |
224 | * code portable - they are not visible from the syscall interface. | |
225 | */ | |
c8ad20ff NS |
226 | #define Q_XSETGQLIM XQM_CMD(8) /* set groups disk limits */ |
227 | #define Q_XGETGQUOTA XQM_CMD(9) /* get groups disk limits */ | |
228 | #define Q_XSETPQLIM XQM_CMD(10) /* set projects disk limits */ | |
229 | #define Q_XGETPQUOTA XQM_CMD(11) /* get projects disk limits */ | |
1da177e4 | 230 | |
6b3f6b5b | 231 | #define dfltprid 0 |
1da177e4 LT |
232 | #define MAXPATHLEN 1024 |
233 | ||
234 | #define MIN(a,b) (min(a,b)) | |
235 | #define MAX(a,b) (max(a,b)) | |
236 | #define howmany(x, y) (((x)+((y)-1))/(y)) | |
237 | #define roundup(x, y) ((((x)+((y)-1))/(y))*(y)) | |
238 | ||
cde410a9 NS |
239 | /* |
240 | * Various platform dependent calls that don't fit anywhere else | |
241 | */ | |
380b5dc0 | 242 | #define xfs_sort(a,n,s,fn) sort(a,n,s,fn,NULL) |
1da177e4 | 243 | #define xfs_stack_trace() dump_stack() |
1da177e4 | 244 | #define xfs_itruncate_data(ip, off) \ |
ec86dc02 | 245 | (-vmtruncate(vn_to_inode(XFS_ITOV(ip)), (off))) |
cde410a9 | 246 | #define xfs_statvfs_fsid(statp, mp) \ |
ce8e922c | 247 | ({ u64 id = huge_encode_dev((mp)->m_ddev_targp->bt_dev); \ |
cde410a9 NS |
248 | __kernel_fsid_t *fsid = &(statp)->f_fsid; \ |
249 | (fsid->val[0] = (u32)id, fsid->val[1] = (u32)(id >> 32)); }) | |
1da177e4 LT |
250 | |
251 | ||
252 | /* Move the kernel do_div definition off to one side */ | |
253 | ||
254 | #if defined __i386__ | |
255 | /* For ia32 we need to pull some tricks to get past various versions | |
256 | * of the compiler which do not like us using do_div in the middle | |
257 | * of large functions. | |
258 | */ | |
259 | static inline __u32 xfs_do_div(void *a, __u32 b, int n) | |
260 | { | |
261 | __u32 mod; | |
262 | ||
263 | switch (n) { | |
264 | case 4: | |
265 | mod = *(__u32 *)a % b; | |
266 | *(__u32 *)a = *(__u32 *)a / b; | |
267 | return mod; | |
268 | case 8: | |
269 | { | |
270 | unsigned long __upper, __low, __high, __mod; | |
271 | __u64 c = *(__u64 *)a; | |
272 | __upper = __high = c >> 32; | |
273 | __low = c; | |
274 | if (__high) { | |
275 | __upper = __high % (b); | |
276 | __high = __high / (b); | |
277 | } | |
278 | asm("divl %2":"=a" (__low), "=d" (__mod):"rm" (b), "0" (__low), "1" (__upper)); | |
279 | asm("":"=A" (c):"a" (__low),"d" (__high)); | |
280 | *(__u64 *)a = c; | |
281 | return __mod; | |
282 | } | |
283 | } | |
284 | ||
285 | /* NOTREACHED */ | |
286 | return 0; | |
287 | } | |
288 | ||
289 | /* Side effect free 64 bit mod operation */ | |
290 | static inline __u32 xfs_do_mod(void *a, __u32 b, int n) | |
291 | { | |
292 | switch (n) { | |
293 | case 4: | |
294 | return *(__u32 *)a % b; | |
295 | case 8: | |
296 | { | |
297 | unsigned long __upper, __low, __high, __mod; | |
298 | __u64 c = *(__u64 *)a; | |
299 | __upper = __high = c >> 32; | |
300 | __low = c; | |
301 | if (__high) { | |
302 | __upper = __high % (b); | |
303 | __high = __high / (b); | |
304 | } | |
305 | asm("divl %2":"=a" (__low), "=d" (__mod):"rm" (b), "0" (__low), "1" (__upper)); | |
306 | asm("":"=A" (c):"a" (__low),"d" (__high)); | |
307 | return __mod; | |
308 | } | |
309 | } | |
310 | ||
311 | /* NOTREACHED */ | |
312 | return 0; | |
313 | } | |
314 | #else | |
315 | static inline __u32 xfs_do_div(void *a, __u32 b, int n) | |
316 | { | |
317 | __u32 mod; | |
318 | ||
319 | switch (n) { | |
320 | case 4: | |
321 | mod = *(__u32 *)a % b; | |
322 | *(__u32 *)a = *(__u32 *)a / b; | |
323 | return mod; | |
324 | case 8: | |
325 | mod = do_div(*(__u64 *)a, b); | |
326 | return mod; | |
327 | } | |
328 | ||
329 | /* NOTREACHED */ | |
330 | return 0; | |
331 | } | |
332 | ||
333 | /* Side effect free 64 bit mod operation */ | |
334 | static inline __u32 xfs_do_mod(void *a, __u32 b, int n) | |
335 | { | |
336 | switch (n) { | |
337 | case 4: | |
338 | return *(__u32 *)a % b; | |
339 | case 8: | |
340 | { | |
341 | __u64 c = *(__u64 *)a; | |
342 | return do_div(c, b); | |
343 | } | |
344 | } | |
345 | ||
346 | /* NOTREACHED */ | |
347 | return 0; | |
348 | } | |
349 | #endif | |
350 | ||
351 | #undef do_div | |
352 | #define do_div(a, b) xfs_do_div(&(a), (b), sizeof(a)) | |
353 | #define do_mod(a, b) xfs_do_mod(&(a), (b), sizeof(a)) | |
354 | ||
355 | static inline __uint64_t roundup_64(__uint64_t x, __uint32_t y) | |
356 | { | |
357 | x += y - 1; | |
358 | do_div(x, y); | |
359 | return(x * y); | |
360 | } | |
361 | ||
1da177e4 | 362 | #endif /* __XFS_LINUX__ */ |