Commit | Line | Data |
---|---|---|
1da177e4 LT |
1 | /* |
2 | * Copyright (c) 2000-2004 Silicon Graphics, Inc. All Rights Reserved. | |
3 | * | |
4 | * This program is free software; you can redistribute it and/or modify it | |
5 | * under the terms of version 2 of the GNU General Public License as | |
6 | * published by the Free Software Foundation. | |
7 | * | |
8 | * This program is distributed in the hope that it would be useful, but | |
9 | * WITHOUT ANY WARRANTY; without even the implied warranty of | |
10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. | |
11 | * | |
12 | * Further, this software is distributed without any warranty that it is | |
13 | * free of the rightful claim of any third person regarding infringement | |
14 | * or the like. Any license provided herein, whether implied or | |
15 | * otherwise, applies only to this software file. Patent licenses, if | |
16 | * any, provided herein do not apply to combinations of this program with | |
17 | * other software, or any other product whatsoever. | |
18 | * | |
19 | * You should have received a copy of the GNU General Public License along | |
20 | * with this program; if not, write the Free Software Foundation, Inc., 59 | |
21 | * Temple Place - Suite 330, Boston MA 02111-1307, USA. | |
22 | * | |
23 | * Contact information: Silicon Graphics, Inc., 1600 Amphitheatre Pkwy, | |
24 | * Mountain View, CA 94043, or: | |
25 | * | |
26 | * http://www.sgi.com | |
27 | * | |
28 | * For further information regarding this notice, see: | |
29 | * | |
30 | * http://oss.sgi.com/projects/GenInfo/SGIGPLNoticeExplan/ | |
31 | */ | |
32 | #ifndef __XFS_LINUX__ | |
33 | #define __XFS_LINUX__ | |
34 | ||
35 | #include <linux/types.h> | |
36 | #include <linux/config.h> | |
37 | ||
38 | /* | |
39 | * Some types are conditional depending on the target system. | |
40 | * XFS_BIG_BLKNOS needs block layer disk addresses to be 64 bits. | |
41 | * XFS_BIG_INUMS needs the VFS inode number to be 64 bits, as well | |
42 | * as requiring XFS_BIG_BLKNOS to be set. | |
43 | */ | |
44 | #if defined(CONFIG_LBD) || (BITS_PER_LONG == 64) | |
45 | # define XFS_BIG_BLKNOS 1 | |
46 | # if BITS_PER_LONG == 64 | |
47 | # define XFS_BIG_INUMS 1 | |
48 | # else | |
49 | # define XFS_BIG_INUMS 0 | |
50 | # endif | |
51 | #else | |
52 | # define XFS_BIG_BLKNOS 0 | |
53 | # define XFS_BIG_INUMS 0 | |
54 | #endif | |
55 | ||
56 | #include <xfs_types.h> | |
57 | #include <xfs_arch.h> | |
58 | ||
59 | #include <kmem.h> | |
60 | #include <mrlock.h> | |
61 | #include <spin.h> | |
62 | #include <sv.h> | |
63 | #include <mutex.h> | |
64 | #include <sema.h> | |
65 | #include <time.h> | |
66 | ||
67 | #include <support/qsort.h> | |
68 | #include <support/ktrace.h> | |
69 | #include <support/debug.h> | |
70 | #include <support/move.h> | |
71 | #include <support/uuid.h> | |
72 | ||
73 | #include <linux/mm.h> | |
74 | #include <linux/kernel.h> | |
75 | #include <linux/blkdev.h> | |
76 | #include <linux/slab.h> | |
77 | #include <linux/module.h> | |
78 | #include <linux/file.h> | |
79 | #include <linux/swap.h> | |
80 | #include <linux/errno.h> | |
81 | #include <linux/sched.h> | |
82 | #include <linux/bitops.h> | |
83 | #include <linux/major.h> | |
84 | #include <linux/pagemap.h> | |
85 | #include <linux/vfs.h> | |
86 | #include <linux/seq_file.h> | |
87 | #include <linux/init.h> | |
88 | #include <linux/list.h> | |
89 | #include <linux/proc_fs.h> | |
90 | #include <linux/version.h> | |
91 | #include <linux/sort.h> | |
92 | ||
93 | #include <asm/page.h> | |
94 | #include <asm/div64.h> | |
95 | #include <asm/param.h> | |
96 | #include <asm/uaccess.h> | |
97 | #include <asm/byteorder.h> | |
98 | #include <asm/unaligned.h> | |
99 | ||
100 | #include <xfs_behavior.h> | |
101 | #include <xfs_vfs.h> | |
102 | #include <xfs_cred.h> | |
103 | #include <xfs_vnode.h> | |
104 | #include <xfs_stats.h> | |
105 | #include <xfs_sysctl.h> | |
106 | #include <xfs_iops.h> | |
0829c360 | 107 | #include <xfs_aops.h> |
1da177e4 LT |
108 | #include <xfs_super.h> |
109 | #include <xfs_globals.h> | |
110 | #include <xfs_fs_subr.h> | |
111 | #include <xfs_lrw.h> | |
112 | #include <xfs_buf.h> | |
113 | ||
114 | /* | |
115 | * Feature macros (disable/enable) | |
116 | */ | |
117 | #undef HAVE_REFCACHE /* reference cache not needed for NFS in 2.6 */ | |
118 | #define HAVE_SENDFILE /* sendfile(2) exists in 2.6, but not in 2.4 */ | |
119 | ||
120 | /* | |
121 | * State flag for unwritten extent buffers. | |
122 | * | |
123 | * We need to be able to distinguish between these and delayed | |
124 | * allocate buffers within XFS. The generic IO path code does | |
125 | * not need to distinguish - we use the BH_Delay flag for both | |
126 | * delalloc and these ondisk-uninitialised buffers. | |
127 | */ | |
128 | BUFFER_FNS(PrivateStart, unwritten); | |
129 | static inline void set_buffer_unwritten_io(struct buffer_head *bh) | |
130 | { | |
131 | bh->b_end_io = linvfs_unwritten_done; | |
132 | } | |
133 | ||
134 | #define restricted_chown xfs_params.restrict_chown.val | |
135 | #define irix_sgid_inherit xfs_params.sgid_inherit.val | |
136 | #define irix_symlink_mode xfs_params.symlink_mode.val | |
137 | #define xfs_panic_mask xfs_params.panic_mask.val | |
138 | #define xfs_error_level xfs_params.error_level.val | |
139 | #define xfs_syncd_centisecs xfs_params.syncd_timer.val | |
140 | #define xfs_stats_clear xfs_params.stats_clear.val | |
141 | #define xfs_inherit_sync xfs_params.inherit_sync.val | |
142 | #define xfs_inherit_nodump xfs_params.inherit_nodump.val | |
143 | #define xfs_inherit_noatime xfs_params.inherit_noatim.val | |
144 | #define xfs_buf_timer_centisecs xfs_params.xfs_buf_timer.val | |
145 | #define xfs_buf_age_centisecs xfs_params.xfs_buf_age.val | |
146 | #define xfs_inherit_nosymlinks xfs_params.inherit_nosym.val | |
147 | #define xfs_rotorstep xfs_params.rotorstep.val | |
148 | ||
39c715b7 IM |
149 | #ifndef raw_smp_processor_id |
150 | #define raw_smp_processor_id() smp_processor_id() | |
1da177e4 | 151 | #endif |
39c715b7 | 152 | #define current_cpu() raw_smp_processor_id() |
1da177e4 LT |
153 | #define current_pid() (current->pid) |
154 | #define current_fsuid(cred) (current->fsuid) | |
155 | #define current_fsgid(cred) (current->fsgid) | |
156 | ||
157 | #define NBPP PAGE_SIZE | |
158 | #define DPPSHFT (PAGE_SHIFT - 9) | |
159 | #define NDPP (1 << (PAGE_SHIFT - 9)) | |
160 | #define dtop(DD) (((DD) + NDPP - 1) >> DPPSHFT) | |
161 | #define dtopt(DD) ((DD) >> DPPSHFT) | |
162 | #define dpoff(DD) ((DD) & (NDPP-1)) | |
163 | ||
164 | #define NBBY 8 /* number of bits per byte */ | |
165 | #define NBPC PAGE_SIZE /* Number of bytes per click */ | |
166 | #define BPCSHIFT PAGE_SHIFT /* LOG2(NBPC) if exact */ | |
167 | ||
168 | /* | |
169 | * Size of block device i/o is parameterized here. | |
170 | * Currently the system supports page-sized i/o. | |
171 | */ | |
172 | #define BLKDEV_IOSHIFT BPCSHIFT | |
173 | #define BLKDEV_IOSIZE (1<<BLKDEV_IOSHIFT) | |
174 | /* number of BB's per block device block */ | |
175 | #define BLKDEV_BB BTOBB(BLKDEV_IOSIZE) | |
176 | ||
177 | /* bytes to clicks */ | |
178 | #define btoc(x) (((__psunsigned_t)(x)+(NBPC-1))>>BPCSHIFT) | |
179 | #define btoct(x) ((__psunsigned_t)(x)>>BPCSHIFT) | |
180 | #define btoc64(x) (((__uint64_t)(x)+(NBPC-1))>>BPCSHIFT) | |
181 | #define btoct64(x) ((__uint64_t)(x)>>BPCSHIFT) | |
182 | #define io_btoc(x) (((__psunsigned_t)(x)+(IO_NBPC-1))>>IO_BPCSHIFT) | |
183 | #define io_btoct(x) ((__psunsigned_t)(x)>>IO_BPCSHIFT) | |
184 | ||
185 | /* off_t bytes to clicks */ | |
186 | #define offtoc(x) (((__uint64_t)(x)+(NBPC-1))>>BPCSHIFT) | |
187 | #define offtoct(x) ((xfs_off_t)(x)>>BPCSHIFT) | |
188 | ||
189 | /* clicks to off_t bytes */ | |
190 | #define ctooff(x) ((xfs_off_t)(x)<<BPCSHIFT) | |
191 | ||
192 | /* clicks to bytes */ | |
193 | #define ctob(x) ((__psunsigned_t)(x)<<BPCSHIFT) | |
194 | #define btoct(x) ((__psunsigned_t)(x)>>BPCSHIFT) | |
195 | #define ctob64(x) ((__uint64_t)(x)<<BPCSHIFT) | |
196 | #define io_ctob(x) ((__psunsigned_t)(x)<<IO_BPCSHIFT) | |
197 | ||
198 | /* bytes to clicks */ | |
199 | #define btoc(x) (((__psunsigned_t)(x)+(NBPC-1))>>BPCSHIFT) | |
200 | ||
201 | #ifndef CELL_CAPABLE | |
202 | #define FSC_NOTIFY_NAME_CHANGED(vp) | |
203 | #endif | |
204 | ||
205 | #ifndef ENOATTR | |
206 | #define ENOATTR ENODATA /* Attribute not found */ | |
207 | #endif | |
208 | ||
209 | /* Note: EWRONGFS never visible outside the kernel */ | |
210 | #define EWRONGFS EINVAL /* Mount with wrong filesystem type */ | |
211 | ||
212 | /* | |
213 | * XXX EFSCORRUPTED needs a real value in errno.h. asm-i386/errno.h won't | |
214 | * return codes out of its known range in errno. | |
215 | * XXX Also note: needs to be < 1000 and fairly unique on Linux (mustn't | |
216 | * conflict with any code we use already or any code a driver may use) | |
217 | * XXX Some options (currently we do #2): | |
218 | * 1/ New error code ["Filesystem is corrupted", _after_ glibc updated] | |
219 | * 2/ 990 ["Unknown error 990"] | |
220 | * 3/ EUCLEAN ["Structure needs cleaning"] | |
221 | * 4/ Convert EFSCORRUPTED to EIO [just prior to return into userspace] | |
222 | */ | |
223 | #define EFSCORRUPTED 990 /* Filesystem is corrupted */ | |
224 | ||
225 | #define SYNCHRONIZE() barrier() | |
226 | #define __return_address __builtin_return_address(0) | |
227 | ||
228 | /* | |
229 | * IRIX (BSD) quotactl makes use of separate commands for user/group, | |
230 | * whereas on Linux the syscall encodes this information into the cmd | |
231 | * field (see the QCMD macro in quota.h). These macros help keep the | |
232 | * code portable - they are not visible from the syscall interface. | |
233 | */ | |
c8ad20ff NS |
234 | #define Q_XSETGQLIM XQM_CMD(8) /* set groups disk limits */ |
235 | #define Q_XGETGQUOTA XQM_CMD(9) /* get groups disk limits */ | |
236 | #define Q_XSETPQLIM XQM_CMD(10) /* set projects disk limits */ | |
237 | #define Q_XGETPQUOTA XQM_CMD(11) /* get projects disk limits */ | |
1da177e4 LT |
238 | |
239 | /* IRIX uses a dynamic sizing algorithm (ndquot = 200 + numprocs*2) */ | |
240 | /* we may well need to fine-tune this if it ever becomes an issue. */ | |
241 | #define DQUOT_MAX_HEURISTIC 1024 /* NR_DQUOTS */ | |
242 | #define ndquot DQUOT_MAX_HEURISTIC | |
243 | ||
244 | /* IRIX uses the current size of the name cache to guess a good value */ | |
245 | /* - this isn't the same but is a good enough starting point for now. */ | |
246 | #define DQUOT_HASH_HEURISTIC files_stat.nr_files | |
247 | ||
248 | /* IRIX inodes maintain the project ID also, zero this field on Linux */ | |
249 | #define DEFAULT_PROJID 0 | |
250 | #define dfltprid DEFAULT_PROJID | |
251 | ||
252 | #define MAXPATHLEN 1024 | |
253 | ||
254 | #define MIN(a,b) (min(a,b)) | |
255 | #define MAX(a,b) (max(a,b)) | |
256 | #define howmany(x, y) (((x)+((y)-1))/(y)) | |
257 | #define roundup(x, y) ((((x)+((y)-1))/(y))*(y)) | |
258 | ||
259 | #define xfs_stack_trace() dump_stack() | |
260 | ||
261 | #define xfs_itruncate_data(ip, off) \ | |
262 | (-vmtruncate(LINVFS_GET_IP(XFS_ITOV(ip)), (off))) | |
263 | ||
264 | ||
265 | /* Move the kernel do_div definition off to one side */ | |
266 | ||
267 | #if defined __i386__ | |
268 | /* For ia32 we need to pull some tricks to get past various versions | |
269 | * of the compiler which do not like us using do_div in the middle | |
270 | * of large functions. | |
271 | */ | |
272 | static inline __u32 xfs_do_div(void *a, __u32 b, int n) | |
273 | { | |
274 | __u32 mod; | |
275 | ||
276 | switch (n) { | |
277 | case 4: | |
278 | mod = *(__u32 *)a % b; | |
279 | *(__u32 *)a = *(__u32 *)a / b; | |
280 | return mod; | |
281 | case 8: | |
282 | { | |
283 | unsigned long __upper, __low, __high, __mod; | |
284 | __u64 c = *(__u64 *)a; | |
285 | __upper = __high = c >> 32; | |
286 | __low = c; | |
287 | if (__high) { | |
288 | __upper = __high % (b); | |
289 | __high = __high / (b); | |
290 | } | |
291 | asm("divl %2":"=a" (__low), "=d" (__mod):"rm" (b), "0" (__low), "1" (__upper)); | |
292 | asm("":"=A" (c):"a" (__low),"d" (__high)); | |
293 | *(__u64 *)a = c; | |
294 | return __mod; | |
295 | } | |
296 | } | |
297 | ||
298 | /* NOTREACHED */ | |
299 | return 0; | |
300 | } | |
301 | ||
302 | /* Side effect free 64 bit mod operation */ | |
303 | static inline __u32 xfs_do_mod(void *a, __u32 b, int n) | |
304 | { | |
305 | switch (n) { | |
306 | case 4: | |
307 | return *(__u32 *)a % b; | |
308 | case 8: | |
309 | { | |
310 | unsigned long __upper, __low, __high, __mod; | |
311 | __u64 c = *(__u64 *)a; | |
312 | __upper = __high = c >> 32; | |
313 | __low = c; | |
314 | if (__high) { | |
315 | __upper = __high % (b); | |
316 | __high = __high / (b); | |
317 | } | |
318 | asm("divl %2":"=a" (__low), "=d" (__mod):"rm" (b), "0" (__low), "1" (__upper)); | |
319 | asm("":"=A" (c):"a" (__low),"d" (__high)); | |
320 | return __mod; | |
321 | } | |
322 | } | |
323 | ||
324 | /* NOTREACHED */ | |
325 | return 0; | |
326 | } | |
327 | #else | |
328 | static inline __u32 xfs_do_div(void *a, __u32 b, int n) | |
329 | { | |
330 | __u32 mod; | |
331 | ||
332 | switch (n) { | |
333 | case 4: | |
334 | mod = *(__u32 *)a % b; | |
335 | *(__u32 *)a = *(__u32 *)a / b; | |
336 | return mod; | |
337 | case 8: | |
338 | mod = do_div(*(__u64 *)a, b); | |
339 | return mod; | |
340 | } | |
341 | ||
342 | /* NOTREACHED */ | |
343 | return 0; | |
344 | } | |
345 | ||
346 | /* Side effect free 64 bit mod operation */ | |
347 | static inline __u32 xfs_do_mod(void *a, __u32 b, int n) | |
348 | { | |
349 | switch (n) { | |
350 | case 4: | |
351 | return *(__u32 *)a % b; | |
352 | case 8: | |
353 | { | |
354 | __u64 c = *(__u64 *)a; | |
355 | return do_div(c, b); | |
356 | } | |
357 | } | |
358 | ||
359 | /* NOTREACHED */ | |
360 | return 0; | |
361 | } | |
362 | #endif | |
363 | ||
364 | #undef do_div | |
365 | #define do_div(a, b) xfs_do_div(&(a), (b), sizeof(a)) | |
366 | #define do_mod(a, b) xfs_do_mod(&(a), (b), sizeof(a)) | |
367 | ||
368 | static inline __uint64_t roundup_64(__uint64_t x, __uint32_t y) | |
369 | { | |
370 | x += y - 1; | |
371 | do_div(x, y); | |
372 | return(x * y); | |
373 | } | |
374 | ||
375 | #define qsort(a, n, s, cmp) sort(a, n, s, cmp, NULL) | |
376 | ||
377 | #endif /* __XFS_LINUX__ */ |