2005-04-16 18:20:36 -04:00
|
|
|
/*
|
2005-11-01 22:58:39 -05:00
|
|
|
* Copyright (c) 2000-2005 Silicon Graphics, Inc.
|
|
|
|
* All Rights Reserved.
|
2005-04-16 18:20:36 -04:00
|
|
|
*
|
2005-11-01 22:58:39 -05:00
|
|
|
* This program is free software; you can redistribute it and/or
|
|
|
|
* modify it under the terms of the GNU General Public License as
|
2005-04-16 18:20:36 -04:00
|
|
|
* published by the Free Software Foundation.
|
|
|
|
*
|
2005-11-01 22:58:39 -05:00
|
|
|
* This program is distributed in the hope that it would be useful,
|
|
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
* GNU General Public License for more details.
|
2005-04-16 18:20:36 -04:00
|
|
|
*
|
2005-11-01 22:58:39 -05:00
|
|
|
* You should have received a copy of the GNU General Public License
|
|
|
|
* along with this program; if not, write the Free Software Foundation,
|
|
|
|
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA
|
2005-04-16 18:20:36 -04:00
|
|
|
*/
|
|
|
|
#ifndef __XFS_LINUX__
|
|
|
|
#define __XFS_LINUX__
|
|
|
|
|
|
|
|
#include <linux/types.h>
|
|
|
|
#include <linux/config.h>
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Some types are conditional depending on the target system.
|
|
|
|
* XFS_BIG_BLKNOS needs block layer disk addresses to be 64 bits.
|
|
|
|
* XFS_BIG_INUMS needs the VFS inode number to be 64 bits, as well
|
|
|
|
* as requiring XFS_BIG_BLKNOS to be set.
|
|
|
|
*/
|
|
|
|
#if defined(CONFIG_LBD) || (BITS_PER_LONG == 64)
|
|
|
|
# define XFS_BIG_BLKNOS 1
|
|
|
|
# if BITS_PER_LONG == 64
|
|
|
|
# define XFS_BIG_INUMS 1
|
|
|
|
# else
|
|
|
|
# define XFS_BIG_INUMS 0
|
|
|
|
# endif
|
|
|
|
#else
|
|
|
|
# define XFS_BIG_BLKNOS 0
|
|
|
|
# define XFS_BIG_INUMS 0
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#include <xfs_types.h>
|
|
|
|
#include <xfs_arch.h>
|
|
|
|
|
|
|
|
#include <kmem.h>
|
|
|
|
#include <mrlock.h>
|
|
|
|
#include <spin.h>
|
|
|
|
#include <sv.h>
|
|
|
|
#include <mutex.h>
|
|
|
|
#include <sema.h>
|
|
|
|
#include <time.h>
|
|
|
|
|
|
|
|
#include <support/ktrace.h>
|
|
|
|
#include <support/debug.h>
|
|
|
|
#include <support/move.h>
|
|
|
|
#include <support/uuid.h>
|
|
|
|
|
|
|
|
#include <linux/mm.h>
|
|
|
|
#include <linux/kernel.h>
|
|
|
|
#include <linux/blkdev.h>
|
|
|
|
#include <linux/slab.h>
|
|
|
|
#include <linux/module.h>
|
|
|
|
#include <linux/file.h>
|
|
|
|
#include <linux/swap.h>
|
|
|
|
#include <linux/errno.h>
|
|
|
|
#include <linux/sched.h>
|
|
|
|
#include <linux/bitops.h>
|
|
|
|
#include <linux/major.h>
|
|
|
|
#include <linux/pagemap.h>
|
|
|
|
#include <linux/vfs.h>
|
|
|
|
#include <linux/seq_file.h>
|
|
|
|
#include <linux/init.h>
|
|
|
|
#include <linux/list.h>
|
|
|
|
#include <linux/proc_fs.h>
|
|
|
|
#include <linux/sort.h>
|
|
|
|
|
|
|
|
#include <asm/page.h>
|
|
|
|
#include <asm/div64.h>
|
|
|
|
#include <asm/param.h>
|
|
|
|
#include <asm/uaccess.h>
|
|
|
|
#include <asm/byteorder.h>
|
|
|
|
#include <asm/unaligned.h>
|
|
|
|
|
|
|
|
#include <xfs_behavior.h>
|
|
|
|
#include <xfs_vfs.h>
|
|
|
|
#include <xfs_cred.h>
|
|
|
|
#include <xfs_vnode.h>
|
|
|
|
#include <xfs_stats.h>
|
|
|
|
#include <xfs_sysctl.h>
|
|
|
|
#include <xfs_iops.h>
|
2005-09-02 02:58:49 -04:00
|
|
|
#include <xfs_aops.h>
|
2005-04-16 18:20:36 -04:00
|
|
|
#include <xfs_super.h>
|
|
|
|
#include <xfs_globals.h>
|
|
|
|
#include <xfs_fs_subr.h>
|
|
|
|
#include <xfs_lrw.h>
|
|
|
|
#include <xfs_buf.h>
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Feature macros (disable/enable)
|
|
|
|
*/
|
|
|
|
#undef HAVE_REFCACHE /* reference cache not needed for NFS in 2.6 */
|
|
|
|
#define HAVE_SENDFILE /* sendfile(2) exists in 2.6, but not in 2.4 */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* State flag for unwritten extent buffers.
|
|
|
|
*
|
|
|
|
* We need to be able to distinguish between these and delayed
|
|
|
|
* allocate buffers within XFS. The generic IO path code does
|
|
|
|
* not need to distinguish - we use the BH_Delay flag for both
|
|
|
|
* delalloc and these ondisk-uninitialised buffers.
|
|
|
|
*/
|
|
|
|
BUFFER_FNS(PrivateStart, unwritten);
|
|
|
|
|
|
|
|
#define restricted_chown xfs_params.restrict_chown.val
|
|
|
|
#define irix_sgid_inherit xfs_params.sgid_inherit.val
|
|
|
|
#define irix_symlink_mode xfs_params.symlink_mode.val
|
|
|
|
#define xfs_panic_mask xfs_params.panic_mask.val
|
|
|
|
#define xfs_error_level xfs_params.error_level.val
|
|
|
|
#define xfs_syncd_centisecs xfs_params.syncd_timer.val
|
|
|
|
#define xfs_stats_clear xfs_params.stats_clear.val
|
|
|
|
#define xfs_inherit_sync xfs_params.inherit_sync.val
|
|
|
|
#define xfs_inherit_nodump xfs_params.inherit_nodump.val
|
|
|
|
#define xfs_inherit_noatime xfs_params.inherit_noatim.val
|
|
|
|
#define xfs_buf_timer_centisecs xfs_params.xfs_buf_timer.val
|
|
|
|
#define xfs_buf_age_centisecs xfs_params.xfs_buf_age.val
|
|
|
|
#define xfs_inherit_nosymlinks xfs_params.inherit_nosym.val
|
|
|
|
#define xfs_rotorstep xfs_params.rotorstep.val
|
|
|
|
|
2005-06-21 20:14:34 -04:00
|
|
|
#ifndef raw_smp_processor_id
|
|
|
|
#define raw_smp_processor_id() smp_processor_id()
|
2005-04-16 18:20:36 -04:00
|
|
|
#endif
|
2005-06-21 20:14:34 -04:00
|
|
|
#define current_cpu() raw_smp_processor_id()
|
2005-04-16 18:20:36 -04:00
|
|
|
#define current_pid() (current->pid)
|
|
|
|
#define current_fsuid(cred) (current->fsuid)
|
|
|
|
#define current_fsgid(cred) (current->fsgid)
|
|
|
|
|
|
|
|
#define NBPP PAGE_SIZE
|
|
|
|
#define DPPSHFT (PAGE_SHIFT - 9)
|
|
|
|
#define NDPP (1 << (PAGE_SHIFT - 9))
|
|
|
|
#define dtop(DD) (((DD) + NDPP - 1) >> DPPSHFT)
|
|
|
|
#define dtopt(DD) ((DD) >> DPPSHFT)
|
|
|
|
#define dpoff(DD) ((DD) & (NDPP-1))
|
|
|
|
|
|
|
|
#define NBBY 8 /* number of bits per byte */
|
|
|
|
#define NBPC PAGE_SIZE /* Number of bytes per click */
|
|
|
|
#define BPCSHIFT PAGE_SHIFT /* LOG2(NBPC) if exact */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Size of block device i/o is parameterized here.
|
|
|
|
* Currently the system supports page-sized i/o.
|
|
|
|
*/
|
|
|
|
#define BLKDEV_IOSHIFT BPCSHIFT
|
|
|
|
#define BLKDEV_IOSIZE (1<<BLKDEV_IOSHIFT)
|
|
|
|
/* number of BB's per block device block */
|
|
|
|
#define BLKDEV_BB BTOBB(BLKDEV_IOSIZE)
|
|
|
|
|
|
|
|
/* bytes to clicks */
|
|
|
|
#define btoc(x) (((__psunsigned_t)(x)+(NBPC-1))>>BPCSHIFT)
|
|
|
|
#define btoct(x) ((__psunsigned_t)(x)>>BPCSHIFT)
|
|
|
|
#define btoc64(x) (((__uint64_t)(x)+(NBPC-1))>>BPCSHIFT)
|
|
|
|
#define btoct64(x) ((__uint64_t)(x)>>BPCSHIFT)
|
|
|
|
#define io_btoc(x) (((__psunsigned_t)(x)+(IO_NBPC-1))>>IO_BPCSHIFT)
|
|
|
|
#define io_btoct(x) ((__psunsigned_t)(x)>>IO_BPCSHIFT)
|
|
|
|
|
|
|
|
/* off_t bytes to clicks */
|
|
|
|
#define offtoc(x) (((__uint64_t)(x)+(NBPC-1))>>BPCSHIFT)
|
|
|
|
#define offtoct(x) ((xfs_off_t)(x)>>BPCSHIFT)
|
|
|
|
|
|
|
|
/* clicks to off_t bytes */
|
|
|
|
#define ctooff(x) ((xfs_off_t)(x)<<BPCSHIFT)
|
|
|
|
|
|
|
|
/* clicks to bytes */
|
|
|
|
#define ctob(x) ((__psunsigned_t)(x)<<BPCSHIFT)
|
|
|
|
#define btoct(x) ((__psunsigned_t)(x)>>BPCSHIFT)
|
|
|
|
#define ctob64(x) ((__uint64_t)(x)<<BPCSHIFT)
|
|
|
|
#define io_ctob(x) ((__psunsigned_t)(x)<<IO_BPCSHIFT)
|
|
|
|
|
|
|
|
/* bytes to clicks */
|
|
|
|
#define btoc(x) (((__psunsigned_t)(x)+(NBPC-1))>>BPCSHIFT)
|
|
|
|
|
|
|
|
#ifndef ENOATTR
|
|
|
|
#define ENOATTR ENODATA /* Attribute not found */
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/* Note: EWRONGFS never visible outside the kernel */
|
|
|
|
#define EWRONGFS EINVAL /* Mount with wrong filesystem type */
|
|
|
|
|
|
|
|
/*
|
|
|
|
* XXX EFSCORRUPTED needs a real value in errno.h. asm-i386/errno.h won't
|
|
|
|
* return codes out of its known range in errno.
|
|
|
|
* XXX Also note: needs to be < 1000 and fairly unique on Linux (mustn't
|
|
|
|
* conflict with any code we use already or any code a driver may use)
|
|
|
|
* XXX Some options (currently we do #2):
|
|
|
|
* 1/ New error code ["Filesystem is corrupted", _after_ glibc updated]
|
|
|
|
* 2/ 990 ["Unknown error 990"]
|
|
|
|
* 3/ EUCLEAN ["Structure needs cleaning"]
|
|
|
|
* 4/ Convert EFSCORRUPTED to EIO [just prior to return into userspace]
|
|
|
|
*/
|
|
|
|
#define EFSCORRUPTED 990 /* Filesystem is corrupted */
|
|
|
|
|
|
|
|
#define SYNCHRONIZE() barrier()
|
|
|
|
#define __return_address __builtin_return_address(0)
|
|
|
|
|
|
|
|
/*
|
|
|
|
* IRIX (BSD) quotactl makes use of separate commands for user/group,
|
|
|
|
* whereas on Linux the syscall encodes this information into the cmd
|
|
|
|
* field (see the QCMD macro in quota.h). These macros help keep the
|
|
|
|
* code portable - they are not visible from the syscall interface.
|
|
|
|
*/
|
2005-06-21 01:38:48 -04:00
|
|
|
#define Q_XSETGQLIM XQM_CMD(8) /* set groups disk limits */
|
|
|
|
#define Q_XGETGQUOTA XQM_CMD(9) /* get groups disk limits */
|
|
|
|
#define Q_XSETPQLIM XQM_CMD(10) /* set projects disk limits */
|
|
|
|
#define Q_XGETPQUOTA XQM_CMD(11) /* get projects disk limits */
|
2005-04-16 18:20:36 -04:00
|
|
|
|
2005-11-01 23:08:25 -05:00
|
|
|
#define dfltprid 0
|
2005-04-16 18:20:36 -04:00
|
|
|
#define MAXPATHLEN 1024
|
|
|
|
|
|
|
|
#define MIN(a,b) (min(a,b))
|
|
|
|
#define MAX(a,b) (max(a,b))
|
|
|
|
#define howmany(x, y) (((x)+((y)-1))/(y))
|
|
|
|
#define roundup(x, y) ((((x)+((y)-1))/(y))*(y))
|
|
|
|
|
2005-09-04 21:47:01 -04:00
|
|
|
/*
|
|
|
|
* Various platform dependent calls that don't fit anywhere else
|
|
|
|
*/
|
2005-11-01 19:43:18 -05:00
|
|
|
#define xfs_sort(a,n,s,fn) sort(a,n,s,fn,NULL)
|
2005-04-16 18:20:36 -04:00
|
|
|
#define xfs_stack_trace() dump_stack()
|
|
|
|
#define xfs_itruncate_data(ip, off) \
|
|
|
|
(-vmtruncate(LINVFS_GET_IP(XFS_ITOV(ip)), (off)))
|
2005-09-04 21:47:01 -04:00
|
|
|
#define xfs_statvfs_fsid(statp, mp) \
|
2006-01-10 23:39:08 -05:00
|
|
|
({ u64 id = huge_encode_dev((mp)->m_ddev_targp->bt_dev); \
|
2005-09-04 21:47:01 -04:00
|
|
|
__kernel_fsid_t *fsid = &(statp)->f_fsid; \
|
|
|
|
(fsid->val[0] = (u32)id, fsid->val[1] = (u32)(id >> 32)); })
|
2005-04-16 18:20:36 -04:00
|
|
|
|
|
|
|
|
|
|
|
/* Move the kernel do_div definition off to one side */
|
|
|
|
|
|
|
|
#if defined __i386__
|
|
|
|
/* For ia32 we need to pull some tricks to get past various versions
|
|
|
|
* of the compiler which do not like us using do_div in the middle
|
|
|
|
* of large functions.
|
|
|
|
*/
|
|
|
|
static inline __u32 xfs_do_div(void *a, __u32 b, int n)
|
|
|
|
{
|
|
|
|
__u32 mod;
|
|
|
|
|
|
|
|
switch (n) {
|
|
|
|
case 4:
|
|
|
|
mod = *(__u32 *)a % b;
|
|
|
|
*(__u32 *)a = *(__u32 *)a / b;
|
|
|
|
return mod;
|
|
|
|
case 8:
|
|
|
|
{
|
|
|
|
unsigned long __upper, __low, __high, __mod;
|
|
|
|
__u64 c = *(__u64 *)a;
|
|
|
|
__upper = __high = c >> 32;
|
|
|
|
__low = c;
|
|
|
|
if (__high) {
|
|
|
|
__upper = __high % (b);
|
|
|
|
__high = __high / (b);
|
|
|
|
}
|
|
|
|
asm("divl %2":"=a" (__low), "=d" (__mod):"rm" (b), "0" (__low), "1" (__upper));
|
|
|
|
asm("":"=A" (c):"a" (__low),"d" (__high));
|
|
|
|
*(__u64 *)a = c;
|
|
|
|
return __mod;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* NOTREACHED */
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Side effect free 64 bit mod operation */
|
|
|
|
static inline __u32 xfs_do_mod(void *a, __u32 b, int n)
|
|
|
|
{
|
|
|
|
switch (n) {
|
|
|
|
case 4:
|
|
|
|
return *(__u32 *)a % b;
|
|
|
|
case 8:
|
|
|
|
{
|
|
|
|
unsigned long __upper, __low, __high, __mod;
|
|
|
|
__u64 c = *(__u64 *)a;
|
|
|
|
__upper = __high = c >> 32;
|
|
|
|
__low = c;
|
|
|
|
if (__high) {
|
|
|
|
__upper = __high % (b);
|
|
|
|
__high = __high / (b);
|
|
|
|
}
|
|
|
|
asm("divl %2":"=a" (__low), "=d" (__mod):"rm" (b), "0" (__low), "1" (__upper));
|
|
|
|
asm("":"=A" (c):"a" (__low),"d" (__high));
|
|
|
|
return __mod;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* NOTREACHED */
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#else
|
|
|
|
static inline __u32 xfs_do_div(void *a, __u32 b, int n)
|
|
|
|
{
|
|
|
|
__u32 mod;
|
|
|
|
|
|
|
|
switch (n) {
|
|
|
|
case 4:
|
|
|
|
mod = *(__u32 *)a % b;
|
|
|
|
*(__u32 *)a = *(__u32 *)a / b;
|
|
|
|
return mod;
|
|
|
|
case 8:
|
|
|
|
mod = do_div(*(__u64 *)a, b);
|
|
|
|
return mod;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* NOTREACHED */
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Side effect free 64 bit mod operation */
|
|
|
|
static inline __u32 xfs_do_mod(void *a, __u32 b, int n)
|
|
|
|
{
|
|
|
|
switch (n) {
|
|
|
|
case 4:
|
|
|
|
return *(__u32 *)a % b;
|
|
|
|
case 8:
|
|
|
|
{
|
|
|
|
__u64 c = *(__u64 *)a;
|
|
|
|
return do_div(c, b);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* NOTREACHED */
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#undef do_div
|
|
|
|
#define do_div(a, b) xfs_do_div(&(a), (b), sizeof(a))
|
|
|
|
#define do_mod(a, b) xfs_do_mod(&(a), (b), sizeof(a))
|
|
|
|
|
|
|
|
static inline __uint64_t roundup_64(__uint64_t x, __uint32_t y)
|
|
|
|
{
|
|
|
|
x += y - 1;
|
|
|
|
do_div(x, y);
|
|
|
|
return(x * y);
|
|
|
|
}
|
|
|
|
|
|
|
|
#endif /* __XFS_LINUX__ */
|