forked from Minki/linux
817e9b4d9e
Sparse lead me to the dev_map_desc one and Al Viro lead me to the bufmap one. Signed-off-by: Mike Marshall <hubcap@omnibond.com>
363 lines
11 KiB
C
363 lines
11 KiB
C
/* SPDX-License-Identifier: GPL-2.0 */
|
|
#include <linux/kernel.h>
|
|
#include <linux/types.h>
|
|
#include <linux/spinlock_types.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/ioctl.h>
|
|
|
|
/* khandle stuff ***********************************************************/
|
|
|
|
/*
|
|
* The 2.9 core will put 64 bit handles in here like this:
|
|
* 1234 0000 0000 5678
|
|
* The 3.0 and beyond cores will put 128 bit handles in here like this:
|
|
* 1234 5678 90AB CDEF
|
|
* The kernel module will always use the first four bytes and
|
|
* the last four bytes as an inum.
|
|
*/
|
|
struct orangefs_khandle {
|
|
unsigned char u[16];
|
|
} __aligned(8);
|
|
|
|
/*
|
|
* kernel version of an object ref.
|
|
*/
|
|
struct orangefs_object_kref {
|
|
struct orangefs_khandle khandle;
|
|
__s32 fs_id;
|
|
__s32 __pad1;
|
|
};
|
|
|
|
/*
|
|
* compare 2 khandles assumes little endian thus from large address to
|
|
* small address
|
|
*/
|
|
static inline int ORANGEFS_khandle_cmp(const struct orangefs_khandle *kh1,
|
|
const struct orangefs_khandle *kh2)
|
|
{
|
|
int i;
|
|
|
|
for (i = 15; i >= 0; i--) {
|
|
if (kh1->u[i] > kh2->u[i])
|
|
return 1;
|
|
if (kh1->u[i] < kh2->u[i])
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static inline void ORANGEFS_khandle_to(const struct orangefs_khandle *kh,
|
|
void *p, int size)
|
|
{
|
|
|
|
memcpy(p, kh->u, 16);
|
|
memset(p + 16, 0, size - 16);
|
|
|
|
}
|
|
|
|
static inline void ORANGEFS_khandle_from(struct orangefs_khandle *kh,
|
|
void *p, int size)
|
|
{
|
|
memset(kh, 0, 16);
|
|
memcpy(kh->u, p, 16);
|
|
|
|
}
|
|
|
|
/* pvfs2-types.h ************************************************************/
|
|
|
|
#define ORANGEFS_SUPER_MAGIC 0x20030528
|
|
|
|
/*
|
|
* ORANGEFS error codes are a signed 32-bit integer. Error codes are negative, but
|
|
* the sign is stripped before decoding.
|
|
*/
|
|
|
|
/* Bit 31 is not used since it is the sign. */
|
|
|
|
/*
|
|
* Bit 30 specifies that this is a ORANGEFS error. A ORANGEFS error is either an
|
|
* encoded errno value or a ORANGEFS protocol error.
|
|
*/
|
|
#define ORANGEFS_ERROR_BIT (1 << 30)
|
|
|
|
/*
|
|
* Bit 29 specifies that this is a ORANGEFS protocol error and not an encoded
|
|
* errno value.
|
|
*/
|
|
#define ORANGEFS_NON_ERRNO_ERROR_BIT (1 << 29)
|
|
|
|
/*
|
|
* Bits 9, 8, and 7 specify the error class, which encodes the section of
|
|
* server code the error originated in for logging purposes. It is not used
|
|
* in the kernel except to be masked out.
|
|
*/
|
|
#define ORANGEFS_ERROR_CLASS_BITS 0x380
|
|
|
|
/* Bits 6 - 0 are reserved for the actual error code. */
|
|
#define ORANGEFS_ERROR_NUMBER_BITS 0x7f
|
|
|
|
/* Encoded errno values decoded by PINT_errno_mapping in orangefs-utils.c. */
|
|
|
|
/* Our own ORANGEFS protocol error codes. */
|
|
#define ORANGEFS_ECANCEL (1|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_EDEVINIT (2|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_EDETAIL (3|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_EHOSTNTFD (4|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_EADDRNTFD (5|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_ENORECVR (6|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_ETRYAGAIN (7|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_ENOTPVFS (8|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
#define ORANGEFS_ESECURITY (9|ORANGEFS_NON_ERRNO_ERROR_BIT|ORANGEFS_ERROR_BIT)
|
|
|
|
/* permission bits */
|
|
#define ORANGEFS_O_EXECUTE (1 << 0)
|
|
#define ORANGEFS_O_WRITE (1 << 1)
|
|
#define ORANGEFS_O_READ (1 << 2)
|
|
#define ORANGEFS_G_EXECUTE (1 << 3)
|
|
#define ORANGEFS_G_WRITE (1 << 4)
|
|
#define ORANGEFS_G_READ (1 << 5)
|
|
#define ORANGEFS_U_EXECUTE (1 << 6)
|
|
#define ORANGEFS_U_WRITE (1 << 7)
|
|
#define ORANGEFS_U_READ (1 << 8)
|
|
/* no ORANGEFS_U_VTX (sticky bit) */
|
|
#define ORANGEFS_G_SGID (1 << 10)
|
|
#define ORANGEFS_U_SUID (1 << 11)
|
|
|
|
#define ORANGEFS_ITERATE_START 2147483646
|
|
#define ORANGEFS_ITERATE_END 2147483645
|
|
#define ORANGEFS_IMMUTABLE_FL FS_IMMUTABLE_FL
|
|
#define ORANGEFS_APPEND_FL FS_APPEND_FL
|
|
#define ORANGEFS_NOATIME_FL FS_NOATIME_FL
|
|
#define ORANGEFS_MIRROR_FL 0x01000000ULL
|
|
#define ORANGEFS_FS_ID_NULL ((__s32)0)
|
|
#define ORANGEFS_ATTR_SYS_UID (1 << 0)
|
|
#define ORANGEFS_ATTR_SYS_GID (1 << 1)
|
|
#define ORANGEFS_ATTR_SYS_PERM (1 << 2)
|
|
#define ORANGEFS_ATTR_SYS_ATIME (1 << 3)
|
|
#define ORANGEFS_ATTR_SYS_CTIME (1 << 4)
|
|
#define ORANGEFS_ATTR_SYS_MTIME (1 << 5)
|
|
#define ORANGEFS_ATTR_SYS_TYPE (1 << 6)
|
|
#define ORANGEFS_ATTR_SYS_ATIME_SET (1 << 7)
|
|
#define ORANGEFS_ATTR_SYS_MTIME_SET (1 << 8)
|
|
#define ORANGEFS_ATTR_SYS_SIZE (1 << 20)
|
|
#define ORANGEFS_ATTR_SYS_LNK_TARGET (1 << 24)
|
|
#define ORANGEFS_ATTR_SYS_DFILE_COUNT (1 << 25)
|
|
#define ORANGEFS_ATTR_SYS_DIRENT_COUNT (1 << 26)
|
|
#define ORANGEFS_ATTR_SYS_BLKSIZE (1 << 28)
|
|
#define ORANGEFS_ATTR_SYS_MIRROR_COPIES_COUNT (1 << 29)
|
|
#define ORANGEFS_ATTR_SYS_COMMON_ALL \
|
|
(ORANGEFS_ATTR_SYS_UID | \
|
|
ORANGEFS_ATTR_SYS_GID | \
|
|
ORANGEFS_ATTR_SYS_PERM | \
|
|
ORANGEFS_ATTR_SYS_ATIME | \
|
|
ORANGEFS_ATTR_SYS_CTIME | \
|
|
ORANGEFS_ATTR_SYS_MTIME | \
|
|
ORANGEFS_ATTR_SYS_TYPE)
|
|
|
|
#define ORANGEFS_ATTR_SYS_ALL_SETABLE \
|
|
(ORANGEFS_ATTR_SYS_COMMON_ALL-ORANGEFS_ATTR_SYS_TYPE)
|
|
|
|
#define ORANGEFS_ATTR_SYS_ALL_NOHINT \
|
|
(ORANGEFS_ATTR_SYS_COMMON_ALL | \
|
|
ORANGEFS_ATTR_SYS_SIZE | \
|
|
ORANGEFS_ATTR_SYS_LNK_TARGET | \
|
|
ORANGEFS_ATTR_SYS_DFILE_COUNT | \
|
|
ORANGEFS_ATTR_SYS_MIRROR_COPIES_COUNT | \
|
|
ORANGEFS_ATTR_SYS_DIRENT_COUNT | \
|
|
ORANGEFS_ATTR_SYS_BLKSIZE)
|
|
|
|
#define ORANGEFS_XATTR_REPLACE 0x2
|
|
#define ORANGEFS_XATTR_CREATE 0x1
|
|
#define ORANGEFS_MAX_SERVER_ADDR_LEN 256
|
|
#define ORANGEFS_NAME_MAX 256
|
|
/*
|
|
* max extended attribute name len as imposed by the VFS and exploited for the
|
|
* upcall request types.
|
|
* NOTE: Please retain them as multiples of 8 even if you wish to change them
|
|
* This is *NECESSARY* for supporting 32 bit user-space binaries on a 64-bit
|
|
* kernel. Due to implementation within DBPF, this really needs to be
|
|
* ORANGEFS_NAME_MAX, which it was the same value as, but no reason to let it
|
|
* break if that changes in the future.
|
|
*/
|
|
#define ORANGEFS_MAX_XATTR_NAMELEN ORANGEFS_NAME_MAX /* Not the same as
|
|
* XATTR_NAME_MAX defined
|
|
* by <linux/xattr.h>
|
|
*/
|
|
#define ORANGEFS_MAX_XATTR_VALUELEN 8192 /* Not the same as XATTR_SIZE_MAX
|
|
* defined by <linux/xattr.h>
|
|
*/
|
|
#define ORANGEFS_MAX_XATTR_LISTLEN 16 /* Not the same as XATTR_LIST_MAX
|
|
* defined by <linux/xattr.h>
|
|
*/
|
|
/*
|
|
* ORANGEFS I/O operation types, used in both system and server interfaces.
|
|
*/
|
|
enum ORANGEFS_io_type {
|
|
ORANGEFS_IO_READ = 1,
|
|
ORANGEFS_IO_WRITE = 2
|
|
};
|
|
|
|
/*
|
|
* If this enum is modified the server parameters related to the precreate pool
|
|
* batch and low threshold sizes may need to be modified to reflect this
|
|
* change.
|
|
*/
|
|
enum orangefs_ds_type {
|
|
ORANGEFS_TYPE_NONE = 0,
|
|
ORANGEFS_TYPE_METAFILE = (1 << 0),
|
|
ORANGEFS_TYPE_DATAFILE = (1 << 1),
|
|
ORANGEFS_TYPE_DIRECTORY = (1 << 2),
|
|
ORANGEFS_TYPE_SYMLINK = (1 << 3),
|
|
ORANGEFS_TYPE_DIRDATA = (1 << 4),
|
|
ORANGEFS_TYPE_INTERNAL = (1 << 5) /* for the server's private use */
|
|
};
|
|
|
|
/* This structure is used by the VFS-client interaction alone */
|
|
struct ORANGEFS_keyval_pair {
|
|
char key[ORANGEFS_MAX_XATTR_NAMELEN];
|
|
__s32 key_sz; /* __s32 for portable, fixed-size structures */
|
|
__s32 val_sz;
|
|
char val[ORANGEFS_MAX_XATTR_VALUELEN];
|
|
};
|
|
|
|
/* pvfs2-sysint.h ***********************************************************/
|
|
/* Describes attributes for a file, directory, or symlink. */
|
|
struct ORANGEFS_sys_attr_s {
|
|
__u32 owner;
|
|
__u32 group;
|
|
__u32 perms;
|
|
__u64 atime;
|
|
__u64 mtime;
|
|
__u64 ctime;
|
|
__s64 size;
|
|
|
|
/* NOTE: caller must free if valid */
|
|
char *link_target;
|
|
|
|
/* Changed to __s32 so that size of structure does not change */
|
|
__s32 dfile_count;
|
|
|
|
/* Changed to __s32 so that size of structure does not change */
|
|
__s32 distr_dir_servers_initial;
|
|
|
|
/* Changed to __s32 so that size of structure does not change */
|
|
__s32 distr_dir_servers_max;
|
|
|
|
/* Changed to __s32 so that size of structure does not change */
|
|
__s32 distr_dir_split_size;
|
|
|
|
__u32 mirror_copies_count;
|
|
|
|
/* NOTE: caller must free if valid */
|
|
char *dist_name;
|
|
|
|
/* NOTE: caller must free if valid */
|
|
char *dist_params;
|
|
|
|
__s64 dirent_count;
|
|
enum orangefs_ds_type objtype;
|
|
__u64 flags;
|
|
__u32 mask;
|
|
__s64 blksize;
|
|
};
|
|
|
|
#define ORANGEFS_LOOKUP_LINK_NO_FOLLOW 0
|
|
|
|
/* pint-dev.h ***************************************************************/
|
|
|
|
/* parameter structure used in ORANGEFS_DEV_DEBUG ioctl command */
|
|
struct dev_mask_info_s {
|
|
enum {
|
|
KERNEL_MASK,
|
|
CLIENT_MASK,
|
|
} mask_type;
|
|
__u64 mask_value;
|
|
};
|
|
|
|
struct dev_mask2_info_s {
|
|
__u64 mask1_value;
|
|
__u64 mask2_value;
|
|
};
|
|
|
|
/* pvfs2-util.h *************************************************************/
|
|
__s32 ORANGEFS_util_translate_mode(int mode);
|
|
|
|
/* pvfs2-debug.h ************************************************************/
|
|
#include "orangefs-debug.h"
|
|
|
|
/* pvfs2-internal.h *********************************************************/
|
|
#define llu(x) (unsigned long long)(x)
|
|
#define lld(x) (long long)(x)
|
|
|
|
/* pint-dev-shared.h ********************************************************/
|
|
#define ORANGEFS_DEV_MAGIC 'k'
|
|
|
|
#define ORANGEFS_READDIR_DEFAULT_DESC_COUNT 5
|
|
|
|
#define DEV_GET_MAGIC 0x1
|
|
#define DEV_GET_MAX_UPSIZE 0x2
|
|
#define DEV_GET_MAX_DOWNSIZE 0x3
|
|
#define DEV_MAP 0x4
|
|
#define DEV_REMOUNT_ALL 0x5
|
|
#define DEV_DEBUG 0x6
|
|
#define DEV_UPSTREAM 0x7
|
|
#define DEV_CLIENT_MASK 0x8
|
|
#define DEV_CLIENT_STRING 0x9
|
|
#define DEV_MAX_NR 0xa
|
|
|
|
/* supported ioctls, codes are with respect to user-space */
|
|
enum {
|
|
ORANGEFS_DEV_GET_MAGIC = _IOW(ORANGEFS_DEV_MAGIC, DEV_GET_MAGIC, __s32),
|
|
ORANGEFS_DEV_GET_MAX_UPSIZE =
|
|
_IOW(ORANGEFS_DEV_MAGIC, DEV_GET_MAX_UPSIZE, __s32),
|
|
ORANGEFS_DEV_GET_MAX_DOWNSIZE =
|
|
_IOW(ORANGEFS_DEV_MAGIC, DEV_GET_MAX_DOWNSIZE, __s32),
|
|
ORANGEFS_DEV_MAP = _IO(ORANGEFS_DEV_MAGIC, DEV_MAP),
|
|
ORANGEFS_DEV_REMOUNT_ALL = _IO(ORANGEFS_DEV_MAGIC, DEV_REMOUNT_ALL),
|
|
ORANGEFS_DEV_DEBUG = _IOR(ORANGEFS_DEV_MAGIC, DEV_DEBUG, __s32),
|
|
ORANGEFS_DEV_UPSTREAM = _IOW(ORANGEFS_DEV_MAGIC, DEV_UPSTREAM, int),
|
|
ORANGEFS_DEV_CLIENT_MASK = _IOW(ORANGEFS_DEV_MAGIC,
|
|
DEV_CLIENT_MASK,
|
|
struct dev_mask2_info_s),
|
|
ORANGEFS_DEV_CLIENT_STRING = _IOW(ORANGEFS_DEV_MAGIC,
|
|
DEV_CLIENT_STRING,
|
|
char *),
|
|
ORANGEFS_DEV_MAXNR = DEV_MAX_NR,
|
|
};
|
|
|
|
/*
|
|
* version number for use in communicating between kernel space and user
|
|
* space. Zero signifies the upstream version of the kernel module.
|
|
*/
|
|
#define ORANGEFS_KERNEL_PROTO_VERSION 0
|
|
#define ORANGEFS_MINIMUM_USERSPACE_VERSION 20903
|
|
|
|
/*
|
|
* describes memory regions to map in the ORANGEFS_DEV_MAP ioctl.
|
|
* NOTE: See devorangefs-req.c for 32 bit compat structure.
|
|
* Since this structure has a variable-sized layout that is different
|
|
* on 32 and 64 bit platforms, we need to normalize to a 64 bit layout
|
|
* on such systems before servicing ioctl calls from user-space binaries
|
|
* that may be 32 bit!
|
|
*/
|
|
struct ORANGEFS_dev_map_desc {
|
|
void __user *ptr;
|
|
__s32 total_size;
|
|
__s32 size;
|
|
__s32 count;
|
|
};
|
|
|
|
/* gossip.h *****************************************************************/
|
|
|
|
extern __u64 orangefs_gossip_debug_mask;
|
|
|
|
/* try to avoid function call overhead by checking masks in macro */
|
|
#define gossip_debug(mask, fmt, ...) \
|
|
do { \
|
|
if (orangefs_gossip_debug_mask & (mask)) \
|
|
printk(KERN_DEBUG fmt, ##__VA_ARGS__); \
|
|
} while (0)
|
|
|
|
#define gossip_err pr_err
|