Commit eca281aa authored by Linus Torvalds's avatar Linus Torvalds

Merge branch 'upstream-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/jlbec/ocfs2

* 'upstream-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/jlbec/ocfs2: (36 commits)
  Ocfs2: Move ocfs2 ioctl definitions from ocfs2_fs.h to newly added ocfs2_ioctl.h
  ocfs2: send SIGXFSZ if new filesize exceeds limit -v2
  ocfs2/userdlm: Add tracing in userdlm
  ocfs2: Use a separate masklog for AST and BASTs
  dlm: allow dlm do recovery during shutdown
  ocfs2: Only bug out in direct io write for reflinked extent.
  ocfs2: fix warning in ocfs2_file_aio_write()
  ocfs2_dlmfs: Enable the use of user cluster stacks.
  ocfs2_dlmfs: Use the stackglue.
  ocfs2_dlmfs: Don't honor truncate.  The size of a dlmfs file is LVB_LEN
  ocfs2: Pass the locking protocol into ocfs2_cluster_connect().
  ocfs2: Remove the ast pointers from ocfs2_stack_plugins
  ocfs2: Hang the locking proto on the cluster conn and use it in asts.
  ocfs2: Attach the connection to the lksb
  ocfs2: Pass lksbs back from stackglue ast/bast functions.
  ocfs2_dlmfs: Move to its own directory
  ocfs2_dlmfs: Use poll() to signify BASTs.
  ocfs2_dlmfs: Add capabilities parameter.
  ocfs2: Handle errors while setting external xattr values.
  ocfs2: Set inline xattr entries with ocfs2_xa_set()
  ...
parents 7f5b09c1 9df5778e
...@@ -46,6 +46,7 @@ ocfs2_stackglue-objs := stackglue.o ...@@ -46,6 +46,7 @@ ocfs2_stackglue-objs := stackglue.o
ocfs2_stack_o2cb-objs := stack_o2cb.o ocfs2_stack_o2cb-objs := stack_o2cb.o
ocfs2_stack_user-objs := stack_user.o ocfs2_stack_user-objs := stack_user.o
obj-$(CONFIG_OCFS2_FS) += dlmfs/
# cluster/ is always needed when OCFS2_FS for masklog support # cluster/ is always needed when OCFS2_FS for masklog support
obj-$(CONFIG_OCFS2_FS) += cluster/ obj-$(CONFIG_OCFS2_FS) += cluster/
obj-$(CONFIG_OCFS2_FS_O2CB) += dlm/ obj-$(CONFIG_OCFS2_FS_O2CB) += dlm/
...@@ -1050,7 +1050,8 @@ static int ocfs2_create_new_meta_bhs(handle_t *handle, ...@@ -1050,7 +1050,8 @@ static int ocfs2_create_new_meta_bhs(handle_t *handle,
strcpy(eb->h_signature, OCFS2_EXTENT_BLOCK_SIGNATURE); strcpy(eb->h_signature, OCFS2_EXTENT_BLOCK_SIGNATURE);
eb->h_blkno = cpu_to_le64(first_blkno); eb->h_blkno = cpu_to_le64(first_blkno);
eb->h_fs_generation = cpu_to_le32(osb->fs_generation); eb->h_fs_generation = cpu_to_le32(osb->fs_generation);
eb->h_suballoc_slot = cpu_to_le16(osb->slot_num); eb->h_suballoc_slot =
cpu_to_le16(meta_ac->ac_alloc_slot);
eb->h_suballoc_bit = cpu_to_le16(suballoc_bit_start); eb->h_suballoc_bit = cpu_to_le16(suballoc_bit_start);
eb->h_list.l_count = eb->h_list.l_count =
cpu_to_le16(ocfs2_extent_recs_per_eb(osb->sb)); cpu_to_le16(ocfs2_extent_recs_per_eb(osb->sb));
...@@ -6037,7 +6038,7 @@ static void ocfs2_truncate_log_worker(struct work_struct *work) ...@@ -6037,7 +6038,7 @@ static void ocfs2_truncate_log_worker(struct work_struct *work)
if (status < 0) if (status < 0)
mlog_errno(status); mlog_errno(status);
else else
ocfs2_init_inode_steal_slot(osb); ocfs2_init_steal_slots(osb);
mlog_exit(status); mlog_exit(status);
} }
......
...@@ -577,8 +577,9 @@ static int ocfs2_direct_IO_get_blocks(struct inode *inode, sector_t iblock, ...@@ -577,8 +577,9 @@ static int ocfs2_direct_IO_get_blocks(struct inode *inode, sector_t iblock,
goto bail; goto bail;
} }
/* We should already CoW the refcounted extent. */ /* We should already CoW the refcounted extent in case of create. */
BUG_ON(ext_flags & OCFS2_EXT_REFCOUNTED); BUG_ON(create && (ext_flags & OCFS2_EXT_REFCOUNTED));
/* /*
* get_more_blocks() expects us to describe a hole by clearing * get_more_blocks() expects us to describe a hole by clearing
* the mapped bit on bh_result(). * the mapped bit on bh_result().
......
...@@ -112,6 +112,7 @@ static struct mlog_attribute mlog_attrs[MLOG_MAX_BITS] = { ...@@ -112,6 +112,7 @@ static struct mlog_attribute mlog_attrs[MLOG_MAX_BITS] = {
define_mask(XATTR), define_mask(XATTR),
define_mask(QUOTA), define_mask(QUOTA),
define_mask(REFCOUNT), define_mask(REFCOUNT),
define_mask(BASTS),
define_mask(ERROR), define_mask(ERROR),
define_mask(NOTICE), define_mask(NOTICE),
define_mask(KTHREAD), define_mask(KTHREAD),
......
...@@ -114,6 +114,7 @@ ...@@ -114,6 +114,7 @@
#define ML_XATTR 0x0000000020000000ULL /* ocfs2 extended attributes */ #define ML_XATTR 0x0000000020000000ULL /* ocfs2 extended attributes */
#define ML_QUOTA 0x0000000040000000ULL /* ocfs2 quota operations */ #define ML_QUOTA 0x0000000040000000ULL /* ocfs2 quota operations */
#define ML_REFCOUNT 0x0000000080000000ULL /* refcount tree operations */ #define ML_REFCOUNT 0x0000000080000000ULL /* refcount tree operations */
#define ML_BASTS 0x0000001000000000ULL /* dlmglue asts and basts */
/* bits that are infrequently given and frequently matched in the high word */ /* bits that are infrequently given and frequently matched in the high word */
#define ML_ERROR 0x0000000100000000ULL /* sent to KERN_ERR */ #define ML_ERROR 0x0000000100000000ULL /* sent to KERN_ERR */
#define ML_NOTICE 0x0000000200000000ULL /* setn to KERN_NOTICE */ #define ML_NOTICE 0x0000000200000000ULL /* setn to KERN_NOTICE */
...@@ -194,9 +195,9 @@ extern struct mlog_bits mlog_and_bits, mlog_not_bits; ...@@ -194,9 +195,9 @@ extern struct mlog_bits mlog_and_bits, mlog_not_bits;
* previous token if args expands to nothing. * previous token if args expands to nothing.
*/ */
#define __mlog_printk(level, fmt, args...) \ #define __mlog_printk(level, fmt, args...) \
printk(level "(%u,%lu):%s:%d " fmt, task_pid_nr(current), \ printk(level "(%s,%u,%lu):%s:%d " fmt, current->comm, \
__mlog_cpu_guess, __PRETTY_FUNCTION__, __LINE__ , \ task_pid_nr(current), __mlog_cpu_guess, \
##args) __PRETTY_FUNCTION__, __LINE__ , ##args)
#define mlog(mask, fmt, args...) do { \ #define mlog(mask, fmt, args...) do { \
u64 __m = MLOG_MASK_PREFIX | (mask); \ u64 __m = MLOG_MASK_PREFIX | (mask); \
......
...@@ -2439,7 +2439,7 @@ static int ocfs2_dx_dir_attach_index(struct ocfs2_super *osb, ...@@ -2439,7 +2439,7 @@ static int ocfs2_dx_dir_attach_index(struct ocfs2_super *osb,
dx_root = (struct ocfs2_dx_root_block *)dx_root_bh->b_data; dx_root = (struct ocfs2_dx_root_block *)dx_root_bh->b_data;
memset(dx_root, 0, osb->sb->s_blocksize); memset(dx_root, 0, osb->sb->s_blocksize);
strcpy(dx_root->dr_signature, OCFS2_DX_ROOT_SIGNATURE); strcpy(dx_root->dr_signature, OCFS2_DX_ROOT_SIGNATURE);
dx_root->dr_suballoc_slot = cpu_to_le16(osb->slot_num); dx_root->dr_suballoc_slot = cpu_to_le16(meta_ac->ac_alloc_slot);
dx_root->dr_suballoc_bit = cpu_to_le16(dr_suballoc_bit); dx_root->dr_suballoc_bit = cpu_to_le16(dr_suballoc_bit);
dx_root->dr_fs_generation = cpu_to_le32(osb->fs_generation); dx_root->dr_fs_generation = cpu_to_le32(osb->fs_generation);
dx_root->dr_blkno = cpu_to_le64(dr_blkno); dx_root->dr_blkno = cpu_to_le64(dr_blkno);
......
EXTRA_CFLAGS += -Ifs/ocfs2 EXTRA_CFLAGS += -Ifs/ocfs2
obj-$(CONFIG_OCFS2_FS_O2CB) += ocfs2_dlm.o ocfs2_dlmfs.o obj-$(CONFIG_OCFS2_FS_O2CB) += ocfs2_dlm.o
ocfs2_dlm-objs := dlmdomain.o dlmdebug.o dlmthread.o dlmrecovery.o \ ocfs2_dlm-objs := dlmdomain.o dlmdebug.o dlmthread.o dlmrecovery.o \
dlmmaster.o dlmast.o dlmconvert.o dlmlock.o dlmunlock.o dlmver.o dlmmaster.o dlmast.o dlmconvert.o dlmlock.o dlmunlock.o dlmver.o
ocfs2_dlmfs-objs := userdlm.o dlmfs.o dlmfsver.o
...@@ -310,7 +310,7 @@ static int dlm_recovery_thread(void *data) ...@@ -310,7 +310,7 @@ static int dlm_recovery_thread(void *data)
mlog(0, "dlm thread running for %s...\n", dlm->name); mlog(0, "dlm thread running for %s...\n", dlm->name);
while (!kthread_should_stop()) { while (!kthread_should_stop()) {
if (dlm_joined(dlm)) { if (dlm_domain_fully_joined(dlm)) {
status = dlm_do_recovery(dlm); status = dlm_do_recovery(dlm);
if (status == -EAGAIN) { if (status == -EAGAIN) {
/* do not sleep, recheck immediately. */ /* do not sleep, recheck immediately. */
......
EXTRA_CFLAGS += -Ifs/ocfs2
obj-$(CONFIG_OCFS2_FS) += ocfs2_dlmfs.o
ocfs2_dlmfs-objs := userdlm.o dlmfs.o dlmfsver.o
...@@ -43,24 +43,17 @@ ...@@ -43,24 +43,17 @@
#include <linux/init.h> #include <linux/init.h>
#include <linux/string.h> #include <linux/string.h>
#include <linux/backing-dev.h> #include <linux/backing-dev.h>
#include <linux/poll.h>
#include <asm/uaccess.h> #include <asm/uaccess.h>
#include "stackglue.h"
#include "cluster/nodemanager.h"
#include "cluster/heartbeat.h"
#include "cluster/tcp.h"
#include "dlmapi.h"
#include "userdlm.h" #include "userdlm.h"
#include "dlmfsver.h" #include "dlmfsver.h"
#define MLOG_MASK_PREFIX ML_DLMFS #define MLOG_MASK_PREFIX ML_DLMFS
#include "cluster/masklog.h" #include "cluster/masklog.h"
#include "ocfs2_lockingver.h"
static const struct super_operations dlmfs_ops; static const struct super_operations dlmfs_ops;
static const struct file_operations dlmfs_file_operations; static const struct file_operations dlmfs_file_operations;
...@@ -71,15 +64,46 @@ static struct kmem_cache *dlmfs_inode_cache; ...@@ -71,15 +64,46 @@ static struct kmem_cache *dlmfs_inode_cache;
struct workqueue_struct *user_dlm_worker; struct workqueue_struct *user_dlm_worker;
/* /*
* This is the userdlmfs locking protocol version. * These are the ABI capabilities of dlmfs.
*
* Over time, dlmfs has added some features that were not part of the
* initial ABI. Unfortunately, some of these features are not detectable
* via standard usage. For example, Linux's default poll always returns
* POLLIN, so there is no way for a caller of poll(2) to know when dlmfs
* added poll support. Instead, we provide this list of new capabilities.
*
* Capabilities is a read-only attribute. We do it as a module parameter
* so we can discover it whether dlmfs is built in, loaded, or even not
* loaded.
* *
* See fs/ocfs2/dlmglue.c for more details on locking versions. * The ABI features are local to this machine's dlmfs mount. This is
* distinct from the locking protocol, which is concerned with inter-node
* interaction.
*
* Capabilities:
* - bast : POLLIN against the file descriptor of a held lock
* signifies a bast fired on the lock.
*/ */
static const struct dlm_protocol_version user_locking_protocol = { #define DLMFS_CAPABILITIES "bast stackglue"
.pv_major = OCFS2_LOCKING_PROTOCOL_MAJOR, extern int param_set_dlmfs_capabilities(const char *val,
.pv_minor = OCFS2_LOCKING_PROTOCOL_MINOR, struct kernel_param *kp)
}; {
printk(KERN_ERR "%s: readonly parameter\n", kp->name);
return -EINVAL;
}
static int param_get_dlmfs_capabilities(char *buffer,
struct kernel_param *kp)
{
return strlcpy(buffer, DLMFS_CAPABILITIES,
strlen(DLMFS_CAPABILITIES) + 1);
}
module_param_call(capabilities, param_set_dlmfs_capabilities,
param_get_dlmfs_capabilities, NULL, 0444);
MODULE_PARM_DESC(capabilities, DLMFS_CAPABILITIES);
/* /*
* decodes a set of open flags into a valid lock level and a set of flags. * decodes a set of open flags into a valid lock level and a set of flags.
...@@ -179,13 +203,46 @@ static int dlmfs_file_release(struct inode *inode, ...@@ -179,13 +203,46 @@ static int dlmfs_file_release(struct inode *inode,
return 0; return 0;
} }
/*
* We do ->setattr() just to override size changes. Our size is the size
* of the LVB and nothing else.
*/
static int dlmfs_file_setattr(struct dentry *dentry, struct iattr *attr)
{
int error;
struct inode *inode = dentry->d_inode;
attr->ia_valid &= ~ATTR_SIZE;
error = inode_change_ok(inode, attr);
if (!error)
error = inode_setattr(inode, attr);
return error;
}
static unsigned int dlmfs_file_poll(struct file *file, poll_table *wait)
{
int event = 0;
struct inode *inode = file->f_path.dentry->d_inode;
struct dlmfs_inode_private *ip = DLMFS_I(inode);
poll_wait(file, &ip->ip_lockres.l_event, wait);
spin_lock(&ip->ip_lockres.l_lock);
if (ip->ip_lockres.l_flags & USER_LOCK_BLOCKED)
event = POLLIN | POLLRDNORM;
spin_unlock(&ip->ip_lockres.l_lock);
return event;
}
static ssize_t dlmfs_file_read(struct file *filp, static ssize_t dlmfs_file_read(struct file *filp,
char __user *buf, char __user *buf,
size_t count, size_t count,
loff_t *ppos) loff_t *ppos)
{ {
int bytes_left; int bytes_left;
ssize_t readlen; ssize_t readlen, got;
char *lvb_buf; char *lvb_buf;
struct inode *inode = filp->f_path.dentry->d_inode; struct inode *inode = filp->f_path.dentry->d_inode;
...@@ -211,9 +268,13 @@ static ssize_t dlmfs_file_read(struct file *filp, ...@@ -211,9 +268,13 @@ static ssize_t dlmfs_file_read(struct file *filp,
if (!lvb_buf) if (!lvb_buf)
return -ENOMEM; return -ENOMEM;
user_dlm_read_lvb(inode, lvb_buf, readlen); got = user_dlm_read_lvb(inode, lvb_buf, readlen);
bytes_left = __copy_to_user(buf, lvb_buf, readlen); if (got) {
readlen -= bytes_left; BUG_ON(got != readlen);
bytes_left = __copy_to_user(buf, lvb_buf, readlen);
readlen -= bytes_left;
} else
readlen = 0;
kfree(lvb_buf); kfree(lvb_buf);
...@@ -272,7 +333,7 @@ static void dlmfs_init_once(void *foo) ...@@ -272,7 +333,7 @@ static void dlmfs_init_once(void *foo)
struct dlmfs_inode_private *ip = struct dlmfs_inode_private *ip =
(struct dlmfs_inode_private *) foo; (struct dlmfs_inode_private *) foo;
ip->ip_dlm = NULL; ip->ip_conn = NULL;
ip->ip_parent = NULL; ip->ip_parent = NULL;
inode_init_once(&ip->ip_vfs_inode); inode_init_once(&ip->ip_vfs_inode);
...@@ -314,14 +375,14 @@ static void dlmfs_clear_inode(struct inode *inode) ...@@ -314,14 +375,14 @@ static void dlmfs_clear_inode(struct inode *inode)
goto clear_fields; goto clear_fields;
} }
mlog(0, "we're a directory, ip->ip_dlm = 0x%p\n", ip->ip_dlm); mlog(0, "we're a directory, ip->ip_conn = 0x%p\n", ip->ip_conn);
/* we must be a directory. If required, lets unregister the /* we must be a directory. If required, lets unregister the
* dlm context now. */ * dlm context now. */
if (ip->ip_dlm) if (ip->ip_conn)
user_dlm_unregister_context(ip->ip_dlm); user_dlm_unregister(ip->ip_conn);
clear_fields: clear_fields:
ip->ip_parent = NULL; ip->ip_parent = NULL;
ip->ip_dlm = NULL; ip->ip_conn = NULL;
} }
static struct backing_dev_info dlmfs_backing_dev_info = { static struct backing_dev_info dlmfs_backing_dev_info = {
...@@ -371,7 +432,7 @@ static struct inode *dlmfs_get_inode(struct inode *parent, ...@@ -371,7 +432,7 @@ static struct inode *dlmfs_get_inode(struct inode *parent,
inode->i_atime = inode->i_mtime = inode->i_ctime = CURRENT_TIME; inode->i_atime = inode->i_mtime = inode->i_ctime = CURRENT_TIME;
ip = DLMFS_I(inode); ip = DLMFS_I(inode);
ip->ip_dlm = DLMFS_I(parent)->ip_dlm; ip->ip_conn = DLMFS_I(parent)->ip_conn;
switch (mode & S_IFMT) { switch (mode & S_IFMT) {
default: default:
...@@ -425,13 +486,12 @@ static int dlmfs_mkdir(struct inode * dir, ...@@ -425,13 +486,12 @@ static int dlmfs_mkdir(struct inode * dir,
struct inode *inode = NULL; struct inode *inode = NULL;
struct qstr *domain = &dentry->d_name; struct qstr *domain = &dentry->d_name;
struct dlmfs_inode_private *ip; struct dlmfs_inode_private *ip;
struct dlm_ctxt *dlm; struct ocfs2_cluster_connection *conn;
struct dlm_protocol_version proto = user_locking_protocol;
mlog(0, "mkdir %.*s\n", domain->len, domain->name); mlog(0, "mkdir %.*s\n", domain->len, domain->name);
/* verify that we have a proper domain */ /* verify that we have a proper domain */
if (domain->len >= O2NM_MAX_NAME_LEN) { if (domain->len >= GROUP_NAME_MAX) {
status = -EINVAL; status = -EINVAL;
mlog(ML_ERROR, "invalid domain name for directory.\n"); mlog(ML_ERROR, "invalid domain name for directory.\n");
goto bail; goto bail;
...@@ -446,14 +506,14 @@ static int dlmfs_mkdir(struct inode * dir, ...@@ -446,14 +506,14 @@ static int dlmfs_mkdir(struct inode * dir,
ip = DLMFS_I(inode); ip = DLMFS_I(inode);
dlm = user_dlm_register_context(domain, &proto); conn = user_dlm_register(domain);
if (IS_ERR(dlm)) { if (IS_ERR(conn)) {
status = PTR_ERR(dlm); status = PTR_ERR(conn);
mlog(ML_ERROR, "Error %d could not register domain \"%.*s\"\n", mlog(ML_ERROR, "Error %d could not register domain \"%.*s\"\n",
status, domain->len, domain->name); status, domain->len, domain->name);
goto bail; goto bail;
} }
ip->ip_dlm = dlm; ip->ip_conn = conn;
inc_nlink(dir); inc_nlink(dir);
d_instantiate(dentry, inode); d_instantiate(dentry, inode);
...@@ -549,6 +609,7 @@ static int dlmfs_fill_super(struct super_block * sb, ...@@ -549,6 +609,7 @@ static int dlmfs_fill_super(struct super_block * sb,
static const struct file_operations dlmfs_file_operations = { static const struct file_operations dlmfs_file_operations = {
.open = dlmfs_file_open, .open = dlmfs_file_open,
.release = dlmfs_file_release, .release = dlmfs_file_release,
.poll = dlmfs_file_poll,
.read = dlmfs_file_read, .read = dlmfs_file_read,
.write = dlmfs_file_write, .write = dlmfs_file_write,
}; };
...@@ -576,6 +637,7 @@ static const struct super_operations dlmfs_ops = { ...@@ -576,6 +637,7 @@ static const struct super_operations dlmfs_ops = {
static const struct inode_operations dlmfs_file_inode_operations = { static const struct inode_operations dlmfs_file_inode_operations = {
.getattr = simple_getattr, .getattr = simple_getattr,
.setattr = dlmfs_file_setattr,
}; };
static int dlmfs_get_sb(struct file_system_type *fs_type, static int dlmfs_get_sb(struct file_system_type *fs_type,
...@@ -620,6 +682,7 @@ static int __init init_dlmfs_fs(void) ...@@ -620,6 +682,7 @@ static int __init init_dlmfs_fs(void)
} }
cleanup_worker = 1; cleanup_worker = 1;
user_dlm_set_locking_protocol();
status = register_filesystem(&dlmfs_fs_type); status = register_filesystem(&dlmfs_fs_type);
bail: bail:
if (status) { if (status) {
......
...@@ -57,7 +57,7 @@ struct user_lock_res { ...@@ -57,7 +57,7 @@ struct user_lock_res {
int l_level; int l_level;
unsigned int l_ro_holders; unsigned int l_ro_holders;
unsigned int l_ex_holders; unsigned int l_ex_holders;
struct dlm_lockstatus l_lksb; struct ocfs2_dlm_lksb l_lksb;
int l_requested; int l_requested;
int l_blocking; int l_blocking;
...@@ -80,15 +80,15 @@ void user_dlm_cluster_unlock(struct user_lock_res *lockres, ...@@ -80,15 +80,15 @@ void user_dlm_cluster_unlock(struct user_lock_res *lockres,
void user_dlm_write_lvb(struct inode *inode, void user_dlm_write_lvb(struct inode *inode,
const char *val, const char *val,
unsigned int len); unsigned int len);
void user_dlm_read_lvb(struct inode *inode, ssize_t user_dlm_read_lvb(struct inode *inode,
char *val, char *val,
unsigned int len); unsigned int len);
struct dlm_ctxt *user_dlm_register_context(struct qstr *name, struct ocfs2_cluster_connection *user_dlm_register(struct qstr *name);
struct dlm_protocol_version *proto); void user_dlm_unregister(struct ocfs2_cluster_connection *conn);
void user_dlm_unregister_context(struct dlm_ctxt *dlm); void user_dlm_set_locking_protocol(void);
struct dlmfs_inode_private { struct dlmfs_inode_private {
struct dlm_ctxt *ip_dlm; struct ocfs2_cluster_connection *ip_conn;
struct user_lock_res ip_lockres; /* unused for directories. */ struct user_lock_res ip_lockres; /* unused for directories. */
struct inode *ip_parent; struct inode *ip_parent;
......
This diff is collapsed.
...@@ -993,10 +993,9 @@ int ocfs2_setattr(struct dentry *dentry, struct iattr *attr) ...@@ -993,10 +993,9 @@ int ocfs2_setattr(struct dentry *dentry, struct iattr *attr)
} }
if (size_change && attr->ia_size != i_size_read(inode)) { if (size_change && attr->ia_size != i_size_read(inode)) {
if (attr->ia_size > sb->s_maxbytes) { status = inode_newsize_ok(inode, attr->ia_size);
status = -EFBIG; if (status)
goto bail_unlock; goto bail_unlock;
}
if (i_size_read(inode) > attr->ia_size) { if (i_size_read(inode) > attr->ia_size) {
if (ocfs2_should_order_data(inode)) { if (ocfs2_should_order_data(inode)) {
...@@ -1836,6 +1835,8 @@ static int ocfs2_prepare_inode_for_write(struct dentry *dentry, ...@@ -1836,6 +1835,8 @@ static int ocfs2_prepare_inode_for_write(struct dentry *dentry,
&meta_level); &meta_level);
if (has_refcount) if (has_refcount)
*has_refcount = 1; *has_refcount = 1;
if (direct_io)
*direct_io = 0;
} }
if (ret < 0) { if (ret < 0) {
...@@ -1859,10 +1860,6 @@ static int ocfs2_prepare_inode_for_write(struct dentry *dentry, ...@@ -1859,10 +1860,6 @@ static int ocfs2_prepare_inode_for_write(struct dentry *dentry,
break; break;
} }
if (has_refcount && *has_refcount == 1) {
*direct_io = 0;
break;
}
/* /*
* Allowing concurrent direct writes means * Allowing concurrent direct writes means
* i_size changes wouldn't be synchronized, so * i_size changes wouldn't be synchronized, so
...@@ -2043,7 +2040,7 @@ static ssize_t ocfs2_file_aio_write(struct kiocb *iocb, ...@@ -2043,7 +2040,7 @@ static ssize_t ocfs2_file_aio_write(struct kiocb *iocb,
* async dio is going to do it in the future or an end_io after an * async dio is going to do it in the future or an end_io after an
* error has already done it. * error has already done it.
*/ */
if (ret == -EIOCBQUEUED || !ocfs2_iocb_is_rw_locked(iocb)) { if ((ret == -EIOCBQUEUED) || (!ocfs2_iocb_is_rw_locked(iocb))) {
rw_level = -1; rw_level = -1;
have_alloc_sem = 0; have_alloc_sem = 0;
} }
......
...@@ -7,10 +7,10 @@ ...@@ -7,10 +7,10 @@
* *
*/ */
#ifndef OCFS2_IOCTL_H #ifndef OCFS2_IOCTL_PROTO_H
#define OCFS2_IOCTL_H #define OCFS2_IOCTL_PROTO_H
long ocfs2_ioctl(struct file *filp, unsigned int cmd, unsigned long arg); long ocfs2_ioctl(struct file *filp, unsigned int cmd, unsigned long arg);
long ocfs2_compat_ioctl(struct file *file, unsigned cmd, unsigned long arg); long ocfs2_compat_ioctl(struct file *file, unsigned cmd, unsigned long arg);
#endif /* OCFS2_IOCTL_H */ #endif /* OCFS2_IOCTL_PROTO_H */
...@@ -476,7 +476,7 @@ int ocfs2_complete_local_alloc_recovery(struct ocfs2_super *osb, ...@@ -476,7 +476,7 @@ int ocfs2_complete_local_alloc_recovery(struct ocfs2_super *osb,
out: out:
if (!status) if (!status)
ocfs2_init_inode_steal_slot(osb); ocfs2_init_steal_slots(osb);
mlog_exit(status); mlog_exit(status);
return status; return status;
} }
......
...@@ -42,6 +42,7 @@ ...@@ -42,6 +42,7 @@
#include "ocfs2_fs.h" #include "ocfs2_fs.h"
#include "ocfs2_lockid.h" #include "ocfs2_lockid.h"
#include "ocfs2_ioctl.h"
/* For struct ocfs2_blockcheck_stats */ /* For struct ocfs2_blockcheck_stats */
#include "blockcheck.h" #include "blockcheck.h"
...@@ -159,7 +160,7 @@ struct ocfs2_lock_res { ...@@ -159,7 +160,7 @@ struct ocfs2_lock_res {
int l_level; int l_level;
unsigned int l_ro_holders; unsigned int l_ro_holders;
unsigned int l_ex_holders; unsigned int l_ex_holders;
union ocfs2_dlm_lksb l_lksb; struct ocfs2_dlm_lksb l_lksb;
/* used from AST/BAST funcs. */ /* used from AST/BAST funcs. */
enum ocfs2_ast_action l_action; enum ocfs2_ast_action l_action;
...@@ -305,7 +306,9 @@ struct ocfs2_super ...@@ -305,7 +306,9 @@ struct ocfs2_super
u32 s_next_generation; u32 s_next_generation;
unsigned long osb_flags; unsigned long osb_flags;
s16 s_inode_steal_slot; s16 s_inode_steal_slot;
s16 s_meta_steal_slot;
atomic_t s_num_inodes_stolen; atomic_t s_num_inodes_stolen;
atomic_t s_num_meta_stolen;
unsigned long s_mount_opt; unsigned long s_mount_opt;
unsigned int s_atime_quantum; unsigned int s_atime_quantum;
...@@ -760,33 +763,6 @@ static inline unsigned int ocfs2_megabytes_to_clusters(struct super_block *sb, ...@@ -760,33 +763,6 @@ static inline unsigned int ocfs2_megabytes_to_clusters(struct super_block *sb,
return megs << (20 - OCFS2_SB(sb)->s_clustersize_bits); return megs << (20 - OCFS2_SB(sb)->s_clustersize_bits);
} }
static inline void ocfs2_init_inode_steal_slot(struct ocfs2_super *osb)
{
spin_lock(&osb->osb_lock);
osb->s_inode_steal_slot = OCFS2_INVALID_SLOT;
spin_unlock(&osb->osb_lock);
atomic_set(&osb->s_num_inodes_stolen, 0);
}
static inline void ocfs2_set_inode_steal_slot(struct ocfs2_super *osb,
s16 slot)
{
spin_lock(&osb->osb_lock);
osb->s_inode_steal_slot = slot;
spin_unlock(&osb->osb_lock);
}
static inline s16 ocfs2_get_inode_steal_slot(struct ocfs2_super *osb)
{
s16 slot;
spin_lock(&osb->osb_lock);
slot = osb->s_inode_steal_slot;
spin_unlock(&osb->osb_lock);
return slot;
}
#define ocfs2_set_bit ext2_set_bit #define ocfs2_set_bit ext2_set_bit
#define ocfs2_clear_bit ext2_clear_bit #define ocfs2_clear_bit ext2_clear_bit
#define ocfs2_test_bit ext2_test_bit #define ocfs2_test_bit ext2_test_bit
......
...@@ -253,63 +253,6 @@ ...@@ -253,63 +253,6 @@
* counted in an associated * counted in an associated
* refcount tree */ * refcount tree */
/*
* ioctl commands
*/
#define OCFS2_IOC_GETFLAGS _IOR('f', 1, long)
#define OCFS2_IOC_SETFLAGS _IOW('f', 2, long)
#define OCFS2_IOC32_GETFLAGS _IOR('f', 1, int)
#define OCFS2_IOC32_SETFLAGS _IOW('f', 2, int)
/*
* Space reservation / allocation / free ioctls and argument structure
* are designed to be compatible with XFS.
*
* ALLOCSP* and FREESP* are not and will never be supported, but are
* included here for completeness.
*/
struct ocfs2_space_resv {
__s16 l_type;
__s16 l_whence;
__s64 l_start;
__s64 l_len; /* len == 0 means until end of file */
__s32 l_sysid;
__u32 l_pid;
__s32 l_pad[4]; /* reserve area */
};
#define OCFS2_IOC_ALLOCSP _IOW ('X', 10, struct ocfs2_space_resv)
#define OCFS2_IOC_FREESP _IOW ('X', 11, struct ocfs2_space_resv)
#define OCFS2_IOC_RESVSP _IOW ('X', 40, struct ocfs2_space_resv)
#define OCFS2_IOC_UNRESVSP _IOW ('X', 41, struct ocfs2_space_resv)
#define OCFS2_IOC_ALLOCSP64 _IOW ('X', 36, struct ocfs2_space_resv)
#define OCFS2_IOC_FREESP64 _IOW ('X', 37, struct ocfs2_space_resv)
#define OCFS2_IOC_RESVSP64 _IOW ('X', 42, struct ocfs2_space_resv)
#define OCFS2_IOC_UNRESVSP64 _IOW ('X', 43, struct ocfs2_space_resv)
/* Used to pass group descriptor data when online resize is done */
struct ocfs2_new_group_input {
__u64 group; /* Group descriptor's blkno. */
__u32 clusters; /* Total number of clusters in this group */
__u32 frees; /* Total free clusters in this group */
__u16 chain; /* Chain for this group */
__u16 reserved1;
__u32 reserved2;
};
#define OCFS2_IOC_GROUP_EXTEND _IOW('o', 1, int)
#define OCFS2_IOC_GROUP_ADD _IOW('o', 2,struct ocfs2_new_group_input)
#define OCFS2_IOC_GROUP_ADD64 _IOW('o', 3,struct ocfs2_new_group_input)
/* Used to pass 2 file names to reflink. */
struct reflink_arguments {
__u64 old_path;
__u64 new_path;
__u64 preserve;
};
#define OCFS2_IOC_REFLINK _IOW('o', 4, struct reflink_arguments)
/* /*
* Journal Flags (ocfs2_dinode.id1.journal1.i_flags) * Journal Flags (ocfs2_dinode.id1.journal1.i_flags)
*/ */
......
/* -*- mode: c; c-basic-offset: 8; -*-
* vim: noexpandtab sw=8 ts=8 sts=0:
*
* ocfs2_ioctl.h
*
* Defines OCFS2 ioctls.
*
* Copyright (C) 2010 Oracle. All rights reserved.
*
* This program is free software; you can redistribute it and/or
* modify it under the terms of the GNU General Public
* License, version 2, as published by the Free Software Foundation.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* General Public License for more details.
*/
#ifndef OCFS2_IOCTL_H
#define OCFS2_IOCTL_H
/*
* ioctl commands
*/
#define OCFS2_IOC_GETFLAGS _IOR('f', 1, long)
#define OCFS2_IOC_SETFLAGS _IOW('f', 2, long)
#define OCFS2_IOC32_GETFLAGS _IOR('f', 1, int)
#define OCFS2_IOC32_SETFLAGS _IOW('f', 2, int)
/*
* Space reservation / allocation / free ioctls and argument structure
* are designed to be compatible with XFS.
*
* ALLOCSP* and FREESP* are not and will never be supported, but are
* included here for completeness.
*/
struct ocfs2_space_resv {
__s16 l_type;
__s16 l_whence;
__s64 l_start;
__s64 l_len; /* len == 0 means until end of file */
__s32 l_sysid;
__u32 l_pid;
__s32 l_pad[4]; /* reserve area */
};
#define OCFS2_IOC_ALLOCSP _IOW ('X', 10, struct ocfs2_space_resv)
#define OCFS2_IOC_FREESP _IOW ('X', 11, struct ocfs2_space_resv)
#define OCFS2_IOC_RESVSP _IOW ('X', 40, struct ocfs2_space_resv)
#define OCFS2_IOC_UNRESVSP _IOW ('X', 41, struct ocfs2_space_resv)
#define OCFS2_IOC_ALLOCSP64 _IOW ('X', 36, struct ocfs2_space_resv)
#define OCFS2_IOC_FREESP64 _IOW ('X', 37, struct ocfs2_space_resv)
#define OCFS2_IOC_RESVSP64 _IOW ('X', 42, struct ocfs2_space_resv)
#define OCFS2_IOC_UNRESVSP64 _IOW ('X', 43, struct ocfs2_space_resv)
/* Used to pass group descriptor data when online resize is done */
struct ocfs2_new_group_input {
__u64 group; /* Group descriptor's blkno. */
__u32 clusters; /* Total number of clusters in this group */
__u32 frees; /* Total free clusters in this group */
__u16 chain; /* Chain for this group */
__u16 reserved1;
__u32 reserved2;
};
#define OCFS2_IOC_GROUP_EXTEND _IOW('o', 1, int)
#define OCFS2_IOC_GROUP_ADD _IOW('o', 2,struct ocfs2_new_group_input)
#define OCFS2_IOC_GROUP_ADD64 _IOW('o', 3,struct ocfs2_new_group_input)
/* Used to pass 2 file names to reflink. */
struct reflink_arguments {
__u64 old_path;
__u64 new_path;
__u64 preserve;
};
#define OCFS2_IOC_REFLINK _IOW('o', 4, struct reflink_arguments)
#endif /* OCFS2_IOCTL_H */
...@@ -23,6 +23,8 @@ ...@@ -23,6 +23,8 @@
/* /*
* The protocol version for ocfs2 cluster locking. See dlmglue.c for * The protocol version for ocfs2 cluster locking. See dlmglue.c for
* more details. * more details.
*
* 1.0 - Initial locking version from ocfs2 1.4.
*/ */
#define OCFS2_LOCKING_PROTOCOL_MAJOR 1 #define OCFS2_LOCKING_PROTOCOL_MAJOR 1
#define OCFS2_LOCKING_PROTOCOL_MINOR 0 #define OCFS2_LOCKING_PROTOCOL_MINOR 0
......
...@@ -626,7 +626,7 @@ static int ocfs2_create_refcount_tree(struct inode *inode, ...@@ -626,7 +626,7 @@ static int ocfs2_create_refcount_tree(struct inode *inode,
rb = (struct ocfs2_refcount_block *)new_bh->b_data; rb = (struct ocfs2_refcount_block *)new_bh->b_data;
memset(rb, 0, inode->i_sb->s_blocksize); memset(rb, 0, inode->i_sb->s_blocksize);
strcpy((void *)rb, OCFS2_REFCOUNT_BLOCK_SIGNATURE); strcpy((void *)rb, OCFS2_REFCOUNT_BLOCK_SIGNATURE);
rb->rf_suballoc_slot = cpu_to_le16(osb->slot_num); rb->rf_suballoc_slot = cpu_to_le16(meta_ac->ac_alloc_slot);
rb->rf_suballoc_bit = cpu_to_le16(suballoc_bit_start); rb->rf_suballoc_bit = cpu_to_le16(suballoc_bit_start);
rb->rf_fs_generation = cpu_to_le32(osb->fs_generation); rb->rf_fs_generation = cpu_to_le32(osb->fs_generation);
rb->rf_blkno = cpu_to_le64(first_blkno); rb->rf_blkno = cpu_to_le64(first_blkno);
...@@ -1330,7 +1330,7 @@ static int ocfs2_expand_inline_ref_root(handle_t *handle, ...@@ -1330,7 +1330,7 @@ static int ocfs2_expand_inline_ref_root(handle_t *handle,
memcpy(new_bh->b_data, ref_root_bh->b_data, sb->s_blocksize); memcpy(new_bh->b_data, ref_root_bh->b_data, sb->s_blocksize);
new_rb = (struct ocfs2_refcount_block *)new_bh->b_data; new_rb = (struct ocfs2_refcount_block *)new_bh->b_data;
new_rb->rf_suballoc_slot = cpu_to_le16(OCFS2_SB(sb)->slot_num); new_rb->rf_suballoc_slot = cpu_to_le16(meta_ac->ac_alloc_slot);
new_rb->rf_suballoc_bit = cpu_to_le16(suballoc_bit_start); new_rb->rf_suballoc_bit = cpu_to_le16(suballoc_bit_start);
new_rb->rf_blkno = cpu_to_le64(blkno); new_rb->rf_blkno = cpu_to_le64(blkno);
new_rb->rf_cpos = cpu_to_le32(0); new_rb->rf_cpos = cpu_to_le32(0);
...@@ -1576,7 +1576,7 @@ static int ocfs2_new_leaf_refcount_block(handle_t *handle, ...@@ -1576,7 +1576,7 @@ static int ocfs2_new_leaf_refcount_block(handle_t *handle,
new_rb = (struct ocfs2_refcount_block *)new_bh->b_data; new_rb = (struct ocfs2_refcount_block *)new_bh->b_data;
memset(new_rb, 0, sb->s_blocksize); memset(new_rb, 0, sb->s_blocksize);
strcpy((void *)new_rb, OCFS2_REFCOUNT_BLOCK_SIGNATURE); strcpy((void *)new_rb, OCFS2_REFCOUNT_BLOCK_SIGNATURE);
new_rb->rf_suballoc_slot = cpu_to_le16(OCFS2_SB(sb)->slot_num); new_rb->rf_suballoc_slot = cpu_to_le16(meta_ac->ac_alloc_slot);
new_rb->rf_suballoc_bit = cpu_to_le16(suballoc_bit_start); new_rb->rf_suballoc_bit = cpu_to_le16(suballoc_bit_start);
new_rb->rf_fs_generation = cpu_to_le32(OCFS2_SB(sb)->fs_generation); new_rb->rf_fs_generation = cpu_to_le32(OCFS2_SB(sb)->fs_generation);
new_rb->rf_blkno = cpu_to_le64(blkno); new_rb->rf_blkno = cpu_to_le64(blkno);
......
...@@ -161,24 +161,23 @@ static int dlm_status_to_errno(enum dlm_status status) ...@@ -161,24 +161,23 @@ static int dlm_status_to_errno(enum dlm_status status)
static void o2dlm_lock_ast_wrapper(void *astarg) static void o2dlm_lock_ast_wrapper(void *astarg)
{ {
BUG_ON(o2cb_stack.sp_proto == NULL); struct ocfs2_dlm_lksb *lksb = astarg;
o2cb_stack.sp_proto->lp_lock_ast(astarg); lksb->lksb_conn->cc_proto->lp_lock_ast(lksb);
} }
static void o2dlm_blocking_ast_wrapper(void *astarg, int level) static void o2dlm_blocking_ast_wrapper(void *astarg, int level)
{ {
BUG_ON(o2cb_stack.sp_proto == NULL); struct ocfs2_dlm_lksb *lksb = astarg;
o2cb_stack.sp_proto->lp_blocking_ast(astarg, level); lksb->lksb_conn->cc_proto->lp_blocking_ast(lksb, level);
} }
static void o2dlm_unlock_ast_wrapper(void *astarg, enum dlm_status status) static void o2dlm_unlock_ast_wrapper(void *astarg, enum dlm_status status)
{ {
struct ocfs2_dlm_lksb *lksb = astarg;
int error = dlm_status_to_errno(status); int error = dlm_status_to_errno(status);
BUG_ON(o2cb_stack.sp_proto == NULL);
/* /*
* In o2dlm, you can get both the lock_ast() for the lock being * In o2dlm, you can get both the lock_ast() for the lock being
* granted and the unlock_ast() for the CANCEL failing. A * granted and the unlock_ast() for the CANCEL failing. A
...@@ -193,16 +192,15 @@ static void o2dlm_unlock_ast_wrapper(void *astarg, enum dlm_status status) ...@@ -193,16 +192,15 @@ static void o2dlm_unlock_ast_wrapper(void *astarg, enum dlm_status status)
if (status == DLM_CANCELGRANT) if (status == DLM_CANCELGRANT)
return; return;
o2cb_stack.sp_proto->lp_unlock_ast(astarg, error); lksb->lksb_conn->cc_proto->lp_unlock_ast(lksb, error);
} }
static int o2cb_dlm_lock(struct ocfs2_cluster_connection *conn, static int o2cb_dlm_lock(struct ocfs2_cluster_connection *conn,
int mode, int mode,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags,
void *name, void *name,
unsigned int namelen, unsigned int namelen)
void *astarg)
{ {
enum dlm_status status; enum dlm_status status;
int o2dlm_mode = mode_to_o2dlm(mode); int o2dlm_mode = mode_to_o2dlm(mode);
...@@ -211,28 +209,27 @@ static int o2cb_dlm_lock(struct ocfs2_cluster_connection *conn, ...@@ -211,28 +209,27 @@ static int o2cb_dlm_lock(struct ocfs2_cluster_connection *conn,
status = dlmlock(conn->cc_lockspace, o2dlm_mode, &lksb->lksb_o2dlm, status = dlmlock(conn->cc_lockspace, o2dlm_mode, &lksb->lksb_o2dlm,
o2dlm_flags, name, namelen, o2dlm_flags, name, namelen,
o2dlm_lock_ast_wrapper, astarg, o2dlm_lock_ast_wrapper, lksb,
o2dlm_blocking_ast_wrapper); o2dlm_blocking_ast_wrapper);
ret = dlm_status_to_errno(status); ret = dlm_status_to_errno(status);
return ret; return ret;
} }
static int o2cb_dlm_unlock(struct ocfs2_cluster_connection *conn, static int o2cb_dlm_unlock(struct ocfs2_cluster_connection *conn,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags)
void *astarg)
{ {
enum dlm_status status; enum dlm_status status;
int o2dlm_flags = flags_to_o2dlm(flags); int o2dlm_flags = flags_to_o2dlm(flags);
int ret; int ret;
status = dlmunlock(conn->cc_lockspace, &lksb->lksb_o2dlm, status = dlmunlock(conn->cc_lockspace, &lksb->lksb_o2dlm,
o2dlm_flags, o2dlm_unlock_ast_wrapper, astarg); o2dlm_flags, o2dlm_unlock_ast_wrapper, lksb);
ret = dlm_status_to_errno(status); ret = dlm_status_to_errno(status);
return ret; return ret;
} }
static int o2cb_dlm_lock_status(union ocfs2_dlm_lksb *lksb) static int o2cb_dlm_lock_status(struct ocfs2_dlm_lksb *lksb)
{ {
return dlm_status_to_errno(lksb->lksb_o2dlm.status); return dlm_status_to_errno(lksb->lksb_o2dlm.status);
} }
...@@ -242,17 +239,17 @@ static int o2cb_dlm_lock_status(union ocfs2_dlm_lksb *lksb) ...@@ -242,17 +239,17 @@ static int o2cb_dlm_lock_status(union ocfs2_dlm_lksb *lksb)
* contents, it will zero out the LVB. Thus the caller can always trust * contents, it will zero out the LVB. Thus the caller can always trust
* the contents. * the contents.
*/ */
static int o2cb_dlm_lvb_valid(union ocfs2_dlm_lksb *lksb) static int o2cb_dlm_lvb_valid(struct ocfs2_dlm_lksb *lksb)
{ {
return 1; return 1;
} }
static void *o2cb_dlm_lvb(union ocfs2_dlm_lksb *lksb) static void *o2cb_dlm_lvb(struct ocfs2_dlm_lksb *lksb)
{ {
return (void *)(lksb->lksb_o2dlm.lvb); return (void *)(lksb->lksb_o2dlm.lvb);
} }
static void o2cb_dump_lksb(union ocfs2_dlm_lksb *lksb) static void o2cb_dump_lksb(struct ocfs2_dlm_lksb *lksb)
{ {
dlm_print_one_lock(lksb->lksb_o2dlm.lockid); dlm_print_one_lock(lksb->lksb_o2dlm.lockid);
} }
...@@ -280,7 +277,7 @@ static int o2cb_cluster_connect(struct ocfs2_cluster_connection *conn) ...@@ -280,7 +277,7 @@ static int o2cb_cluster_connect(struct ocfs2_cluster_connection *conn)
struct dlm_protocol_version fs_version; struct dlm_protocol_version fs_version;
BUG_ON(conn == NULL); BUG_ON(conn == NULL);
BUG_ON(o2cb_stack.sp_proto == NULL); BUG_ON(conn->cc_proto == NULL);
/* for now we only have one cluster/node, make sure we see it /* for now we only have one cluster/node, make sure we see it
* in the heartbeat universe */ * in the heartbeat universe */
......
...@@ -25,7 +25,6 @@ ...@@ -25,7 +25,6 @@
#include <linux/reboot.h> #include <linux/reboot.h>
#include <asm/uaccess.h> #include <asm/uaccess.h>
#include "ocfs2.h" /* For struct ocfs2_lock_res */
#include "stackglue.h" #include "stackglue.h"
#include <linux/dlm_plock.h> #include <linux/dlm_plock.h>
...@@ -63,8 +62,8 @@ ...@@ -63,8 +62,8 @@
* negotiated by the client. The client negotiates based on the maximum * negotiated by the client. The client negotiates based on the maximum
* version advertised in /sys/fs/ocfs2/max_locking_protocol. The major * version advertised in /sys/fs/ocfs2/max_locking_protocol. The major
* number from the "SETV" message must match * number from the "SETV" message must match
* ocfs2_user_plugin.sp_proto->lp_max_version.pv_major, and the minor number * ocfs2_user_plugin.sp_max_proto.pv_major, and the minor number
* must be less than or equal to ...->lp_max_version.pv_minor. * must be less than or equal to ...sp_max_version.pv_minor.
* *
* Once this information has been set, mounts will be allowed. From this * Once this information has been set, mounts will be allowed. From this
* point on, the "DOWN" message can be sent for node down notification. * point on, the "DOWN" message can be sent for node down notification.
...@@ -401,7 +400,7 @@ static int ocfs2_control_do_setversion_msg(struct file *file, ...@@ -401,7 +400,7 @@ static int ocfs2_control_do_setversion_msg(struct file *file,
char *ptr = NULL; char *ptr = NULL;
struct ocfs2_control_private *p = file->private_data; struct ocfs2_control_private *p = file->private_data;
struct ocfs2_protocol_version *max = struct ocfs2_protocol_version *max =
&ocfs2_user_plugin.sp_proto->lp_max_version; &ocfs2_user_plugin.sp_max_proto;
if (ocfs2_control_get_handshake_state(file) != if (ocfs2_control_get_handshake_state(file) !=
OCFS2_CONTROL_HANDSHAKE_PROTOCOL) OCFS2_CONTROL_HANDSHAKE_PROTOCOL)
...@@ -664,18 +663,10 @@ static void ocfs2_control_exit(void) ...@@ -664,18 +663,10 @@ static void ocfs2_control_exit(void)
-rc); -rc);
} }
static struct dlm_lksb *fsdlm_astarg_to_lksb(void *astarg)
{
struct ocfs2_lock_res *res = astarg;
return &res->l_lksb.lksb_fsdlm;
}
static void fsdlm_lock_ast_wrapper(void *astarg) static void fsdlm_lock_ast_wrapper(void *astarg)
{ {
struct dlm_lksb *lksb = fsdlm_astarg_to_lksb(astarg); struct ocfs2_dlm_lksb *lksb = astarg;
int status = lksb->sb_status; int status = lksb->lksb_fsdlm.sb_status;
BUG_ON(ocfs2_user_plugin.sp_proto == NULL);
/* /*
* For now we're punting on the issue of other non-standard errors * For now we're punting on the issue of other non-standard errors
...@@ -688,25 +679,24 @@ static void fsdlm_lock_ast_wrapper(void *astarg) ...@@ -688,25 +679,24 @@ static void fsdlm_lock_ast_wrapper(void *astarg)
*/ */
if (status == -DLM_EUNLOCK || status == -DLM_ECANCEL) if (status == -DLM_EUNLOCK || status == -DLM_ECANCEL)
ocfs2_user_plugin.sp_proto->lp_unlock_ast(astarg, 0); lksb->lksb_conn->cc_proto->lp_unlock_ast(lksb, 0);
else else
ocfs2_user_plugin.sp_proto->lp_lock_ast(astarg); lksb->lksb_conn->cc_proto->lp_lock_ast(lksb);
} }
static void fsdlm_blocking_ast_wrapper(void *astarg, int level) static void fsdlm_blocking_ast_wrapper(void *astarg, int level)
{ {
BUG_ON(ocfs2_user_plugin.sp_proto == NULL); struct ocfs2_dlm_lksb *lksb = astarg;
ocfs2_user_plugin.sp_proto->lp_blocking_ast(astarg, level); lksb->lksb_conn->cc_proto->lp_blocking_ast(lksb, level);
} }
static int user_dlm_lock(struct ocfs2_cluster_connection *conn, static int user_dlm_lock(struct ocfs2_cluster_connection *conn,
int mode, int mode,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags,
void *name, void *name,
unsigned int namelen, unsigned int namelen)
void *astarg)
{ {
int ret; int ret;
...@@ -716,36 +706,35 @@ static int user_dlm_lock(struct ocfs2_cluster_connection *conn, ...@@ -716,36 +706,35 @@ static int user_dlm_lock(struct ocfs2_cluster_connection *conn,
ret = dlm_lock(conn->cc_lockspace, mode, &lksb->lksb_fsdlm, ret = dlm_lock(conn->cc_lockspace, mode, &lksb->lksb_fsdlm,
flags|DLM_LKF_NODLCKWT, name, namelen, 0, flags|DLM_LKF_NODLCKWT, name, namelen, 0,
fsdlm_lock_ast_wrapper, astarg, fsdlm_lock_ast_wrapper, lksb,
fsdlm_blocking_ast_wrapper); fsdlm_blocking_ast_wrapper);
return ret; return ret;
} }
static int user_dlm_unlock(struct ocfs2_cluster_connection *conn, static int user_dlm_unlock(struct ocfs2_cluster_connection *conn,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags)
void *astarg)
{ {
int ret; int ret;
ret = dlm_unlock(conn->cc_lockspace, lksb->lksb_fsdlm.sb_lkid, ret = dlm_unlock(conn->cc_lockspace, lksb->lksb_fsdlm.sb_lkid,
flags, &lksb->lksb_fsdlm, astarg); flags, &lksb->lksb_fsdlm, lksb);
return ret; return ret;
} }
static int user_dlm_lock_status(union ocfs2_dlm_lksb *lksb) static int user_dlm_lock_status(struct ocfs2_dlm_lksb *lksb)
{ {
return lksb->lksb_fsdlm.sb_status; return lksb->lksb_fsdlm.sb_status;
} }
static int user_dlm_lvb_valid(union ocfs2_dlm_lksb *lksb) static int user_dlm_lvb_valid(struct ocfs2_dlm_lksb *lksb)
{ {
int invalid = lksb->lksb_fsdlm.sb_flags & DLM_SBF_VALNOTVALID; int invalid = lksb->lksb_fsdlm.sb_flags & DLM_SBF_VALNOTVALID;
return !invalid; return !invalid;
} }
static void *user_dlm_lvb(union ocfs2_dlm_lksb *lksb) static void *user_dlm_lvb(struct ocfs2_dlm_lksb *lksb)
{ {
if (!lksb->lksb_fsdlm.sb_lvbptr) if (!lksb->lksb_fsdlm.sb_lvbptr)
lksb->lksb_fsdlm.sb_lvbptr = (char *)lksb + lksb->lksb_fsdlm.sb_lvbptr = (char *)lksb +
...@@ -753,7 +742,7 @@ static void *user_dlm_lvb(union ocfs2_dlm_lksb *lksb) ...@@ -753,7 +742,7 @@ static void *user_dlm_lvb(union ocfs2_dlm_lksb *lksb)
return (void *)(lksb->lksb_fsdlm.sb_lvbptr); return (void *)(lksb->lksb_fsdlm.sb_lvbptr);
} }
static void user_dlm_dump_lksb(union ocfs2_dlm_lksb *lksb) static void user_dlm_dump_lksb(struct ocfs2_dlm_lksb *lksb)
{ {
} }
......
...@@ -36,7 +36,7 @@ ...@@ -36,7 +36,7 @@
#define OCFS2_STACK_PLUGIN_USER "user" #define OCFS2_STACK_PLUGIN_USER "user"
#define OCFS2_MAX_HB_CTL_PATH 256 #define OCFS2_MAX_HB_CTL_PATH 256
static struct ocfs2_locking_protocol *lproto; static struct ocfs2_protocol_version locking_max_version;
static DEFINE_SPINLOCK(ocfs2_stack_lock); static DEFINE_SPINLOCK(ocfs2_stack_lock);
static LIST_HEAD(ocfs2_stack_list); static LIST_HEAD(ocfs2_stack_list);
static char cluster_stack_name[OCFS2_STACK_LABEL_LEN + 1]; static char cluster_stack_name[OCFS2_STACK_LABEL_LEN + 1];
...@@ -176,7 +176,7 @@ int ocfs2_stack_glue_register(struct ocfs2_stack_plugin *plugin) ...@@ -176,7 +176,7 @@ int ocfs2_stack_glue_register(struct ocfs2_stack_plugin *plugin)
spin_lock(&ocfs2_stack_lock); spin_lock(&ocfs2_stack_lock);
if (!ocfs2_stack_lookup(plugin->sp_name)) { if (!ocfs2_stack_lookup(plugin->sp_name)) {
plugin->sp_count = 0; plugin->sp_count = 0;
plugin->sp_proto = lproto; plugin->sp_max_proto = locking_max_version;
list_add(&plugin->sp_list, &ocfs2_stack_list); list_add(&plugin->sp_list, &ocfs2_stack_list);
printk(KERN_INFO "ocfs2: Registered cluster interface %s\n", printk(KERN_INFO "ocfs2: Registered cluster interface %s\n",
plugin->sp_name); plugin->sp_name);
...@@ -213,77 +213,76 @@ void ocfs2_stack_glue_unregister(struct ocfs2_stack_plugin *plugin) ...@@ -213,77 +213,76 @@ void ocfs2_stack_glue_unregister(struct ocfs2_stack_plugin *plugin)
} }
EXPORT_SYMBOL_GPL(ocfs2_stack_glue_unregister); EXPORT_SYMBOL_GPL(ocfs2_stack_glue_unregister);
void ocfs2_stack_glue_set_locking_protocol(struct ocfs2_locking_protocol *proto) void ocfs2_stack_glue_set_max_proto_version(struct ocfs2_protocol_version *max_proto)
{ {
struct ocfs2_stack_plugin *p; struct ocfs2_stack_plugin *p;
BUG_ON(proto == NULL);
spin_lock(&ocfs2_stack_lock); spin_lock(&ocfs2_stack_lock);
BUG_ON(active_stack != NULL); if (memcmp(max_proto, &locking_max_version,
sizeof(struct ocfs2_protocol_version))) {
BUG_ON(locking_max_version.pv_major != 0);
lproto = proto; locking_max_version = *max_proto;
list_for_each_entry(p, &ocfs2_stack_list, sp_list) { list_for_each_entry(p, &ocfs2_stack_list, sp_list) {
p->sp_proto = lproto; p->sp_max_proto = locking_max_version;
}
} }
spin_unlock(&ocfs2_stack_lock); spin_unlock(&ocfs2_stack_lock);
} }
EXPORT_SYMBOL_GPL(ocfs2_stack_glue_set_locking_protocol); EXPORT_SYMBOL_GPL(ocfs2_stack_glue_set_max_proto_version);
/* /*
* The ocfs2_dlm_lock() and ocfs2_dlm_unlock() functions take * The ocfs2_dlm_lock() and ocfs2_dlm_unlock() functions take no argument
* "struct ocfs2_lock_res *astarg" instead of "void *astarg" because the * for the ast and bast functions. They will pass the lksb to the ast
* underlying stack plugins need to pilfer the lksb off of the lock_res. * and bast. The caller can wrap the lksb with their own structure to
* If some other structure needs to be passed as an astarg, the plugins * get more information.
* will need to be given a different avenue to the lksb.
*/ */
int ocfs2_dlm_lock(struct ocfs2_cluster_connection *conn, int ocfs2_dlm_lock(struct ocfs2_cluster_connection *conn,
int mode, int mode,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags,
void *name, void *name,
unsigned int namelen, unsigned int namelen)
struct ocfs2_lock_res *astarg)
{ {
BUG_ON(lproto == NULL); if (!lksb->lksb_conn)
lksb->lksb_conn = conn;
else
BUG_ON(lksb->lksb_conn != conn);
return active_stack->sp_ops->dlm_lock(conn, mode, lksb, flags, return active_stack->sp_ops->dlm_lock(conn, mode, lksb, flags,
name, namelen, astarg); name, namelen);
} }
EXPORT_SYMBOL_GPL(ocfs2_dlm_lock); EXPORT_SYMBOL_GPL(ocfs2_dlm_lock);
int ocfs2_dlm_unlock(struct ocfs2_cluster_connection *conn, int ocfs2_dlm_unlock(struct ocfs2_cluster_connection *conn,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags)
struct ocfs2_lock_res *astarg)
{ {
BUG_ON(lproto == NULL); BUG_ON(lksb->lksb_conn == NULL);
return active_stack->sp_ops->dlm_unlock(conn, lksb, flags, astarg); return active_stack->sp_ops->dlm_unlock(conn, lksb, flags);
} }
EXPORT_SYMBOL_GPL(ocfs2_dlm_unlock); EXPORT_SYMBOL_GPL(ocfs2_dlm_unlock);
int ocfs2_dlm_lock_status(union ocfs2_dlm_lksb *lksb) int ocfs2_dlm_lock_status(struct ocfs2_dlm_lksb *lksb)
{ {
return active_stack->sp_ops->lock_status(lksb); return active_stack->sp_ops->lock_status(lksb);
} }
EXPORT_SYMBOL_GPL(ocfs2_dlm_lock_status); EXPORT_SYMBOL_GPL(ocfs2_dlm_lock_status);
int ocfs2_dlm_lvb_valid(union ocfs2_dlm_lksb *lksb) int ocfs2_dlm_lvb_valid(struct ocfs2_dlm_lksb *lksb)
{ {
return active_stack->sp_ops->lvb_valid(lksb); return active_stack->sp_ops->lvb_valid(lksb);
} }
EXPORT_SYMBOL_GPL(ocfs2_dlm_lvb_valid); EXPORT_SYMBOL_GPL(ocfs2_dlm_lvb_valid);
void *ocfs2_dlm_lvb(union ocfs2_dlm_lksb *lksb) void *ocfs2_dlm_lvb(struct ocfs2_dlm_lksb *lksb)
{ {
return active_stack->sp_ops->lock_lvb(lksb); return active_stack->sp_ops->lock_lvb(lksb);
} }
EXPORT_SYMBOL_GPL(ocfs2_dlm_lvb); EXPORT_SYMBOL_GPL(ocfs2_dlm_lvb);
void ocfs2_dlm_dump_lksb(union ocfs2_dlm_lksb *lksb) void ocfs2_dlm_dump_lksb(struct ocfs2_dlm_lksb *lksb)
{ {
active_stack->sp_ops->dump_lksb(lksb); active_stack->sp_ops->dump_lksb(lksb);
} }
...@@ -312,6 +311,7 @@ EXPORT_SYMBOL_GPL(ocfs2_plock); ...@@ -312,6 +311,7 @@ EXPORT_SYMBOL_GPL(ocfs2_plock);
int ocfs2_cluster_connect(const char *stack_name, int ocfs2_cluster_connect(const char *stack_name,
const char *group, const char *group,
int grouplen, int grouplen,
struct ocfs2_locking_protocol *lproto,
void (*recovery_handler)(int node_num, void (*recovery_handler)(int node_num,
void *recovery_data), void *recovery_data),
void *recovery_data, void *recovery_data,
...@@ -329,6 +329,12 @@ int ocfs2_cluster_connect(const char *stack_name, ...@@ -329,6 +329,12 @@ int ocfs2_cluster_connect(const char *stack_name,
goto out; goto out;
} }
if (memcmp(&lproto->lp_max_version, &locking_max_version,
sizeof(struct ocfs2_protocol_version))) {
rc = -EINVAL;
goto out;
}
new_conn = kzalloc(sizeof(struct ocfs2_cluster_connection), new_conn = kzalloc(sizeof(struct ocfs2_cluster_connection),
GFP_KERNEL); GFP_KERNEL);
if (!new_conn) { if (!new_conn) {
...@@ -341,6 +347,7 @@ int ocfs2_cluster_connect(const char *stack_name, ...@@ -341,6 +347,7 @@ int ocfs2_cluster_connect(const char *stack_name,
new_conn->cc_recovery_handler = recovery_handler; new_conn->cc_recovery_handler = recovery_handler;
new_conn->cc_recovery_data = recovery_data; new_conn->cc_recovery_data = recovery_data;
new_conn->cc_proto = lproto;
/* Start the new connection at our maximum compatibility level */ /* Start the new connection at our maximum compatibility level */
new_conn->cc_version = lproto->lp_max_version; new_conn->cc_version = lproto->lp_max_version;
...@@ -366,6 +373,24 @@ int ocfs2_cluster_connect(const char *stack_name, ...@@ -366,6 +373,24 @@ int ocfs2_cluster_connect(const char *stack_name,
} }
EXPORT_SYMBOL_GPL(ocfs2_cluster_connect); EXPORT_SYMBOL_GPL(ocfs2_cluster_connect);
/* The caller will ensure all nodes have the same cluster stack */
int ocfs2_cluster_connect_agnostic(const char *group,
int grouplen,
struct ocfs2_locking_protocol *lproto,
void (*recovery_handler)(int node_num,
void *recovery_data),
void *recovery_data,
struct ocfs2_cluster_connection **conn)
{
char *stack_name = NULL;
if (cluster_stack_name[0])
stack_name = cluster_stack_name;
return ocfs2_cluster_connect(stack_name, group, grouplen, lproto,
recovery_handler, recovery_data, conn);
}
EXPORT_SYMBOL_GPL(ocfs2_cluster_connect_agnostic);
/* If hangup_pending is 0, the stack driver will be dropped */ /* If hangup_pending is 0, the stack driver will be dropped */
int ocfs2_cluster_disconnect(struct ocfs2_cluster_connection *conn, int ocfs2_cluster_disconnect(struct ocfs2_cluster_connection *conn,
int hangup_pending) int hangup_pending)
...@@ -453,10 +478,10 @@ static ssize_t ocfs2_max_locking_protocol_show(struct kobject *kobj, ...@@ -453,10 +478,10 @@ static ssize_t ocfs2_max_locking_protocol_show(struct kobject *kobj,
ssize_t ret = 0; ssize_t ret = 0;
spin_lock(&ocfs2_stack_lock); spin_lock(&ocfs2_stack_lock);
if (lproto) if (locking_max_version.pv_major)
ret = snprintf(buf, PAGE_SIZE, "%u.%u\n", ret = snprintf(buf, PAGE_SIZE, "%u.%u\n",
lproto->lp_max_version.pv_major, locking_max_version.pv_major,
lproto->lp_max_version.pv_minor); locking_max_version.pv_minor);
spin_unlock(&ocfs2_stack_lock); spin_unlock(&ocfs2_stack_lock);
return ret; return ret;
...@@ -685,7 +710,10 @@ static int __init ocfs2_stack_glue_init(void) ...@@ -685,7 +710,10 @@ static int __init ocfs2_stack_glue_init(void)
static void __exit ocfs2_stack_glue_exit(void) static void __exit ocfs2_stack_glue_exit(void)
{ {
lproto = NULL; memset(&locking_max_version, 0,
sizeof(struct ocfs2_protocol_version));
locking_max_version.pv_major = 0;
locking_max_version.pv_minor = 0;
ocfs2_sysfs_exit(); ocfs2_sysfs_exit();
if (ocfs2_table_header) if (ocfs2_table_header)
unregister_sysctl_table(ocfs2_table_header); unregister_sysctl_table(ocfs2_table_header);
......
...@@ -55,17 +55,6 @@ struct ocfs2_protocol_version { ...@@ -55,17 +55,6 @@ struct ocfs2_protocol_version {
u8 pv_minor; u8 pv_minor;
}; };
/*
* The ocfs2_locking_protocol defines the handlers called on ocfs2's behalf.
*/
struct ocfs2_locking_protocol {
struct ocfs2_protocol_version lp_max_version;
void (*lp_lock_ast)(void *astarg);
void (*lp_blocking_ast)(void *astarg, int level);
void (*lp_unlock_ast)(void *astarg, int error);
};
/* /*
* The dlm_lockstatus struct includes lvb space, but the dlm_lksb struct only * The dlm_lockstatus struct includes lvb space, but the dlm_lksb struct only
* has a pointer to separately allocated lvb space. This struct exists only to * has a pointer to separately allocated lvb space. This struct exists only to
...@@ -81,12 +70,27 @@ struct fsdlm_lksb_plus_lvb { ...@@ -81,12 +70,27 @@ struct fsdlm_lksb_plus_lvb {
* size of the union is known. Lock status structures are embedded in * size of the union is known. Lock status structures are embedded in
* ocfs2 inodes. * ocfs2 inodes.
*/ */
union ocfs2_dlm_lksb { struct ocfs2_cluster_connection;
struct dlm_lockstatus lksb_o2dlm; struct ocfs2_dlm_lksb {
struct dlm_lksb lksb_fsdlm; union {
struct fsdlm_lksb_plus_lvb padding; struct dlm_lockstatus lksb_o2dlm;
struct dlm_lksb lksb_fsdlm;
struct fsdlm_lksb_plus_lvb padding;
};
struct ocfs2_cluster_connection *lksb_conn;
};
/*
* The ocfs2_locking_protocol defines the handlers called on ocfs2's behalf.
*/
struct ocfs2_locking_protocol {
struct ocfs2_protocol_version lp_max_version;
void (*lp_lock_ast)(struct ocfs2_dlm_lksb *lksb);
void (*lp_blocking_ast)(struct ocfs2_dlm_lksb *lksb, int level);
void (*lp_unlock_ast)(struct ocfs2_dlm_lksb *lksb, int error);
}; };
/* /*
* A cluster connection. Mostly opaque to ocfs2, the connection holds * A cluster connection. Mostly opaque to ocfs2, the connection holds
* state for the underlying stack. ocfs2 does use cc_version to determine * state for the underlying stack. ocfs2 does use cc_version to determine
...@@ -96,6 +100,7 @@ struct ocfs2_cluster_connection { ...@@ -96,6 +100,7 @@ struct ocfs2_cluster_connection {
char cc_name[GROUP_NAME_MAX]; char cc_name[GROUP_NAME_MAX];
int cc_namelen; int cc_namelen;
struct ocfs2_protocol_version cc_version; struct ocfs2_protocol_version cc_version;
struct ocfs2_locking_protocol *cc_proto;
void (*cc_recovery_handler)(int node_num, void *recovery_data); void (*cc_recovery_handler)(int node_num, void *recovery_data);
void *cc_recovery_data; void *cc_recovery_data;
void *cc_lockspace; void *cc_lockspace;
...@@ -155,27 +160,29 @@ struct ocfs2_stack_operations { ...@@ -155,27 +160,29 @@ struct ocfs2_stack_operations {
* *
* ast and bast functions are not part of the call because the * ast and bast functions are not part of the call because the
* stack will likely want to wrap ast and bast calls before passing * stack will likely want to wrap ast and bast calls before passing
* them to stack->sp_proto. * them to stack->sp_proto. There is no astarg. The lksb will
* be passed back to the ast and bast functions. The caller can
* use this to find their object.
*/ */
int (*dlm_lock)(struct ocfs2_cluster_connection *conn, int (*dlm_lock)(struct ocfs2_cluster_connection *conn,
int mode, int mode,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags,
void *name, void *name,
unsigned int namelen, unsigned int namelen);
void *astarg);
/* /*
* Call the underlying dlm unlock function. The ->dlm_unlock() * Call the underlying dlm unlock function. The ->dlm_unlock()
* function should convert the flags as appropriate. * function should convert the flags as appropriate.
* *
* The unlock ast is not passed, as the stack will want to wrap * The unlock ast is not passed, as the stack will want to wrap
* it before calling stack->sp_proto->lp_unlock_ast(). * it before calling stack->sp_proto->lp_unlock_ast(). There is
* no astarg. The lksb will be passed back to the unlock ast
* function. The caller can use this to find their object.
*/ */
int (*dlm_unlock)(struct ocfs2_cluster_connection *conn, int (*dlm_unlock)(struct ocfs2_cluster_connection *conn,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags);
void *astarg);
/* /*
* Return the status of the current lock status block. The fs * Return the status of the current lock status block. The fs
...@@ -183,17 +190,17 @@ struct ocfs2_stack_operations { ...@@ -183,17 +190,17 @@ struct ocfs2_stack_operations {
* callback pulls out the stack-specific lksb, converts the status * callback pulls out the stack-specific lksb, converts the status
* to a proper errno, and returns it. * to a proper errno, and returns it.
*/ */
int (*lock_status)(union ocfs2_dlm_lksb *lksb); int (*lock_status)(struct ocfs2_dlm_lksb *lksb);
/* /*
* Return non-zero if the LVB is valid. * Return non-zero if the LVB is valid.
*/ */
int (*lvb_valid)(union ocfs2_dlm_lksb *lksb); int (*lvb_valid)(struct ocfs2_dlm_lksb *lksb);
/* /*
* Pull the lvb pointer off of the stack-specific lksb. * Pull the lvb pointer off of the stack-specific lksb.
*/ */
void *(*lock_lvb)(union ocfs2_dlm_lksb *lksb); void *(*lock_lvb)(struct ocfs2_dlm_lksb *lksb);
/* /*
* Cluster-aware posix locks * Cluster-aware posix locks
...@@ -210,7 +217,7 @@ struct ocfs2_stack_operations { ...@@ -210,7 +217,7 @@ struct ocfs2_stack_operations {
* This is an optoinal debugging hook. If provided, the * This is an optoinal debugging hook. If provided, the
* stack can dump debugging information about this lock. * stack can dump debugging information about this lock.
*/ */
void (*dump_lksb)(union ocfs2_dlm_lksb *lksb); void (*dump_lksb)(struct ocfs2_dlm_lksb *lksb);
}; };
/* /*
...@@ -226,7 +233,7 @@ struct ocfs2_stack_plugin { ...@@ -226,7 +233,7 @@ struct ocfs2_stack_plugin {
/* These are managed by the stackglue code. */ /* These are managed by the stackglue code. */
struct list_head sp_list; struct list_head sp_list;
unsigned int sp_count; unsigned int sp_count;
struct ocfs2_locking_protocol *sp_proto; struct ocfs2_protocol_version sp_max_proto;
}; };
...@@ -234,10 +241,22 @@ struct ocfs2_stack_plugin { ...@@ -234,10 +241,22 @@ struct ocfs2_stack_plugin {
int ocfs2_cluster_connect(const char *stack_name, int ocfs2_cluster_connect(const char *stack_name,
const char *group, const char *group,
int grouplen, int grouplen,
struct ocfs2_locking_protocol *lproto,
void (*recovery_handler)(int node_num, void (*recovery_handler)(int node_num,
void *recovery_data), void *recovery_data),
void *recovery_data, void *recovery_data,
struct ocfs2_cluster_connection **conn); struct ocfs2_cluster_connection **conn);
/*
* Used by callers that don't store their stack name. They must ensure
* all nodes have the same stack.
*/
int ocfs2_cluster_connect_agnostic(const char *group,
int grouplen,
struct ocfs2_locking_protocol *lproto,
void (*recovery_handler)(int node_num,
void *recovery_data),
void *recovery_data,
struct ocfs2_cluster_connection **conn);
int ocfs2_cluster_disconnect(struct ocfs2_cluster_connection *conn, int ocfs2_cluster_disconnect(struct ocfs2_cluster_connection *conn,
int hangup_pending); int hangup_pending);
void ocfs2_cluster_hangup(const char *group, int grouplen); void ocfs2_cluster_hangup(const char *group, int grouplen);
...@@ -246,26 +265,24 @@ int ocfs2_cluster_this_node(unsigned int *node); ...@@ -246,26 +265,24 @@ int ocfs2_cluster_this_node(unsigned int *node);
struct ocfs2_lock_res; struct ocfs2_lock_res;
int ocfs2_dlm_lock(struct ocfs2_cluster_connection *conn, int ocfs2_dlm_lock(struct ocfs2_cluster_connection *conn,
int mode, int mode,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags,
void *name, void *name,
unsigned int namelen, unsigned int namelen);
struct ocfs2_lock_res *astarg);
int ocfs2_dlm_unlock(struct ocfs2_cluster_connection *conn, int ocfs2_dlm_unlock(struct ocfs2_cluster_connection *conn,
union ocfs2_dlm_lksb *lksb, struct ocfs2_dlm_lksb *lksb,
u32 flags, u32 flags);
struct ocfs2_lock_res *astarg);
int ocfs2_dlm_lock_status(union ocfs2_dlm_lksb *lksb); int ocfs2_dlm_lock_status(struct ocfs2_dlm_lksb *lksb);
int ocfs2_dlm_lvb_valid(union ocfs2_dlm_lksb *lksb); int ocfs2_dlm_lvb_valid(struct ocfs2_dlm_lksb *lksb);
void *ocfs2_dlm_lvb(union ocfs2_dlm_lksb *lksb); void *ocfs2_dlm_lvb(struct ocfs2_dlm_lksb *lksb);
void ocfs2_dlm_dump_lksb(union ocfs2_dlm_lksb *lksb); void ocfs2_dlm_dump_lksb(struct ocfs2_dlm_lksb *lksb);
int ocfs2_stack_supports_plocks(void); int ocfs2_stack_supports_plocks(void);
int ocfs2_plock(struct ocfs2_cluster_connection *conn, u64 ino, int ocfs2_plock(struct ocfs2_cluster_connection *conn, u64 ino,
struct file *file, int cmd, struct file_lock *fl); struct file *file, int cmd, struct file_lock *fl);
void ocfs2_stack_glue_set_locking_protocol(struct ocfs2_locking_protocol *proto); void ocfs2_stack_glue_set_max_proto_version(struct ocfs2_protocol_version *max_proto);
/* Used by stack plugins */ /* Used by stack plugins */
......
...@@ -51,7 +51,7 @@ ...@@ -51,7 +51,7 @@
#define ALLOC_NEW_GROUP 0x1 #define ALLOC_NEW_GROUP 0x1
#define ALLOC_GROUPS_FROM_GLOBAL 0x2 #define ALLOC_GROUPS_FROM_GLOBAL 0x2
#define OCFS2_MAX_INODES_TO_STEAL 1024 #define OCFS2_MAX_TO_STEAL 1024
static inline void ocfs2_debug_bg(struct ocfs2_group_desc *bg); static inline void ocfs2_debug_bg(struct ocfs2_group_desc *bg);
static inline void ocfs2_debug_suballoc_inode(struct ocfs2_dinode *fe); static inline void ocfs2_debug_suballoc_inode(struct ocfs2_dinode *fe);
...@@ -637,12 +637,113 @@ static int ocfs2_reserve_suballoc_bits(struct ocfs2_super *osb, ...@@ -637,12 +637,113 @@ static int ocfs2_reserve_suballoc_bits(struct ocfs2_super *osb,
return status; return status;
} }
static void ocfs2_init_inode_steal_slot(struct ocfs2_super *osb)
{
spin_lock(&osb->osb_lock);
osb->s_inode_steal_slot = OCFS2_INVALID_SLOT;
spin_unlock(&osb->osb_lock);
atomic_set(&osb->s_num_inodes_stolen, 0);
}
static void ocfs2_init_meta_steal_slot(struct ocfs2_super *osb)
{
spin_lock(&osb->osb_lock);
osb->s_meta_steal_slot = OCFS2_INVALID_SLOT;
spin_unlock(&osb->osb_lock);
atomic_set(&osb->s_num_meta_stolen, 0);
}
void ocfs2_init_steal_slots(struct ocfs2_super *osb)
{
ocfs2_init_inode_steal_slot(osb);
ocfs2_init_meta_steal_slot(osb);
}
static void __ocfs2_set_steal_slot(struct ocfs2_super *osb, int slot, int type)
{
spin_lock(&osb->osb_lock);
if (type == INODE_ALLOC_SYSTEM_INODE)
osb->s_inode_steal_slot = slot;
else if (type == EXTENT_ALLOC_SYSTEM_INODE)
osb->s_meta_steal_slot = slot;
spin_unlock(&osb->osb_lock);
}
static int __ocfs2_get_steal_slot(struct ocfs2_super *osb, int type)
{
int slot = OCFS2_INVALID_SLOT;
spin_lock(&osb->osb_lock);
if (type == INODE_ALLOC_SYSTEM_INODE)
slot = osb->s_inode_steal_slot;
else if (type == EXTENT_ALLOC_SYSTEM_INODE)
slot = osb->s_meta_steal_slot;
spin_unlock(&osb->osb_lock);
return slot;
}
static int ocfs2_get_inode_steal_slot(struct ocfs2_super *osb)
{
return __ocfs2_get_steal_slot(osb, INODE_ALLOC_SYSTEM_INODE);
}
static int ocfs2_get_meta_steal_slot(struct ocfs2_super *osb)
{
return __ocfs2_get_steal_slot(osb, EXTENT_ALLOC_SYSTEM_INODE);
}
static int ocfs2_steal_resource(struct ocfs2_super *osb,
struct ocfs2_alloc_context *ac,
int type)
{
int i, status = -ENOSPC;
int slot = __ocfs2_get_steal_slot(osb, type);
/* Start to steal resource from the first slot after ours. */
if (slot == OCFS2_INVALID_SLOT)
slot = osb->slot_num + 1;
for (i = 0; i < osb->max_slots; i++, slot++) {
if (slot == osb->max_slots)
slot = 0;
if (slot == osb->slot_num)
continue;
status = ocfs2_reserve_suballoc_bits(osb, ac,
type,
(u32)slot, NULL,
NOT_ALLOC_NEW_GROUP);
if (status >= 0) {
__ocfs2_set_steal_slot(osb, slot, type);
break;
}
ocfs2_free_ac_resource(ac);
}
return status;
}
static int ocfs2_steal_inode(struct ocfs2_super *osb,
struct ocfs2_alloc_context *ac)
{
return ocfs2_steal_resource(osb, ac, INODE_ALLOC_SYSTEM_INODE);
}
static int ocfs2_steal_meta(struct ocfs2_super *osb,
struct ocfs2_alloc_context *ac)
{
return ocfs2_steal_resource(osb, ac, EXTENT_ALLOC_SYSTEM_INODE);
}
int ocfs2_reserve_new_metadata_blocks(struct ocfs2_super *osb, int ocfs2_reserve_new_metadata_blocks(struct ocfs2_super *osb,
int blocks, int blocks,
struct ocfs2_alloc_context **ac) struct ocfs2_alloc_context **ac)
{ {
int status; int status;
u32 slot; int slot = ocfs2_get_meta_steal_slot(osb);
*ac = kzalloc(sizeof(struct ocfs2_alloc_context), GFP_KERNEL); *ac = kzalloc(sizeof(struct ocfs2_alloc_context), GFP_KERNEL);
if (!(*ac)) { if (!(*ac)) {
...@@ -653,12 +754,34 @@ int ocfs2_reserve_new_metadata_blocks(struct ocfs2_super *osb, ...@@ -653,12 +754,34 @@ int ocfs2_reserve_new_metadata_blocks(struct ocfs2_super *osb,
(*ac)->ac_bits_wanted = blocks; (*ac)->ac_bits_wanted = blocks;
(*ac)->ac_which = OCFS2_AC_USE_META; (*ac)->ac_which = OCFS2_AC_USE_META;
slot = osb->slot_num;
(*ac)->ac_group_search = ocfs2_block_group_search; (*ac)->ac_group_search = ocfs2_block_group_search;
if (slot != OCFS2_INVALID_SLOT &&
atomic_read(&osb->s_num_meta_stolen) < OCFS2_MAX_TO_STEAL)
goto extent_steal;
atomic_set(&osb->s_num_meta_stolen, 0);
status = ocfs2_reserve_suballoc_bits(osb, (*ac), status = ocfs2_reserve_suballoc_bits(osb, (*ac),
EXTENT_ALLOC_SYSTEM_INODE, EXTENT_ALLOC_SYSTEM_INODE,
slot, NULL, ALLOC_NEW_GROUP); (u32)osb->slot_num, NULL,
ALLOC_NEW_GROUP);
if (status >= 0) {
status = 0;
if (slot != OCFS2_INVALID_SLOT)
ocfs2_init_meta_steal_slot(osb);
goto bail;
} else if (status < 0 && status != -ENOSPC) {
mlog_errno(status);
goto bail;
}
ocfs2_free_ac_resource(*ac);
extent_steal:
status = ocfs2_steal_meta(osb, *ac);
atomic_inc(&osb->s_num_meta_stolen);
if (status < 0) { if (status < 0) {
if (status != -ENOSPC) if (status != -ENOSPC)
mlog_errno(status); mlog_errno(status);
...@@ -685,43 +808,11 @@ int ocfs2_reserve_new_metadata(struct ocfs2_super *osb, ...@@ -685,43 +808,11 @@ int ocfs2_reserve_new_metadata(struct ocfs2_super *osb,
ac); ac);
} }
static int ocfs2_steal_inode_from_other_nodes(struct ocfs2_super *osb,
struct ocfs2_alloc_context *ac)
{
int i, status = -ENOSPC;
s16 slot = ocfs2_get_inode_steal_slot(osb);
/* Start to steal inodes from the first slot after ours. */
if (slot == OCFS2_INVALID_SLOT)
slot = osb->slot_num + 1;
for (i = 0; i < osb->max_slots; i++, slot++) {
if (slot == osb->max_slots)
slot = 0;
if (slot == osb->slot_num)
continue;
status = ocfs2_reserve_suballoc_bits(osb, ac,
INODE_ALLOC_SYSTEM_INODE,
slot, NULL,
NOT_ALLOC_NEW_GROUP);
if (status >= 0) {
ocfs2_set_inode_steal_slot(osb, slot);
break;
}
ocfs2_free_ac_resource(ac);
}
return status;
}
int ocfs2_reserve_new_inode(struct ocfs2_super *osb, int ocfs2_reserve_new_inode(struct ocfs2_super *osb,
struct ocfs2_alloc_context **ac) struct ocfs2_alloc_context **ac)
{ {
int status; int status;
s16 slot = ocfs2_get_inode_steal_slot(osb); int slot = ocfs2_get_inode_steal_slot(osb);
u64 alloc_group; u64 alloc_group;
*ac = kzalloc(sizeof(struct ocfs2_alloc_context), GFP_KERNEL); *ac = kzalloc(sizeof(struct ocfs2_alloc_context), GFP_KERNEL);
...@@ -754,14 +845,14 @@ int ocfs2_reserve_new_inode(struct ocfs2_super *osb, ...@@ -754,14 +845,14 @@ int ocfs2_reserve_new_inode(struct ocfs2_super *osb,
* need to check our slots to see whether there is some space for us. * need to check our slots to see whether there is some space for us.
*/ */
if (slot != OCFS2_INVALID_SLOT && if (slot != OCFS2_INVALID_SLOT &&
atomic_read(&osb->s_num_inodes_stolen) < OCFS2_MAX_INODES_TO_STEAL) atomic_read(&osb->s_num_inodes_stolen) < OCFS2_MAX_TO_STEAL)
goto inode_steal; goto inode_steal;
atomic_set(&osb->s_num_inodes_stolen, 0); atomic_set(&osb->s_num_inodes_stolen, 0);
alloc_group = osb->osb_inode_alloc_group; alloc_group = osb->osb_inode_alloc_group;
status = ocfs2_reserve_suballoc_bits(osb, *ac, status = ocfs2_reserve_suballoc_bits(osb, *ac,
INODE_ALLOC_SYSTEM_INODE, INODE_ALLOC_SYSTEM_INODE,
osb->slot_num, (u32)osb->slot_num,
&alloc_group, &alloc_group,
ALLOC_NEW_GROUP | ALLOC_NEW_GROUP |
ALLOC_GROUPS_FROM_GLOBAL); ALLOC_GROUPS_FROM_GLOBAL);
...@@ -789,7 +880,7 @@ int ocfs2_reserve_new_inode(struct ocfs2_super *osb, ...@@ -789,7 +880,7 @@ int ocfs2_reserve_new_inode(struct ocfs2_super *osb,
ocfs2_free_ac_resource(*ac); ocfs2_free_ac_resource(*ac);
inode_steal: inode_steal:
status = ocfs2_steal_inode_from_other_nodes(osb, *ac); status = ocfs2_steal_inode(osb, *ac);
atomic_inc(&osb->s_num_inodes_stolen); atomic_inc(&osb->s_num_inodes_stolen);
if (status < 0) { if (status < 0) {
if (status != -ENOSPC) if (status != -ENOSPC)
......
...@@ -56,6 +56,7 @@ struct ocfs2_alloc_context { ...@@ -56,6 +56,7 @@ struct ocfs2_alloc_context {
is the same as ~0 - unlimited */ is the same as ~0 - unlimited */
}; };
void ocfs2_init_steal_slots(struct ocfs2_super *osb);
void ocfs2_free_alloc_context(struct ocfs2_alloc_context *ac); void ocfs2_free_alloc_context(struct ocfs2_alloc_context *ac);
static inline int ocfs2_alloc_context_bits_left(struct ocfs2_alloc_context *ac) static inline int ocfs2_alloc_context_bits_left(struct ocfs2_alloc_context *ac)
{ {
......
...@@ -69,6 +69,7 @@ ...@@ -69,6 +69,7 @@
#include "xattr.h" #include "xattr.h"
#include "quota.h" #include "quota.h"
#include "refcounttree.h" #include "refcounttree.h"
#include "suballoc.h"
#include "buffer_head_io.h" #include "buffer_head_io.h"
...@@ -301,9 +302,12 @@ static int ocfs2_osb_dump(struct ocfs2_super *osb, char *buf, int len) ...@@ -301,9 +302,12 @@ static int ocfs2_osb_dump(struct ocfs2_super *osb, char *buf, int len)
spin_lock(&osb->osb_lock); spin_lock(&osb->osb_lock);
out += snprintf(buf + out, len - out, out += snprintf(buf + out, len - out,
"%10s => Slot: %d NumStolen: %d\n", "Steal", "%10s => InodeSlot: %d StolenInodes: %d, "
"MetaSlot: %d StolenMeta: %d\n", "Steal",
osb->s_inode_steal_slot, osb->s_inode_steal_slot,
atomic_read(&osb->s_num_inodes_stolen)); atomic_read(&osb->s_num_inodes_stolen),
osb->s_meta_steal_slot,
atomic_read(&osb->s_num_meta_stolen));
spin_unlock(&osb->osb_lock); spin_unlock(&osb->osb_lock);
out += snprintf(buf + out, len - out, "OrphanScan => "); out += snprintf(buf + out, len - out, "OrphanScan => ");
...@@ -1997,7 +2001,7 @@ static int ocfs2_initialize_super(struct super_block *sb, ...@@ -1997,7 +2001,7 @@ static int ocfs2_initialize_super(struct super_block *sb,
osb->blocked_lock_count = 0; osb->blocked_lock_count = 0;
spin_lock_init(&osb->osb_lock); spin_lock_init(&osb->osb_lock);
spin_lock_init(&osb->osb_xattr_lock); spin_lock_init(&osb->osb_xattr_lock);
ocfs2_init_inode_steal_slot(osb); ocfs2_init_steal_slots(osb);
atomic_set(&osb->alloc_stats.moves, 0); atomic_set(&osb->alloc_stats.moves, 0);
atomic_set(&osb->alloc_stats.local_data, 0); atomic_set(&osb->alloc_stats.local_data, 0);
......
This diff is collapsed.
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment