Commit 682c30ed authored by Linus Torvalds's avatar Linus Torvalds

Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/sage/ceph-client

* 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/sage/ceph-client: (39 commits)
  ceph: generalize mon requests, add pool op support
  ceph: only queue async writeback on cap revocation if there is dirty data
  ceph: do not ignore osd_idle_ttl mount option
  ceph: constify dentry_operations
  ceph: whitespace cleanup
  ceph: add flock/fcntl lock support
  ceph: define on-wire types, constants for file locking support
  ceph: add CEPH_FEATURE_FLOCK to the supported feature bits
  ceph: support v2 reconnect encoding
  ceph: support v2 client_caps encoding
  ceph: move AES iv definition to shared header
  ceph: fix decoding of pool snap info
  ceph: make ->sync_fs not wait if wait==0
  ceph: warn on missing snap realm
  ceph: print useful error message when crush rule not found
  ceph: use %pU to print uuid (fsid)
  ceph: sync header defs with server code
  ceph: clean up header guards
  ceph: strip misleading/obsolete version, feature info
  ceph: specify supported features in super.h
  ...
parents 84479f3c e56fa10e
...@@ -6,7 +6,7 @@ ifneq ($(KERNELRELEASE),) ...@@ -6,7 +6,7 @@ ifneq ($(KERNELRELEASE),)
obj-$(CONFIG_CEPH_FS) += ceph.o obj-$(CONFIG_CEPH_FS) += ceph.o
ceph-objs := super.o inode.o dir.o file.o addr.o ioctl.o \ ceph-objs := super.o inode.o dir.o file.o locks.o addr.o ioctl.o \
export.o caps.o snap.o xattr.o \ export.o caps.o snap.o xattr.o \
messenger.o msgpool.o buffer.o pagelist.o \ messenger.o msgpool.o buffer.o pagelist.o \
mds_client.o mdsmap.o \ mds_client.o mdsmap.o \
......
...@@ -309,7 +309,8 @@ static int ceph_readpages(struct file *file, struct address_space *mapping, ...@@ -309,7 +309,8 @@ static int ceph_readpages(struct file *file, struct address_space *mapping,
zero_user_segment(page, s, PAGE_CACHE_SIZE); zero_user_segment(page, s, PAGE_CACHE_SIZE);
} }
if (add_to_page_cache_lru(page, mapping, page->index, GFP_NOFS)) { if (add_to_page_cache_lru(page, mapping, page->index,
GFP_NOFS)) {
page_cache_release(page); page_cache_release(page);
dout("readpages %p add_to_page_cache failed %p\n", dout("readpages %p add_to_page_cache failed %p\n",
inode, page); inode, page);
...@@ -552,7 +553,7 @@ static void writepages_finish(struct ceph_osd_request *req, ...@@ -552,7 +553,7 @@ static void writepages_finish(struct ceph_osd_request *req,
* page truncation thread, possibly losing some data that * page truncation thread, possibly losing some data that
* raced its way in * raced its way in
*/ */
if ((issued & CEPH_CAP_FILE_CACHE) == 0) if ((issued & (CEPH_CAP_FILE_CACHE|CEPH_CAP_FILE_LAZYIO)) == 0)
generic_error_remove_page(inode->i_mapping, page); generic_error_remove_page(inode->i_mapping, page);
unlock_page(page); unlock_page(page);
...@@ -797,9 +798,12 @@ static int ceph_writepages_start(struct address_space *mapping, ...@@ -797,9 +798,12 @@ static int ceph_writepages_start(struct address_space *mapping,
dout("%p will write page %p idx %lu\n", dout("%p will write page %p idx %lu\n",
inode, page, page->index); inode, page, page->index);
writeback_stat = atomic_long_inc_return(&client->writeback_count); writeback_stat =
if (writeback_stat > CONGESTION_ON_THRESH(client->mount_args->congestion_kb)) { atomic_long_inc_return(&client->writeback_count);
set_bdi_congested(&client->backing_dev_info, BLK_RW_ASYNC); if (writeback_stat > CONGESTION_ON_THRESH(
client->mount_args->congestion_kb)) {
set_bdi_congested(&client->backing_dev_info,
BLK_RW_ASYNC);
} }
set_page_writeback(page); set_page_writeback(page);
...@@ -1036,7 +1040,7 @@ static int ceph_write_begin(struct file *file, struct address_space *mapping, ...@@ -1036,7 +1040,7 @@ static int ceph_write_begin(struct file *file, struct address_space *mapping,
*pagep = page; *pagep = page;
dout("write_begin file %p inode %p page %p %d~%d\n", file, dout("write_begin file %p inode %p page %p %d~%d\n", file,
inode, page, (int)pos, (int)len); inode, page, (int)pos, (int)len);
r = ceph_update_writeable_page(file, pos, len, page); r = ceph_update_writeable_page(file, pos, len, page);
} while (r == -EAGAIN); } while (r == -EAGAIN);
......
#include <linux/errno.h> #include <linux/errno.h>
int ceph_armor(char *dst, const char *src, const char *end);
int ceph_unarmor(char *dst, const char *src, const char *end);
/* /*
* base64 encode/decode. * base64 encode/decode.
*/ */
const char *pem_key = "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/"; static const char *pem_key =
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789+/";
static int encode_bits(int c) static int encode_bits(int c)
{ {
......
...@@ -20,7 +20,7 @@ static u32 supported_protocols[] = { ...@@ -20,7 +20,7 @@ static u32 supported_protocols[] = {
CEPH_AUTH_CEPHX CEPH_AUTH_CEPHX
}; };
int ceph_auth_init_protocol(struct ceph_auth_client *ac, int protocol) static int ceph_auth_init_protocol(struct ceph_auth_client *ac, int protocol)
{ {
switch (protocol) { switch (protocol) {
case CEPH_AUTH_NONE: case CEPH_AUTH_NONE:
...@@ -133,8 +133,8 @@ int ceph_auth_build_hello(struct ceph_auth_client *ac, void *buf, size_t len) ...@@ -133,8 +133,8 @@ int ceph_auth_build_hello(struct ceph_auth_client *ac, void *buf, size_t len)
return -ERANGE; return -ERANGE;
} }
int ceph_build_auth_request(struct ceph_auth_client *ac, static int ceph_build_auth_request(struct ceph_auth_client *ac,
void *msg_buf, size_t msg_len) void *msg_buf, size_t msg_len)
{ {
struct ceph_mon_request_header *monhdr = msg_buf; struct ceph_mon_request_header *monhdr = msg_buf;
void *p = monhdr + 1; void *p = monhdr + 1;
......
...@@ -87,8 +87,8 @@ static int ceph_x_decrypt(struct ceph_crypto_key *secret, ...@@ -87,8 +87,8 @@ static int ceph_x_decrypt(struct ceph_crypto_key *secret,
/* /*
* get existing (or insert new) ticket handler * get existing (or insert new) ticket handler
*/ */
struct ceph_x_ticket_handler *get_ticket_handler(struct ceph_auth_client *ac, static struct ceph_x_ticket_handler *
int service) get_ticket_handler(struct ceph_auth_client *ac, int service)
{ {
struct ceph_x_ticket_handler *th; struct ceph_x_ticket_handler *th;
struct ceph_x_info *xi = ac->private; struct ceph_x_info *xi = ac->private;
...@@ -429,7 +429,7 @@ static int ceph_x_build_request(struct ceph_auth_client *ac, ...@@ -429,7 +429,7 @@ static int ceph_x_build_request(struct ceph_auth_client *ac,
auth->struct_v = 1; auth->struct_v = 1;
auth->key = 0; auth->key = 0;
for (u = (u64 *)tmp_enc; u + 1 <= (u64 *)(tmp_enc + ret); u++) for (u = (u64 *)tmp_enc; u + 1 <= (u64 *)(tmp_enc + ret); u++)
auth->key ^= *u; auth->key ^= *(__le64 *)u;
dout(" server_challenge %llx client_challenge %llx key %llx\n", dout(" server_challenge %llx client_challenge %llx key %llx\n",
xi->server_challenge, le64_to_cpu(auth->client_challenge), xi->server_challenge, le64_to_cpu(auth->client_challenge),
le64_to_cpu(auth->key)); le64_to_cpu(auth->key));
......
...@@ -47,22 +47,6 @@ void ceph_buffer_release(struct kref *kref) ...@@ -47,22 +47,6 @@ void ceph_buffer_release(struct kref *kref)
kfree(b); kfree(b);
} }
int ceph_buffer_alloc(struct ceph_buffer *b, int len, gfp_t gfp)
{
b->vec.iov_base = kmalloc(len, gfp | __GFP_NOWARN);
if (b->vec.iov_base) {
b->is_vmalloc = false;
} else {
b->vec.iov_base = __vmalloc(len, gfp, PAGE_KERNEL);
b->is_vmalloc = true;
}
if (!b->vec.iov_base)
return -ENOMEM;
b->alloc_len = len;
b->vec.iov_len = len;
return 0;
}
int ceph_decode_buffer(struct ceph_buffer **b, void **p, void *end) int ceph_decode_buffer(struct ceph_buffer **b, void **p, void *end)
{ {
size_t len; size_t len;
......
This diff is collapsed.
#ifndef _FS_CEPH_FRAG_H #ifndef FS_CEPH_FRAG_H
#define _FS_CEPH_FRAG_H #define FS_CEPH_FRAG_H
/* /*
* "Frags" are a way to describe a subset of a 32-bit number space, * "Frags" are a way to describe a subset of a 32-bit number space,
......
...@@ -29,46 +29,44 @@ int ceph_file_layout_is_valid(const struct ceph_file_layout *layout) ...@@ -29,46 +29,44 @@ int ceph_file_layout_is_valid(const struct ceph_file_layout *layout)
int ceph_flags_to_mode(int flags) int ceph_flags_to_mode(int flags)
{ {
int mode;
#ifdef O_DIRECTORY /* fixme */ #ifdef O_DIRECTORY /* fixme */
if ((flags & O_DIRECTORY) == O_DIRECTORY) if ((flags & O_DIRECTORY) == O_DIRECTORY)
return CEPH_FILE_MODE_PIN; return CEPH_FILE_MODE_PIN;
#endif #endif
if ((flags & O_APPEND) == O_APPEND)
flags |= O_WRONLY;
if ((flags & O_ACCMODE) == O_RDWR)
mode = CEPH_FILE_MODE_RDWR;
else if ((flags & O_ACCMODE) == O_WRONLY)
mode = CEPH_FILE_MODE_WR;
else
mode = CEPH_FILE_MODE_RD;
#ifdef O_LAZY #ifdef O_LAZY
if (flags & O_LAZY) if (flags & O_LAZY)
return CEPH_FILE_MODE_LAZY; mode |= CEPH_FILE_MODE_LAZY;
#endif #endif
if ((flags & O_APPEND) == O_APPEND)
flags |= O_WRONLY;
flags &= O_ACCMODE; return mode;
if ((flags & O_RDWR) == O_RDWR)
return CEPH_FILE_MODE_RDWR;
if ((flags & O_WRONLY) == O_WRONLY)
return CEPH_FILE_MODE_WR;
return CEPH_FILE_MODE_RD;
} }
int ceph_caps_for_mode(int mode) int ceph_caps_for_mode(int mode)
{ {
switch (mode) { int caps = CEPH_CAP_PIN;
case CEPH_FILE_MODE_PIN:
return CEPH_CAP_PIN; if (mode & CEPH_FILE_MODE_RD)
case CEPH_FILE_MODE_RD: caps |= CEPH_CAP_FILE_SHARED |
return CEPH_CAP_PIN | CEPH_CAP_FILE_SHARED |
CEPH_CAP_FILE_RD | CEPH_CAP_FILE_CACHE; CEPH_CAP_FILE_RD | CEPH_CAP_FILE_CACHE;
case CEPH_FILE_MODE_RDWR: if (mode & CEPH_FILE_MODE_WR)
return CEPH_CAP_PIN | CEPH_CAP_FILE_SHARED | caps |= CEPH_CAP_FILE_EXCL |
CEPH_CAP_FILE_EXCL |
CEPH_CAP_FILE_RD | CEPH_CAP_FILE_CACHE |
CEPH_CAP_FILE_WR | CEPH_CAP_FILE_BUFFER |
CEPH_CAP_AUTH_SHARED | CEPH_CAP_AUTH_EXCL |
CEPH_CAP_XATTR_SHARED | CEPH_CAP_XATTR_EXCL;
case CEPH_FILE_MODE_WR:
return CEPH_CAP_PIN | CEPH_CAP_FILE_SHARED |
CEPH_CAP_FILE_EXCL |
CEPH_CAP_FILE_WR | CEPH_CAP_FILE_BUFFER | CEPH_CAP_FILE_WR | CEPH_CAP_FILE_BUFFER |
CEPH_CAP_AUTH_SHARED | CEPH_CAP_AUTH_EXCL | CEPH_CAP_AUTH_SHARED | CEPH_CAP_AUTH_EXCL |
CEPH_CAP_XATTR_SHARED | CEPH_CAP_XATTR_EXCL; CEPH_CAP_XATTR_SHARED | CEPH_CAP_XATTR_EXCL;
} if (mode & CEPH_FILE_MODE_LAZY)
return 0; caps |= CEPH_CAP_FILE_LAZYIO;
return caps;
} }
...@@ -9,26 +9,12 @@ ...@@ -9,26 +9,12 @@
* LGPL2 * LGPL2
*/ */
#ifndef _FS_CEPH_CEPH_FS_H #ifndef CEPH_FS_H
#define _FS_CEPH_CEPH_FS_H #define CEPH_FS_H
#include "msgr.h" #include "msgr.h"
#include "rados.h" #include "rados.h"
/*
* Ceph release version
*/
#define CEPH_VERSION_MAJOR 0
#define CEPH_VERSION_MINOR 20
#define CEPH_VERSION_PATCH 0
#define _CEPH_STRINGIFY(x) #x
#define CEPH_STRINGIFY(x) _CEPH_STRINGIFY(x)
#define CEPH_MAKE_VERSION(x, y, z) CEPH_STRINGIFY(x) "." CEPH_STRINGIFY(y) \
"." CEPH_STRINGIFY(z)
#define CEPH_VERSION CEPH_MAKE_VERSION(CEPH_VERSION_MAJOR, \
CEPH_VERSION_MINOR, CEPH_VERSION_PATCH)
/* /*
* subprotocol versions. when specific messages types or high-level * subprotocol versions. when specific messages types or high-level
* protocols change, bump the affected components. we keep rev * protocols change, bump the affected components. we keep rev
...@@ -53,18 +39,10 @@ ...@@ -53,18 +39,10 @@
/* /*
* feature bits * feature bits
*/ */
#define CEPH_FEATURE_UID 1 #define CEPH_FEATURE_UID (1<<0)
#define CEPH_FEATURE_NOSRCADDR 2 #define CEPH_FEATURE_NOSRCADDR (1<<1)
#define CEPH_FEATURE_FLOCK 4 #define CEPH_FEATURE_MONCLOCKCHECK (1<<2)
#define CEPH_FEATURE_FLOCK (1<<3)
#define CEPH_FEATURE_SUPPORTED_MON CEPH_FEATURE_UID|CEPH_FEATURE_NOSRCADDR
#define CEPH_FEATURE_REQUIRED_MON CEPH_FEATURE_UID
#define CEPH_FEATURE_SUPPORTED_MDS CEPH_FEATURE_UID|CEPH_FEATURE_NOSRCADDR|CEPH_FEATURE_FLOCK
#define CEPH_FEATURE_REQUIRED_MDS CEPH_FEATURE_UID
#define CEPH_FEATURE_SUPPORTED_OSD CEPH_FEATURE_UID|CEPH_FEATURE_NOSRCADDR
#define CEPH_FEATURE_REQUIRED_OSD CEPH_FEATURE_UID
#define CEPH_FEATURE_SUPPORTED_CLIENT CEPH_FEATURE_NOSRCADDR
#define CEPH_FEATURE_REQUIRED_CLIENT CEPH_FEATURE_NOSRCADDR
/* /*
...@@ -96,6 +74,8 @@ int ceph_file_layout_is_valid(const struct ceph_file_layout *layout); ...@@ -96,6 +74,8 @@ int ceph_file_layout_is_valid(const struct ceph_file_layout *layout);
#define CEPH_CRYPTO_NONE 0x0 #define CEPH_CRYPTO_NONE 0x0
#define CEPH_CRYPTO_AES 0x1 #define CEPH_CRYPTO_AES 0x1
#define CEPH_AES_IV "cephsageyudagreg"
/* security/authentication protocols */ /* security/authentication protocols */
#define CEPH_AUTH_UNKNOWN 0x0 #define CEPH_AUTH_UNKNOWN 0x0
#define CEPH_AUTH_NONE 0x1 #define CEPH_AUTH_NONE 0x1
...@@ -275,6 +255,7 @@ extern const char *ceph_mds_state_name(int s); ...@@ -275,6 +255,7 @@ extern const char *ceph_mds_state_name(int s);
#define CEPH_LOCK_IDFT 512 /* dir frag tree */ #define CEPH_LOCK_IDFT 512 /* dir frag tree */
#define CEPH_LOCK_INEST 1024 /* mds internal */ #define CEPH_LOCK_INEST 1024 /* mds internal */
#define CEPH_LOCK_IXATTR 2048 #define CEPH_LOCK_IXATTR 2048
#define CEPH_LOCK_IFLOCK 4096 /* advisory file locks */
#define CEPH_LOCK_INO 8192 /* immutable inode bits; not a lock */ #define CEPH_LOCK_INO 8192 /* immutable inode bits; not a lock */
/* client_session ops */ /* client_session ops */
...@@ -316,6 +297,8 @@ enum { ...@@ -316,6 +297,8 @@ enum {
CEPH_MDS_OP_RMXATTR = 0x01106, CEPH_MDS_OP_RMXATTR = 0x01106,
CEPH_MDS_OP_SETLAYOUT = 0x01107, CEPH_MDS_OP_SETLAYOUT = 0x01107,
CEPH_MDS_OP_SETATTR = 0x01108, CEPH_MDS_OP_SETATTR = 0x01108,
CEPH_MDS_OP_SETFILELOCK= 0x01109,
CEPH_MDS_OP_GETFILELOCK= 0x00110,
CEPH_MDS_OP_MKNOD = 0x01201, CEPH_MDS_OP_MKNOD = 0x01201,
CEPH_MDS_OP_LINK = 0x01202, CEPH_MDS_OP_LINK = 0x01202,
...@@ -386,6 +369,15 @@ union ceph_mds_request_args { ...@@ -386,6 +369,15 @@ union ceph_mds_request_args {
struct { struct {
struct ceph_file_layout layout; struct ceph_file_layout layout;
} __attribute__ ((packed)) setlayout; } __attribute__ ((packed)) setlayout;
struct {
__u8 rule; /* currently fcntl or flock */
__u8 type; /* shared, exclusive, remove*/
__le64 pid; /* process id requesting the lock */
__le64 pid_namespace;
__le64 start; /* initial location to lock */
__le64 length; /* num bytes to lock from start */
__u8 wait; /* will caller wait for lock to become available? */
} __attribute__ ((packed)) filelock_change;
} __attribute__ ((packed)); } __attribute__ ((packed));
#define CEPH_MDS_FLAG_REPLAY 1 /* this is a replayed op */ #define CEPH_MDS_FLAG_REPLAY 1 /* this is a replayed op */
...@@ -480,6 +472,23 @@ struct ceph_mds_reply_dirfrag { ...@@ -480,6 +472,23 @@ struct ceph_mds_reply_dirfrag {
__le32 dist[]; __le32 dist[];
} __attribute__ ((packed)); } __attribute__ ((packed));
#define CEPH_LOCK_FCNTL 1
#define CEPH_LOCK_FLOCK 2
#define CEPH_LOCK_SHARED 1
#define CEPH_LOCK_EXCL 2
#define CEPH_LOCK_UNLOCK 4
struct ceph_filelock {
__le64 start;/* file offset to start lock at */
__le64 length; /* num bytes to lock; 0 for all following start */
__le64 client; /* which client holds the lock */
__le64 pid; /* process id holding the lock on the client */
__le64 pid_namespace;
__u8 type; /* shared lock, exclusive lock, or unlock */
} __attribute__ ((packed));
/* file access modes */ /* file access modes */
#define CEPH_FILE_MODE_PIN 0 #define CEPH_FILE_MODE_PIN 0
#define CEPH_FILE_MODE_RD 1 #define CEPH_FILE_MODE_RD 1
...@@ -508,9 +517,10 @@ int ceph_flags_to_mode(int flags); ...@@ -508,9 +517,10 @@ int ceph_flags_to_mode(int flags);
#define CEPH_CAP_SAUTH 2 #define CEPH_CAP_SAUTH 2
#define CEPH_CAP_SLINK 4 #define CEPH_CAP_SLINK 4
#define CEPH_CAP_SXATTR 6 #define CEPH_CAP_SXATTR 6
#define CEPH_CAP_SFILE 8 /* goes at the end (uses >2 cap bits) */ #define CEPH_CAP_SFILE 8
#define CEPH_CAP_SFLOCK 20
#define CEPH_CAP_BITS 16 #define CEPH_CAP_BITS 22
/* composed values */ /* composed values */
#define CEPH_CAP_AUTH_SHARED (CEPH_CAP_GSHARED << CEPH_CAP_SAUTH) #define CEPH_CAP_AUTH_SHARED (CEPH_CAP_GSHARED << CEPH_CAP_SAUTH)
...@@ -528,6 +538,9 @@ int ceph_flags_to_mode(int flags); ...@@ -528,6 +538,9 @@ int ceph_flags_to_mode(int flags);
#define CEPH_CAP_FILE_BUFFER (CEPH_CAP_GBUFFER << CEPH_CAP_SFILE) #define CEPH_CAP_FILE_BUFFER (CEPH_CAP_GBUFFER << CEPH_CAP_SFILE)
#define CEPH_CAP_FILE_WREXTEND (CEPH_CAP_GWREXTEND << CEPH_CAP_SFILE) #define CEPH_CAP_FILE_WREXTEND (CEPH_CAP_GWREXTEND << CEPH_CAP_SFILE)
#define CEPH_CAP_FILE_LAZYIO (CEPH_CAP_GLAZYIO << CEPH_CAP_SFILE) #define CEPH_CAP_FILE_LAZYIO (CEPH_CAP_GLAZYIO << CEPH_CAP_SFILE)
#define CEPH_CAP_FLOCK_SHARED (CEPH_CAP_GSHARED << CEPH_CAP_SFLOCK)
#define CEPH_CAP_FLOCK_EXCL (CEPH_CAP_GEXCL << CEPH_CAP_SFLOCK)
/* cap masks (for getattr) */ /* cap masks (for getattr) */
#define CEPH_STAT_CAP_INODE CEPH_CAP_PIN #define CEPH_STAT_CAP_INODE CEPH_CAP_PIN
...@@ -563,7 +576,8 @@ int ceph_flags_to_mode(int flags); ...@@ -563,7 +576,8 @@ int ceph_flags_to_mode(int flags);
CEPH_CAP_FILE_EXCL) CEPH_CAP_FILE_EXCL)
#define CEPH_CAP_ANY_WR (CEPH_CAP_ANY_EXCL | CEPH_CAP_ANY_FILE_WR) #define CEPH_CAP_ANY_WR (CEPH_CAP_ANY_EXCL | CEPH_CAP_ANY_FILE_WR)
#define CEPH_CAP_ANY (CEPH_CAP_ANY_RD | CEPH_CAP_ANY_EXCL | \ #define CEPH_CAP_ANY (CEPH_CAP_ANY_RD | CEPH_CAP_ANY_EXCL | \
CEPH_CAP_ANY_FILE_WR | CEPH_CAP_PIN) CEPH_CAP_ANY_FILE_WR | CEPH_CAP_FILE_LAZYIO | \
CEPH_CAP_PIN)
#define CEPH_CAP_LOCKS (CEPH_LOCK_IFILE | CEPH_LOCK_IAUTH | CEPH_LOCK_ILINK | \ #define CEPH_CAP_LOCKS (CEPH_LOCK_IFILE | CEPH_LOCK_IAUTH | CEPH_LOCK_ILINK | \
CEPH_LOCK_IXATTR) CEPH_LOCK_IXATTR)
...@@ -650,6 +664,16 @@ struct ceph_mds_lease { ...@@ -650,6 +664,16 @@ struct ceph_mds_lease {
/* client reconnect */ /* client reconnect */
struct ceph_mds_cap_reconnect { struct ceph_mds_cap_reconnect {
__le64 cap_id;
__le32 wanted;
__le32 issued;
__le64 snaprealm;
__le64 pathbase; /* base ino for our path to this ino */
__le32 flock_len; /* size of flock state blob, if any */
} __attribute__ ((packed));
/* followed by flock blob */
struct ceph_mds_cap_reconnect_v1 {
__le64 cap_id; __le64 cap_id;
__le32 wanted; __le32 wanted;
__le32 issued; __le32 issued;
...@@ -658,7 +682,6 @@ struct ceph_mds_cap_reconnect { ...@@ -658,7 +682,6 @@ struct ceph_mds_cap_reconnect {
__le64 snaprealm; __le64 snaprealm;
__le64 pathbase; /* base ino for our path to this ino */ __le64 pathbase; /* base ino for our path to this ino */
} __attribute__ ((packed)); } __attribute__ ((packed));
/* followed by encoded string */
struct ceph_mds_snaprealm_reconnect { struct ceph_mds_snaprealm_reconnect {
__le64 ino; /* snap realm base */ __le64 ino; /* snap realm base */
......
#ifndef _FS_CEPH_HASH_H #ifndef FS_CEPH_HASH_H
#define _FS_CEPH_HASH_H #define FS_CEPH_HASH_H
#define CEPH_STR_HASH_LINUX 0x1 /* linux dcache hash */ #define CEPH_STR_HASH_LINUX 0x1 /* linux dcache hash */
#define CEPH_STR_HASH_RJENKINS 0x2 /* robert jenkins' */ #define CEPH_STR_HASH_RJENKINS 0x2 /* robert jenkins' */
......
...@@ -28,6 +28,7 @@ const char *ceph_osd_op_name(int op) ...@@ -28,6 +28,7 @@ const char *ceph_osd_op_name(int op)
case CEPH_OSD_OP_TRUNCATE: return "truncate"; case CEPH_OSD_OP_TRUNCATE: return "truncate";
case CEPH_OSD_OP_ZERO: return "zero"; case CEPH_OSD_OP_ZERO: return "zero";
case CEPH_OSD_OP_WRITEFULL: return "writefull"; case CEPH_OSD_OP_WRITEFULL: return "writefull";
case CEPH_OSD_OP_ROLLBACK: return "rollback";
case CEPH_OSD_OP_APPEND: return "append"; case CEPH_OSD_OP_APPEND: return "append";
case CEPH_OSD_OP_STARTSYNC: return "startsync"; case CEPH_OSD_OP_STARTSYNC: return "startsync";
...@@ -129,6 +130,8 @@ const char *ceph_mds_op_name(int op) ...@@ -129,6 +130,8 @@ const char *ceph_mds_op_name(int op)
case CEPH_MDS_OP_LSSNAP: return "lssnap"; case CEPH_MDS_OP_LSSNAP: return "lssnap";
case CEPH_MDS_OP_MKSNAP: return "mksnap"; case CEPH_MDS_OP_MKSNAP: return "mksnap";
case CEPH_MDS_OP_RMSNAP: return "rmsnap"; case CEPH_MDS_OP_RMSNAP: return "rmsnap";
case CEPH_MDS_OP_SETFILELOCK: return "setfilelock";
case CEPH_MDS_OP_GETFILELOCK: return "getfilelock";
} }
return "???"; return "???";
} }
......
#ifndef _CRUSH_CRUSH_H #ifndef CEPH_CRUSH_CRUSH_H
#define _CRUSH_CRUSH_H #define CEPH_CRUSH_CRUSH_H
#include <linux/types.h> #include <linux/types.h>
......
#ifndef _CRUSH_HASH_H #ifndef CEPH_CRUSH_HASH_H
#define _CRUSH_HASH_H #define CEPH_CRUSH_HASH_H
#define CRUSH_HASH_RJENKINS1 0 #define CRUSH_HASH_RJENKINS1 0
......
#ifndef _CRUSH_MAPPER_H #ifndef CEPH_CRUSH_MAPPER_H
#define _CRUSH_MAPPER_H #define CEPH_CRUSH_MAPPER_H
/* /*
* CRUSH functions for find rules and then mapping an input to an * CRUSH functions for find rules and then mapping an input to an
......
...@@ -75,10 +75,11 @@ static struct crypto_blkcipher *ceph_crypto_alloc_cipher(void) ...@@ -75,10 +75,11 @@ static struct crypto_blkcipher *ceph_crypto_alloc_cipher(void)
return crypto_alloc_blkcipher("cbc(aes)", 0, CRYPTO_ALG_ASYNC); return crypto_alloc_blkcipher("cbc(aes)", 0, CRYPTO_ALG_ASYNC);
} }
const u8 *aes_iv = "cephsageyudagreg"; static const u8 *aes_iv = (u8 *)CEPH_AES_IV;
int ceph_aes_encrypt(const void *key, int key_len, void *dst, size_t *dst_len, static int ceph_aes_encrypt(const void *key, int key_len,
const void *src, size_t src_len) void *dst, size_t *dst_len,
const void *src, size_t src_len)
{ {
struct scatterlist sg_in[2], sg_out[1]; struct scatterlist sg_in[2], sg_out[1];
struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher(); struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher();
...@@ -126,9 +127,10 @@ int ceph_aes_encrypt(const void *key, int key_len, void *dst, size_t *dst_len, ...@@ -126,9 +127,10 @@ int ceph_aes_encrypt(const void *key, int key_len, void *dst, size_t *dst_len,
return 0; return 0;
} }
int ceph_aes_encrypt2(const void *key, int key_len, void *dst, size_t *dst_len, static int ceph_aes_encrypt2(const void *key, int key_len, void *dst,
const void *src1, size_t src1_len, size_t *dst_len,
const void *src2, size_t src2_len) const void *src1, size_t src1_len,
const void *src2, size_t src2_len)
{ {
struct scatterlist sg_in[3], sg_out[1]; struct scatterlist sg_in[3], sg_out[1];
struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher(); struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher();
...@@ -179,8 +181,9 @@ int ceph_aes_encrypt2(const void *key, int key_len, void *dst, size_t *dst_len, ...@@ -179,8 +181,9 @@ int ceph_aes_encrypt2(const void *key, int key_len, void *dst, size_t *dst_len,
return 0; return 0;
} }
int ceph_aes_decrypt(const void *key, int key_len, void *dst, size_t *dst_len, static int ceph_aes_decrypt(const void *key, int key_len,
const void *src, size_t src_len) void *dst, size_t *dst_len,
const void *src, size_t src_len)
{ {
struct scatterlist sg_in[1], sg_out[2]; struct scatterlist sg_in[1], sg_out[2];
struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher(); struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher();
...@@ -238,10 +241,10 @@ int ceph_aes_decrypt(const void *key, int key_len, void *dst, size_t *dst_len, ...@@ -238,10 +241,10 @@ int ceph_aes_decrypt(const void *key, int key_len, void *dst, size_t *dst_len,
return 0; return 0;
} }
int ceph_aes_decrypt2(const void *key, int key_len, static int ceph_aes_decrypt2(const void *key, int key_len,
void *dst1, size_t *dst1_len, void *dst1, size_t *dst1_len,
void *dst2, size_t *dst2_len, void *dst2, size_t *dst2_len,
const void *src, size_t src_len) const void *src, size_t src_len)
{ {
struct scatterlist sg_in[1], sg_out[3]; struct scatterlist sg_in[1], sg_out[3];
struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher(); struct crypto_blkcipher *tfm = ceph_crypto_alloc_cipher();
......
...@@ -42,7 +42,7 @@ extern int ceph_encrypt2(struct ceph_crypto_key *secret, ...@@ -42,7 +42,7 @@ extern int ceph_encrypt2(struct ceph_crypto_key *secret,
const void *src2, size_t src2_len); const void *src2, size_t src2_len);
/* armor.c */ /* armor.c */
extern int ceph_armor(char *dst, const void *src, const void *end); extern int ceph_armor(char *dst, const char *src, const char *end);
extern int ceph_unarmor(void *dst, const char *src, const char *end); extern int ceph_unarmor(char *dst, const char *src, const char *end);
#endif #endif
...@@ -291,7 +291,7 @@ static int dentry_lru_show(struct seq_file *s, void *ptr) ...@@ -291,7 +291,7 @@ static int dentry_lru_show(struct seq_file *s, void *ptr)
return 0; return 0;
} }
#define DEFINE_SHOW_FUNC(name) \ #define DEFINE_SHOW_FUNC(name) \
static int name##_open(struct inode *inode, struct file *file) \ static int name##_open(struct inode *inode, struct file *file) \
{ \ { \
struct seq_file *sf; \ struct seq_file *sf; \
...@@ -361,8 +361,8 @@ int ceph_debugfs_client_init(struct ceph_client *client) ...@@ -361,8 +361,8 @@ int ceph_debugfs_client_init(struct ceph_client *client)
int ret = 0; int ret = 0;
char name[80]; char name[80];
snprintf(name, sizeof(name), FSID_FORMAT ".client%lld", snprintf(name, sizeof(name), "%pU.client%lld", &client->fsid,
PR_FSID(&client->fsid), client->monc.auth->global_id); client->monc.auth->global_id);
client->debugfs_dir = debugfs_create_dir(name, ceph_debugfs_dir); client->debugfs_dir = debugfs_create_dir(name, ceph_debugfs_dir);
if (!client->debugfs_dir) if (!client->debugfs_dir)
...@@ -432,11 +432,12 @@ int ceph_debugfs_client_init(struct ceph_client *client) ...@@ -432,11 +432,12 @@ int ceph_debugfs_client_init(struct ceph_client *client)
if (!client->debugfs_caps) if (!client->debugfs_caps)
goto out; goto out;
client->debugfs_congestion_kb = debugfs_create_file("writeback_congestion_kb", client->debugfs_congestion_kb =
0600, debugfs_create_file("writeback_congestion_kb",
client->debugfs_dir, 0600,
client, client->debugfs_dir,
&congestion_kb_fops); client,
&congestion_kb_fops);
if (!client->debugfs_congestion_kb) if (!client->debugfs_congestion_kb)
goto out; goto out;
...@@ -466,7 +467,7 @@ void ceph_debugfs_client_cleanup(struct ceph_client *client) ...@@ -466,7 +467,7 @@ void ceph_debugfs_client_cleanup(struct ceph_client *client)
debugfs_remove(client->debugfs_dir); debugfs_remove(client->debugfs_dir);
} }
#else // CONFIG_DEBUG_FS #else /* CONFIG_DEBUG_FS */
int __init ceph_debugfs_init(void) int __init ceph_debugfs_init(void)
{ {
...@@ -486,4 +487,4 @@ void ceph_debugfs_client_cleanup(struct ceph_client *client) ...@@ -486,4 +487,4 @@ void ceph_debugfs_client_cleanup(struct ceph_client *client)
{ {
} }
#endif // CONFIG_DEBUG_FS #endif /* CONFIG_DEBUG_FS */
...@@ -99,11 +99,13 @@ static inline void ceph_encode_timespec(struct ceph_timespec *tv, ...@@ -99,11 +99,13 @@ static inline void ceph_encode_timespec(struct ceph_timespec *tv,
*/ */
static inline void ceph_encode_addr(struct ceph_entity_addr *a) static inline void ceph_encode_addr(struct ceph_entity_addr *a)
{ {
a->in_addr.ss_family = htons(a->in_addr.ss_family); __be16 ss_family = htons(a->in_addr.ss_family);
a->in_addr.ss_family = *(__u16 *)&ss_family;
} }
static inline void ceph_decode_addr(struct ceph_entity_addr *a) static inline void ceph_decode_addr(struct ceph_entity_addr *a)
{ {
a->in_addr.ss_family = ntohs(a->in_addr.ss_family); __be16 ss_family = *(__be16 *)&a->in_addr.ss_family;
a->in_addr.ss_family = ntohs(ss_family);
WARN_ON(a->in_addr.ss_family == 512); WARN_ON(a->in_addr.ss_family == 512);
} }
......
...@@ -27,7 +27,7 @@ ...@@ -27,7 +27,7 @@
const struct inode_operations ceph_dir_iops; const struct inode_operations ceph_dir_iops;
const struct file_operations ceph_dir_fops; const struct file_operations ceph_dir_fops;
struct dentry_operations ceph_dentry_ops; const struct dentry_operations ceph_dentry_ops;
/* /*
* Initialize ceph dentry state. * Initialize ceph dentry state.
...@@ -94,6 +94,8 @@ static unsigned fpos_off(loff_t p) ...@@ -94,6 +94,8 @@ static unsigned fpos_off(loff_t p)
*/ */
static int __dcache_readdir(struct file *filp, static int __dcache_readdir(struct file *filp,
void *dirent, filldir_t filldir) void *dirent, filldir_t filldir)
__releases(inode->i_lock)
__acquires(inode->i_lock)
{ {
struct inode *inode = filp->f_dentry->d_inode; struct inode *inode = filp->f_dentry->d_inode;
struct ceph_file_info *fi = filp->private_data; struct ceph_file_info *fi = filp->private_data;
...@@ -1239,16 +1241,16 @@ const struct inode_operations ceph_dir_iops = { ...@@ -1239,16 +1241,16 @@ const struct inode_operations ceph_dir_iops = {
.create = ceph_create, .create = ceph_create,
}; };
struct dentry_operations ceph_dentry_ops = { const struct dentry_operations ceph_dentry_ops = {
.d_revalidate = ceph_d_revalidate, .d_revalidate = ceph_d_revalidate,
.d_release = ceph_dentry_release, .d_release = ceph_dentry_release,
}; };
struct dentry_operations ceph_snapdir_dentry_ops = { const struct dentry_operations ceph_snapdir_dentry_ops = {
.d_revalidate = ceph_snapdir_d_revalidate, .d_revalidate = ceph_snapdir_d_revalidate,
.d_release = ceph_dentry_release, .d_release = ceph_dentry_release,
}; };
struct dentry_operations ceph_snap_dentry_ops = { const struct dentry_operations ceph_snap_dentry_ops = {
.d_release = ceph_dentry_release, .d_release = ceph_dentry_release,
}; };
...@@ -317,7 +317,7 @@ void ceph_release_page_vector(struct page **pages, int num_pages) ...@@ -317,7 +317,7 @@ void ceph_release_page_vector(struct page **pages, int num_pages)
/* /*
* allocate a vector new pages * allocate a vector new pages
*/ */
struct page **ceph_alloc_page_vector(int num_pages, gfp_t flags) static struct page **ceph_alloc_page_vector(int num_pages, gfp_t flags)
{ {
struct page **pages; struct page **pages;
int i; int i;
...@@ -665,7 +665,7 @@ static ssize_t ceph_sync_write(struct file *file, const char __user *data, ...@@ -665,7 +665,7 @@ static ssize_t ceph_sync_write(struct file *file, const char __user *data,
* throw out any page cache pages in this range. this * throw out any page cache pages in this range. this
* may block. * may block.
*/ */
truncate_inode_pages_range(inode->i_mapping, pos, truncate_inode_pages_range(inode->i_mapping, pos,
(pos+len) | (PAGE_CACHE_SIZE-1)); (pos+len) | (PAGE_CACHE_SIZE-1));
} else { } else {
pages = ceph_alloc_page_vector(num_pages, GFP_NOFS); pages = ceph_alloc_page_vector(num_pages, GFP_NOFS);
...@@ -740,28 +740,32 @@ static ssize_t ceph_aio_read(struct kiocb *iocb, const struct iovec *iov, ...@@ -740,28 +740,32 @@ static ssize_t ceph_aio_read(struct kiocb *iocb, const struct iovec *iov,
unsigned long nr_segs, loff_t pos) unsigned long nr_segs, loff_t pos)
{ {
struct file *filp = iocb->ki_filp; struct file *filp = iocb->ki_filp;
struct ceph_file_info *fi = filp->private_data;
loff_t *ppos = &iocb->ki_pos; loff_t *ppos = &iocb->ki_pos;
size_t len = iov->iov_len; size_t len = iov->iov_len;
struct inode *inode = filp->f_dentry->d_inode; struct inode *inode = filp->f_dentry->d_inode;
struct ceph_inode_info *ci = ceph_inode(inode); struct ceph_inode_info *ci = ceph_inode(inode);
void *base = iov->iov_base; void __user *base = iov->iov_base;
ssize_t ret; ssize_t ret;
int got = 0; int want, got = 0;
int checkeof = 0, read = 0; int checkeof = 0, read = 0;
dout("aio_read %p %llx.%llx %llu~%u trying to get caps on %p\n", dout("aio_read %p %llx.%llx %llu~%u trying to get caps on %p\n",
inode, ceph_vinop(inode), pos, (unsigned)len, inode); inode, ceph_vinop(inode), pos, (unsigned)len, inode);
again: again:
__ceph_do_pending_vmtruncate(inode); __ceph_do_pending_vmtruncate(inode);
ret = ceph_get_caps(ci, CEPH_CAP_FILE_RD, CEPH_CAP_FILE_CACHE, if (fi->fmode & CEPH_FILE_MODE_LAZY)
&got, -1); want = CEPH_CAP_FILE_CACHE | CEPH_CAP_FILE_LAZYIO;
else
want = CEPH_CAP_FILE_CACHE;
ret = ceph_get_caps(ci, CEPH_CAP_FILE_RD, want, &got, -1);
if (ret < 0) if (ret < 0)
goto out; goto out;
dout("aio_read %p %llx.%llx %llu~%u got cap refs on %s\n", dout("aio_read %p %llx.%llx %llu~%u got cap refs on %s\n",
inode, ceph_vinop(inode), pos, (unsigned)len, inode, ceph_vinop(inode), pos, (unsigned)len,
ceph_cap_string(got)); ceph_cap_string(got));
if ((got & CEPH_CAP_FILE_CACHE) == 0 || if ((got & (CEPH_CAP_FILE_CACHE|CEPH_CAP_FILE_LAZYIO)) == 0 ||
(iocb->ki_filp->f_flags & O_DIRECT) || (iocb->ki_filp->f_flags & O_DIRECT) ||
(inode->i_sb->s_flags & MS_SYNCHRONOUS)) (inode->i_sb->s_flags & MS_SYNCHRONOUS))
/* hmm, this isn't really async... */ /* hmm, this isn't really async... */
...@@ -807,11 +811,12 @@ static ssize_t ceph_aio_write(struct kiocb *iocb, const struct iovec *iov, ...@@ -807,11 +811,12 @@ static ssize_t ceph_aio_write(struct kiocb *iocb, const struct iovec *iov,
unsigned long nr_segs, loff_t pos) unsigned long nr_segs, loff_t pos)
{ {
struct file *file = iocb->ki_filp; struct file *file = iocb->ki_filp;
struct ceph_file_info *fi = file->private_data;
struct inode *inode = file->f_dentry->d_inode; struct inode *inode = file->f_dentry->d_inode;
struct ceph_inode_info *ci = ceph_inode(inode); struct ceph_inode_info *ci = ceph_inode(inode);
struct ceph_osd_client *osdc = &ceph_sb_to_client(inode->i_sb)->osdc; struct ceph_osd_client *osdc = &ceph_sb_to_client(inode->i_sb)->osdc;
loff_t endoff = pos + iov->iov_len; loff_t endoff = pos + iov->iov_len;
int got = 0; int want, got = 0;
int ret, err; int ret, err;
if (ceph_snap(inode) != CEPH_NOSNAP) if (ceph_snap(inode) != CEPH_NOSNAP)
...@@ -824,8 +829,11 @@ static ssize_t ceph_aio_write(struct kiocb *iocb, const struct iovec *iov, ...@@ -824,8 +829,11 @@ static ssize_t ceph_aio_write(struct kiocb *iocb, const struct iovec *iov,
dout("aio_write %p %llx.%llx %llu~%u getting caps. i_size %llu\n", dout("aio_write %p %llx.%llx %llu~%u getting caps. i_size %llu\n",
inode, ceph_vinop(inode), pos, (unsigned)iov->iov_len, inode, ceph_vinop(inode), pos, (unsigned)iov->iov_len,
inode->i_size); inode->i_size);
ret = ceph_get_caps(ci, CEPH_CAP_FILE_WR, CEPH_CAP_FILE_BUFFER, if (fi->fmode & CEPH_FILE_MODE_LAZY)
&got, endoff); want = CEPH_CAP_FILE_BUFFER | CEPH_CAP_FILE_LAZYIO;
else
want = CEPH_CAP_FILE_BUFFER;
ret = ceph_get_caps(ci, CEPH_CAP_FILE_WR, want, &got, endoff);
if (ret < 0) if (ret < 0)
goto out; goto out;
...@@ -833,7 +841,7 @@ static ssize_t ceph_aio_write(struct kiocb *iocb, const struct iovec *iov, ...@@ -833,7 +841,7 @@ static ssize_t ceph_aio_write(struct kiocb *iocb, const struct iovec *iov,
inode, ceph_vinop(inode), pos, (unsigned)iov->iov_len, inode, ceph_vinop(inode), pos, (unsigned)iov->iov_len,
ceph_cap_string(got)); ceph_cap_string(got));
if ((got & CEPH_CAP_FILE_BUFFER) == 0 || if ((got & (CEPH_CAP_FILE_BUFFER|CEPH_CAP_FILE_LAZYIO)) == 0 ||
(iocb->ki_filp->f_flags & O_DIRECT) || (iocb->ki_filp->f_flags & O_DIRECT) ||
(inode->i_sb->s_flags & MS_SYNCHRONOUS)) { (inode->i_sb->s_flags & MS_SYNCHRONOUS)) {
ret = ceph_sync_write(file, iov->iov_base, iov->iov_len, ret = ceph_sync_write(file, iov->iov_base, iov->iov_len,
...@@ -930,6 +938,8 @@ const struct file_operations ceph_file_fops = { ...@@ -930,6 +938,8 @@ const struct file_operations ceph_file_fops = {
.aio_write = ceph_aio_write, .aio_write = ceph_aio_write,
.mmap = ceph_mmap, .mmap = ceph_mmap,
.fsync = ceph_fsync, .fsync = ceph_fsync,
.lock = ceph_lock,
.flock = ceph_flock,
.splice_read = generic_file_splice_read, .splice_read = generic_file_splice_read,
.splice_write = generic_file_splice_write, .splice_write = generic_file_splice_write,
.unlocked_ioctl = ceph_ioctl, .unlocked_ioctl = ceph_ioctl,
......
...@@ -442,8 +442,9 @@ int ceph_fill_file_size(struct inode *inode, int issued, ...@@ -442,8 +442,9 @@ int ceph_fill_file_size(struct inode *inode, int issued,
* the file is either opened or mmaped * the file is either opened or mmaped
*/ */
if ((issued & (CEPH_CAP_FILE_CACHE|CEPH_CAP_FILE_RD| if ((issued & (CEPH_CAP_FILE_CACHE|CEPH_CAP_FILE_RD|
CEPH_CAP_FILE_WR|CEPH_CAP_FILE_BUFFER| CEPH_CAP_FILE_WR|CEPH_CAP_FILE_BUFFER|
CEPH_CAP_FILE_EXCL)) || CEPH_CAP_FILE_EXCL|
CEPH_CAP_FILE_LAZYIO)) ||
mapping_mapped(inode->i_mapping) || mapping_mapped(inode->i_mapping) ||
__ceph_caps_file_wanted(ci)) { __ceph_caps_file_wanted(ci)) {
ci->i_truncate_pending++; ci->i_truncate_pending++;
......
...@@ -143,6 +143,27 @@ static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg) ...@@ -143,6 +143,27 @@ static long ceph_ioctl_get_dataloc(struct file *file, void __user *arg)
return 0; return 0;
} }
static long ceph_ioctl_lazyio(struct file *file)
{
struct ceph_file_info *fi = file->private_data;
struct inode *inode = file->f_dentry->d_inode;
struct ceph_inode_info *ci = ceph_inode(inode);
if ((fi->fmode & CEPH_FILE_MODE_LAZY) == 0) {
spin_lock(&inode->i_lock);
ci->i_nr_by_mode[fi->fmode]--;
fi->fmode |= CEPH_FILE_MODE_LAZY;
ci->i_nr_by_mode[fi->fmode]++;
spin_unlock(&inode->i_lock);
dout("ioctl_layzio: file %p marked lazy\n", file);
ceph_check_caps(ci, 0, NULL);
} else {
dout("ioctl_layzio: file %p already lazy\n", file);
}
return 0;
}
long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg) long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
{ {
dout("ioctl file %p cmd %u arg %lu\n", file, cmd, arg); dout("ioctl file %p cmd %u arg %lu\n", file, cmd, arg);
...@@ -155,6 +176,9 @@ long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg) ...@@ -155,6 +176,9 @@ long ceph_ioctl(struct file *file, unsigned int cmd, unsigned long arg)
case CEPH_IOC_GET_DATALOC: case CEPH_IOC_GET_DATALOC:
return ceph_ioctl_get_dataloc(file, (void __user *)arg); return ceph_ioctl_get_dataloc(file, (void __user *)arg);
case CEPH_IOC_LAZYIO:
return ceph_ioctl_lazyio(file);
} }
return -ENOTTY; return -ENOTTY;
} }
...@@ -37,4 +37,6 @@ struct ceph_ioctl_dataloc { ...@@ -37,4 +37,6 @@ struct ceph_ioctl_dataloc {
#define CEPH_IOC_GET_DATALOC _IOWR(CEPH_IOCTL_MAGIC, 3, \ #define CEPH_IOC_GET_DATALOC _IOWR(CEPH_IOCTL_MAGIC, 3, \
struct ceph_ioctl_dataloc) struct ceph_ioctl_dataloc)
#define CEPH_IOC_LAZYIO _IO(CEPH_IOCTL_MAGIC, 4)
#endif #endif
#include "ceph_debug.h"
#include <linux/file.h>
#include <linux/namei.h>
#include "super.h"
#include "mds_client.h"
#include "pagelist.h"
/**
* Implement fcntl and flock locking functions.
*/
static int ceph_lock_message(u8 lock_type, u16 operation, struct file *file,
u64 pid, u64 pid_ns,
int cmd, u64 start, u64 length, u8 wait)
{
struct inode *inode = file->f_dentry->d_inode;
struct ceph_mds_client *mdsc =
&ceph_sb_to_client(inode->i_sb)->mdsc;
struct ceph_mds_request *req;
int err;
req = ceph_mdsc_create_request(mdsc, operation, USE_AUTH_MDS);
if (IS_ERR(req))
return PTR_ERR(req);
req->r_inode = igrab(inode);
dout("ceph_lock_message: rule: %d, op: %d, pid: %llu, start: %llu, "
"length: %llu, wait: %d, type`: %d", (int)lock_type,
(int)operation, pid, start, length, wait, cmd);
req->r_args.filelock_change.rule = lock_type;
req->r_args.filelock_change.type = cmd;
req->r_args.filelock_change.pid = cpu_to_le64(pid);
/* This should be adjusted, but I'm not sure if
namespaces actually get id numbers*/
req->r_args.filelock_change.pid_namespace =
cpu_to_le64((u64)pid_ns);
req->r_args.filelock_change.start = cpu_to_le64(start);
req->r_args.filelock_change.length = cpu_to_le64(length);
req->r_args.filelock_change.wait = wait;
err = ceph_mdsc_do_request(mdsc, inode, req);
ceph_mdsc_put_request(req);
dout("ceph_lock_message: rule: %d, op: %d, pid: %llu, start: %llu, "
"length: %llu, wait: %d, type`: %d err code %d", (int)lock_type,
(int)operation, pid, start, length, wait, cmd, err);
return err;
}
/**
* Attempt to set an fcntl lock.
* For now, this just goes away to the server. Later it may be more awesome.
*/
int ceph_lock(struct file *file, int cmd, struct file_lock *fl)
{
u64 length;
u8 lock_cmd;
int err;
u8 wait = 0;
u16 op = CEPH_MDS_OP_SETFILELOCK;
fl->fl_nspid = get_pid(task_tgid(current));
dout("ceph_lock, fl_pid:%d", fl->fl_pid);
/* set wait bit as appropriate, then make command as Ceph expects it*/
if (F_SETLKW == cmd)
wait = 1;
if (F_GETLK == cmd)
op = CEPH_MDS_OP_GETFILELOCK;
if (F_RDLCK == fl->fl_type)
lock_cmd = CEPH_LOCK_SHARED;
else if (F_WRLCK == fl->fl_type)
lock_cmd = CEPH_LOCK_EXCL;
else
lock_cmd = CEPH_LOCK_UNLOCK;
if (LLONG_MAX == fl->fl_end)
length = 0;
else
length = fl->fl_end - fl->fl_start + 1;
err = ceph_lock_message(CEPH_LOCK_FCNTL, op, file,
(u64)fl->fl_pid, (u64)fl->fl_nspid,
lock_cmd, fl->fl_start,
length, wait);
if (!err) {
dout("mds locked, locking locally");
err = posix_lock_file(file, fl, NULL);
if (err && (CEPH_MDS_OP_SETFILELOCK == op)) {
/* undo! This should only happen if the kernel detects
* local deadlock. */
ceph_lock_message(CEPH_LOCK_FCNTL, op, file,
(u64)fl->fl_pid, (u64)fl->fl_nspid,
CEPH_LOCK_UNLOCK, fl->fl_start,
length, 0);
dout("got %d on posix_lock_file, undid lock", err);
}
} else {
dout("mds returned error code %d", err);
}
return err;
}
int ceph_flock(struct file *file, int cmd, struct file_lock *fl)
{
u64 length;
u8 lock_cmd;
int err;
u8 wait = 1;
fl->fl_nspid = get_pid(task_tgid(current));
dout("ceph_flock, fl_pid:%d", fl->fl_pid);
/* set wait bit, then clear it out of cmd*/
if (cmd & LOCK_NB)
wait = 0;
cmd = cmd & (LOCK_SH | LOCK_EX | LOCK_UN);
/* set command sequence that Ceph wants to see:
shared lock, exclusive lock, or unlock */
if (LOCK_SH == cmd)
lock_cmd = CEPH_LOCK_SHARED;
else if (LOCK_EX == cmd)
lock_cmd = CEPH_LOCK_EXCL;
else
lock_cmd = CEPH_LOCK_UNLOCK;
/* mds requires start and length rather than start and end */
if (LLONG_MAX == fl->fl_end)
length = 0;
else
length = fl->fl_end - fl->fl_start + 1;
err = ceph_lock_message(CEPH_LOCK_FLOCK, CEPH_MDS_OP_SETFILELOCK,
file, (u64)fl->fl_pid, (u64)fl->fl_nspid,
lock_cmd, fl->fl_start,
length, wait);
if (!err) {
err = flock_lock_file_wait(file, fl);
if (err) {
ceph_lock_message(CEPH_LOCK_FLOCK,
CEPH_MDS_OP_SETFILELOCK,
file, (u64)fl->fl_pid,
(u64)fl->fl_nspid,
CEPH_LOCK_UNLOCK, fl->fl_start,
length, 0);
dout("got %d on flock_lock_file_wait, undid lock", err);
}
} else {
dout("mds error code %d", err);
}
return err;
}
/**
* Must be called with BKL already held. Fills in the passed
* counter variables, so you can prepare pagelist metadata before calling
* ceph_encode_locks.
*/
void ceph_count_locks(struct inode *inode, int *fcntl_count, int *flock_count)
{
struct file_lock *lock;
*fcntl_count = 0;
*flock_count = 0;
for (lock = inode->i_flock; lock != NULL; lock = lock->fl_next) {
if (lock->fl_flags & FL_POSIX)
++(*fcntl_count);
else if (lock->fl_flags & FL_FLOCK)
++(*flock_count);
}
dout("counted %d flock locks and %d fcntl locks",
*flock_count, *fcntl_count);
}
/**
* Encode the flock and fcntl locks for the given inode into the pagelist.
* Format is: #fcntl locks, sequential fcntl locks, #flock locks,
* sequential flock locks.
* Must be called with BLK already held, and the lock numbers should have
* been gathered under the same lock holding window.
*/
int ceph_encode_locks(struct inode *inode, struct ceph_pagelist *pagelist,
int num_fcntl_locks, int num_flock_locks)
{
struct file_lock *lock;
struct ceph_filelock cephlock;
int err = 0;
dout("encoding %d flock and %d fcntl locks", num_flock_locks,
num_fcntl_locks);
err = ceph_pagelist_append(pagelist, &num_fcntl_locks, sizeof(u32));
if (err)
goto fail;
for (lock = inode->i_flock; lock != NULL; lock = lock->fl_next) {
if (lock->fl_flags & FL_POSIX) {
err = lock_to_ceph_filelock(lock, &cephlock);
if (err)
goto fail;
err = ceph_pagelist_append(pagelist, &cephlock,
sizeof(struct ceph_filelock));
}
if (err)
goto fail;
}
err = ceph_pagelist_append(pagelist, &num_flock_locks, sizeof(u32));
if (err)
goto fail;
for (lock = inode->i_flock; lock != NULL; lock = lock->fl_next) {
if (lock->fl_flags & FL_FLOCK) {
err = lock_to_ceph_filelock(lock, &cephlock);
if (err)
goto fail;
err = ceph_pagelist_append(pagelist, &cephlock,
sizeof(struct ceph_filelock));
}
if (err)
goto fail;
}
fail:
return err;
}
/*
* Given a pointer to a lock, convert it to a ceph filelock
*/
int lock_to_ceph_filelock(struct file_lock *lock,
struct ceph_filelock *cephlock)
{
int err = 0;
cephlock->start = cpu_to_le64(lock->fl_start);
cephlock->length = cpu_to_le64(lock->fl_end - lock->fl_start + 1);
cephlock->client = cpu_to_le64(0);
cephlock->pid = cpu_to_le64(lock->fl_pid);
cephlock->pid_namespace = cpu_to_le64((u64)lock->fl_nspid);
switch (lock->fl_type) {
case F_RDLCK:
cephlock->type = CEPH_LOCK_SHARED;
break;
case F_WRLCK:
cephlock->type = CEPH_LOCK_EXCL;
break;
case F_UNLCK:
cephlock->type = CEPH_LOCK_UNLOCK;
break;
default:
dout("Have unknown lock type %d", lock->fl_type);
err = -EINVAL;
}
return err;
}
This diff is collapsed.
...@@ -151,6 +151,7 @@ typedef void (*ceph_mds_request_callback_t) (struct ceph_mds_client *mdsc, ...@@ -151,6 +151,7 @@ typedef void (*ceph_mds_request_callback_t) (struct ceph_mds_client *mdsc,
struct ceph_mds_request { struct ceph_mds_request {
u64 r_tid; /* transaction id */ u64 r_tid; /* transaction id */
struct rb_node r_node; struct rb_node r_node;
struct ceph_mds_client *r_mdsc;
int r_op; /* mds op code */ int r_op; /* mds op code */
int r_mds; int r_mds;
...@@ -207,8 +208,8 @@ struct ceph_mds_request { ...@@ -207,8 +208,8 @@ struct ceph_mds_request {
int r_attempts; /* resend attempts */ int r_attempts; /* resend attempts */
int r_num_fwd; /* number of forward attempts */ int r_num_fwd; /* number of forward attempts */
int r_num_stale;
int r_resend_mds; /* mds to resend to next, if any*/ int r_resend_mds; /* mds to resend to next, if any*/
u32 r_sent_on_mseq; /* cap mseq request was sent at*/
struct kref r_kref; struct kref r_kref;
struct list_head r_wait; struct list_head r_wait;
...@@ -267,6 +268,27 @@ struct ceph_mds_client { ...@@ -267,6 +268,27 @@ struct ceph_mds_client {
spinlock_t cap_dirty_lock; /* protects above items */ spinlock_t cap_dirty_lock; /* protects above items */
wait_queue_head_t cap_flushing_wq; wait_queue_head_t cap_flushing_wq;
/*
* Cap reservations
*
* Maintain a global pool of preallocated struct ceph_caps, referenced
* by struct ceph_caps_reservations. This ensures that we preallocate
* memory needed to successfully process an MDS response. (If an MDS
* sends us cap information and we fail to process it, we will have
* problems due to the client and MDS being out of sync.)
*
* Reservations are 'owned' by a ceph_cap_reservation context.
*/
spinlock_t caps_list_lock;
struct list_head caps_list; /* unused (reserved or
unreserved) */
int caps_total_count; /* total caps allocated */
int caps_use_count; /* in use */
int caps_reserve_count; /* unused, reserved */
int caps_avail_count; /* unused, unreserved */
int caps_min_count; /* keep at least this many
(unreserved) */
#ifdef CONFIG_DEBUG_FS #ifdef CONFIG_DEBUG_FS
struct dentry *debugfs_file; struct dentry *debugfs_file;
#endif #endif
...@@ -324,8 +346,7 @@ static inline void ceph_mdsc_put_request(struct ceph_mds_request *req) ...@@ -324,8 +346,7 @@ static inline void ceph_mdsc_put_request(struct ceph_mds_request *req)
} }
extern int ceph_add_cap_releases(struct ceph_mds_client *mdsc, extern int ceph_add_cap_releases(struct ceph_mds_client *mdsc,
struct ceph_mds_session *session, struct ceph_mds_session *session);
int extra);
extern void ceph_send_cap_releases(struct ceph_mds_client *mdsc, extern void ceph_send_cap_releases(struct ceph_mds_client *mdsc,
struct ceph_mds_session *session); struct ceph_mds_session *session);
...@@ -343,4 +364,7 @@ extern void ceph_mdsc_lease_send_msg(struct ceph_mds_session *session, ...@@ -343,4 +364,7 @@ extern void ceph_mdsc_lease_send_msg(struct ceph_mds_session *session,
extern void ceph_mdsc_handle_map(struct ceph_mds_client *mdsc, extern void ceph_mdsc_handle_map(struct ceph_mds_client *mdsc,
struct ceph_msg *msg); struct ceph_msg *msg);
extern void ceph_mdsc_open_export_target_sessions(struct ceph_mds_client *mdsc,
struct ceph_mds_session *session);
#endif #endif
...@@ -85,6 +85,7 @@ struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end) ...@@ -85,6 +85,7 @@ struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end)
struct ceph_entity_addr addr; struct ceph_entity_addr addr;
u32 num_export_targets; u32 num_export_targets;
void *pexport_targets = NULL; void *pexport_targets = NULL;
struct ceph_timespec laggy_since;
ceph_decode_need(p, end, sizeof(u64)*2 + 1 + sizeof(u32), bad); ceph_decode_need(p, end, sizeof(u64)*2 + 1 + sizeof(u32), bad);
global_id = ceph_decode_64(p); global_id = ceph_decode_64(p);
...@@ -103,7 +104,7 @@ struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end) ...@@ -103,7 +104,7 @@ struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end)
state_seq = ceph_decode_64(p); state_seq = ceph_decode_64(p);
ceph_decode_copy(p, &addr, sizeof(addr)); ceph_decode_copy(p, &addr, sizeof(addr));
ceph_decode_addr(&addr); ceph_decode_addr(&addr);
*p += sizeof(struct ceph_timespec); ceph_decode_copy(p, &laggy_since, sizeof(laggy_since));
*p += sizeof(u32); *p += sizeof(u32);
ceph_decode_32_safe(p, end, namelen, bad); ceph_decode_32_safe(p, end, namelen, bad);
*p += namelen; *p += namelen;
...@@ -122,6 +123,9 @@ struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end) ...@@ -122,6 +123,9 @@ struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end)
m->m_info[mds].global_id = global_id; m->m_info[mds].global_id = global_id;
m->m_info[mds].state = state; m->m_info[mds].state = state;
m->m_info[mds].addr = addr; m->m_info[mds].addr = addr;
m->m_info[mds].laggy =
(laggy_since.tv_sec != 0 ||
laggy_since.tv_nsec != 0);
m->m_info[mds].num_export_targets = num_export_targets; m->m_info[mds].num_export_targets = num_export_targets;
if (num_export_targets) { if (num_export_targets) {
m->m_info[mds].export_targets = m->m_info[mds].export_targets =
......
...@@ -13,6 +13,7 @@ struct ceph_mds_info { ...@@ -13,6 +13,7 @@ struct ceph_mds_info {
struct ceph_entity_addr addr; struct ceph_entity_addr addr;
s32 state; s32 state;
int num_export_targets; int num_export_targets;
bool laggy;
u32 *export_targets; u32 *export_targets;
}; };
...@@ -47,6 +48,13 @@ static inline int ceph_mdsmap_get_state(struct ceph_mdsmap *m, int w) ...@@ -47,6 +48,13 @@ static inline int ceph_mdsmap_get_state(struct ceph_mdsmap *m, int w)
return m->m_info[w].state; return m->m_info[w].state;
} }
static inline bool ceph_mdsmap_is_laggy(struct ceph_mdsmap *m, int w)
{
if (w >= 0 && w < m->m_max_mds)
return m->m_info[w].laggy;
return false;
}
extern int ceph_mdsmap_get_random_mds(struct ceph_mdsmap *m); extern int ceph_mdsmap_get_random_mds(struct ceph_mdsmap *m);
extern struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end); extern struct ceph_mdsmap *ceph_mdsmap_decode(void **p, void *end);
extern void ceph_mdsmap_destroy(struct ceph_mdsmap *m); extern void ceph_mdsmap_destroy(struct ceph_mdsmap *m);
......
...@@ -108,7 +108,7 @@ void ceph_msgr_exit(void) ...@@ -108,7 +108,7 @@ void ceph_msgr_exit(void)
destroy_workqueue(ceph_msgr_wq); destroy_workqueue(ceph_msgr_wq);
} }
void ceph_msgr_flush() void ceph_msgr_flush(void)
{ {
flush_workqueue(ceph_msgr_wq); flush_workqueue(ceph_msgr_wq);
} }
...@@ -647,7 +647,7 @@ static void prepare_write_connect(struct ceph_messenger *msgr, ...@@ -647,7 +647,7 @@ static void prepare_write_connect(struct ceph_messenger *msgr,
dout("prepare_write_connect %p cseq=%d gseq=%d proto=%d\n", con, dout("prepare_write_connect %p cseq=%d gseq=%d proto=%d\n", con,
con->connect_seq, global_seq, proto); con->connect_seq, global_seq, proto);
con->out_connect.features = cpu_to_le64(CEPH_FEATURE_SUPPORTED_CLIENT); con->out_connect.features = cpu_to_le64(CEPH_FEATURE_SUPPORTED);
con->out_connect.host_type = cpu_to_le32(CEPH_ENTITY_TYPE_CLIENT); con->out_connect.host_type = cpu_to_le32(CEPH_ENTITY_TYPE_CLIENT);
con->out_connect.connect_seq = cpu_to_le32(con->connect_seq); con->out_connect.connect_seq = cpu_to_le32(con->connect_seq);
con->out_connect.global_seq = cpu_to_le32(global_seq); con->out_connect.global_seq = cpu_to_le32(global_seq);
...@@ -1081,11 +1081,11 @@ static int process_banner(struct ceph_connection *con) ...@@ -1081,11 +1081,11 @@ static int process_banner(struct ceph_connection *con)
sizeof(con->peer_addr)) != 0 && sizeof(con->peer_addr)) != 0 &&
!(addr_is_blank(&con->actual_peer_addr.in_addr) && !(addr_is_blank(&con->actual_peer_addr.in_addr) &&
con->actual_peer_addr.nonce == con->peer_addr.nonce)) { con->actual_peer_addr.nonce == con->peer_addr.nonce)) {
pr_warning("wrong peer, want %s/%lld, got %s/%lld\n", pr_warning("wrong peer, want %s/%d, got %s/%d\n",
pr_addr(&con->peer_addr.in_addr), pr_addr(&con->peer_addr.in_addr),
le64_to_cpu(con->peer_addr.nonce), (int)le32_to_cpu(con->peer_addr.nonce),
pr_addr(&con->actual_peer_addr.in_addr), pr_addr(&con->actual_peer_addr.in_addr),
le64_to_cpu(con->actual_peer_addr.nonce)); (int)le32_to_cpu(con->actual_peer_addr.nonce));
con->error_msg = "wrong peer at address"; con->error_msg = "wrong peer at address";
return -1; return -1;
} }
...@@ -1123,8 +1123,8 @@ static void fail_protocol(struct ceph_connection *con) ...@@ -1123,8 +1123,8 @@ static void fail_protocol(struct ceph_connection *con)
static int process_connect(struct ceph_connection *con) static int process_connect(struct ceph_connection *con)
{ {
u64 sup_feat = CEPH_FEATURE_SUPPORTED_CLIENT; u64 sup_feat = CEPH_FEATURE_SUPPORTED;
u64 req_feat = CEPH_FEATURE_REQUIRED_CLIENT; u64 req_feat = CEPH_FEATURE_REQUIRED;
u64 server_feat = le64_to_cpu(con->in_reply.features); u64 server_feat = le64_to_cpu(con->in_reply.features);
dout("process_connect on %p tag %d\n", con, (int)con->in_tag); dout("process_connect on %p tag %d\n", con, (int)con->in_tag);
...@@ -1302,8 +1302,8 @@ static void process_ack(struct ceph_connection *con) ...@@ -1302,8 +1302,8 @@ static void process_ack(struct ceph_connection *con)
static int read_partial_message_section(struct ceph_connection *con, static int read_partial_message_section(struct ceph_connection *con,
struct kvec *section, unsigned int sec_len, struct kvec *section,
u32 *crc) unsigned int sec_len, u32 *crc)
{ {
int left; int left;
int ret; int ret;
...@@ -1434,7 +1434,8 @@ static int read_partial_message(struct ceph_connection *con) ...@@ -1434,7 +1434,8 @@ static int read_partial_message(struct ceph_connection *con)
/* middle */ /* middle */
if (m->middle) { if (m->middle) {
ret = read_partial_message_section(con, &m->middle->vec, middle_len, ret = read_partial_message_section(con, &m->middle->vec,
middle_len,
&con->in_middle_crc); &con->in_middle_crc);
if (ret <= 0) if (ret <= 0)
return ret; return ret;
...@@ -1920,7 +1921,7 @@ static void ceph_fault(struct ceph_connection *con) ...@@ -1920,7 +1921,7 @@ static void ceph_fault(struct ceph_connection *con)
/* /*
* in case we faulted due to authentication, invalidate our * in case we faulted due to authentication, invalidate our
* current tickets so that we can get new ones. * current tickets so that we can get new ones.
*/ */
if (con->auth_retry && con->ops->invalidate_authorizer) { if (con->auth_retry && con->ops->invalidate_authorizer) {
dout("calling invalidate_authorizer()\n"); dout("calling invalidate_authorizer()\n");
con->ops->invalidate_authorizer(con); con->ops->invalidate_authorizer(con);
......
...@@ -349,7 +349,7 @@ static void ceph_monc_handle_map(struct ceph_mon_client *monc, ...@@ -349,7 +349,7 @@ static void ceph_monc_handle_map(struct ceph_mon_client *monc,
} }
/* /*
* statfs * generic requests (e.g., statfs, poolop)
*/ */
static struct ceph_mon_generic_request *__lookup_generic_req( static struct ceph_mon_generic_request *__lookup_generic_req(
struct ceph_mon_client *monc, u64 tid) struct ceph_mon_client *monc, u64 tid)
...@@ -442,6 +442,35 @@ static struct ceph_msg *get_generic_reply(struct ceph_connection *con, ...@@ -442,6 +442,35 @@ static struct ceph_msg *get_generic_reply(struct ceph_connection *con,
return m; return m;
} }
static int do_generic_request(struct ceph_mon_client *monc,
struct ceph_mon_generic_request *req)
{
int err;
/* register request */
mutex_lock(&monc->mutex);
req->tid = ++monc->last_tid;
req->request->hdr.tid = cpu_to_le64(req->tid);
__insert_generic_request(monc, req);
monc->num_generic_requests++;
ceph_con_send(monc->con, ceph_msg_get(req->request));
mutex_unlock(&monc->mutex);
err = wait_for_completion_interruptible(&req->completion);
mutex_lock(&monc->mutex);
rb_erase(&req->node, &monc->generic_request_tree);
monc->num_generic_requests--;
mutex_unlock(&monc->mutex);
if (!err)
err = req->result;
return err;
}
/*
* statfs
*/
static void handle_statfs_reply(struct ceph_mon_client *monc, static void handle_statfs_reply(struct ceph_mon_client *monc,
struct ceph_msg *msg) struct ceph_msg *msg)
{ {
...@@ -468,7 +497,7 @@ static void handle_statfs_reply(struct ceph_mon_client *monc, ...@@ -468,7 +497,7 @@ static void handle_statfs_reply(struct ceph_mon_client *monc,
return; return;
bad: bad:
pr_err("corrupt generic reply, no tid\n"); pr_err("corrupt generic reply, tid %llu\n", tid);
ceph_msg_dump(msg); ceph_msg_dump(msg);
} }
...@@ -487,6 +516,7 @@ int ceph_monc_do_statfs(struct ceph_mon_client *monc, struct ceph_statfs *buf) ...@@ -487,6 +516,7 @@ int ceph_monc_do_statfs(struct ceph_mon_client *monc, struct ceph_statfs *buf)
kref_init(&req->kref); kref_init(&req->kref);
req->buf = buf; req->buf = buf;
req->buf_len = sizeof(*buf);
init_completion(&req->completion); init_completion(&req->completion);
err = -ENOMEM; err = -ENOMEM;
...@@ -504,33 +534,134 @@ int ceph_monc_do_statfs(struct ceph_mon_client *monc, struct ceph_statfs *buf) ...@@ -504,33 +534,134 @@ int ceph_monc_do_statfs(struct ceph_mon_client *monc, struct ceph_statfs *buf)
h->monhdr.session_mon_tid = 0; h->monhdr.session_mon_tid = 0;
h->fsid = monc->monmap->fsid; h->fsid = monc->monmap->fsid;
/* register request */ err = do_generic_request(monc, req);
mutex_lock(&monc->mutex);
req->tid = ++monc->last_tid;
req->request->hdr.tid = cpu_to_le64(req->tid);
__insert_generic_request(monc, req);
monc->num_generic_requests++;
mutex_unlock(&monc->mutex);
/* send request and wait */ out:
ceph_con_send(monc->con, ceph_msg_get(req->request)); kref_put(&req->kref, release_generic_request);
err = wait_for_completion_interruptible(&req->completion); return err;
}
/*
* pool ops
*/
static int get_poolop_reply_buf(const char *src, size_t src_len,
char *dst, size_t dst_len)
{
u32 buf_len;
if (src_len != sizeof(u32) + dst_len)
return -EINVAL;
buf_len = le32_to_cpu(*(u32 *)src);
if (buf_len != dst_len)
return -EINVAL;
memcpy(dst, src + sizeof(u32), dst_len);
return 0;
}
static void handle_poolop_reply(struct ceph_mon_client *monc,
struct ceph_msg *msg)
{
struct ceph_mon_generic_request *req;
struct ceph_mon_poolop_reply *reply = msg->front.iov_base;
u64 tid = le64_to_cpu(msg->hdr.tid);
if (msg->front.iov_len < sizeof(*reply))
goto bad;
dout("handle_poolop_reply %p tid %llu\n", msg, tid);
mutex_lock(&monc->mutex); mutex_lock(&monc->mutex);
rb_erase(&req->node, &monc->generic_request_tree); req = __lookup_generic_req(monc, tid);
monc->num_generic_requests--; if (req) {
if (req->buf_len &&
get_poolop_reply_buf(msg->front.iov_base + sizeof(*reply),
msg->front.iov_len - sizeof(*reply),
req->buf, req->buf_len) < 0) {
mutex_unlock(&monc->mutex);
goto bad;
}
req->result = le32_to_cpu(reply->reply_code);
get_generic_request(req);
}
mutex_unlock(&monc->mutex); mutex_unlock(&monc->mutex);
if (req) {
complete(&req->completion);
put_generic_request(req);
}
return;
if (!err) bad:
err = req->result; pr_err("corrupt generic reply, tid %llu\n", tid);
ceph_msg_dump(msg);
}
/*
* Do a synchronous pool op.
*/
int ceph_monc_do_poolop(struct ceph_mon_client *monc, u32 op,
u32 pool, u64 snapid,
char *buf, int len)
{
struct ceph_mon_generic_request *req;
struct ceph_mon_poolop *h;
int err;
req = kzalloc(sizeof(*req), GFP_NOFS);
if (!req)
return -ENOMEM;
kref_init(&req->kref);
req->buf = buf;
req->buf_len = len;
init_completion(&req->completion);
err = -ENOMEM;
req->request = ceph_msg_new(CEPH_MSG_POOLOP, sizeof(*h), GFP_NOFS);
if (!req->request)
goto out;
req->reply = ceph_msg_new(CEPH_MSG_POOLOP_REPLY, 1024, GFP_NOFS);
if (!req->reply)
goto out;
/* fill out request */
req->request->hdr.version = cpu_to_le16(2);
h = req->request->front.iov_base;
h->monhdr.have_version = 0;
h->monhdr.session_mon = cpu_to_le16(-1);
h->monhdr.session_mon_tid = 0;
h->fsid = monc->monmap->fsid;
h->pool = cpu_to_le32(pool);
h->op = cpu_to_le32(op);
h->auid = 0;
h->snapid = cpu_to_le64(snapid);
h->name_len = 0;
err = do_generic_request(monc, req);
out: out:
kref_put(&req->kref, release_generic_request); kref_put(&req->kref, release_generic_request);
return err; return err;
} }
int ceph_monc_create_snapid(struct ceph_mon_client *monc,
u32 pool, u64 *snapid)
{
return ceph_monc_do_poolop(monc, POOL_OP_CREATE_UNMANAGED_SNAP,
pool, 0, (char *)snapid, sizeof(*snapid));
}
int ceph_monc_delete_snapid(struct ceph_mon_client *monc,
u32 pool, u64 snapid)
{
return ceph_monc_do_poolop(monc, POOL_OP_CREATE_UNMANAGED_SNAP,
pool, snapid, 0, 0);
}
/* /*
* Resend pending statfs requests. * Resend pending generic requests.
*/ */
static void __resend_generic_request(struct ceph_mon_client *monc) static void __resend_generic_request(struct ceph_mon_client *monc)
{ {
...@@ -783,6 +914,10 @@ static void dispatch(struct ceph_connection *con, struct ceph_msg *msg) ...@@ -783,6 +914,10 @@ static void dispatch(struct ceph_connection *con, struct ceph_msg *msg)
handle_statfs_reply(monc, msg); handle_statfs_reply(monc, msg);
break; break;
case CEPH_MSG_POOLOP_REPLY:
handle_poolop_reply(monc, msg);
break;
case CEPH_MSG_MON_MAP: case CEPH_MSG_MON_MAP:
ceph_monc_handle_map(monc, msg); ceph_monc_handle_map(monc, msg);
break; break;
...@@ -820,6 +955,7 @@ static struct ceph_msg *mon_alloc_msg(struct ceph_connection *con, ...@@ -820,6 +955,7 @@ static struct ceph_msg *mon_alloc_msg(struct ceph_connection *con,
case CEPH_MSG_MON_SUBSCRIBE_ACK: case CEPH_MSG_MON_SUBSCRIBE_ACK:
m = ceph_msg_get(monc->m_subscribe_ack); m = ceph_msg_get(monc->m_subscribe_ack);
break; break;
case CEPH_MSG_POOLOP_REPLY:
case CEPH_MSG_STATFS_REPLY: case CEPH_MSG_STATFS_REPLY:
return get_generic_reply(con, hdr, skip); return get_generic_reply(con, hdr, skip);
case CEPH_MSG_AUTH_REPLY: case CEPH_MSG_AUTH_REPLY:
......
...@@ -50,6 +50,7 @@ struct ceph_mon_generic_request { ...@@ -50,6 +50,7 @@ struct ceph_mon_generic_request {
struct rb_node node; struct rb_node node;
int result; int result;
void *buf; void *buf;
int buf_len;
struct completion completion; struct completion completion;
struct ceph_msg *request; /* original request */ struct ceph_msg *request; /* original request */
struct ceph_msg *reply; /* and reply */ struct ceph_msg *reply; /* and reply */
...@@ -111,6 +112,10 @@ extern int ceph_monc_open_session(struct ceph_mon_client *monc); ...@@ -111,6 +112,10 @@ extern int ceph_monc_open_session(struct ceph_mon_client *monc);
extern int ceph_monc_validate_auth(struct ceph_mon_client *monc); extern int ceph_monc_validate_auth(struct ceph_mon_client *monc);
extern int ceph_monc_create_snapid(struct ceph_mon_client *monc,
u32 pool, u64 *snapid);
extern int ceph_monc_delete_snapid(struct ceph_mon_client *monc,
u32 pool, u64 snapid);
#endif #endif
#ifndef __MSGR_H #ifndef CEPH_MSGR_H
#define __MSGR_H #define CEPH_MSGR_H
/* /*
* Data types for message passing layer used by Ceph. * Data types for message passing layer used by Ceph.
......
...@@ -1276,8 +1276,6 @@ int ceph_osdc_readpages(struct ceph_osd_client *osdc, ...@@ -1276,8 +1276,6 @@ int ceph_osdc_readpages(struct ceph_osd_client *osdc,
/* it may be a short read due to an object boundary */ /* it may be a short read due to an object boundary */
req->r_pages = pages; req->r_pages = pages;
num_pages = calc_pages_for(off, *plen);
req->r_num_pages = num_pages;
dout("readpages final extent is %llu~%llu (%d pages)\n", dout("readpages final extent is %llu~%llu (%d pages)\n",
off, *plen, req->r_num_pages); off, *plen, req->r_num_pages);
...@@ -1319,7 +1317,6 @@ int ceph_osdc_writepages(struct ceph_osd_client *osdc, struct ceph_vino vino, ...@@ -1319,7 +1317,6 @@ int ceph_osdc_writepages(struct ceph_osd_client *osdc, struct ceph_vino vino,
/* it may be a short write due to an object boundary */ /* it may be a short write due to an object boundary */
req->r_pages = pages; req->r_pages = pages;
req->r_num_pages = calc_pages_for(off, len);
dout("writepages %llu~%llu (%d pages)\n", off, len, dout("writepages %llu~%llu (%d pages)\n", off, len,
req->r_num_pages); req->r_num_pages);
...@@ -1476,8 +1473,8 @@ static void put_osd_con(struct ceph_connection *con) ...@@ -1476,8 +1473,8 @@ static void put_osd_con(struct ceph_connection *con)
* authentication * authentication
*/ */
static int get_authorizer(struct ceph_connection *con, static int get_authorizer(struct ceph_connection *con,
void **buf, int *len, int *proto, void **buf, int *len, int *proto,
void **reply_buf, int *reply_len, int force_new) void **reply_buf, int *reply_len, int force_new)
{ {
struct ceph_osd *o = con->private; struct ceph_osd *o = con->private;
struct ceph_osd_client *osdc = o->o_osdc; struct ceph_osd_client *osdc = o->o_osdc;
...@@ -1497,7 +1494,7 @@ static int get_authorizer(struct ceph_connection *con, ...@@ -1497,7 +1494,7 @@ static int get_authorizer(struct ceph_connection *con,
&o->o_authorizer_reply_buf, &o->o_authorizer_reply_buf,
&o->o_authorizer_reply_buf_len); &o->o_authorizer_reply_buf_len);
if (ret) if (ret)
return ret; return ret;
} }
*proto = ac->protocol; *proto = ac->protocol;
......
...@@ -424,12 +424,30 @@ static void __remove_pg_pool(struct rb_root *root, struct ceph_pg_pool_info *pi) ...@@ -424,12 +424,30 @@ static void __remove_pg_pool(struct rb_root *root, struct ceph_pg_pool_info *pi)
kfree(pi); kfree(pi);
} }
void __decode_pool(void **p, struct ceph_pg_pool_info *pi) static int __decode_pool(void **p, void *end, struct ceph_pg_pool_info *pi)
{ {
unsigned n, m;
ceph_decode_copy(p, &pi->v, sizeof(pi->v)); ceph_decode_copy(p, &pi->v, sizeof(pi->v));
calc_pg_masks(pi); calc_pg_masks(pi);
*p += le32_to_cpu(pi->v.num_snaps) * sizeof(u64);
/* num_snaps * snap_info_t */
n = le32_to_cpu(pi->v.num_snaps);
while (n--) {
ceph_decode_need(p, end, sizeof(u64) + 1 + sizeof(u64) +
sizeof(struct ceph_timespec), bad);
*p += sizeof(u64) + /* key */
1 + sizeof(u64) + /* u8, snapid */
sizeof(struct ceph_timespec);
m = ceph_decode_32(p); /* snap name */
*p += m;
}
*p += le32_to_cpu(pi->v.num_removed_snap_intervals) * sizeof(u64) * 2; *p += le32_to_cpu(pi->v.num_removed_snap_intervals) * sizeof(u64) * 2;
return 0;
bad:
return -EINVAL;
} }
static int __decode_pool_names(void **p, void *end, struct ceph_osdmap *map) static int __decode_pool_names(void **p, void *end, struct ceph_osdmap *map)
...@@ -571,7 +589,9 @@ struct ceph_osdmap *osdmap_decode(void **p, void *end) ...@@ -571,7 +589,9 @@ struct ceph_osdmap *osdmap_decode(void **p, void *end)
kfree(pi); kfree(pi);
goto bad; goto bad;
} }
__decode_pool(p, pi); err = __decode_pool(p, end, pi);
if (err < 0)
goto bad;
__insert_pg_pool(&map->pg_pools, pi); __insert_pg_pool(&map->pg_pools, pi);
} }
...@@ -760,7 +780,9 @@ struct ceph_osdmap *osdmap_apply_incremental(void **p, void *end, ...@@ -760,7 +780,9 @@ struct ceph_osdmap *osdmap_apply_incremental(void **p, void *end,
pi->id = pool; pi->id = pool;
__insert_pg_pool(&map->pg_pools, pi); __insert_pg_pool(&map->pg_pools, pi);
} }
__decode_pool(p, pi); err = __decode_pool(p, end, pi);
if (err < 0)
goto bad;
} }
if (version >= 5 && __decode_pool_names(p, end, map) < 0) if (version >= 5 && __decode_pool_names(p, end, map) < 0)
goto bad; goto bad;
...@@ -833,7 +855,7 @@ struct ceph_osdmap *osdmap_apply_incremental(void **p, void *end, ...@@ -833,7 +855,7 @@ struct ceph_osdmap *osdmap_apply_incremental(void **p, void *end,
node)->pgid, pgid) <= 0) { node)->pgid, pgid) <= 0) {
struct ceph_pg_mapping *cur = struct ceph_pg_mapping *cur =
rb_entry(rbp, struct ceph_pg_mapping, node); rb_entry(rbp, struct ceph_pg_mapping, node);
rbp = rb_next(rbp); rbp = rb_next(rbp);
dout(" removed pg_temp %llx\n", *(u64 *)&cur->pgid); dout(" removed pg_temp %llx\n", *(u64 *)&cur->pgid);
rb_erase(&cur->node, &map->pg_temp); rb_erase(&cur->node, &map->pg_temp);
...@@ -1026,8 +1048,9 @@ static int *calc_pg_raw(struct ceph_osdmap *osdmap, struct ceph_pg pgid, ...@@ -1026,8 +1048,9 @@ static int *calc_pg_raw(struct ceph_osdmap *osdmap, struct ceph_pg pgid,
ruleno = crush_find_rule(osdmap->crush, pool->v.crush_ruleset, ruleno = crush_find_rule(osdmap->crush, pool->v.crush_ruleset,
pool->v.type, pool->v.size); pool->v.type, pool->v.size);
if (ruleno < 0) { if (ruleno < 0) {
pr_err("no crush rule pool %d type %d size %d\n", pr_err("no crush rule pool %d ruleset %d type %d size %d\n",
poolid, pool->v.type, pool->v.size); poolid, pool->v.crush_ruleset, pool->v.type,
pool->v.size);
return NULL; return NULL;
} }
......
#ifndef __RADOS_H #ifndef CEPH_RADOS_H
#define __RADOS_H #define CEPH_RADOS_H
/* /*
* Data types for the Ceph distributed object storage layer RADOS * Data types for the Ceph distributed object storage layer RADOS
...@@ -203,6 +203,7 @@ enum { ...@@ -203,6 +203,7 @@ enum {
CEPH_OSD_OP_TMAPGET = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 12, CEPH_OSD_OP_TMAPGET = CEPH_OSD_OP_MODE_RD | CEPH_OSD_OP_TYPE_DATA | 12,
CEPH_OSD_OP_CREATE = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 13, CEPH_OSD_OP_CREATE = CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 13,
CEPH_OSD_OP_ROLLBACK= CEPH_OSD_OP_MODE_WR | CEPH_OSD_OP_TYPE_DATA | 14,
/** attrs **/ /** attrs **/
/* read */ /* read */
...@@ -272,6 +273,10 @@ static inline int ceph_osd_op_mode_modify(int op) ...@@ -272,6 +273,10 @@ static inline int ceph_osd_op_mode_modify(int op)
return (op & CEPH_OSD_OP_MODE) == CEPH_OSD_OP_MODE_WR; return (op & CEPH_OSD_OP_MODE) == CEPH_OSD_OP_MODE_WR;
} }
/*
* note that the following tmap stuff is also defined in the ceph librados.h
* any modification here needs to be updated there
*/
#define CEPH_OSD_TMAP_HDR 'h' #define CEPH_OSD_TMAP_HDR 'h'
#define CEPH_OSD_TMAP_SET 's' #define CEPH_OSD_TMAP_SET 's'
#define CEPH_OSD_TMAP_RM 'r' #define CEPH_OSD_TMAP_RM 'r'
...@@ -297,6 +302,7 @@ enum { ...@@ -297,6 +302,7 @@ enum {
CEPH_OSD_FLAG_PARALLELEXEC = 512, /* execute op in parallel */ CEPH_OSD_FLAG_PARALLELEXEC = 512, /* execute op in parallel */
CEPH_OSD_FLAG_PGOP = 1024, /* pg op, no object */ CEPH_OSD_FLAG_PGOP = 1024, /* pg op, no object */
CEPH_OSD_FLAG_EXEC = 2048, /* op may exec */ CEPH_OSD_FLAG_EXEC = 2048, /* op may exec */
CEPH_OSD_FLAG_EXEC_PUBLIC = 4096, /* op may exec (public) */
}; };
enum { enum {
...@@ -350,6 +356,9 @@ struct ceph_osd_op { ...@@ -350,6 +356,9 @@ struct ceph_osd_op {
struct { struct {
__le64 cookie, count; __le64 cookie, count;
} __attribute__ ((packed)) pgls; } __attribute__ ((packed)) pgls;
struct {
__le64 snapid;
} __attribute__ ((packed)) snap;
}; };
__le32 payload_len; __le32 payload_len;
} __attribute__ ((packed)); } __attribute__ ((packed));
......
...@@ -2,6 +2,7 @@ ...@@ -2,6 +2,7 @@
#include "ceph_debug.h" #include "ceph_debug.h"
#include <linux/backing-dev.h> #include <linux/backing-dev.h>
#include <linux/ctype.h>
#include <linux/fs.h> #include <linux/fs.h>
#include <linux/inet.h> #include <linux/inet.h>
#include <linux/in6.h> #include <linux/in6.h>
...@@ -101,12 +102,21 @@ static int ceph_statfs(struct dentry *dentry, struct kstatfs *buf) ...@@ -101,12 +102,21 @@ static int ceph_statfs(struct dentry *dentry, struct kstatfs *buf)
} }
static int ceph_syncfs(struct super_block *sb, int wait) static int ceph_sync_fs(struct super_block *sb, int wait)
{ {
dout("sync_fs %d\n", wait); struct ceph_client *client = ceph_sb_to_client(sb);
if (!wait) {
dout("sync_fs (non-blocking)\n");
ceph_flush_dirty_caps(&client->mdsc);
dout("sync_fs (non-blocking) done\n");
return 0;
}
dout("sync_fs (blocking)\n");
ceph_osdc_sync(&ceph_sb_to_client(sb)->osdc); ceph_osdc_sync(&ceph_sb_to_client(sb)->osdc);
ceph_mdsc_sync(&ceph_sb_to_client(sb)->mdsc); ceph_mdsc_sync(&ceph_sb_to_client(sb)->mdsc);
dout("sync_fs %d done\n", wait); dout("sync_fs (blocking) done\n");
return 0; return 0;
} }
...@@ -150,9 +160,7 @@ static int ceph_show_options(struct seq_file *m, struct vfsmount *mnt) ...@@ -150,9 +160,7 @@ static int ceph_show_options(struct seq_file *m, struct vfsmount *mnt)
struct ceph_mount_args *args = client->mount_args; struct ceph_mount_args *args = client->mount_args;
if (args->flags & CEPH_OPT_FSID) if (args->flags & CEPH_OPT_FSID)
seq_printf(m, ",fsidmajor=%llu,fsidminor%llu", seq_printf(m, ",fsid=%pU", &args->fsid);
le64_to_cpu(*(__le64 *)&args->fsid.fsid[0]),
le64_to_cpu(*(__le64 *)&args->fsid.fsid[8]));
if (args->flags & CEPH_OPT_NOSHARE) if (args->flags & CEPH_OPT_NOSHARE)
seq_puts(m, ",noshare"); seq_puts(m, ",noshare");
if (args->flags & CEPH_OPT_DIRSTAT) if (args->flags & CEPH_OPT_DIRSTAT)
...@@ -279,7 +287,7 @@ static const struct super_operations ceph_super_ops = { ...@@ -279,7 +287,7 @@ static const struct super_operations ceph_super_ops = {
.alloc_inode = ceph_alloc_inode, .alloc_inode = ceph_alloc_inode,
.destroy_inode = ceph_destroy_inode, .destroy_inode = ceph_destroy_inode,
.write_inode = ceph_write_inode, .write_inode = ceph_write_inode,
.sync_fs = ceph_syncfs, .sync_fs = ceph_sync_fs,
.put_super = ceph_put_super, .put_super = ceph_put_super,
.show_options = ceph_show_options, .show_options = ceph_show_options,
.statfs = ceph_statfs, .statfs = ceph_statfs,
...@@ -322,9 +330,6 @@ const char *ceph_msg_type_name(int type) ...@@ -322,9 +330,6 @@ const char *ceph_msg_type_name(int type)
* mount options * mount options
*/ */
enum { enum {
Opt_fsidmajor,
Opt_fsidminor,
Opt_monport,
Opt_wsize, Opt_wsize,
Opt_rsize, Opt_rsize,
Opt_osdtimeout, Opt_osdtimeout,
...@@ -339,6 +344,7 @@ enum { ...@@ -339,6 +344,7 @@ enum {
Opt_congestion_kb, Opt_congestion_kb,
Opt_last_int, Opt_last_int,
/* int args above */ /* int args above */
Opt_fsid,
Opt_snapdirname, Opt_snapdirname,
Opt_name, Opt_name,
Opt_secret, Opt_secret,
...@@ -355,9 +361,6 @@ enum { ...@@ -355,9 +361,6 @@ enum {
}; };
static match_table_t arg_tokens = { static match_table_t arg_tokens = {
{Opt_fsidmajor, "fsidmajor=%ld"},
{Opt_fsidminor, "fsidminor=%ld"},
{Opt_monport, "monport=%d"},
{Opt_wsize, "wsize=%d"}, {Opt_wsize, "wsize=%d"},
{Opt_rsize, "rsize=%d"}, {Opt_rsize, "rsize=%d"},
{Opt_osdtimeout, "osdtimeout=%d"}, {Opt_osdtimeout, "osdtimeout=%d"},
...@@ -371,6 +374,7 @@ static match_table_t arg_tokens = { ...@@ -371,6 +374,7 @@ static match_table_t arg_tokens = {
{Opt_readdir_max_bytes, "readdir_max_bytes=%d"}, {Opt_readdir_max_bytes, "readdir_max_bytes=%d"},
{Opt_congestion_kb, "write_congestion_kb=%d"}, {Opt_congestion_kb, "write_congestion_kb=%d"},
/* int args above */ /* int args above */
{Opt_fsid, "fsid=%s"},
{Opt_snapdirname, "snapdirname=%s"}, {Opt_snapdirname, "snapdirname=%s"},
{Opt_name, "name=%s"}, {Opt_name, "name=%s"},
{Opt_secret, "secret=%s"}, {Opt_secret, "secret=%s"},
...@@ -386,6 +390,36 @@ static match_table_t arg_tokens = { ...@@ -386,6 +390,36 @@ static match_table_t arg_tokens = {
{-1, NULL} {-1, NULL}
}; };
static int parse_fsid(const char *str, struct ceph_fsid *fsid)
{
int i = 0;
char tmp[3];
int err = -EINVAL;
int d;
dout("parse_fsid '%s'\n", str);
tmp[2] = 0;
while (*str && i < 16) {
if (ispunct(*str)) {
str++;
continue;
}
if (!isxdigit(str[0]) || !isxdigit(str[1]))
break;
tmp[0] = str[0];
tmp[1] = str[1];
if (sscanf(tmp, "%x", &d) < 1)
break;
fsid->fsid[i] = d & 0xff;
i++;
str += 2;
}
if (i == 16)
err = 0;
dout("parse_fsid ret %d got fsid %pU", err, fsid);
return err;
}
static struct ceph_mount_args *parse_mount_args(int flags, char *options, static struct ceph_mount_args *parse_mount_args(int flags, char *options,
const char *dev_name, const char *dev_name,
...@@ -469,12 +503,6 @@ static struct ceph_mount_args *parse_mount_args(int flags, char *options, ...@@ -469,12 +503,6 @@ static struct ceph_mount_args *parse_mount_args(int flags, char *options,
dout("got token %d\n", token); dout("got token %d\n", token);
} }
switch (token) { switch (token) {
case Opt_fsidmajor:
*(__le64 *)&args->fsid.fsid[0] = cpu_to_le64(intval);
break;
case Opt_fsidminor:
*(__le64 *)&args->fsid.fsid[8] = cpu_to_le64(intval);
break;
case Opt_ip: case Opt_ip:
err = ceph_parse_ips(argstr[0].from, err = ceph_parse_ips(argstr[0].from,
argstr[0].to, argstr[0].to,
...@@ -485,6 +513,11 @@ static struct ceph_mount_args *parse_mount_args(int flags, char *options, ...@@ -485,6 +513,11 @@ static struct ceph_mount_args *parse_mount_args(int flags, char *options,
args->flags |= CEPH_OPT_MYIP; args->flags |= CEPH_OPT_MYIP;
break; break;
case Opt_fsid:
err = parse_fsid(argstr[0].from, &args->fsid);
if (err == 0)
args->flags |= CEPH_OPT_FSID;
break;
case Opt_snapdirname: case Opt_snapdirname:
kfree(args->snapdir_name); kfree(args->snapdir_name);
args->snapdir_name = kstrndup(argstr[0].from, args->snapdir_name = kstrndup(argstr[0].from,
...@@ -515,6 +548,9 @@ static struct ceph_mount_args *parse_mount_args(int flags, char *options, ...@@ -515,6 +548,9 @@ static struct ceph_mount_args *parse_mount_args(int flags, char *options,
case Opt_osdkeepalivetimeout: case Opt_osdkeepalivetimeout:
args->osd_keepalive_timeout = intval; args->osd_keepalive_timeout = intval;
break; break;
case Opt_osd_idle_ttl:
args->osd_idle_ttl = intval;
break;
case Opt_mount_timeout: case Opt_mount_timeout:
args->mount_timeout = intval; args->mount_timeout = intval;
break; break;
...@@ -630,7 +666,6 @@ static struct ceph_client *ceph_create_client(struct ceph_mount_args *args) ...@@ -630,7 +666,6 @@ static struct ceph_client *ceph_create_client(struct ceph_mount_args *args)
/* caps */ /* caps */
client->min_caps = args->max_readdir; client->min_caps = args->max_readdir;
ceph_adjust_min_caps(client->min_caps);
/* subsystems */ /* subsystems */
err = ceph_monc_init(&client->monc, client); err = ceph_monc_init(&client->monc, client);
...@@ -680,8 +715,6 @@ static void ceph_destroy_client(struct ceph_client *client) ...@@ -680,8 +715,6 @@ static void ceph_destroy_client(struct ceph_client *client)
ceph_monc_stop(&client->monc); ceph_monc_stop(&client->monc);
ceph_adjust_min_caps(-client->min_caps);
ceph_debugfs_client_cleanup(client); ceph_debugfs_client_cleanup(client);
destroy_workqueue(client->wb_wq); destroy_workqueue(client->wb_wq);
destroy_workqueue(client->pg_inv_wq); destroy_workqueue(client->pg_inv_wq);
...@@ -706,13 +739,13 @@ int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid) ...@@ -706,13 +739,13 @@ int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid)
{ {
if (client->have_fsid) { if (client->have_fsid) {
if (ceph_fsid_compare(&client->fsid, fsid)) { if (ceph_fsid_compare(&client->fsid, fsid)) {
pr_err("bad fsid, had " FSID_FORMAT " got " FSID_FORMAT, pr_err("bad fsid, had %pU got %pU",
PR_FSID(&client->fsid), PR_FSID(fsid)); &client->fsid, fsid);
return -1; return -1;
} }
} else { } else {
pr_info("client%lld fsid " FSID_FORMAT "\n", pr_info("client%lld fsid %pU\n", client->monc.auth->global_id,
client->monc.auth->global_id, PR_FSID(fsid)); fsid);
memcpy(&client->fsid, fsid, sizeof(*fsid)); memcpy(&client->fsid, fsid, sizeof(*fsid));
ceph_debugfs_client_init(client); ceph_debugfs_client_init(client);
client->have_fsid = true; client->have_fsid = true;
...@@ -1043,8 +1076,6 @@ static int __init init_ceph(void) ...@@ -1043,8 +1076,6 @@ static int __init init_ceph(void)
if (ret) if (ret)
goto out_msgr; goto out_msgr;
ceph_caps_init();
ret = register_filesystem(&ceph_fs_type); ret = register_filesystem(&ceph_fs_type);
if (ret) if (ret)
goto out_icache; goto out_icache;
...@@ -1069,7 +1100,6 @@ static void __exit exit_ceph(void) ...@@ -1069,7 +1100,6 @@ static void __exit exit_ceph(void)
{ {
dout("exit_ceph\n"); dout("exit_ceph\n");
unregister_filesystem(&ceph_fs_type); unregister_filesystem(&ceph_fs_type);
ceph_caps_finalize();
destroy_caches(); destroy_caches();
ceph_msgr_exit(); ceph_msgr_exit();
ceph_debugfs_cleanup(); ceph_debugfs_cleanup();
......
...@@ -30,6 +30,12 @@ ...@@ -30,6 +30,12 @@
#define CEPH_BLOCK_SHIFT 20 /* 1 MB */ #define CEPH_BLOCK_SHIFT 20 /* 1 MB */
#define CEPH_BLOCK (1 << CEPH_BLOCK_SHIFT) #define CEPH_BLOCK (1 << CEPH_BLOCK_SHIFT)
/*
* Supported features
*/
#define CEPH_FEATURE_SUPPORTED CEPH_FEATURE_NOSRCADDR | CEPH_FEATURE_FLOCK
#define CEPH_FEATURE_REQUIRED CEPH_FEATURE_NOSRCADDR
/* /*
* mount options * mount options
*/ */
...@@ -560,11 +566,13 @@ static inline int __ceph_caps_wanted(struct ceph_inode_info *ci) ...@@ -560,11 +566,13 @@ static inline int __ceph_caps_wanted(struct ceph_inode_info *ci)
/* what the mds thinks we want */ /* what the mds thinks we want */
extern int __ceph_caps_mds_wanted(struct ceph_inode_info *ci); extern int __ceph_caps_mds_wanted(struct ceph_inode_info *ci);
extern void ceph_caps_init(void); extern void ceph_caps_init(struct ceph_mds_client *mdsc);
extern void ceph_caps_finalize(void); extern void ceph_caps_finalize(struct ceph_mds_client *mdsc);
extern void ceph_adjust_min_caps(int delta); extern void ceph_adjust_min_caps(struct ceph_mds_client *mdsc, int delta);
extern int ceph_reserve_caps(struct ceph_cap_reservation *ctx, int need); extern int ceph_reserve_caps(struct ceph_mds_client *mdsc,
extern int ceph_unreserve_caps(struct ceph_cap_reservation *ctx); struct ceph_cap_reservation *ctx, int need);
extern int ceph_unreserve_caps(struct ceph_mds_client *mdsc,
struct ceph_cap_reservation *ctx);
extern void ceph_reservation_status(struct ceph_client *client, extern void ceph_reservation_status(struct ceph_client *client,
int *total, int *avail, int *used, int *total, int *avail, int *used,
int *reserved, int *min); int *reserved, int *min);
...@@ -738,13 +746,6 @@ extern struct kmem_cache *ceph_file_cachep; ...@@ -738,13 +746,6 @@ extern struct kmem_cache *ceph_file_cachep;
extern const char *ceph_msg_type_name(int type); extern const char *ceph_msg_type_name(int type);
extern int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid); extern int ceph_check_fsid(struct ceph_client *client, struct ceph_fsid *fsid);
#define FSID_FORMAT "%02x%02x%02x%02x-%02x%02x-%02x%02x-%02x%02x-" \
"%02x%02x%02x%02x%02x%02x"
#define PR_FSID(f) (f)->fsid[0], (f)->fsid[1], (f)->fsid[2], (f)->fsid[3], \
(f)->fsid[4], (f)->fsid[5], (f)->fsid[6], (f)->fsid[7], \
(f)->fsid[8], (f)->fsid[9], (f)->fsid[10], (f)->fsid[11], \
(f)->fsid[12], (f)->fsid[13], (f)->fsid[14], (f)->fsid[15]
/* inode.c */ /* inode.c */
extern const struct inode_operations ceph_file_iops; extern const struct inode_operations ceph_file_iops;
...@@ -806,13 +807,16 @@ static inline void ceph_remove_cap(struct ceph_cap *cap) ...@@ -806,13 +807,16 @@ static inline void ceph_remove_cap(struct ceph_cap *cap)
__ceph_remove_cap(cap); __ceph_remove_cap(cap);
spin_unlock(&inode->i_lock); spin_unlock(&inode->i_lock);
} }
extern void ceph_put_cap(struct ceph_cap *cap); extern void ceph_put_cap(struct ceph_mds_client *mdsc,
struct ceph_cap *cap);
extern void ceph_queue_caps_release(struct inode *inode); extern void ceph_queue_caps_release(struct inode *inode);
extern int ceph_write_inode(struct inode *inode, struct writeback_control *wbc); extern int ceph_write_inode(struct inode *inode, struct writeback_control *wbc);
extern int ceph_fsync(struct file *file, int datasync); extern int ceph_fsync(struct file *file, int datasync);
extern void ceph_kick_flushing_caps(struct ceph_mds_client *mdsc, extern void ceph_kick_flushing_caps(struct ceph_mds_client *mdsc,
struct ceph_mds_session *session); struct ceph_mds_session *session);
extern struct ceph_cap *ceph_get_cap_for_mds(struct ceph_inode_info *ci,
int mds);
extern int ceph_get_cap_mds(struct inode *inode); extern int ceph_get_cap_mds(struct inode *inode);
extern void ceph_get_cap_refs(struct ceph_inode_info *ci, int caps); extern void ceph_get_cap_refs(struct ceph_inode_info *ci, int caps);
extern void ceph_put_cap_refs(struct ceph_inode_info *ci, int had); extern void ceph_put_cap_refs(struct ceph_inode_info *ci, int had);
...@@ -857,7 +861,7 @@ extern void ceph_release_page_vector(struct page **pages, int num_pages); ...@@ -857,7 +861,7 @@ extern void ceph_release_page_vector(struct page **pages, int num_pages);
/* dir.c */ /* dir.c */
extern const struct file_operations ceph_dir_fops; extern const struct file_operations ceph_dir_fops;
extern const struct inode_operations ceph_dir_iops; extern const struct inode_operations ceph_dir_iops;
extern struct dentry_operations ceph_dentry_ops, ceph_snap_dentry_ops, extern const struct dentry_operations ceph_dentry_ops, ceph_snap_dentry_ops,
ceph_snapdir_dentry_ops; ceph_snapdir_dentry_ops;
extern int ceph_handle_notrace_create(struct inode *dir, struct dentry *dentry); extern int ceph_handle_notrace_create(struct inode *dir, struct dentry *dentry);
...@@ -888,6 +892,14 @@ extern void ceph_debugfs_cleanup(void); ...@@ -888,6 +892,14 @@ extern void ceph_debugfs_cleanup(void);
extern int ceph_debugfs_client_init(struct ceph_client *client); extern int ceph_debugfs_client_init(struct ceph_client *client);
extern void ceph_debugfs_client_cleanup(struct ceph_client *client); extern void ceph_debugfs_client_cleanup(struct ceph_client *client);
/* locks.c */
extern int ceph_lock(struct file *file, int cmd, struct file_lock *fl);
extern int ceph_flock(struct file *file, int cmd, struct file_lock *fl);
extern void ceph_count_locks(struct inode *inode, int *p_num, int *f_num);
extern int ceph_encode_locks(struct inode *i, struct ceph_pagelist *p,
int p_locks, int f_locks);
extern int lock_to_ceph_filelock(struct file_lock *fl, struct ceph_filelock *c);
static inline struct inode *get_dentry_parent_inode(struct dentry *dentry) static inline struct inode *get_dentry_parent_inode(struct dentry *dentry)
{ {
if (dentry && dentry->d_parent) if (dentry && dentry->d_parent)
......
...@@ -337,6 +337,8 @@ void __ceph_destroy_xattrs(struct ceph_inode_info *ci) ...@@ -337,6 +337,8 @@ void __ceph_destroy_xattrs(struct ceph_inode_info *ci)
} }
static int __build_xattrs(struct inode *inode) static int __build_xattrs(struct inode *inode)
__releases(inode->i_lock)
__acquires(inode->i_lock)
{ {
u32 namelen; u32 namelen;
u32 numattr = 0; u32 numattr = 0;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment