Commit abfa034e authored by Aneesh Kumar K.V's avatar Aneesh Kumar K.V Committed by Eric Van Hensbergen

fs/9p: Update zero-copy implementation in 9p

* remove lot of update to different data structure
* add a seperate callback for zero copy request.
* above makes non zero copy code path simpler
* remove conditionalizing TREAD/TREADDIR/TWRITE in the zero copy path
* Fix the dotu p9_check_errors with zero copy. Add sufficient doc around
* Add support for both in and output buffers in zero copy callback
* pin and unpin pages in the same context
* use helpers instead of defining page offset and rest of page ourself
* Fix mem leak in p9_check_errors
* Remove 'E' and 'F' in p9pdu_vwritef
Signed-off-by: default avatarAneesh Kumar K.V <aneesh.kumar@linux.vnet.ibm.com>
Signed-off-by: default avatarEric Van Hensbergen <ericvh@gmail.com>
parent c3b92c87
...@@ -231,7 +231,7 @@ static int v9fs_dir_readdir_dotl(struct file *filp, void *dirent, ...@@ -231,7 +231,7 @@ static int v9fs_dir_readdir_dotl(struct file *filp, void *dirent,
while (err == 0) { while (err == 0) {
if (rdir->tail == rdir->head) { if (rdir->tail == rdir->head) {
err = p9_client_readdir(fid, rdir->buf, buflen, err = p9_client_readdir(fid, rdir->buf, buflen,
filp->f_pos); filp->f_pos);
if (err <= 0) if (err <= 0)
goto unlock_and_exit; goto unlock_and_exit;
......
...@@ -359,6 +359,9 @@ enum p9_qid_t { ...@@ -359,6 +359,9 @@ enum p9_qid_t {
/* Room for readdir header */ /* Room for readdir header */
#define P9_READDIRHDRSZ 24 #define P9_READDIRHDRSZ 24
/* size of header for zero copy read/write */
#define P9_ZC_HDR_SZ 4096
/** /**
* struct p9_qid - file system entity information * struct p9_qid - file system entity information
* @type: 8-bit type &p9_qid_t * @type: 8-bit type &p9_qid_t
...@@ -555,10 +558,6 @@ struct p9_rstatfs { ...@@ -555,10 +558,6 @@ struct p9_rstatfs {
* @tag: transaction id of the request * @tag: transaction id of the request
* @offset: used by marshalling routines to track current position in buffer * @offset: used by marshalling routines to track current position in buffer
* @capacity: used by marshalling routines to track total malloc'd capacity * @capacity: used by marshalling routines to track total malloc'd capacity
* @pubuf: Payload user buffer given by the caller
* @pkbuf: Payload kernel buffer given by the caller
* @pbuf_size: pubuf/pkbuf(only one will be !NULL) size to be read/write.
* @private: For transport layer's use.
* @sdata: payload * @sdata: payload
* *
* &p9_fcall represents the structure for all 9P RPC * &p9_fcall represents the structure for all 9P RPC
...@@ -575,10 +574,6 @@ struct p9_fcall { ...@@ -575,10 +574,6 @@ struct p9_fcall {
size_t offset; size_t offset;
size_t capacity; size_t capacity;
char __user *pubuf;
char *pkbuf;
size_t pbuf_size;
void *private;
u8 *sdata; u8 *sdata;
}; };
......
...@@ -26,13 +26,6 @@ ...@@ -26,13 +26,6 @@
#ifndef NET_9P_TRANSPORT_H #ifndef NET_9P_TRANSPORT_H
#define NET_9P_TRANSPORT_H #define NET_9P_TRANSPORT_H
#define P9_TRANS_PREF_PAYLOAD_MASK 0x1
/* Default. Add Payload to PDU before sending it down to transport layer */
#define P9_TRANS_PREF_PAYLOAD_DEF 0x0
/* Send pay load separately to transport layer along with PDU.*/
#define P9_TRANS_PREF_PAYLOAD_SEP 0x1
/** /**
* struct p9_trans_module - transport module interface * struct p9_trans_module - transport module interface
* @list: used to maintain a list of currently available transports * @list: used to maintain a list of currently available transports
...@@ -56,13 +49,14 @@ struct p9_trans_module { ...@@ -56,13 +49,14 @@ struct p9_trans_module {
struct list_head list; struct list_head list;
char *name; /* name of transport */ char *name; /* name of transport */
int maxsize; /* max message size of transport */ int maxsize; /* max message size of transport */
int pref; /* Preferences of this transport */
int def; /* this transport should be default */ int def; /* this transport should be default */
struct module *owner; struct module *owner;
int (*create)(struct p9_client *, const char *, char *); int (*create)(struct p9_client *, const char *, char *);
void (*close) (struct p9_client *); void (*close) (struct p9_client *);
int (*request) (struct p9_client *, struct p9_req_t *req); int (*request) (struct p9_client *, struct p9_req_t *req);
int (*cancel) (struct p9_client *, struct p9_req_t *req); int (*cancel) (struct p9_client *, struct p9_req_t *req);
int (*zc_request)(struct p9_client *, struct p9_req_t *,
char *, char *, int , int, int, int);
}; };
void v9fs_register_trans(struct p9_trans_module *m); void v9fs_register_trans(struct p9_trans_module *m);
......
This diff is collapsed.
...@@ -81,7 +81,7 @@ void p9stat_free(struct p9_wstat *stbuf) ...@@ -81,7 +81,7 @@ void p9stat_free(struct p9_wstat *stbuf)
} }
EXPORT_SYMBOL(p9stat_free); EXPORT_SYMBOL(p9stat_free);
static size_t pdu_read(struct p9_fcall *pdu, void *data, size_t size) size_t pdu_read(struct p9_fcall *pdu, void *data, size_t size)
{ {
size_t len = min(pdu->size - pdu->offset, size); size_t len = min(pdu->size - pdu->offset, size);
memcpy(data, &pdu->sdata[pdu->offset], len); memcpy(data, &pdu->sdata[pdu->offset], len);
...@@ -108,26 +108,6 @@ pdu_write_u(struct p9_fcall *pdu, const char __user *udata, size_t size) ...@@ -108,26 +108,6 @@ pdu_write_u(struct p9_fcall *pdu, const char __user *udata, size_t size)
return size - len; return size - len;
} }
static size_t
pdu_write_urw(struct p9_fcall *pdu, const char *kdata, const char __user *udata,
size_t size)
{
BUG_ON(pdu->size > P9_IOHDRSZ);
pdu->pubuf = (char __user *)udata;
pdu->pkbuf = (char *)kdata;
pdu->pbuf_size = size;
return 0;
}
static size_t
pdu_write_readdir(struct p9_fcall *pdu, const char *kdata, size_t size)
{
BUG_ON(pdu->size > P9_READDIRHDRSZ);
pdu->pkbuf = (char *)kdata;
pdu->pbuf_size = size;
return 0;
}
/* /*
b - int8_t b - int8_t
w - int16_t w - int16_t
...@@ -459,26 +439,6 @@ p9pdu_vwritef(struct p9_fcall *pdu, int proto_version, const char *fmt, ...@@ -459,26 +439,6 @@ p9pdu_vwritef(struct p9_fcall *pdu, int proto_version, const char *fmt,
errcode = -EFAULT; errcode = -EFAULT;
} }
break; break;
case 'E':{
int32_t cnt = va_arg(ap, int32_t);
const char *k = va_arg(ap, const void *);
const char __user *u = va_arg(ap,
const void __user *);
errcode = p9pdu_writef(pdu, proto_version, "d",
cnt);
if (!errcode && pdu_write_urw(pdu, k, u, cnt))
errcode = -EFAULT;
}
break;
case 'F':{
int32_t cnt = va_arg(ap, int32_t);
const char *k = va_arg(ap, const void *);
errcode = p9pdu_writef(pdu, proto_version, "d",
cnt);
if (!errcode && pdu_write_readdir(pdu, k, cnt))
errcode = -EFAULT;
}
break;
case 'U':{ case 'U':{
int32_t count = va_arg(ap, int32_t); int32_t count = va_arg(ap, int32_t);
const char __user *udata = const char __user *udata =
...@@ -637,10 +597,6 @@ void p9pdu_reset(struct p9_fcall *pdu) ...@@ -637,10 +597,6 @@ void p9pdu_reset(struct p9_fcall *pdu)
{ {
pdu->offset = 0; pdu->offset = 0;
pdu->size = 0; pdu->size = 0;
pdu->private = NULL;
pdu->pubuf = NULL;
pdu->pkbuf = NULL;
pdu->pbuf_size = 0;
} }
int p9dirent_read(char *buf, int len, struct p9_dirent *dirent, int p9dirent_read(char *buf, int len, struct p9_dirent *dirent,
......
...@@ -32,3 +32,4 @@ int p9pdu_prepare(struct p9_fcall *pdu, int16_t tag, int8_t type); ...@@ -32,3 +32,4 @@ int p9pdu_prepare(struct p9_fcall *pdu, int16_t tag, int8_t type);
int p9pdu_finalize(struct p9_fcall *pdu); int p9pdu_finalize(struct p9_fcall *pdu);
void p9pdu_dump(int, struct p9_fcall *); void p9pdu_dump(int, struct p9_fcall *);
void p9pdu_reset(struct p9_fcall *pdu); void p9pdu_reset(struct p9_fcall *pdu);
size_t pdu_read(struct p9_fcall *pdu, void *data, size_t size);
...@@ -21,30 +21,25 @@ ...@@ -21,30 +21,25 @@
/** /**
* p9_release_req_pages - Release pages after the transaction. * p9_release_req_pages - Release pages after the transaction.
* @*private: PDU's private page of struct trans_rpage_info
*/ */
void void p9_release_pages(struct page **pages, int nr_pages)
p9_release_req_pages(struct trans_rpage_info *rpinfo)
{ {
int i = 0; int i = 0;
while (pages[i] && nr_pages--) {
while (rpinfo->rp_data[i] && rpinfo->rp_nr_pages--) { put_page(pages[i]);
put_page(rpinfo->rp_data[i]);
i++; i++;
} }
} }
EXPORT_SYMBOL(p9_release_req_pages); EXPORT_SYMBOL(p9_release_pages);
/** /**
* p9_nr_pages - Return number of pages needed to accommodate the payload. * p9_nr_pages - Return number of pages needed to accommodate the payload.
*/ */
int int p9_nr_pages(char *data, int len)
p9_nr_pages(struct p9_req_t *req)
{ {
unsigned long start_page, end_page; unsigned long start_page, end_page;
start_page = (unsigned long)req->tc->pubuf >> PAGE_SHIFT; start_page = (unsigned long)data >> PAGE_SHIFT;
end_page = ((unsigned long)req->tc->pubuf + req->tc->pbuf_size + end_page = ((unsigned long)data + len + PAGE_SIZE - 1) >> PAGE_SHIFT;
PAGE_SIZE - 1) >> PAGE_SHIFT;
return end_page - start_page; return end_page - start_page;
} }
EXPORT_SYMBOL(p9_nr_pages); EXPORT_SYMBOL(p9_nr_pages);
...@@ -58,35 +53,17 @@ EXPORT_SYMBOL(p9_nr_pages); ...@@ -58,35 +53,17 @@ EXPORT_SYMBOL(p9_nr_pages);
* @nr_pages: number of pages to accommodate the payload * @nr_pages: number of pages to accommodate the payload
* @rw: Indicates if the pages are for read or write. * @rw: Indicates if the pages are for read or write.
*/ */
int
p9_payload_gup(struct p9_req_t *req, size_t *pdata_off, int *pdata_len,
int nr_pages, u8 rw)
{
uint32_t first_page_bytes = 0;
int32_t pdata_mapped_pages;
struct trans_rpage_info *rpinfo;
*pdata_off = (__force size_t)req->tc->pubuf & (PAGE_SIZE-1);
if (*pdata_off) int p9_payload_gup(char *data, int *nr_pages, struct page **pages, int write)
first_page_bytes = min(((size_t)PAGE_SIZE - *pdata_off), {
req->tc->pbuf_size); int nr_mapped_pages;
rpinfo = req->tc->private; nr_mapped_pages = get_user_pages_fast((unsigned long)data,
pdata_mapped_pages = get_user_pages_fast((unsigned long)req->tc->pubuf, *nr_pages, write, pages);
nr_pages, rw, &rpinfo->rp_data[0]); if (nr_mapped_pages <= 0)
if (pdata_mapped_pages <= 0) return nr_mapped_pages;
return pdata_mapped_pages;
rpinfo->rp_nr_pages = pdata_mapped_pages; *nr_pages = nr_mapped_pages;
if (*pdata_off) {
*pdata_len = first_page_bytes;
*pdata_len += min((req->tc->pbuf_size - *pdata_len),
((size_t)pdata_mapped_pages - 1) << PAGE_SHIFT);
} else {
*pdata_len = min(req->tc->pbuf_size,
(size_t)pdata_mapped_pages << PAGE_SHIFT);
}
return 0; return 0;
} }
EXPORT_SYMBOL(p9_payload_gup); EXPORT_SYMBOL(p9_payload_gup);
...@@ -12,21 +12,6 @@ ...@@ -12,21 +12,6 @@
* *
*/ */
/* TRUE if it is user context */ void p9_release_pages(struct page **, int);
#define P9_IS_USER_CONTEXT (!segment_eq(get_fs(), KERNEL_DS)) int p9_payload_gup(char *, int *, struct page **, int);
int p9_nr_pages(char *, int);
/**
* struct trans_rpage_info - To store mapped page information in PDU.
* @rp_alloc:Set if this structure is allocd, not a reuse unused space in pdu.
* @rp_nr_pages: Number of mapped pages
* @rp_data: Array of page pointers
*/
struct trans_rpage_info {
u8 rp_alloc;
int rp_nr_pages;
struct page *rp_data[0];
};
void p9_release_req_pages(struct trans_rpage_info *);
int p9_payload_gup(struct p9_req_t *, size_t *, int *, int, u8);
int p9_nr_pages(struct p9_req_t *);
This diff is collapsed.
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment