Commit 4420cfd3 authored by James Simmons's avatar James Simmons Committed by Greg Kroah-Hartman

staging: lustre: format properly all comment blocks for LNet core

In several places in the LNet core comment blocks don't follow the
linux kernel style. This patch cleans those problems up.
Signed-off-by: default avatarJames Simmons <jsimmons@infradead.org>
Signed-off-by: default avatarGreg Kroah-Hartman <gregkh@linuxfoundation.org>
parent ddbc66a5
...@@ -48,7 +48,8 @@ ...@@ -48,7 +48,8 @@
/** \defgroup lnet_init_fini Initialization and cleanup /** \defgroup lnet_init_fini Initialization and cleanup
* The LNet must be properly initialized before any LNet calls can be made. * The LNet must be properly initialized before any LNet calls can be made.
* @{ */ * @{
*/
int LNetNIInit(lnet_pid_t requested_pid); int LNetNIInit(lnet_pid_t requested_pid);
int LNetNIFini(void); int LNetNIFini(void);
/** @} lnet_init_fini */ /** @} lnet_init_fini */
...@@ -71,7 +72,8 @@ int LNetNIFini(void); ...@@ -71,7 +72,8 @@ int LNetNIFini(void);
* it's an entry in the portals table of a process. * it's an entry in the portals table of a process.
* *
* \see LNetMEAttach * \see LNetMEAttach
* @{ */ * @{
*/
int LNetGetId(unsigned int index, lnet_process_id_t *id); int LNetGetId(unsigned int index, lnet_process_id_t *id);
int LNetDist(lnet_nid_t nid, lnet_nid_t *srcnid, __u32 *order); int LNetDist(lnet_nid_t nid, lnet_nid_t *srcnid, __u32 *order);
void LNetSnprintHandle(char *str, int str_len, lnet_handle_any_t handle); void LNetSnprintHandle(char *str, int str_len, lnet_handle_any_t handle);
...@@ -89,7 +91,8 @@ void LNetSnprintHandle(char *str, int str_len, lnet_handle_any_t handle); ...@@ -89,7 +91,8 @@ void LNetSnprintHandle(char *str, int str_len, lnet_handle_any_t handle);
* incoming requests based on process ID or the match bits provided in the * incoming requests based on process ID or the match bits provided in the
* request. MEs can be dynamically inserted into a match list by LNetMEAttach() * request. MEs can be dynamically inserted into a match list by LNetMEAttach()
* and LNetMEInsert(), and removed from its list by LNetMEUnlink(). * and LNetMEInsert(), and removed from its list by LNetMEUnlink().
* @{ */ * @{
*/
int LNetMEAttach(unsigned int portal, int LNetMEAttach(unsigned int portal,
lnet_process_id_t match_id_in, lnet_process_id_t match_id_in,
__u64 match_bits_in, __u64 match_bits_in,
...@@ -120,7 +123,8 @@ int LNetMEUnlink(lnet_handle_me_t current_in); ...@@ -120,7 +123,8 @@ int LNetMEUnlink(lnet_handle_me_t current_in);
* The LNet API provides two operations to create MDs: LNetMDAttach() * The LNet API provides two operations to create MDs: LNetMDAttach()
* and LNetMDBind(); one operation to unlink and release the resources * and LNetMDBind(); one operation to unlink and release the resources
* associated with a MD: LNetMDUnlink(). * associated with a MD: LNetMDUnlink().
* @{ */ * @{
*/
int LNetMDAttach(lnet_handle_me_t current_in, int LNetMDAttach(lnet_handle_me_t current_in,
lnet_md_t md_in, lnet_md_t md_in,
lnet_unlink_t unlink_in, lnet_unlink_t unlink_in,
...@@ -154,7 +158,8 @@ int LNetMDUnlink(lnet_handle_md_t md_in); ...@@ -154,7 +158,8 @@ int LNetMDUnlink(lnet_handle_md_t md_in);
* event from an EQ, and LNetEQWait() can be used to block a process until * event from an EQ, and LNetEQWait() can be used to block a process until
* an EQ has at least one event. LNetEQPoll() can be used to test or wait * an EQ has at least one event. LNetEQPoll() can be used to test or wait
* on multiple EQs. * on multiple EQs.
* @{ */ * @{
*/
int LNetEQAlloc(unsigned int count_in, int LNetEQAlloc(unsigned int count_in,
lnet_eq_handler_t handler, lnet_eq_handler_t handler,
lnet_handle_eq_t *handle_out); lnet_handle_eq_t *handle_out);
...@@ -172,7 +177,8 @@ int LNetEQPoll(lnet_handle_eq_t *eventqs_in, ...@@ -172,7 +177,8 @@ int LNetEQPoll(lnet_handle_eq_t *eventqs_in,
* *
* The LNet API provides two data movement operations: LNetPut() * The LNet API provides two data movement operations: LNetPut()
* and LNetGet(). * and LNetGet().
* @{ */ * @{
*/
int LNetPut(lnet_nid_t self, int LNetPut(lnet_nid_t self,
lnet_handle_md_t md_in, lnet_handle_md_t md_in,
lnet_ack_req_t ack_req_in, lnet_ack_req_t ack_req_in,
...@@ -192,8 +198,8 @@ int LNetGet(lnet_nid_t self, ...@@ -192,8 +198,8 @@ int LNetGet(lnet_nid_t self,
/** \defgroup lnet_misc Miscellaneous operations. /** \defgroup lnet_misc Miscellaneous operations.
* Miscellaneous operations. * Miscellaneous operations.
* @{ */ * @{
*/
int LNetSetLazyPortal(int portal); int LNetSetLazyPortal(int portal);
int LNetClearLazyPortal(int portal); int LNetClearLazyPortal(int portal);
int LNetCtl(unsigned int cmd, void *arg); int LNetCtl(unsigned int cmd, void *arg);
......
...@@ -79,7 +79,8 @@ static inline int lnet_md_exhausted(lnet_libmd_t *md) ...@@ -79,7 +79,8 @@ static inline int lnet_md_exhausted(lnet_libmd_t *md)
static inline int lnet_md_unlinkable(lnet_libmd_t *md) static inline int lnet_md_unlinkable(lnet_libmd_t *md)
{ {
/* Should unlink md when its refcount is 0 and either: /*
* Should unlink md when its refcount is 0 and either:
* - md has been flagged for deletion (by auto unlink or * - md has been flagged for deletion (by auto unlink or
* LNetM[DE]Unlink, in the latter case md may not be exhausted). * LNetM[DE]Unlink, in the latter case md may not be exhausted).
* - auto unlink is on and md is exhausted. * - auto unlink is on and md is exhausted.
...@@ -102,8 +103,10 @@ lnet_cpt_of_cookie(__u64 cookie) ...@@ -102,8 +103,10 @@ lnet_cpt_of_cookie(__u64 cookie)
{ {
unsigned int cpt = (cookie >> LNET_COOKIE_TYPE_BITS) & LNET_CPT_MASK; unsigned int cpt = (cookie >> LNET_COOKIE_TYPE_BITS) & LNET_CPT_MASK;
/* LNET_CPT_NUMBER doesn't have to be power2, which means we can /*
* get illegal cpt from it's invalid cookie */ * LNET_CPT_NUMBER doesn't have to be power2, which means we can
* get illegal cpt from it's invalid cookie
*/
return cpt < LNET_CPT_NUMBER ? cpt : cpt % LNET_CPT_NUMBER; return cpt < LNET_CPT_NUMBER ? cpt : cpt % LNET_CPT_NUMBER;
} }
......
...@@ -85,8 +85,7 @@ typedef struct lnet_msg { ...@@ -85,8 +85,7 @@ typedef struct lnet_msg {
unsigned int msg_receiving:1; /* being received */ unsigned int msg_receiving:1; /* being received */
unsigned int msg_txcredit:1; /* taken an NI send credit */ unsigned int msg_txcredit:1; /* taken an NI send credit */
unsigned int msg_peertxcredit:1; /* taken a peer send credit */ unsigned int msg_peertxcredit:1; /* taken a peer send credit */
unsigned int msg_rtrcredit:1; /* taken a global unsigned int msg_rtrcredit:1; /* taken a global router credit */
router credit */
unsigned int msg_peerrtrcredit:1; /* taken a peer router credit */ unsigned int msg_peerrtrcredit:1; /* taken a peer router credit */
unsigned int msg_onactivelist:1; /* on the activelist */ unsigned int msg_onactivelist:1; /* on the activelist */
...@@ -190,7 +189,8 @@ typedef struct lnet_lnd { ...@@ -190,7 +189,8 @@ typedef struct lnet_lnd {
void (*lnd_shutdown)(struct lnet_ni *ni); void (*lnd_shutdown)(struct lnet_ni *ni);
int (*lnd_ctl)(struct lnet_ni *ni, unsigned int cmd, void *arg); int (*lnd_ctl)(struct lnet_ni *ni, unsigned int cmd, void *arg);
/* In data movement APIs below, payload buffers are described as a set /*
* In data movement APIs below, payload buffers are described as a set
* of 'niov' fragments which are... * of 'niov' fragments which are...
* EITHER * EITHER
* in virtual memory (struct iovec *iov != NULL) * in virtual memory (struct iovec *iov != NULL)
...@@ -201,30 +201,36 @@ typedef struct lnet_lnd { ...@@ -201,30 +201,36 @@ typedef struct lnet_lnd {
* fragments to start from * fragments to start from
*/ */
/* Start sending a preformatted message. 'private' is NULL for PUT and /*
* Start sending a preformatted message. 'private' is NULL for PUT and
* GET messages; otherwise this is a response to an incoming message * GET messages; otherwise this is a response to an incoming message
* and 'private' is the 'private' passed to lnet_parse(). Return * and 'private' is the 'private' passed to lnet_parse(). Return
* non-zero for immediate failure, otherwise complete later with * non-zero for immediate failure, otherwise complete later with
* lnet_finalize() */ * lnet_finalize()
*/
int (*lnd_send)(struct lnet_ni *ni, void *private, lnet_msg_t *msg); int (*lnd_send)(struct lnet_ni *ni, void *private, lnet_msg_t *msg);
/* Start receiving 'mlen' bytes of payload data, skipping the following /*
* Start receiving 'mlen' bytes of payload data, skipping the following
* 'rlen' - 'mlen' bytes. 'private' is the 'private' passed to * 'rlen' - 'mlen' bytes. 'private' is the 'private' passed to
* lnet_parse(). Return non-zero for immediate failure, otherwise * lnet_parse(). Return non-zero for immediate failure, otherwise
* complete later with lnet_finalize(). This also gives back a receive * complete later with lnet_finalize(). This also gives back a receive
* credit if the LND does flow control. */ * credit if the LND does flow control.
*/
int (*lnd_recv)(struct lnet_ni *ni, void *private, lnet_msg_t *msg, int (*lnd_recv)(struct lnet_ni *ni, void *private, lnet_msg_t *msg,
int delayed, unsigned int niov, int delayed, unsigned int niov,
struct kvec *iov, lnet_kiov_t *kiov, struct kvec *iov, lnet_kiov_t *kiov,
unsigned int offset, unsigned int mlen, unsigned int offset, unsigned int mlen,
unsigned int rlen); unsigned int rlen);
/* lnet_parse() has had to delay processing of this message /*
* lnet_parse() has had to delay processing of this message
* (e.g. waiting for a forwarding buffer or send credits). Give the * (e.g. waiting for a forwarding buffer or send credits). Give the
* LND a chance to free urgently needed resources. If called, return 0 * LND a chance to free urgently needed resources. If called, return 0
* for success and do NOT give back a receive credit; that has to wait * for success and do NOT give back a receive credit; that has to wait
* until lnd_recv() gets called. On failure return < 0 and * until lnd_recv() gets called. On failure return < 0 and
* release resources; lnd_recv() will not be called. */ * release resources; lnd_recv() will not be called.
*/
int (*lnd_eager_recv)(struct lnet_ni *ni, void *private, int (*lnd_eager_recv)(struct lnet_ni *ni, void *private,
lnet_msg_t *msg, void **new_privatep); lnet_msg_t *msg, void **new_privatep);
...@@ -272,8 +278,10 @@ typedef struct lnet_ni { ...@@ -272,8 +278,10 @@ typedef struct lnet_ni {
#define LNET_PROTO_PING_MATCHBITS 0x8000000000000000LL #define LNET_PROTO_PING_MATCHBITS 0x8000000000000000LL
/* NB: value of these features equal to LNET_PROTO_PING_VERSION_x /*
* of old LNet, so there shouldn't be any compatibility issue */ * NB: value of these features equal to LNET_PROTO_PING_VERSION_x
* of old LNet, so there shouldn't be any compatibility issue
*/
#define LNET_PING_FEAT_INVAL (0) /* no feature */ #define LNET_PING_FEAT_INVAL (0) /* no feature */
#define LNET_PING_FEAT_BASE (1 << 0) /* just a ping */ #define LNET_PING_FEAT_BASE (1 << 0) /* just a ping */
#define LNET_PING_FEAT_NI_STATUS (1 << 1) /* return NI status */ #define LNET_PING_FEAT_NI_STATUS (1 << 1) /* return NI status */
...@@ -347,8 +355,10 @@ struct lnet_peer_table { ...@@ -347,8 +355,10 @@ struct lnet_peer_table {
struct list_head *pt_hash; /* NID->peer hash */ struct list_head *pt_hash; /* NID->peer hash */
}; };
/* peer aliveness is enabled only on routers for peers in a network where the /*
* lnet_ni_t::ni_peertimeout has been set to a positive value */ * peer aliveness is enabled only on routers for peers in a network where the
* lnet_ni_t::ni_peertimeout has been set to a positive value
*/
#define lnet_peer_aliveness_enabled(lp) (the_lnet.ln_routing != 0 && \ #define lnet_peer_aliveness_enabled(lp) (the_lnet.ln_routing != 0 && \
(lp)->lp_ni->ni_peertimeout > 0) (lp)->lp_ni->ni_peertimeout > 0)
...@@ -433,12 +443,16 @@ struct lnet_match_info { ...@@ -433,12 +443,16 @@ struct lnet_match_info {
#define LNET_MT_HASH_BITS 8 #define LNET_MT_HASH_BITS 8
#define LNET_MT_HASH_SIZE (1 << LNET_MT_HASH_BITS) #define LNET_MT_HASH_SIZE (1 << LNET_MT_HASH_BITS)
#define LNET_MT_HASH_MASK (LNET_MT_HASH_SIZE - 1) #define LNET_MT_HASH_MASK (LNET_MT_HASH_SIZE - 1)
/* we allocate (LNET_MT_HASH_SIZE + 1) entries for lnet_match_table::mt_hash, /*
* the last entry is reserved for MEs with ignore-bits */ * we allocate (LNET_MT_HASH_SIZE + 1) entries for lnet_match_table::mt_hash,
* the last entry is reserved for MEs with ignore-bits
*/
#define LNET_MT_HASH_IGNORE LNET_MT_HASH_SIZE #define LNET_MT_HASH_IGNORE LNET_MT_HASH_SIZE
/* __u64 has 2^6 bits, so need 2^(LNET_MT_HASH_BITS - LNET_MT_BITS_U64) which /*
* __u64 has 2^6 bits, so need 2^(LNET_MT_HASH_BITS - LNET_MT_BITS_U64) which
* is 4 __u64s as bit-map, and add an extra __u64 (only use one bit) for the * is 4 __u64s as bit-map, and add an extra __u64 (only use one bit) for the
* ME-list with ignore-bits, which is mtable::mt_hash[LNET_MT_HASH_IGNORE] */ * ME-list with ignore-bits, which is mtable::mt_hash[LNET_MT_HASH_IGNORE]
*/
#define LNET_MT_BITS_U64 6 /* 2^6 bits */ #define LNET_MT_BITS_U64 6 /* 2^6 bits */
#define LNET_MT_EXHAUSTED_BITS (LNET_MT_HASH_BITS - LNET_MT_BITS_U64) #define LNET_MT_EXHAUSTED_BITS (LNET_MT_HASH_BITS - LNET_MT_BITS_U64)
#define LNET_MT_EXHAUSTED_BMAP ((1 << LNET_MT_EXHAUSTED_BITS) + 1) #define LNET_MT_EXHAUSTED_BMAP ((1 << LNET_MT_EXHAUSTED_BITS) + 1)
...@@ -448,8 +462,10 @@ struct lnet_match_table { ...@@ -448,8 +462,10 @@ struct lnet_match_table {
/* reserved for upcoming patches, CPU partition ID */ /* reserved for upcoming patches, CPU partition ID */
unsigned int mt_cpt; unsigned int mt_cpt;
unsigned int mt_portal; /* portal index */ unsigned int mt_portal; /* portal index */
/* match table is set as "enabled" if there's non-exhausted MD /*
* attached on mt_mhash, it's only valid for wildcard portal */ * match table is set as "enabled" if there's non-exhausted MD
* attached on mt_mhash, it's only valid for wildcard portal
*/
unsigned int mt_enabled; unsigned int mt_enabled;
/* bitmap to flag whether MEs on mt_hash are exhausted or not */ /* bitmap to flag whether MEs on mt_hash are exhausted or not */
__u64 mt_exhausted[LNET_MT_EXHAUSTED_BMAP]; __u64 mt_exhausted[LNET_MT_EXHAUSTED_BMAP];
......
...@@ -34,8 +34,10 @@ ...@@ -34,8 +34,10 @@
* Lustre Network Driver types. * Lustre Network Driver types.
*/ */
enum { enum {
/* Only add to these values (i.e. don't ever change or redefine them): /*
* network addresses depend on them... */ * Only add to these values (i.e. don't ever change or redefine them):
* network addresses depend on them...
*/
QSWLND = 1, QSWLND = 1,
SOCKLND = 2, SOCKLND = 2,
GMLND = 3, GMLND = 3,
......
...@@ -91,8 +91,10 @@ socklnd_init_msg(ksock_msg_t *msg, int type) ...@@ -91,8 +91,10 @@ socklnd_init_msg(ksock_msg_t *msg, int type)
#define KSOCK_MSG_NOOP 0xC0 /* ksm_u empty */ #define KSOCK_MSG_NOOP 0xC0 /* ksm_u empty */
#define KSOCK_MSG_LNET 0xC1 /* lnet msg */ #define KSOCK_MSG_LNET 0xC1 /* lnet msg */
/* We need to know this number to parse hello msg from ksocklnd in /*
* other LND (usocklnd, for example) */ * We need to know this number to parse hello msg from ksocklnd in
* other LND (usocklnd, for example)
*/
#define KSOCK_PROTO_V2 2 #define KSOCK_PROTO_V2 2
#define KSOCK_PROTO_V3 3 #define KSOCK_PROTO_V3 3
......
...@@ -36,10 +36,12 @@ ...@@ -36,10 +36,12 @@
#include <linux/types.h> #include <linux/types.h>
/** \addtogroup lnet /** \addtogroup lnet
* @{ */ * @{
*/
/** \addtogroup lnet_addr /** \addtogroup lnet_addr
* @{ */ * @{
*/
/** Portal reserved for LNet's own use. /** Portal reserved for LNet's own use.
* \see lustre/include/lustre/lustre_idl.h for Lustre portal assignments. * \see lustre/include/lustre/lustre_idl.h for Lustre portal assignments.
...@@ -116,10 +118,12 @@ typedef struct { ...@@ -116,10 +118,12 @@ typedef struct {
lnet_pid_t pid; lnet_pid_t pid;
} WIRE_ATTR lnet_process_id_packed_t; } WIRE_ATTR lnet_process_id_packed_t;
/* The wire handle's interface cookie only matches one network interface in /*
* The wire handle's interface cookie only matches one network interface in
* one epoch (i.e. new cookie when the interface restarts or the node * one epoch (i.e. new cookie when the interface restarts or the node
* reboots). The object cookie only matches one object on that interface * reboots). The object cookie only matches one object on that interface
* during that object's lifetime (i.e. no cookie re-use). */ * during that object's lifetime (i.e. no cookie re-use).
*/
typedef struct { typedef struct {
__u64 wh_interface_cookie; __u64 wh_interface_cookie;
__u64 wh_object_cookie; __u64 wh_object_cookie;
...@@ -133,10 +137,12 @@ typedef enum { ...@@ -133,10 +137,12 @@ typedef enum {
LNET_MSG_HELLO, LNET_MSG_HELLO,
} lnet_msg_type_t; } lnet_msg_type_t;
/* The variant fields of the portals message header are aligned on an 8 /*
* The variant fields of the portals message header are aligned on an 8
* byte boundary in the message header. Note that all types used in these * byte boundary in the message header. Note that all types used in these
* wire structs MUST be fixed size and the smaller types are placed at the * wire structs MUST be fixed size and the smaller types are placed at the
* end. */ * end.
*/
typedef struct lnet_ack { typedef struct lnet_ack {
lnet_handle_wire_t dst_wmd; lnet_handle_wire_t dst_wmd;
__u64 match_bits; __u64 match_bits;
...@@ -185,7 +191,8 @@ typedef struct { ...@@ -185,7 +191,8 @@ typedef struct {
} msg; } msg;
} WIRE_ATTR lnet_hdr_t; } WIRE_ATTR lnet_hdr_t;
/* A HELLO message contains a magic number and protocol version /*
* A HELLO message contains a magic number and protocol version
* code in the header's dest_nid, the peer's NID in the src_nid, and * code in the header's dest_nid, the peer's NID in the src_nid, and
* LNET_MSG_HELLO in the type field. All other common fields are zero * LNET_MSG_HELLO in the type field. All other common fields are zero
* (including payload_size; i.e. no payload). * (including payload_size; i.e. no payload).
...@@ -208,8 +215,10 @@ typedef struct { ...@@ -208,8 +215,10 @@ typedef struct {
#define LNET_PROTO_PING_MAGIC 0x70696E67 /* 'ping' */ #define LNET_PROTO_PING_MAGIC 0x70696E67 /* 'ping' */
/* Placeholder for a future "unified" protocol across all LNDs */ /* Placeholder for a future "unified" protocol across all LNDs */
/* Current LNDs that receive a request with this magic will respond with a /*
* "stub" reply using their current protocol */ * Current LNDs that receive a request with this magic will respond with a
* "stub" reply using their current protocol
*/
#define LNET_PROTO_MAGIC 0x45726963 /* ! */ #define LNET_PROTO_MAGIC 0x45726963 /* ! */
#define LNET_PROTO_TCP_VERSION_MAJOR 1 #define LNET_PROTO_TCP_VERSION_MAJOR 1
...@@ -258,7 +267,7 @@ typedef struct lnet_counters { ...@@ -258,7 +267,7 @@ typedef struct lnet_counters {
#define LNET_MAX_INTERFACES 16 #define LNET_MAX_INTERFACES 16
/* /**
* Objects maintained by the LNet are accessed through handles. Handle types * Objects maintained by the LNet are accessed through handles. Handle types
* have names of the form lnet_handle_xx_t, where xx is one of the two letter * have names of the form lnet_handle_xx_t, where xx is one of the two letter
* object type codes ('eq' for event queue, 'md' for memory descriptor, and * object type codes ('eq' for event queue, 'md' for memory descriptor, and
...@@ -318,7 +327,8 @@ typedef struct { ...@@ -318,7 +327,8 @@ typedef struct {
/** @} lnet_addr */ /** @} lnet_addr */
/** \addtogroup lnet_me /** \addtogroup lnet_me
* @{ */ * @{
*/
/** /**
* Specifies whether the match entry or memory descriptor should be unlinked * Specifies whether the match entry or memory descriptor should be unlinked
...@@ -348,7 +358,8 @@ typedef enum { ...@@ -348,7 +358,8 @@ typedef enum {
/** @} lnet_me */ /** @} lnet_me */
/** \addtogroup lnet_md /** \addtogroup lnet_md
* @{ */ * @{
*/
/** /**
* Defines the visible parts of a memory descriptor. Values of this type * Defines the visible parts of a memory descriptor. Values of this type
...@@ -450,9 +461,11 @@ typedef struct { ...@@ -450,9 +461,11 @@ typedef struct {
lnet_handle_eq_t eq_handle; lnet_handle_eq_t eq_handle;
} lnet_md_t; } lnet_md_t;
/* Max Transfer Unit (minimum supported everywhere). /*
* Max Transfer Unit (minimum supported everywhere).
* CAVEAT EMPTOR, with multinet (i.e. routers forwarding between networks) * CAVEAT EMPTOR, with multinet (i.e. routers forwarding between networks)
* these limits are system wide and not interface-local. */ * these limits are system wide and not interface-local.
*/
#define LNET_MTU_BITS 20 #define LNET_MTU_BITS 20
#define LNET_MTU (1 << LNET_MTU_BITS) #define LNET_MTU (1 << LNET_MTU_BITS)
...@@ -506,7 +519,8 @@ typedef struct { ...@@ -506,7 +519,8 @@ typedef struct {
/** @} lnet_md */ /** @} lnet_md */
/** \addtogroup lnet_eq /** \addtogroup lnet_eq
* @{ */ * @{
*/
/** /**
* Six types of events can be logged in an event queue. * Six types of events can be logged in an event queue.
...@@ -640,7 +654,8 @@ typedef void (*lnet_eq_handler_t)(lnet_event_t *event); ...@@ -640,7 +654,8 @@ typedef void (*lnet_eq_handler_t)(lnet_event_t *event);
/** @} lnet_eq */ /** @} lnet_eq */
/** \addtogroup lnet_data /** \addtogroup lnet_data
* @{ */ * @{
*/
/** /**
* Specify whether an acknowledgment should be sent by target when the PUT * Specify whether an acknowledgment should be sent by target when the PUT
......
...@@ -189,8 +189,10 @@ void kiblnd_pack_msg(lnet_ni_t *ni, kib_msg_t *msg, int version, ...@@ -189,8 +189,10 @@ void kiblnd_pack_msg(lnet_ni_t *ni, kib_msg_t *msg, int version,
{ {
kib_net_t *net = ni->ni_data; kib_net_t *net = ni->ni_data;
/* CAVEAT EMPTOR! all message fields not set here should have been /*
* initialised previously. */ * CAVEAT EMPTOR! all message fields not set here should have been
* initialised previously.
*/
msg->ibm_magic = IBLND_MSG_MAGIC; msg->ibm_magic = IBLND_MSG_MAGIC;
msg->ibm_version = version; msg->ibm_version = version;
/* ibm_type */ /* ibm_type */
...@@ -249,8 +251,10 @@ int kiblnd_unpack_msg(kib_msg_t *msg, int nob) ...@@ -249,8 +251,10 @@ int kiblnd_unpack_msg(kib_msg_t *msg, int nob)
return -EPROTO; return -EPROTO;
} }
/* checksum must be computed with ibm_cksum zero and BEFORE anything /*
* gets flipped */ * checksum must be computed with ibm_cksum zero and BEFORE anything
* gets flipped
*/
msg_cksum = flip ? __swab32(msg->ibm_cksum) : msg->ibm_cksum; msg_cksum = flip ? __swab32(msg->ibm_cksum) : msg->ibm_cksum;
msg->ibm_cksum = 0; msg->ibm_cksum = 0;
if (msg_cksum != 0 && if (msg_cksum != 0 &&
...@@ -375,17 +379,21 @@ void kiblnd_destroy_peer(kib_peer_t *peer) ...@@ -375,17 +379,21 @@ void kiblnd_destroy_peer(kib_peer_t *peer)
LIBCFS_FREE(peer, sizeof(*peer)); LIBCFS_FREE(peer, sizeof(*peer));
/* NB a peer's connections keep a reference on their peer until /*
* NB a peer's connections keep a reference on their peer until
* they are destroyed, so we can be assured that _all_ state to do * they are destroyed, so we can be assured that _all_ state to do
* with this peer has been cleaned up when its refcount drops to * with this peer has been cleaned up when its refcount drops to
* zero. */ * zero.
*/
atomic_dec(&net->ibn_npeers); atomic_dec(&net->ibn_npeers);
} }
kib_peer_t *kiblnd_find_peer_locked(lnet_nid_t nid) kib_peer_t *kiblnd_find_peer_locked(lnet_nid_t nid)
{ {
/* the caller is responsible for accounting the additional reference /*
* that this creates */ * the caller is responsible for accounting the additional reference
* that this creates
*/
struct list_head *peer_list = kiblnd_nid2peerlist(nid); struct list_head *peer_list = kiblnd_nid2peerlist(nid);
struct list_head *tmp; struct list_head *tmp;
kib_peer_t *peer; kib_peer_t *peer;
...@@ -474,8 +482,10 @@ static void kiblnd_del_peer_locked(kib_peer_t *peer) ...@@ -474,8 +482,10 @@ static void kiblnd_del_peer_locked(kib_peer_t *peer)
} }
/* NB closing peer's last conn unlinked it. */ /* NB closing peer's last conn unlinked it. */
} }
/* NB peer now unlinked; might even be freed if the peer table had the /*
* last ref on it. */ * NB peer now unlinked; might even be freed if the peer table had the
* last ref on it.
*/
} }
static int kiblnd_del_peer(lnet_ni_t *ni, lnet_nid_t nid) static int kiblnd_del_peer(lnet_ni_t *ni, lnet_nid_t nid)
...@@ -636,13 +646,15 @@ static int kiblnd_get_completion_vector(kib_conn_t *conn, int cpt) ...@@ -636,13 +646,15 @@ static int kiblnd_get_completion_vector(kib_conn_t *conn, int cpt)
kib_conn_t *kiblnd_create_conn(kib_peer_t *peer, struct rdma_cm_id *cmid, kib_conn_t *kiblnd_create_conn(kib_peer_t *peer, struct rdma_cm_id *cmid,
int state, int version) int state, int version)
{ {
/* CAVEAT EMPTOR: /*
* CAVEAT EMPTOR:
* If the new conn is created successfully it takes over the caller's * If the new conn is created successfully it takes over the caller's
* ref on 'peer'. It also "owns" 'cmid' and destroys it when it itself * ref on 'peer'. It also "owns" 'cmid' and destroys it when it itself
* is destroyed. On failure, the caller's ref on 'peer' remains and * is destroyed. On failure, the caller's ref on 'peer' remains and
* she must dispose of 'cmid'. (Actually I'd block forever if I tried * she must dispose of 'cmid'. (Actually I'd block forever if I tried
* to destroy 'cmid' here since I'm called from the CM which still has * to destroy 'cmid' here since I'm called from the CM which still has
* its ref on 'cmid'). */ * its ref on 'cmid').
*/
rwlock_t *glock = &kiblnd_data.kib_global_lock; rwlock_t *glock = &kiblnd_data.kib_global_lock;
kib_net_t *net = peer->ibp_ni->ni_data; kib_net_t *net = peer->ibp_ni->ni_data;
kib_dev_t *dev; kib_dev_t *dev;
...@@ -800,15 +812,19 @@ kib_conn_t *kiblnd_create_conn(kib_peer_t *peer, struct rdma_cm_id *cmid, ...@@ -800,15 +812,19 @@ kib_conn_t *kiblnd_create_conn(kib_peer_t *peer, struct rdma_cm_id *cmid,
/* Make posted receives complete */ /* Make posted receives complete */
kiblnd_abort_receives(conn); kiblnd_abort_receives(conn);
/* correct # of posted buffers /*
* NB locking needed now I'm racing with completion */ * correct # of posted buffers
* NB locking needed now I'm racing with completion
*/
spin_lock_irqsave(&sched->ibs_lock, flags); spin_lock_irqsave(&sched->ibs_lock, flags);
conn->ibc_nrx -= IBLND_RX_MSGS(version) - i; conn->ibc_nrx -= IBLND_RX_MSGS(version) - i;
spin_unlock_irqrestore(&sched->ibs_lock, flags); spin_unlock_irqrestore(&sched->ibs_lock, flags);
/* cmid will be destroyed by CM(ofed) after cm_callback /*
* cmid will be destroyed by CM(ofed) after cm_callback
* returned, so we can't refer it anymore * returned, so we can't refer it anymore
* (by kiblnd_connd()->kiblnd_destroy_conn) */ * (by kiblnd_connd()->kiblnd_destroy_conn)
*/
rdma_destroy_qp(conn->ibc_cmid); rdma_destroy_qp(conn->ibc_cmid);
conn->ibc_cmid = NULL; conn->ibc_cmid = NULL;
...@@ -1077,8 +1093,10 @@ void kiblnd_query(lnet_ni_t *ni, lnet_nid_t nid, unsigned long *when) ...@@ -1077,8 +1093,10 @@ void kiblnd_query(lnet_ni_t *ni, lnet_nid_t nid, unsigned long *when)
if (last_alive != 0) if (last_alive != 0)
*when = last_alive; *when = last_alive;
/* peer is not persistent in hash, trigger peer creation /*
* and connection establishment with a NULL tx */ * peer is not persistent in hash, trigger peer creation
* and connection establishment with a NULL tx
*/
if (peer == NULL) if (peer == NULL)
kiblnd_launch_tx(ni, NULL, nid); kiblnd_launch_tx(ni, NULL, nid);
...@@ -2070,8 +2088,10 @@ static int kiblnd_net_init_pools(kib_net_t *net, __u32 *cpts, int ncpts) ...@@ -2070,8 +2088,10 @@ static int kiblnd_net_init_pools(kib_net_t *net, __u32 *cpts, int ncpts)
static int kiblnd_hdev_get_attr(kib_hca_dev_t *hdev) static int kiblnd_hdev_get_attr(kib_hca_dev_t *hdev)
{ {
/* It's safe to assume a HCA can handle a page size /*
* matching that of the native system */ * It's safe to assume a HCA can handle a page size
* matching that of the native system
*/
hdev->ibh_page_shift = PAGE_SHIFT; hdev->ibh_page_shift = PAGE_SHIFT;
hdev->ibh_page_size = 1 << PAGE_SHIFT; hdev->ibh_page_size = 1 << PAGE_SHIFT;
hdev->ibh_page_mask = ~((__u64)hdev->ibh_page_size - 1); hdev->ibh_page_mask = ~((__u64)hdev->ibh_page_size - 1);
...@@ -2175,7 +2195,8 @@ static int kiblnd_dev_need_failover(kib_dev_t *dev) ...@@ -2175,7 +2195,8 @@ static int kiblnd_dev_need_failover(kib_dev_t *dev)
*kiblnd_tunables.kib_dev_failover > 1) /* debugging */ *kiblnd_tunables.kib_dev_failover > 1) /* debugging */
return 1; return 1;
/* XXX: it's UGLY, but I don't have better way to find /*
* XXX: it's UGLY, but I don't have better way to find
* ib-bonding HCA failover because: * ib-bonding HCA failover because:
* *
* a. no reliable CM event for HCA failover... * a. no reliable CM event for HCA failover...
...@@ -2184,7 +2205,8 @@ static int kiblnd_dev_need_failover(kib_dev_t *dev) ...@@ -2184,7 +2205,8 @@ static int kiblnd_dev_need_failover(kib_dev_t *dev)
* We have only two choices at this point: * We have only two choices at this point:
* *
* a. rdma_bind_addr(), it will conflict with listener cmid * a. rdma_bind_addr(), it will conflict with listener cmid
* b. rdma_resolve_addr() to zero addr */ * b. rdma_resolve_addr() to zero addr
*/
cmid = kiblnd_rdma_create_id(kiblnd_dummy_callback, dev, RDMA_PS_TCP, cmid = kiblnd_rdma_create_id(kiblnd_dummy_callback, dev, RDMA_PS_TCP,
IB_QPT_RC); IB_QPT_RC);
if (IS_ERR(cmid)) { if (IS_ERR(cmid)) {
...@@ -2239,15 +2261,19 @@ int kiblnd_dev_failover(kib_dev_t *dev) ...@@ -2239,15 +2261,19 @@ int kiblnd_dev_failover(kib_dev_t *dev)
if (dev->ibd_hdev != NULL && if (dev->ibd_hdev != NULL &&
dev->ibd_hdev->ibh_cmid != NULL) { dev->ibd_hdev->ibh_cmid != NULL) {
/* XXX it's not good to close old listener at here, /*
* XXX it's not good to close old listener at here,
* because we can fail to create new listener. * because we can fail to create new listener.
* But we have to close it now, otherwise rdma_bind_addr * But we have to close it now, otherwise rdma_bind_addr
* will return EADDRINUSE... How crap! */ * will return EADDRINUSE... How crap!
*/
write_lock_irqsave(&kiblnd_data.kib_global_lock, flags); write_lock_irqsave(&kiblnd_data.kib_global_lock, flags);
cmid = dev->ibd_hdev->ibh_cmid; cmid = dev->ibd_hdev->ibh_cmid;
/* make next schedule of kiblnd_dev_need_failover() /*
* return 1 for me */ * make next schedule of kiblnd_dev_need_failover()
* return 1 for me
*/
dev->ibd_hdev->ibh_cmid = NULL; dev->ibd_hdev->ibh_cmid = NULL;
write_unlock_irqrestore(&kiblnd_data.kib_global_lock, flags); write_unlock_irqrestore(&kiblnd_data.kib_global_lock, flags);
...@@ -2433,9 +2459,11 @@ static void kiblnd_base_shutdown(void) ...@@ -2433,9 +2459,11 @@ static void kiblnd_base_shutdown(void)
/* flag threads to terminate; wake and wait for them to die */ /* flag threads to terminate; wake and wait for them to die */
kiblnd_data.kib_shutdown = 1; kiblnd_data.kib_shutdown = 1;
/* NB: we really want to stop scheduler threads net by net /*
* NB: we really want to stop scheduler threads net by net
* instead of the whole module, this should be improved * instead of the whole module, this should be improved
* with dynamic configuration LNet */ * with dynamic configuration LNet
*/
cfs_percpt_for_each(sched, i, kiblnd_data.kib_scheds) cfs_percpt_for_each(sched, i, kiblnd_data.kib_scheds)
wake_up_all(&sched->ibs_waitq); wake_up_all(&sched->ibs_waitq);
...@@ -2585,8 +2613,10 @@ static int kiblnd_base_startup(void) ...@@ -2585,8 +2613,10 @@ static int kiblnd_base_startup(void)
if (*kiblnd_tunables.kib_nscheds > 0) { if (*kiblnd_tunables.kib_nscheds > 0) {
nthrs = min(nthrs, *kiblnd_tunables.kib_nscheds); nthrs = min(nthrs, *kiblnd_tunables.kib_nscheds);
} else { } else {
/* max to half of CPUs, another half is reserved for /*
* upper layer modules */ * max to half of CPUs, another half is reserved for
* upper layer modules
*/
nthrs = min(max(IBLND_N_SCHED, nthrs >> 1), nthrs); nthrs = min(max(IBLND_N_SCHED, nthrs >> 1), nthrs);
} }
......
...@@ -52,8 +52,10 @@ static int timeout = 50; ...@@ -52,8 +52,10 @@ static int timeout = 50;
module_param(timeout, int, 0644); module_param(timeout, int, 0644);
MODULE_PARM_DESC(timeout, "timeout (seconds)"); MODULE_PARM_DESC(timeout, "timeout (seconds)");
/* Number of threads in each scheduler pool which is percpt, /*
* we will estimate reasonable value based on CPUs if it's set to zero. */ * Number of threads in each scheduler pool which is percpt,
* we will estimate reasonable value based on CPUs if it's set to zero.
*/
static int nscheds; static int nscheds;
module_param(nscheds, int, 0444); module_param(nscheds, int, 0444);
MODULE_PARM_DESC(nscheds, "number of threads in each scheduler pool"); MODULE_PARM_DESC(nscheds, "number of threads in each scheduler pool");
......
...@@ -69,8 +69,10 @@ ...@@ -69,8 +69,10 @@
#define SOCKNAL_VERSION_DEBUG 0 /* enable protocol version debugging */ #define SOCKNAL_VERSION_DEBUG 0 /* enable protocol version debugging */
/* risk kmap deadlock on multi-frag I/O (backs off to single-frag if disabled). /*
* no risk if we're not running on a CONFIG_HIGHMEM platform. */ * risk kmap deadlock on multi-frag I/O (backs off to single-frag if disabled).
* no risk if we're not running on a CONFIG_HIGHMEM platform.
*/
#ifdef CONFIG_HIGHMEM #ifdef CONFIG_HIGHMEM
# define SOCKNAL_RISK_KMAP_DEADLOCK 0 # define SOCKNAL_RISK_KMAP_DEADLOCK 0
#else #else
...@@ -237,15 +239,16 @@ typedef struct { ...@@ -237,15 +239,16 @@ typedef struct {
#define SOCKNAL_INIT_DATA 1 #define SOCKNAL_INIT_DATA 1
#define SOCKNAL_INIT_ALL 2 #define SOCKNAL_INIT_ALL 2
/* A packet just assembled for transmission is represented by 1 or more /*
* A packet just assembled for transmission is represented by 1 or more
* struct iovec fragments (the first frag contains the portals header), * struct iovec fragments (the first frag contains the portals header),
* followed by 0 or more lnet_kiov_t fragments. * followed by 0 or more lnet_kiov_t fragments.
* *
* On the receive side, initially 1 struct iovec fragment is posted for * On the receive side, initially 1 struct iovec fragment is posted for
* receive (the header). Once the header has been received, the payload is * receive (the header). Once the header has been received, the payload is
* received into either struct iovec or lnet_kiov_t fragments, depending on * received into either struct iovec or lnet_kiov_t fragments, depending on
* what the header matched or whether the message needs forwarding. */ * what the header matched or whether the message needs forwarding.
*/
struct ksock_conn; /* forward ref */ struct ksock_conn; /* forward ref */
struct ksock_peer; /* forward ref */ struct ksock_peer; /* forward ref */
struct ksock_route; /* forward ref */ struct ksock_route; /* forward ref */
...@@ -288,8 +291,10 @@ typedef struct /* transmit packet */ ...@@ -288,8 +291,10 @@ typedef struct /* transmit packet */
/* network zero copy callback descriptor embedded in ksock_tx_t */ /* network zero copy callback descriptor embedded in ksock_tx_t */
/* space for the rx frag descriptors; we either read a single contiguous /*
* header, or up to LNET_MAX_IOV frags of payload of either type. */ * space for the rx frag descriptors; we either read a single contiguous
* header, or up to LNET_MAX_IOV frags of payload of either type.
*/
typedef union { typedef union {
struct kvec iov[LNET_MAX_IOV]; struct kvec iov[LNET_MAX_IOV];
lnet_kiov_t kiov[LNET_MAX_IOV]; lnet_kiov_t kiov[LNET_MAX_IOV];
...@@ -463,11 +468,13 @@ typedef struct ksock_proto { ...@@ -463,11 +468,13 @@ typedef struct ksock_proto {
/* handle ZC ACK */ /* handle ZC ACK */
int (*pro_handle_zcack)(ksock_conn_t *, __u64, __u64); int (*pro_handle_zcack)(ksock_conn_t *, __u64, __u64);
/* msg type matches the connection type: /*
* msg type matches the connection type:
* return value: * return value:
* return MATCH_NO : no * return MATCH_NO : no
* return MATCH_YES : matching type * return MATCH_YES : matching type
* return MATCH_MAY : can be backup */ * return MATCH_MAY : can be backup
*/
int (*pro_match_tx)(ksock_conn_t *, ksock_tx_t *, int); int (*pro_match_tx)(ksock_conn_t *, ksock_tx_t *, int);
} ksock_proto_t; } ksock_proto_t;
......
...@@ -67,8 +67,10 @@ ksocknal_lib_zc_capable(ksock_conn_t *conn) ...@@ -67,8 +67,10 @@ ksocknal_lib_zc_capable(ksock_conn_t *conn)
if (conn->ksnc_proto == &ksocknal_protocol_v1x) if (conn->ksnc_proto == &ksocknal_protocol_v1x)
return 0; return 0;
/* ZC if the socket supports scatter/gather and doesn't need software /*
* checksums */ * ZC if the socket supports scatter/gather and doesn't need software
* checksums
*/
return ((caps & NETIF_F_SG) != 0 && (caps & NETIF_F_CSUM_MASK) != 0); return ((caps & NETIF_F_SG) != 0 && (caps & NETIF_F_CSUM_MASK) != 0);
} }
...@@ -85,9 +87,10 @@ ksocknal_lib_send_iov(ksock_conn_t *conn, ksock_tx_t *tx) ...@@ -85,9 +87,10 @@ ksocknal_lib_send_iov(ksock_conn_t *conn, ksock_tx_t *tx)
tx->tx_msg.ksm_csum == 0) /* not checksummed */ tx->tx_msg.ksm_csum == 0) /* not checksummed */
ksocknal_lib_csum_tx(tx); ksocknal_lib_csum_tx(tx);
/* NB we can't trust socket ops to either consume our iovs /*
* or leave them alone. */ * NB we can't trust socket ops to either consume our iovs
* or leave them alone.
*/
{ {
#if SOCKNAL_SINGLE_FRAG_TX #if SOCKNAL_SINGLE_FRAG_TX
struct kvec scratch; struct kvec scratch;
...@@ -125,8 +128,10 @@ ksocknal_lib_send_kiov(ksock_conn_t *conn, ksock_tx_t *tx) ...@@ -125,8 +128,10 @@ ksocknal_lib_send_kiov(ksock_conn_t *conn, ksock_tx_t *tx)
/* Not NOOP message */ /* Not NOOP message */
LASSERT(tx->tx_lnetmsg != NULL); LASSERT(tx->tx_lnetmsg != NULL);
/* NB we can't trust socket ops to either consume our iovs /*
* or leave them alone. */ * NB we can't trust socket ops to either consume our iovs
* or leave them alone.
*/
if (tx->tx_msg.ksm_zc_cookies[0] != 0) { if (tx->tx_msg.ksm_zc_cookies[0] != 0) {
/* Zero copy is enabled */ /* Zero copy is enabled */
struct sock *sk = sock->sk; struct sock *sk = sock->sk;
...@@ -187,11 +192,12 @@ ksocknal_lib_eager_ack(ksock_conn_t *conn) ...@@ -187,11 +192,12 @@ ksocknal_lib_eager_ack(ksock_conn_t *conn)
int opt = 1; int opt = 1;
struct socket *sock = conn->ksnc_sock; struct socket *sock = conn->ksnc_sock;
/* Remind the socket to ACK eagerly. If I don't, the socket might /*
* Remind the socket to ACK eagerly. If I don't, the socket might
* think I'm about to send something it could piggy-back the ACK * think I'm about to send something it could piggy-back the ACK
* on, introducing delay in completing zero-copy sends in my * on, introducing delay in completing zero-copy sends in my
* peer. */ * peer.
*/
kernel_setsockopt(sock, SOL_TCP, TCP_QUICKACK, kernel_setsockopt(sock, SOL_TCP, TCP_QUICKACK,
(char *)&opt, sizeof(opt)); (char *)&opt, sizeof(opt));
} }
...@@ -218,8 +224,10 @@ ksocknal_lib_recv_iov(ksock_conn_t *conn) ...@@ -218,8 +224,10 @@ ksocknal_lib_recv_iov(ksock_conn_t *conn)
int sum; int sum;
__u32 saved_csum; __u32 saved_csum;
/* NB we can't trust socket ops to either consume our iovs /*
* or leave them alone. */ * NB we can't trust socket ops to either consume our iovs
* or leave them alone.
*/
LASSERT(niov > 0); LASSERT(niov > 0);
for (nob = i = 0; i < niov; i++) { for (nob = i = 0; i < niov; i++) {
...@@ -329,8 +337,10 @@ ksocknal_lib_recv_kiov(ksock_conn_t *conn) ...@@ -329,8 +337,10 @@ ksocknal_lib_recv_kiov(ksock_conn_t *conn)
int fragnob; int fragnob;
int n; int n;
/* NB we can't trust socket ops to either consume our iovs /*
* or leave them alone. */ * NB we can't trust socket ops to either consume our iovs
* or leave them alone.
*/
addr = ksocknal_lib_kiov_vmap(kiov, niov, scratchiov, pages); addr = ksocknal_lib_kiov_vmap(kiov, niov, scratchiov, pages);
if (addr != NULL) { if (addr != NULL) {
nob = scratchiov[0].iov_len; nob = scratchiov[0].iov_len;
...@@ -354,10 +364,12 @@ ksocknal_lib_recv_kiov(ksock_conn_t *conn) ...@@ -354,10 +364,12 @@ ksocknal_lib_recv_kiov(ksock_conn_t *conn)
for (i = 0, sum = rc; sum > 0; i++, sum -= fragnob) { for (i = 0, sum = rc; sum > 0; i++, sum -= fragnob) {
LASSERT(i < niov); LASSERT(i < niov);
/* Dang! have to kmap again because I have nowhere to /*
* Dang! have to kmap again because I have nowhere to
* stash the mapped address. But by doing it while the * stash the mapped address. But by doing it while the
* page is still mapped, the kernel just bumps the map * page is still mapped, the kernel just bumps the map
* count and returns me the address it stashed. */ * count and returns me the address it stashed.
*/
base = kmap(kiov[i].kiov_page) + kiov[i].kiov_offset; base = kmap(kiov[i].kiov_page) + kiov[i].kiov_offset;
fragnob = kiov[i].kiov_len; fragnob = kiov[i].kiov_len;
if (fragnob > sum) if (fragnob > sum)
...@@ -463,9 +475,10 @@ ksocknal_lib_setup_sock(struct socket *sock) ...@@ -463,9 +475,10 @@ ksocknal_lib_setup_sock(struct socket *sock)
sock->sk->sk_allocation = GFP_NOFS; sock->sk->sk_allocation = GFP_NOFS;
/* Ensure this socket aborts active sends immediately when we close /*
* it. */ * Ensure this socket aborts active sends immediately when we close
* it.
*/
linger.l_onoff = 0; linger.l_onoff = 0;
linger.l_linger = 0; linger.l_linger = 0;
...@@ -637,10 +650,11 @@ ksocknal_write_space(struct sock *sk) ...@@ -637,10 +650,11 @@ ksocknal_write_space(struct sock *sk)
if (wspace >= min_wpace) { /* got enough space */ if (wspace >= min_wpace) { /* got enough space */
ksocknal_write_callback(conn); ksocknal_write_callback(conn);
/* Clear SOCK_NOSPACE _after_ ksocknal_write_callback so the /*
* Clear SOCK_NOSPACE _after_ ksocknal_write_callback so the
* ENOMEM check in ksocknal_transmit is race-free (think about * ENOMEM check in ksocknal_transmit is race-free (think about
* it). */ * it).
*/
clear_bit(SOCK_NOSPACE, &sk->sk_socket->flags); clear_bit(SOCK_NOSPACE, &sk->sk_socket->flags);
} }
...@@ -666,15 +680,19 @@ ksocknal_lib_set_callback(struct socket *sock, ksock_conn_t *conn) ...@@ -666,15 +680,19 @@ ksocknal_lib_set_callback(struct socket *sock, ksock_conn_t *conn)
void void
ksocknal_lib_reset_callback(struct socket *sock, ksock_conn_t *conn) ksocknal_lib_reset_callback(struct socket *sock, ksock_conn_t *conn)
{ {
/* Remove conn's network callbacks. /*
* Remove conn's network callbacks.
* NB I _have_ to restore the callback, rather than storing a noop, * NB I _have_ to restore the callback, rather than storing a noop,
* since the socket could survive past this module being unloaded!! */ * since the socket could survive past this module being unloaded!!
*/
sock->sk->sk_data_ready = conn->ksnc_saved_data_ready; sock->sk->sk_data_ready = conn->ksnc_saved_data_ready;
sock->sk->sk_write_space = conn->ksnc_saved_write_space; sock->sk->sk_write_space = conn->ksnc_saved_write_space;
/* A callback could be in progress already; they hold a read lock /*
* A callback could be in progress already; they hold a read lock
* on ksnd_global_lock (to serialise with me) and NOOP if * on ksnd_global_lock (to serialise with me) and NOOP if
* sk_user_data is NULL. */ * sk_user_data is NULL.
*/
sock->sk->sk_user_data = NULL; sock->sk->sk_user_data = NULL;
return ; return ;
...@@ -691,14 +709,16 @@ ksocknal_lib_memory_pressure(ksock_conn_t *conn) ...@@ -691,14 +709,16 @@ ksocknal_lib_memory_pressure(ksock_conn_t *conn)
if (!test_bit(SOCK_NOSPACE, &conn->ksnc_sock->flags) && if (!test_bit(SOCK_NOSPACE, &conn->ksnc_sock->flags) &&
!conn->ksnc_tx_ready) { !conn->ksnc_tx_ready) {
/* SOCK_NOSPACE is set when the socket fills /*
* SOCK_NOSPACE is set when the socket fills
* and cleared in the write_space callback * and cleared in the write_space callback
* (which also sets ksnc_tx_ready). If * (which also sets ksnc_tx_ready). If
* SOCK_NOSPACE and ksnc_tx_ready are BOTH * SOCK_NOSPACE and ksnc_tx_ready are BOTH
* zero, I didn't fill the socket and * zero, I didn't fill the socket and
* write_space won't reschedule me, so I * write_space won't reschedule me, so I
* return -ENOMEM to get my caller to retry * return -ENOMEM to get my caller to retry
* after a timeout */ * after a timeout
*/
rc = -ENOMEM; rc = -ENOMEM;
} }
......
...@@ -41,8 +41,10 @@ static int peer_timeout = 180; ...@@ -41,8 +41,10 @@ static int peer_timeout = 180;
module_param(peer_timeout, int, 0444); module_param(peer_timeout, int, 0444);
MODULE_PARM_DESC(peer_timeout, "Seconds without aliveness news to declare peer dead (<=0 to disable)"); MODULE_PARM_DESC(peer_timeout, "Seconds without aliveness news to declare peer dead (<=0 to disable)");
/* Number of daemons in each thread pool which is percpt, /*
* we will estimate reasonable value based on CPUs if it's not set. */ * Number of daemons in each thread pool which is percpt,
* we will estimate reasonable value based on CPUs if it's not set.
*/
static unsigned int nscheds; static unsigned int nscheds;
module_param(nscheds, int, 0444); module_param(nscheds, int, 0444);
MODULE_PARM_DESC(nscheds, "# scheduler daemons in each pool while starting"); MODULE_PARM_DESC(nscheds, "# scheduler daemons in each pool while starting");
......
...@@ -468,8 +468,10 @@ ksocknal_send_hello_v1(ksock_conn_t *conn, ksock_hello_msg_t *hello) ...@@ -468,8 +468,10 @@ ksocknal_send_hello_v1(ksock_conn_t *conn, ksock_hello_msg_t *hello)
hmv = (lnet_magicversion_t *)&hdr->dest_nid; hmv = (lnet_magicversion_t *)&hdr->dest_nid;
/* Re-organize V2.x message header to V1.x (lnet_hdr_t) /*
* header and send out */ * Re-organize V2.x message header to V1.x (lnet_hdr_t)
* header and send out
*/
hmv->magic = cpu_to_le32 (LNET_PROTO_TCP_MAGIC); hmv->magic = cpu_to_le32 (LNET_PROTO_TCP_MAGIC);
hmv->version_major = cpu_to_le16 (KSOCK_PROTO_V1_MAJOR); hmv->version_major = cpu_to_le16 (KSOCK_PROTO_V1_MAJOR);
hmv->version_minor = cpu_to_le16 (KSOCK_PROTO_V1_MINOR); hmv->version_minor = cpu_to_le16 (KSOCK_PROTO_V1_MINOR);
......
...@@ -78,9 +78,11 @@ static char *accept_type; ...@@ -78,9 +78,11 @@ static char *accept_type;
static int static int
lnet_acceptor_get_tunables(void) lnet_acceptor_get_tunables(void)
{ {
/* Userland acceptor uses 'accept_type' instead of 'accept', due to /*
* Userland acceptor uses 'accept_type' instead of 'accept', due to
* conflict with 'accept(2)', but kernel acceptor still uses 'accept' * conflict with 'accept(2)', but kernel acceptor still uses 'accept'
* for compatibility. Hence the trick. */ * for compatibility. Hence the trick.
*/
accept_type = accept; accept_type = accept;
return 0; return 0;
} }
...@@ -223,11 +225,12 @@ lnet_accept(struct socket *sock, __u32 magic) ...@@ -223,11 +225,12 @@ lnet_accept(struct socket *sock, __u32 magic)
if (!lnet_accept_magic(magic, LNET_PROTO_ACCEPTOR_MAGIC)) { if (!lnet_accept_magic(magic, LNET_PROTO_ACCEPTOR_MAGIC)) {
if (lnet_accept_magic(magic, LNET_PROTO_MAGIC)) { if (lnet_accept_magic(magic, LNET_PROTO_MAGIC)) {
/* future version compatibility! /*
* future version compatibility!
* When LNET unifies protocols over all LNDs, the first * When LNET unifies protocols over all LNDs, the first
* thing sent will be a version query. I send back * thing sent will be a version query. I send back
* LNET_PROTO_ACCEPTOR_MAGIC to tell her I'm "old" */ * LNET_PROTO_ACCEPTOR_MAGIC to tell her I'm "old"
*/
memset(&cr, 0, sizeof(cr)); memset(&cr, 0, sizeof(cr));
cr.acr_magic = LNET_PROTO_ACCEPTOR_MAGIC; cr.acr_magic = LNET_PROTO_ACCEPTOR_MAGIC;
cr.acr_version = LNET_PROTO_ACCEPTOR_VERSION; cr.acr_version = LNET_PROTO_ACCEPTOR_VERSION;
...@@ -264,10 +267,12 @@ lnet_accept(struct socket *sock, __u32 magic) ...@@ -264,10 +267,12 @@ lnet_accept(struct socket *sock, __u32 magic)
__swab32s(&cr.acr_version); __swab32s(&cr.acr_version);
if (cr.acr_version != LNET_PROTO_ACCEPTOR_VERSION) { if (cr.acr_version != LNET_PROTO_ACCEPTOR_VERSION) {
/* future version compatibility! /*
* future version compatibility!
* An acceptor-specific protocol rev will first send a version * An acceptor-specific protocol rev will first send a version
* query. I send back my current version to tell her I'm * query. I send back my current version to tell her I'm
* "old". */ * "old".
*/
int peer_version = cr.acr_version; int peer_version = cr.acr_version;
memset(&cr, 0, sizeof(cr)); memset(&cr, 0, sizeof(cr));
......
...@@ -174,10 +174,12 @@ lnet_create_locks(void) ...@@ -174,10 +174,12 @@ lnet_create_locks(void)
static void lnet_assert_wire_constants(void) static void lnet_assert_wire_constants(void)
{ {
/* Wire protocol assertions generated by 'wirecheck' /*
* Wire protocol assertions generated by 'wirecheck'
* running on Linux robert.bartonsoftware.com 2.6.8-1.521 * running on Linux robert.bartonsoftware.com 2.6.8-1.521
* #1 Mon Aug 16 09:01:18 EDT 2004 i686 athlon i386 GNU/Linux * #1 Mon Aug 16 09:01:18 EDT 2004 i686 athlon i386 GNU/Linux
* with gcc version 3.3.3 20040412 (Red Hat Linux 3.3.3-7) */ * with gcc version 3.3.3 20040412 (Red Hat Linux 3.3.3-7)
*/
/* Constants... */ /* Constants... */
CLASSERT(LNET_PROTO_TCP_MAGIC == 0xeebc0ded); CLASSERT(LNET_PROTO_TCP_MAGIC == 0xeebc0ded);
...@@ -398,9 +400,11 @@ lnet_res_container_cleanup(struct lnet_res_container *rec) ...@@ -398,9 +400,11 @@ lnet_res_container_cleanup(struct lnet_res_container *rec)
} }
if (count > 0) { if (count > 0) {
/* Found alive MD/ME/EQ, user really should unlink/free /*
* Found alive MD/ME/EQ, user really should unlink/free
* all of them before finalize LNet, but if someone didn't, * all of them before finalize LNet, but if someone didn't,
* we have to recycle garbage for him */ * we have to recycle garbage for him
*/
CERROR("%d active elements on exit of %s container\n", CERROR("%d active elements on exit of %s container\n",
count, lnet_res_type2str(rec->rec_type)); count, lnet_res_type2str(rec->rec_type));
} }
...@@ -605,11 +609,12 @@ lnet_prepare(lnet_pid_t requested_pid) ...@@ -605,11 +609,12 @@ lnet_prepare(lnet_pid_t requested_pid)
int int
lnet_unprepare(void) lnet_unprepare(void)
{ {
/* NB no LNET_LOCK since this is the last reference. All LND instances /*
* NB no LNET_LOCK since this is the last reference. All LND instances
* have shut down already, so it is safe to unlink and free all * have shut down already, so it is safe to unlink and free all
* descriptors, even those that appear committed to a network op (eg MD * descriptors, even those that appear committed to a network op (eg MD
* with non-zero pending count) */ * with non-zero pending count)
*/
lnet_fail_nid(LNET_NID_ANY, 0); lnet_fail_nid(LNET_NID_ANY, 0);
LASSERT(the_lnet.ln_refcount == 0); LASSERT(the_lnet.ln_refcount == 0);
...@@ -877,18 +882,24 @@ lnet_shutdown_lndnis(void) ...@@ -877,18 +882,24 @@ lnet_shutdown_lndnis(void)
lnet_net_unlock(LNET_LOCK_EX); lnet_net_unlock(LNET_LOCK_EX);
/* Clear lazy portals and drop delayed messages which hold refs /*
* on their lnet_msg_t::msg_rxpeer */ * Clear lazy portals and drop delayed messages which hold refs
* on their lnet_msg_t::msg_rxpeer
*/
for (i = 0; i < the_lnet.ln_nportals; i++) for (i = 0; i < the_lnet.ln_nportals; i++)
LNetClearLazyPortal(i); LNetClearLazyPortal(i);
/* Clear the peer table and wait for all peers to go (they hold refs on /*
* their NIs) */ * Clear the peer table and wait for all peers to go (they hold refs on
* their NIs)
*/
lnet_peer_tables_cleanup(); lnet_peer_tables_cleanup();
lnet_net_lock(LNET_LOCK_EX); lnet_net_lock(LNET_LOCK_EX);
/* Now wait for the NI's I just nuked to show up on ln_zombie_nis /*
* and shut them down in guaranteed thread context */ * Now wait for the NI's I just nuked to show up on ln_zombie_nis
* and shut them down in guaranteed thread context
*/
i = 2; i = 2;
while (!list_empty(&the_lnet.ln_nis_zombie)) { while (!list_empty(&the_lnet.ln_nis_zombie)) {
int *ref; int *ref;
...@@ -926,9 +937,10 @@ lnet_shutdown_lndnis(void) ...@@ -926,9 +937,10 @@ lnet_shutdown_lndnis(void)
LASSERT(!in_interrupt()); LASSERT(!in_interrupt());
(ni->ni_lnd->lnd_shutdown)(ni); (ni->ni_lnd->lnd_shutdown)(ni);
/* can't deref lnd anymore now; it might have unregistered /*
* itself... */ * can't deref lnd anymore now; it might have unregistered
* itself...
*/
if (!islo) if (!islo)
CDEBUG(D_LNI, "Removed LNI %s\n", CDEBUG(D_LNI, "Removed LNI %s\n",
libcfs_nid2str(ni->ni_nid)); libcfs_nid2str(ni->ni_nid));
...@@ -1139,9 +1151,11 @@ lnet_init(void) ...@@ -1139,9 +1151,11 @@ lnet_init(void)
INIT_LIST_HEAD(&the_lnet.ln_rcd_zombie); INIT_LIST_HEAD(&the_lnet.ln_rcd_zombie);
INIT_LIST_HEAD(&the_lnet.ln_rcd_deathrow); INIT_LIST_HEAD(&the_lnet.ln_rcd_deathrow);
/* The hash table size is the number of bits it takes to express the set /*
* The hash table size is the number of bits it takes to express the set
* ln_num_routes, minus 1 (better to under estimate than over so we * ln_num_routes, minus 1 (better to under estimate than over so we
* don't waste memory). */ * don't waste memory).
*/
if (rnet_htable_size <= 0) if (rnet_htable_size <= 0)
rnet_htable_size = LNET_REMOTE_NETS_HASH_DEFAULT; rnet_htable_size = LNET_REMOTE_NETS_HASH_DEFAULT;
else if (rnet_htable_size > LNET_REMOTE_NETS_HASH_MAX) else if (rnet_htable_size > LNET_REMOTE_NETS_HASH_MAX)
...@@ -1149,9 +1163,11 @@ lnet_init(void) ...@@ -1149,9 +1163,11 @@ lnet_init(void)
the_lnet.ln_remote_nets_hbits = max_t(int, 1, the_lnet.ln_remote_nets_hbits = max_t(int, 1,
order_base_2(rnet_htable_size) - 1); order_base_2(rnet_htable_size) - 1);
/* All LNDs apart from the LOLND are in separate modules. They /*
* All LNDs apart from the LOLND are in separate modules. They
* register themselves when their module loads, and unregister * register themselves when their module loads, and unregister
* themselves when their module is unloaded. */ * themselves when their module is unloaded.
*/
lnet_register_lnd(&the_lolnd); lnet_register_lnd(&the_lolnd);
return 0; return 0;
} }
...@@ -1244,8 +1260,10 @@ LNetNIInit(lnet_pid_t requested_pid) ...@@ -1244,8 +1260,10 @@ LNetNIInit(lnet_pid_t requested_pid)
the_lnet.ln_refcount = 1; the_lnet.ln_refcount = 1;
/* Now I may use my own API functions... */ /* Now I may use my own API functions... */
/* NB router checker needs the_lnet.ln_ping_info in /*
* lnet_router_checker -> lnet_update_ni_status_locked */ * NB router checker needs the_lnet.ln_ping_info in
* lnet_router_checker -> lnet_update_ni_status_locked
*/
rc = lnet_ping_target_init(); rc = lnet_ping_target_init();
if (rc != 0) if (rc != 0)
goto failed3; goto failed3;
...@@ -1554,8 +1572,10 @@ lnet_ping_target_init(void) ...@@ -1554,8 +1572,10 @@ lnet_ping_target_init(void)
if (rc != 0) if (rc != 0)
return rc; return rc;
/* We can have a tiny EQ since we only need to see the unlink event on /*
* teardown, which by definition is the last one! */ * We can have a tiny EQ since we only need to see the unlink event on
* teardown, which by definition is the last one!
*/
rc = LNetEQAlloc(2, LNET_EQ_HANDLER_NONE, &the_lnet.ln_ping_target_eq); rc = LNetEQAlloc(2, LNET_EQ_HANDLER_NONE, &the_lnet.ln_ping_target_eq);
if (rc != 0) { if (rc != 0) {
CERROR("Can't allocate ping EQ: %d\n", rc); CERROR("Can't allocate ping EQ: %d\n", rc);
......
...@@ -75,18 +75,21 @@ LNetEQAlloc(unsigned int count, lnet_eq_handler_t callback, ...@@ -75,18 +75,21 @@ LNetEQAlloc(unsigned int count, lnet_eq_handler_t callback,
LASSERT(the_lnet.ln_init); LASSERT(the_lnet.ln_init);
LASSERT(the_lnet.ln_refcount > 0); LASSERT(the_lnet.ln_refcount > 0);
/* We need count to be a power of 2 so that when eq_{enq,deq}_seq /*
* We need count to be a power of 2 so that when eq_{enq,deq}_seq
* overflow, they don't skip entries, so the queue has the same * overflow, they don't skip entries, so the queue has the same
* apparent capacity at all times */ * apparent capacity at all times
*/
if (count) if (count)
count = roundup_pow_of_two(count); count = roundup_pow_of_two(count);
if (callback != LNET_EQ_HANDLER_NONE && count != 0) if (callback != LNET_EQ_HANDLER_NONE && count != 0)
CWARN("EQ callback is guaranteed to get every event, do you still want to set eqcount %d for polling event which will have locking overhead? Please contact with developer to confirm\n", count); CWARN("EQ callback is guaranteed to get every event, do you still want to set eqcount %d for polling event which will have locking overhead? Please contact with developer to confirm\n", count);
/* count can be 0 if only need callback, we can eliminate /*
* overhead of enqueue event */ * count can be 0 if only need callback, we can eliminate
* overhead of enqueue event
*/
if (count == 0 && callback == LNET_EQ_HANDLER_NONE) if (count == 0 && callback == LNET_EQ_HANDLER_NONE)
return -EINVAL; return -EINVAL;
...@@ -98,8 +101,10 @@ LNetEQAlloc(unsigned int count, lnet_eq_handler_t callback, ...@@ -98,8 +101,10 @@ LNetEQAlloc(unsigned int count, lnet_eq_handler_t callback,
LIBCFS_ALLOC(eq->eq_events, count * sizeof(lnet_event_t)); LIBCFS_ALLOC(eq->eq_events, count * sizeof(lnet_event_t));
if (eq->eq_events == NULL) if (eq->eq_events == NULL)
goto failed; goto failed;
/* NB allocator has set all event sequence numbers to 0, /*
* so all them should be earlier than eq_deq_seq */ * NB allocator has set all event sequence numbers to 0,
* so all them should be earlier than eq_deq_seq
*/
} }
eq->eq_deq_seq = 1; eq->eq_deq_seq = 1;
...@@ -114,8 +119,10 @@ LNetEQAlloc(unsigned int count, lnet_eq_handler_t callback, ...@@ -114,8 +119,10 @@ LNetEQAlloc(unsigned int count, lnet_eq_handler_t callback,
/* MUST hold both exclusive lnet_res_lock */ /* MUST hold both exclusive lnet_res_lock */
lnet_res_lock(LNET_LOCK_EX); lnet_res_lock(LNET_LOCK_EX);
/* NB: hold lnet_eq_wait_lock for EQ link/unlink, so we can do /*
* both EQ lookup and poll event with only lnet_eq_wait_lock */ * NB: hold lnet_eq_wait_lock for EQ link/unlink, so we can do
* both EQ lookup and poll event with only lnet_eq_wait_lock
*/
lnet_eq_wait_lock(); lnet_eq_wait_lock();
lnet_res_lh_initialize(&the_lnet.ln_eq_container, &eq->eq_lh); lnet_res_lh_initialize(&the_lnet.ln_eq_container, &eq->eq_lh);
...@@ -164,8 +171,10 @@ LNetEQFree(lnet_handle_eq_t eqh) ...@@ -164,8 +171,10 @@ LNetEQFree(lnet_handle_eq_t eqh)
LASSERT(the_lnet.ln_refcount > 0); LASSERT(the_lnet.ln_refcount > 0);
lnet_res_lock(LNET_LOCK_EX); lnet_res_lock(LNET_LOCK_EX);
/* NB: hold lnet_eq_wait_lock for EQ link/unlink, so we can do /*
* both EQ lookup and poll event with only lnet_eq_wait_lock */ * NB: hold lnet_eq_wait_lock for EQ link/unlink, so we can do
* both EQ lookup and poll event with only lnet_eq_wait_lock
*/
lnet_eq_wait_lock(); lnet_eq_wait_lock();
eq = lnet_handle2eq(&eqh); eq = lnet_handle2eq(&eqh);
...@@ -256,8 +265,10 @@ lnet_eq_dequeue_event(lnet_eq_t *eq, lnet_event_t *ev) ...@@ -256,8 +265,10 @@ lnet_eq_dequeue_event(lnet_eq_t *eq, lnet_event_t *ev)
if (eq->eq_deq_seq == new_event->sequence) { if (eq->eq_deq_seq == new_event->sequence) {
rc = 1; rc = 1;
} else { } else {
/* don't complain with CERROR: some EQs are sized small /*
* anyway; if it's important, the caller should complain */ * don't complain with CERROR: some EQs are sized small
* anyway; if it's important, the caller should complain
*/
CDEBUG(D_NET, "Event Queue Overflow: eq seq %lu ev seq %lu\n", CDEBUG(D_NET, "Event Queue Overflow: eq seq %lu ev seq %lu\n",
eq->eq_deq_seq, new_event->sequence); eq->eq_deq_seq, new_event->sequence);
rc = -EOVERFLOW; rc = -EOVERFLOW;
......
...@@ -52,9 +52,11 @@ lnet_md_unlink(lnet_libmd_t *md) ...@@ -52,9 +52,11 @@ lnet_md_unlink(lnet_libmd_t *md)
md->md_flags |= LNET_MD_FLAG_ZOMBIE; md->md_flags |= LNET_MD_FLAG_ZOMBIE;
/* Disassociate from ME (if any), /*
* Disassociate from ME (if any),
* and unlink it if it was created * and unlink it if it was created
* with LNET_UNLINK */ * with LNET_UNLINK
*/
if (me != NULL) { if (me != NULL) {
/* detach MD from portal */ /* detach MD from portal */
lnet_ptl_detach_md(me, md); lnet_ptl_detach_md(me, md);
...@@ -169,14 +171,18 @@ lnet_md_link(lnet_libmd_t *md, lnet_handle_eq_t eq_handle, int cpt) ...@@ -169,14 +171,18 @@ lnet_md_link(lnet_libmd_t *md, lnet_handle_eq_t eq_handle, int cpt)
{ {
struct lnet_res_container *container = the_lnet.ln_md_containers[cpt]; struct lnet_res_container *container = the_lnet.ln_md_containers[cpt];
/* NB we are passed an allocated, but inactive md. /*
* NB we are passed an allocated, but inactive md.
* if we return success, caller may lnet_md_unlink() it. * if we return success, caller may lnet_md_unlink() it.
* otherwise caller may only lnet_md_free() it. * otherwise caller may only lnet_md_free() it.
*/ */
/* This implementation doesn't know how to create START events or /*
* This implementation doesn't know how to create START events or
* disable END events. Best to LASSERT our caller is compliant so * disable END events. Best to LASSERT our caller is compliant so
* we find out quickly... */ * we find out quickly...
/* TODO - reevaluate what should be here in light of */
/*
* TODO - reevaluate what should be here in light of
* the removal of the start and end events * the removal of the start and end events
* maybe there we shouldn't even allow LNET_EQ_NONE!) * maybe there we shouldn't even allow LNET_EQ_NONE!)
* LASSERT (eq == NULL); * LASSERT (eq == NULL);
...@@ -306,8 +312,10 @@ LNetMDAttach(lnet_handle_me_t meh, lnet_md_t umd, ...@@ -306,8 +312,10 @@ LNetMDAttach(lnet_handle_me_t meh, lnet_md_t umd,
if (rc != 0) if (rc != 0)
goto failed; goto failed;
/* attach this MD to portal of ME and check if it matches any /*
* blocked msgs on this portal */ * attach this MD to portal of ME and check if it matches any
* blocked msgs on this portal
*/
lnet_ptl_attach_md(me, md, &matches, &drops); lnet_ptl_attach_md(me, md, &matches, &drops);
lnet_md2handle(handle, md); lnet_md2handle(handle, md);
...@@ -438,9 +446,11 @@ LNetMDUnlink(lnet_handle_md_t mdh) ...@@ -438,9 +446,11 @@ LNetMDUnlink(lnet_handle_md_t mdh)
} }
md->md_flags |= LNET_MD_FLAG_ABORTED; md->md_flags |= LNET_MD_FLAG_ABORTED;
/* If the MD is busy, lnet_md_unlink just marks it for deletion, and /*
* If the MD is busy, lnet_md_unlink just marks it for deletion, and
* when the LND is done, the completion event flags that the MD was * when the LND is done, the completion event flags that the MD was
* unlinked. Otherwise, we enqueue an event now... */ * unlinked. Otherwise, we enqueue an event now...
*/
if (md->md_eq != NULL && md->md_refcount == 0) { if (md->md_eq != NULL && md->md_refcount == 0) {
lnet_build_unlink_event(md, &ev); lnet_build_unlink_event(md, &ev);
lnet_eq_enqueue_event(md->md_eq, &ev); lnet_eq_enqueue_event(md->md_eq, &ev);
......
This diff is collapsed.
...@@ -203,8 +203,10 @@ lnet_msg_decommit_tx(lnet_msg_t *msg, int status) ...@@ -203,8 +203,10 @@ lnet_msg_decommit_tx(lnet_msg_t *msg, int status)
case LNET_EVENT_GET: case LNET_EVENT_GET:
LASSERT(msg->msg_rx_committed); LASSERT(msg->msg_rx_committed);
/* overwritten while sending reply, we should never be /*
* here for optimized GET */ * overwritten while sending reply, we should never be
* here for optimized GET
*/
LASSERT(msg->msg_type == LNET_MSG_REPLY); LASSERT(msg->msg_type == LNET_MSG_REPLY);
msg->msg_type = LNET_MSG_GET; /* fix type */ msg->msg_type = LNET_MSG_GET; /* fix type */
break; break;
...@@ -240,10 +242,12 @@ lnet_msg_decommit_rx(lnet_msg_t *msg, int status) ...@@ -240,10 +242,12 @@ lnet_msg_decommit_rx(lnet_msg_t *msg, int status)
break; break;
case LNET_EVENT_GET: case LNET_EVENT_GET:
/* type is "REPLY" if it's an optimized GET on passive side, /*
* type is "REPLY" if it's an optimized GET on passive side,
* because optimized GET will never be committed for sending, * because optimized GET will never be committed for sending,
* so message type wouldn't be changed back to "GET" by * so message type wouldn't be changed back to "GET" by
* lnet_msg_decommit_tx(), see details in lnet_parse_get() */ * lnet_msg_decommit_tx(), see details in lnet_parse_get()
*/
LASSERT(msg->msg_type == LNET_MSG_REPLY || LASSERT(msg->msg_type == LNET_MSG_REPLY ||
msg->msg_type == LNET_MSG_GET); msg->msg_type == LNET_MSG_GET);
counters->send_length += msg->msg_wanted; counters->send_length += msg->msg_wanted;
...@@ -254,8 +258,10 @@ lnet_msg_decommit_rx(lnet_msg_t *msg, int status) ...@@ -254,8 +258,10 @@ lnet_msg_decommit_rx(lnet_msg_t *msg, int status)
break; break;
case LNET_EVENT_REPLY: case LNET_EVENT_REPLY:
/* type is "GET" if it's an optimized GET on active side, /*
* see details in lnet_create_reply_msg() */ * type is "GET" if it's an optimized GET on active side,
* see details in lnet_create_reply_msg()
*/
LASSERT(msg->msg_type == LNET_MSG_GET || LASSERT(msg->msg_type == LNET_MSG_GET ||
msg->msg_type == LNET_MSG_REPLY); msg->msg_type == LNET_MSG_REPLY);
break; break;
...@@ -309,10 +315,12 @@ lnet_msg_attach_md(lnet_msg_t *msg, lnet_libmd_t *md, ...@@ -309,10 +315,12 @@ lnet_msg_attach_md(lnet_msg_t *msg, lnet_libmd_t *md,
unsigned int offset, unsigned int mlen) unsigned int offset, unsigned int mlen)
{ {
/* NB: @offset and @len are only useful for receiving */ /* NB: @offset and @len are only useful for receiving */
/* Here, we attach the MD on lnet_msg and mark it busy and /*
* Here, we attach the MD on lnet_msg and mark it busy and
* decrementing its threshold. Come what may, the lnet_msg "owns" * decrementing its threshold. Come what may, the lnet_msg "owns"
* the MD until a call to lnet_msg_detach_md or lnet_finalize() * the MD until a call to lnet_msg_detach_md or lnet_finalize()
* signals completion. */ * signals completion.
*/
LASSERT(!msg->msg_routing); LASSERT(!msg->msg_routing);
msg->msg_md = md; msg->msg_md = md;
...@@ -383,8 +391,10 @@ lnet_complete_msg_locked(lnet_msg_t *msg, int cpt) ...@@ -383,8 +391,10 @@ lnet_complete_msg_locked(lnet_msg_t *msg, int cpt)
msg->msg_hdr.msg.ack.match_bits = msg->msg_ev.match_bits; msg->msg_hdr.msg.ack.match_bits = msg->msg_ev.match_bits;
msg->msg_hdr.msg.ack.mlength = cpu_to_le32(msg->msg_ev.mlength); msg->msg_hdr.msg.ack.mlength = cpu_to_le32(msg->msg_ev.mlength);
/* NB: we probably want to use NID of msg::msg_from as 3rd /*
* parameter (router NID) if it's routed message */ * NB: we probably want to use NID of msg::msg_from as 3rd
* parameter (router NID) if it's routed message
*/
rc = lnet_send(msg->msg_ev.target.nid, msg, LNET_NID_ANY); rc = lnet_send(msg->msg_ev.target.nid, msg, LNET_NID_ANY);
lnet_net_lock(cpt); lnet_net_lock(cpt);
...@@ -491,9 +501,10 @@ lnet_finalize(lnet_ni_t *ni, lnet_msg_t *msg, int status) ...@@ -491,9 +501,10 @@ lnet_finalize(lnet_ni_t *ni, lnet_msg_t *msg, int status)
container = the_lnet.ln_msg_containers[cpt]; container = the_lnet.ln_msg_containers[cpt];
list_add_tail(&msg->msg_list, &container->msc_finalizing); list_add_tail(&msg->msg_list, &container->msc_finalizing);
/* Recursion breaker. Don't complete the message here if I am (or /*
* enough other threads are) already completing messages */ * Recursion breaker. Don't complete the message here if I am (or
* enough other threads are) already completing messages
*/
my_slot = -1; my_slot = -1;
for (i = 0; i < container->msc_nfinalizers; i++) { for (i = 0; i < container->msc_nfinalizers; i++) {
if (container->msc_finalizers[i] == current) if (container->msc_finalizers[i] == current)
...@@ -516,8 +527,10 @@ lnet_finalize(lnet_ni_t *ni, lnet_msg_t *msg, int status) ...@@ -516,8 +527,10 @@ lnet_finalize(lnet_ni_t *ni, lnet_msg_t *msg, int status)
list_del(&msg->msg_list); list_del(&msg->msg_list);
/* NB drops and regains the lnet lock if it actually does /*
* anything, so my finalizing friends can chomp along too */ * NB drops and regains the lnet lock if it actually does
* anything, so my finalizing friends can chomp along too
*/
rc = lnet_complete_msg_locked(msg, cpt); rc = lnet_complete_msg_locked(msg, cpt);
if (rc != 0) if (rc != 0)
break; break;
......
...@@ -139,8 +139,10 @@ static int ...@@ -139,8 +139,10 @@ static int
lnet_try_match_md(lnet_libmd_t *md, lnet_try_match_md(lnet_libmd_t *md,
struct lnet_match_info *info, struct lnet_msg *msg) struct lnet_match_info *info, struct lnet_msg *msg)
{ {
/* ALWAYS called holding the lnet_res_lock, and can't lnet_res_unlock; /*
* lnet_match_blocked_msg() relies on this to avoid races */ * ALWAYS called holding the lnet_res_lock, and can't lnet_res_unlock;
* lnet_match_blocked_msg() relies on this to avoid races
*/
unsigned int offset; unsigned int offset;
unsigned int mlength; unsigned int mlength;
lnet_me_t *me = md->md_me; lnet_me_t *me = md->md_me;
...@@ -203,9 +205,11 @@ lnet_try_match_md(lnet_libmd_t *md, ...@@ -203,9 +205,11 @@ lnet_try_match_md(lnet_libmd_t *md,
if (!lnet_md_exhausted(md)) if (!lnet_md_exhausted(md))
return LNET_MATCHMD_OK; return LNET_MATCHMD_OK;
/* Auto-unlink NOW, so the ME gets unlinked if required. /*
* Auto-unlink NOW, so the ME gets unlinked if required.
* We bumped md->md_refcount above so the MD just gets flagged * We bumped md->md_refcount above so the MD just gets flagged
* for unlink when it is finalized. */ * for unlink when it is finalized.
*/
if ((md->md_flags & LNET_MD_FLAG_AUTO_UNLINK) != 0) if ((md->md_flags & LNET_MD_FLAG_AUTO_UNLINK) != 0)
lnet_md_unlink(md); lnet_md_unlink(md);
...@@ -248,8 +252,10 @@ lnet_mt_of_attach(unsigned int index, lnet_process_id_t id, ...@@ -248,8 +252,10 @@ lnet_mt_of_attach(unsigned int index, lnet_process_id_t id,
return NULL; return NULL;
case LNET_INS_BEFORE: case LNET_INS_BEFORE:
case LNET_INS_AFTER: case LNET_INS_AFTER:
/* posted by no affinity thread, always hash to specific /*
* match-table to avoid buffer stealing which is heavy */ * posted by no affinity thread, always hash to specific
* match-table to avoid buffer stealing which is heavy
*/
return ptl->ptl_mtables[ptl->ptl_index % LNET_CPT_NUMBER]; return ptl->ptl_mtables[ptl->ptl_index % LNET_CPT_NUMBER];
case LNET_INS_LOCAL: case LNET_INS_LOCAL:
/* posted by cpu-affinity thread */ /* posted by cpu-affinity thread */
...@@ -299,9 +305,11 @@ lnet_mt_of_match(struct lnet_match_info *info, struct lnet_msg *msg) ...@@ -299,9 +305,11 @@ lnet_mt_of_match(struct lnet_match_info *info, struct lnet_msg *msg)
nmaps = ptl->ptl_mt_nmaps; nmaps = ptl->ptl_mt_nmaps;
/* map to an active mtable to avoid heavy "stealing" */ /* map to an active mtable to avoid heavy "stealing" */
if (nmaps != 0) { if (nmaps != 0) {
/* NB: there is possibility that ptl_mt_maps is being /*
* NB: there is possibility that ptl_mt_maps is being
* changed because we are not under protection of * changed because we are not under protection of
* lnet_ptl_lock, but it shouldn't hurt anything */ * lnet_ptl_lock, but it shouldn't hurt anything
*/
cpt = ptl->ptl_mt_maps[rotor % nmaps]; cpt = ptl->ptl_mt_maps[rotor % nmaps];
} }
} }
...@@ -401,8 +409,10 @@ lnet_mt_match_md(struct lnet_match_table *mtable, ...@@ -401,8 +409,10 @@ lnet_mt_match_md(struct lnet_match_table *mtable,
exhausted = 0; /* mlist is not empty */ exhausted = 0; /* mlist is not empty */
if ((rc & LNET_MATCHMD_FINISH) != 0) { if ((rc & LNET_MATCHMD_FINISH) != 0) {
/* don't return EXHAUSTED bit because we don't know /*
* whether the mlist is empty or not */ * don't return EXHAUSTED bit because we don't know
* whether the mlist is empty or not
*/
return rc & ~LNET_MATCHMD_EXHAUSTED; return rc & ~LNET_MATCHMD_EXHAUSTED;
} }
} }
...@@ -430,8 +440,10 @@ lnet_ptl_match_early(struct lnet_portal *ptl, struct lnet_msg *msg) ...@@ -430,8 +440,10 @@ lnet_ptl_match_early(struct lnet_portal *ptl, struct lnet_msg *msg)
{ {
int rc; int rc;
/* message arrived before any buffer posting on this portal, /*
* simply delay or drop this message */ * message arrived before any buffer posting on this portal,
* simply delay or drop this message
*/
if (likely(lnet_ptl_is_wildcard(ptl) || lnet_ptl_is_unique(ptl))) if (likely(lnet_ptl_is_wildcard(ptl) || lnet_ptl_is_unique(ptl)))
return 0; return 0;
...@@ -465,9 +477,11 @@ lnet_ptl_match_delay(struct lnet_portal *ptl, ...@@ -465,9 +477,11 @@ lnet_ptl_match_delay(struct lnet_portal *ptl,
int rc = 0; int rc = 0;
int i; int i;
/* steal buffer from other CPTs, and delay it if nothing to steal, /*
* steal buffer from other CPTs, and delay it if nothing to steal,
* this function is more expensive than a regular match, but we * this function is more expensive than a regular match, but we
* don't expect it can happen a lot */ * don't expect it can happen a lot
*/
LASSERT(lnet_ptl_is_wildcard(ptl)); LASSERT(lnet_ptl_is_wildcard(ptl));
for (i = 0; i < LNET_CPT_NUMBER; i++) { for (i = 0; i < LNET_CPT_NUMBER; i++) {
...@@ -498,8 +512,10 @@ lnet_ptl_match_delay(struct lnet_portal *ptl, ...@@ -498,8 +512,10 @@ lnet_ptl_match_delay(struct lnet_portal *ptl,
list_del_init(&msg->msg_list); list_del_init(&msg->msg_list);
} else { } else {
/* could be matched by lnet_ptl_attach_md() /*
* which is called by another thread */ * could be matched by lnet_ptl_attach_md()
* which is called by another thread
*/
rc = msg->msg_md == NULL ? rc = msg->msg_md == NULL ?
LNET_MATCHMD_DROP : LNET_MATCHMD_OK; LNET_MATCHMD_DROP : LNET_MATCHMD_OK;
} }
......
...@@ -258,9 +258,10 @@ lnet_sock_write(struct socket *sock, void *buffer, int nob, int timeout) ...@@ -258,9 +258,10 @@ lnet_sock_write(struct socket *sock, void *buffer, int nob, int timeout)
struct timeval tv; struct timeval tv;
LASSERT(nob > 0); LASSERT(nob > 0);
/* Caller may pass a zero timeout if she thinks the socket buffer is /*
* empty enough to take the whole message immediately */ * Caller may pass a zero timeout if she thinks the socket buffer is
* empty enough to take the whole message immediately
*/
for (;;) { for (;;) {
struct kvec iov = { struct kvec iov = {
.iov_base = buffer, .iov_base = buffer,
...@@ -524,8 +525,10 @@ lnet_sock_accept(struct socket **newsockp, struct socket *sock) ...@@ -524,8 +525,10 @@ lnet_sock_accept(struct socket **newsockp, struct socket *sock)
init_waitqueue_entry(&wait, current); init_waitqueue_entry(&wait, current);
/* XXX this should add a ref to sock->ops->owner, if /*
* TCP could be a module */ * XXX this should add a ref to sock->ops->owner, if
* TCP could be a module
*/
rc = sock_create_lite(PF_PACKET, sock->type, IPPROTO_TCP, &newsock); rc = sock_create_lite(PF_PACKET, sock->type, IPPROTO_TCP, &newsock);
if (rc) { if (rc) {
CERROR("Can't allocate socket\n"); CERROR("Can't allocate socket\n");
...@@ -578,10 +581,12 @@ lnet_sock_connect(struct socket **sockp, int *fatal, __u32 local_ip, ...@@ -578,10 +581,12 @@ lnet_sock_connect(struct socket **sockp, int *fatal, __u32 local_ip,
if (rc == 0) if (rc == 0)
return 0; return 0;
/* EADDRNOTAVAIL probably means we're already connected to the same /*
* EADDRNOTAVAIL probably means we're already connected to the same
* peer/port on the same local port on a differently typed * peer/port on the same local port on a differently typed
* connection. Let our caller retry with a different local * connection. Let our caller retry with a different local
* port... */ * port...
*/
*fatal = !(rc == -EADDRNOTAVAIL); *fatal = !(rc == -EADDRNOTAVAIL);
CDEBUG_LIMIT(*fatal ? D_NETERROR : D_NET, CDEBUG_LIMIT(*fatal ? D_NETERROR : D_NET,
......
...@@ -96,9 +96,11 @@ lnet_ioctl(unsigned int cmd, struct libcfs_ioctl_data *data) ...@@ -96,9 +96,11 @@ lnet_ioctl(unsigned int cmd, struct libcfs_ioctl_data *data)
return lnet_unconfigure(); return lnet_unconfigure();
default: default:
/* Passing LNET_PID_ANY only gives me a ref if the net is up /*
* Passing LNET_PID_ANY only gives me a ref if the net is up
* already; I'll need it to ensure the net can't go down while * already; I'll need it to ensure the net can't go down while
* I'm called into it */ * I'm called into it
*/
rc = LNetNIInit(LNET_PID_ANY); rc = LNetNIInit(LNET_PID_ANY);
if (rc >= 0) { if (rc >= 0) {
rc = LNetCtl(cmd, data); rc = LNetCtl(cmd, data);
...@@ -127,8 +129,10 @@ init_lnet(void) ...@@ -127,8 +129,10 @@ init_lnet(void)
LASSERT(rc == 0); LASSERT(rc == 0);
if (config_on_load) { if (config_on_load) {
/* Have to schedule a separate thread to avoid deadlocking /*
* in modload */ * Have to schedule a separate thread to avoid deadlocking
* in modload
*/
(void) kthread_run(lnet_configure, NULL, "lnet_initd"); (void) kthread_run(lnet_configure, NULL, "lnet_initd");
} }
......
...@@ -210,9 +210,11 @@ add_nidrange(const struct cfs_lstr *src, ...@@ -210,9 +210,11 @@ add_nidrange(const struct cfs_lstr *src,
/* network name only, e.g. "elan" or "tcp" */ /* network name only, e.g. "elan" or "tcp" */
netnum = 0; netnum = 0;
else { else {
/* e.g. "elan25" or "tcp23", refuse to parse if /*
* e.g. "elan25" or "tcp23", refuse to parse if
* network name is not appended with decimal or * network name is not appended with decimal or
* hexadecimal number */ * hexadecimal number
*/
if (!cfs_str2num_check(src->ls_str + strlen(nf->nf_name), if (!cfs_str2num_check(src->ls_str + strlen(nf->nf_name),
endlen, &netnum, 0, MAX_NUMERIC_VALUE)) endlen, &netnum, 0, MAX_NUMERIC_VALUE))
return NULL; return NULL;
...@@ -784,12 +786,14 @@ libcfs_ip_addr2str(__u32 addr, char *str, size_t size) ...@@ -784,12 +786,14 @@ libcfs_ip_addr2str(__u32 addr, char *str, size_t size)
(addr >> 8) & 0xff, addr & 0xff); (addr >> 8) & 0xff, addr & 0xff);
} }
/* CAVEAT EMPTOR XscanfX /*
* CAVEAT EMPTOR XscanfX
* I use "%n" at the end of a sscanf format to detect trailing junk. However * I use "%n" at the end of a sscanf format to detect trailing junk. However
* sscanf may return immediately if it sees the terminating '0' in a string, so * sscanf may return immediately if it sees the terminating '0' in a string, so
* I initialise the %n variable to the expected length. If sscanf sets it; * I initialise the %n variable to the expected length. If sscanf sets it;
* fine, if it doesn't, then the scan ended at the end of the string, which is * fine, if it doesn't, then the scan ended at the end of the string, which is
* fine too :) */ * fine too :)
*/
static int static int
libcfs_ip_str2addr(const char *str, int nob, __u32 *addr) libcfs_ip_str2addr(const char *str, int nob, __u32 *addr)
{ {
......
...@@ -61,8 +61,10 @@ lnet_peer_buffer_credits(lnet_ni_t *ni) ...@@ -61,8 +61,10 @@ lnet_peer_buffer_credits(lnet_ni_t *ni)
if (peer_buffer_credits > 0) if (peer_buffer_credits > 0)
return peer_buffer_credits; return peer_buffer_credits;
/* As an approximation, allow this peer the same number of router /*
* buffers as it is allowed outstanding sends */ * As an approximation, allow this peer the same number of router
* buffers as it is allowed outstanding sends
*/
return ni->ni_peertxcredits; return ni->ni_peertxcredits;
} }
...@@ -131,10 +133,11 @@ lnet_ni_notify_locked(lnet_ni_t *ni, lnet_peer_t *lp) ...@@ -131,10 +133,11 @@ lnet_ni_notify_locked(lnet_ni_t *ni, lnet_peer_t *lp)
int alive; int alive;
int notifylnd; int notifylnd;
/* Notify only in 1 thread at any time to ensure ordered notification. /*
* Notify only in 1 thread at any time to ensure ordered notification.
* NB individual events can be missed; the only guarantee is that you * NB individual events can be missed; the only guarantee is that you
* always get the most recent news */ * always get the most recent news
*/
if (lp->lp_notifying || ni == NULL) if (lp->lp_notifying || ni == NULL)
return; return;
...@@ -150,9 +153,10 @@ lnet_ni_notify_locked(lnet_ni_t *ni, lnet_peer_t *lp) ...@@ -150,9 +153,10 @@ lnet_ni_notify_locked(lnet_ni_t *ni, lnet_peer_t *lp)
if (notifylnd && ni->ni_lnd->lnd_notify != NULL) { if (notifylnd && ni->ni_lnd->lnd_notify != NULL) {
lnet_net_unlock(lp->lp_cpt); lnet_net_unlock(lp->lp_cpt);
/* A new notification could happen now; I'll handle it /*
* when control returns to me */ * A new notification could happen now; I'll handle it
* when control returns to me
*/
(ni->ni_lnd->lnd_notify)(ni, lp->lp_nid, alive); (ni->ni_lnd->lnd_notify)(ni, lp->lp_nid, alive);
lnet_net_lock(lp->lp_cpt); lnet_net_lock(lp->lp_cpt);
...@@ -245,8 +249,10 @@ static void lnet_shuffle_seed(void) ...@@ -245,8 +249,10 @@ static void lnet_shuffle_seed(void)
cfs_get_random_bytes(seed, sizeof(seed)); cfs_get_random_bytes(seed, sizeof(seed));
/* Nodes with small feet have little entropy /*
* the NID for this node gives the most entropy in the low bits */ * Nodes with small feet have little entropy
* the NID for this node gives the most entropy in the low bits
*/
list_for_each(tmp, &the_lnet.ln_nis) { list_for_each(tmp, &the_lnet.ln_nis) {
ni = list_entry(tmp, lnet_ni_t, ni_list); ni = list_entry(tmp, lnet_ni_t, ni_list);
lnd_type = LNET_NETTYP(LNET_NIDNET(ni->ni_nid)); lnd_type = LNET_NETTYP(LNET_NIDNET(ni->ni_nid));
...@@ -472,9 +478,10 @@ lnet_del_route(__u32 net, lnet_nid_t gw_nid) ...@@ -472,9 +478,10 @@ lnet_del_route(__u32 net, lnet_nid_t gw_nid)
CDEBUG(D_NET, "Del route: net %s : gw %s\n", CDEBUG(D_NET, "Del route: net %s : gw %s\n",
libcfs_net2str(net), libcfs_nid2str(gw_nid)); libcfs_net2str(net), libcfs_nid2str(gw_nid));
/* NB Caller may specify either all routes via the given gateway /*
* or a specific route entry actual NIDs) */ * NB Caller may specify either all routes via the given gateway
* or a specific route entry actual NIDs)
*/
lnet_net_lock(LNET_LOCK_EX); lnet_net_lock(LNET_LOCK_EX);
if (net == LNET_NIDNET(LNET_NID_ANY)) if (net == LNET_NIDNET(LNET_NID_ANY))
rn_list = &the_lnet.ln_remote_nets_hash[0]; rn_list = &the_lnet.ln_remote_nets_hash[0];
...@@ -663,8 +670,10 @@ lnet_parse_rc_info(lnet_rc_data_t *rcd) ...@@ -663,8 +670,10 @@ lnet_parse_rc_info(lnet_rc_data_t *rcd)
up = 1; up = 1;
break; break;
} }
/* ptl NIs are considered down only when /*
* they're all down */ * ptl NIs are considered down only when
* they're all down
*/
if (LNET_NETTYP(LNET_NIDNET(nid)) == PTLLND) if (LNET_NETTYP(LNET_NIDNET(nid)) == PTLLND)
ptl_status = LNET_NI_STATUS_UP; ptl_status = LNET_NI_STATUS_UP;
continue; continue;
...@@ -703,9 +712,11 @@ lnet_router_checker_event(lnet_event_t *event) ...@@ -703,9 +712,11 @@ lnet_router_checker_event(lnet_event_t *event)
lp = rcd->rcd_gateway; lp = rcd->rcd_gateway;
LASSERT(lp != NULL); LASSERT(lp != NULL);
/* NB: it's called with holding lnet_res_lock, we have a few /*
* places need to hold both locks at the same time, please take * NB: it's called with holding lnet_res_lock, we have a few
* care of lock ordering */ * places need to hold both locks at the same time, please take
* care of lock ordering
*/
lnet_net_lock(lp->lp_cpt); lnet_net_lock(lp->lp_cpt);
if (!lnet_isrouter(lp) || lp->lp_rcd != rcd) { if (!lnet_isrouter(lp) || lp->lp_rcd != rcd) {
/* ignore if no longer a router or rcd is replaced */ /* ignore if no longer a router or rcd is replaced */
...@@ -719,17 +730,20 @@ lnet_router_checker_event(lnet_event_t *event) ...@@ -719,17 +730,20 @@ lnet_router_checker_event(lnet_event_t *event)
} }
/* LNET_EVENT_REPLY */ /* LNET_EVENT_REPLY */
/* A successful REPLY means the router is up. If _any_ comms /*
* A successful REPLY means the router is up. If _any_ comms
* to the router fail I assume it's down (this will happen if * to the router fail I assume it's down (this will happen if
* we ping alive routers to try to detect router death before * we ping alive routers to try to detect router death before
* apps get burned). */ * apps get burned).
*/
lnet_notify_locked(lp, 1, (event->status == 0), cfs_time_current()); lnet_notify_locked(lp, 1, (event->status == 0), cfs_time_current());
/* The router checker will wake up very shortly and do the
/*
* The router checker will wake up very shortly and do the
* actual notification. * actual notification.
* XXX If 'lp' stops being a router before then, it will still * XXX If 'lp' stops being a router before then, it will still
* have the notification pending!!! */ * have the notification pending!!!
*/
if (avoid_asym_router_failure && event->status == 0) if (avoid_asym_router_failure && event->status == 0)
lnet_parse_rc_info(rcd); lnet_parse_rc_info(rcd);
...@@ -816,8 +830,10 @@ lnet_update_ni_status_locked(void) ...@@ -816,8 +830,10 @@ lnet_update_ni_status_locked(void)
if (ni->ni_status->ns_status != LNET_NI_STATUS_DOWN) { if (ni->ni_status->ns_status != LNET_NI_STATUS_DOWN) {
CDEBUG(D_NET, "NI(%s:%d) status changed to down\n", CDEBUG(D_NET, "NI(%s:%d) status changed to down\n",
libcfs_nid2str(ni->ni_nid), timeout); libcfs_nid2str(ni->ni_nid), timeout);
/* NB: so far, this is the only place to set /*
* NI status to "down" */ * NB: so far, this is the only place to set
* NI status to "down"
*/
ni->ni_status->ns_status = LNET_NI_STATUS_DOWN; ni->ni_status->ns_status = LNET_NI_STATUS_DOWN;
} }
lnet_ni_unlock(ni); lnet_ni_unlock(ni);
...@@ -1018,8 +1034,10 @@ lnet_router_checker_start(void) ...@@ -1018,8 +1034,10 @@ lnet_router_checker_start(void)
return 0; return 0;
sema_init(&the_lnet.ln_rc_signal, 0); sema_init(&the_lnet.ln_rc_signal, 0);
/* EQ size doesn't matter; the callback is guaranteed to get every /*
* event */ * EQ size doesn't matter; the callback is guaranteed to get every
* event
*/
eqsz = 0; eqsz = 0;
rc = LNetEQAlloc(eqsz, lnet_router_checker_event, rc = LNetEQAlloc(eqsz, lnet_router_checker_event,
&the_lnet.ln_rc_eqh); &the_lnet.ln_rc_eqh);
...@@ -1042,9 +1060,11 @@ lnet_router_checker_start(void) ...@@ -1042,9 +1060,11 @@ lnet_router_checker_start(void)
} }
if (check_routers_before_use) { if (check_routers_before_use) {
/* Note that a helpful side-effect of pinging all known routers /*
* Note that a helpful side-effect of pinging all known routers
* at startup is that it makes them drop stale connections they * at startup is that it makes them drop stale connections they
* may have to a previous instance of me. */ * may have to a previous instance of me.
*/
lnet_wait_known_routerstate(); lnet_wait_known_routerstate();
} }
...@@ -1199,9 +1219,11 @@ lnet_router_checker(void *arg) ...@@ -1199,9 +1219,11 @@ lnet_router_checker(void *arg)
lnet_prune_rc_data(0); /* don't wait for UNLINK */ lnet_prune_rc_data(0); /* don't wait for UNLINK */
/* Call schedule_timeout() here always adds 1 to load average /*
* Call schedule_timeout() here always adds 1 to load average
* because kernel counts # active tasks as nr_running * because kernel counts # active tasks as nr_running
* + nr_uninterruptible. */ * + nr_uninterruptible.
*/
set_current_state(TASK_INTERRUPTIBLE); set_current_state(TASK_INTERRUPTIBLE);
schedule_timeout(cfs_time_seconds(1)); schedule_timeout(cfs_time_seconds(1));
} }
...@@ -1541,10 +1563,12 @@ lnet_notify(lnet_ni_t *ni, lnet_nid_t nid, int alive, unsigned long when) ...@@ -1541,10 +1563,12 @@ lnet_notify(lnet_ni_t *ni, lnet_nid_t nid, int alive, unsigned long when)
return 0; return 0;
} }
/* We can't fully trust LND on reporting exact peer last_alive /*
* We can't fully trust LND on reporting exact peer last_alive
* if he notifies us about dead peer. For example ksocklnd can * if he notifies us about dead peer. For example ksocklnd can
* call us with when == _time_when_the_node_was_booted_ if * call us with when == _time_when_the_node_was_booted_ if
* no connections were successfully established */ * no connections were successfully established
*/
if (ni != NULL && !alive && when < lp->lp_last_alive) if (ni != NULL && !alive && when < lp->lp_last_alive)
when = lp->lp_last_alive; when = lp->lp_last_alive;
......
...@@ -25,8 +25,10 @@ ...@@ -25,8 +25,10 @@
#include "../../include/linux/libcfs/libcfs.h" #include "../../include/linux/libcfs/libcfs.h"
#include "../../include/linux/lnet/lib-lnet.h" #include "../../include/linux/lnet/lib-lnet.h"
/* This is really lnet_proc.c. You might need to update sanity test 215 /*
* if any file format is changed. */ * This is really lnet_proc.c. You might need to update sanity test 215
* if any file format is changed.
*/
#define LNET_LOFFT_BITS (sizeof(loff_t) * 8) #define LNET_LOFFT_BITS (sizeof(loff_t) * 8)
/* /*
...@@ -358,9 +360,11 @@ static int proc_lnet_routers(struct ctl_table *table, int write, ...@@ -358,9 +360,11 @@ static int proc_lnet_routers(struct ctl_table *table, int write,
if ((peer->lp_ping_feats & if ((peer->lp_ping_feats &
LNET_PING_FEAT_NI_STATUS) != 0) { LNET_PING_FEAT_NI_STATUS) != 0) {
list_for_each_entry(rtr, &peer->lp_routes, list_for_each_entry(rtr, &peer->lp_routes,
lr_gwlist) { lr_gwlist) {
/* downis on any route should be the /*
* number of downis on the gateway */ * downis on any route should be the
* number of downis on the gateway
*/
if (rtr->lr_downis != 0) { if (rtr->lr_downis != 0) {
down_ni = rtr->lr_downis; down_ni = rtr->lr_downis;
break; break;
...@@ -479,9 +483,11 @@ static int proc_lnet_peers(struct ctl_table *table, int write, ...@@ -479,9 +483,11 @@ static int proc_lnet_peers(struct ctl_table *table, int write,
if (skip == 0) { if (skip == 0) {
peer = lp; peer = lp;
/* minor optimization: start from idx+1 /*
* minor optimization: start from idx+1
* on next iteration if we've just * on next iteration if we've just
* drained lp_hashlist */ * drained lp_hashlist
*/
if (lp->lp_hashlist.next == if (lp->lp_hashlist.next ==
&ptable->pt_hash[hash]) { &ptable->pt_hash[hash]) {
hoff = 1; hoff = 1;
...@@ -710,8 +716,10 @@ static int proc_lnet_nis(struct ctl_table *table, int write, ...@@ -710,8 +716,10 @@ static int proc_lnet_nis(struct ctl_table *table, int write,
LNET_NI_STATUS_UP) ? "up" : "down"; LNET_NI_STATUS_UP) ? "up" : "down";
lnet_ni_unlock(ni); lnet_ni_unlock(ni);
/* we actually output credits information for /*
* TX queue of each partition */ * we actually output credits information for
* TX queue of each partition
*/
cfs_percpt_for_each(tq, i, ni->ni_tx_queues) { cfs_percpt_for_each(tq, i, ni->ni_tx_queues) {
for (j = 0; ni->ni_cpts != NULL && for (j = 0; ni->ni_cpts != NULL &&
j < ni->ni_ncpts; j++) { j < ni->ni_ncpts; j++) {
......
...@@ -86,15 +86,19 @@ brw_client_init(sfw_test_instance_t *tsi) ...@@ -86,15 +86,19 @@ brw_client_init(sfw_test_instance_t *tsi)
opc = breq->blk_opc; opc = breq->blk_opc;
flags = breq->blk_flags; flags = breq->blk_flags;
npg = breq->blk_npg; npg = breq->blk_npg;
/* NB: this is not going to work for variable page size, /*
* but we have to keep it for compatibility */ * NB: this is not going to work for variable page size,
* but we have to keep it for compatibility
*/
len = npg * PAGE_CACHE_SIZE; len = npg * PAGE_CACHE_SIZE;
} else { } else {
test_bulk_req_v1_t *breq = &tsi->tsi_u.bulk_v1; test_bulk_req_v1_t *breq = &tsi->tsi_u.bulk_v1;
/* I should never get this step if it's unknown feature /*
* because make_session will reject unknown feature */ * I should never get this step if it's unknown feature
* because make_session will reject unknown feature
*/
LASSERT((sn->sn_features & ~LST_FEATS_MASK) == 0); LASSERT((sn->sn_features & ~LST_FEATS_MASK) == 0);
opc = breq->blk_opc; opc = breq->blk_opc;
...@@ -279,8 +283,10 @@ brw_client_prep_rpc(sfw_test_unit_t *tsu, ...@@ -279,8 +283,10 @@ brw_client_prep_rpc(sfw_test_unit_t *tsu,
} else { } else {
test_bulk_req_v1_t *breq = &tsi->tsi_u.bulk_v1; test_bulk_req_v1_t *breq = &tsi->tsi_u.bulk_v1;
/* I should never get this step if it's unknown feature /*
* because make_session will reject unknown feature */ * I should never get this step if it's unknown feature
* because make_session will reject unknown feature
*/
LASSERT((sn->sn_features & ~LST_FEATS_MASK) == 0); LASSERT((sn->sn_features & ~LST_FEATS_MASK) == 0);
opc = breq->blk_opc; opc = breq->blk_opc;
......
...@@ -60,8 +60,10 @@ lstcon_rpc_done(srpc_client_rpc_t *rpc) ...@@ -60,8 +60,10 @@ lstcon_rpc_done(srpc_client_rpc_t *rpc)
spin_lock(&rpc->crpc_lock); spin_lock(&rpc->crpc_lock);
if (crpc->crp_trans == NULL) { if (crpc->crp_trans == NULL) {
/* Orphan RPC is not in any transaction, /*
* I'm just a poor body and nobody loves me */ * Orphan RPC is not in any transaction,
* I'm just a poor body and nobody loves me
*/
spin_unlock(&rpc->crpc_lock); spin_unlock(&rpc->crpc_lock);
/* release it */ /* release it */
...@@ -241,8 +243,10 @@ lstcon_rpc_trans_prep(struct list_head *translist, ...@@ -241,8 +243,10 @@ lstcon_rpc_trans_prep(struct list_head *translist,
if (translist != NULL) { if (translist != NULL) {
list_for_each_entry(trans, translist, tas_link) { list_for_each_entry(trans, translist, tas_link) {
/* Can't enqueue two private transaction on /*
* the same object */ * Can't enqueue two private transaction on
* the same object
*/
if ((trans->tas_opc & transop) == LST_TRANS_PRIVATE) if ((trans->tas_opc & transop) == LST_TRANS_PRIVATE)
return -EPERM; return -EPERM;
} }
...@@ -563,11 +567,12 @@ lstcon_rpc_trans_destroy(lstcon_rpc_trans_t *trans) ...@@ -563,11 +567,12 @@ lstcon_rpc_trans_destroy(lstcon_rpc_trans_t *trans)
continue; continue;
} }
/* rpcs can be still not callbacked (even LNetMDUnlink is called) /*
* rpcs can be still not callbacked (even LNetMDUnlink is called)
* because huge timeout for inaccessible network, don't make * because huge timeout for inaccessible network, don't make
* user wait for them, just abandon them, they will be recycled * user wait for them, just abandon them, they will be recycled
* in callback */ * in callback
*/
LASSERT(crpc->crp_status != 0); LASSERT(crpc->crp_status != 0);
crpc->crp_node = NULL; crpc->crp_node = NULL;
......
...@@ -104,9 +104,11 @@ lstcon_node_find(lnet_process_id_t id, lstcon_node_t **ndpp, int create) ...@@ -104,9 +104,11 @@ lstcon_node_find(lnet_process_id_t id, lstcon_node_t **ndpp, int create)
ndl->ndl_node->nd_timeout = 0; ndl->ndl_node->nd_timeout = 0;
memset(&ndl->ndl_node->nd_ping, 0, sizeof(lstcon_rpc_t)); memset(&ndl->ndl_node->nd_ping, 0, sizeof(lstcon_rpc_t));
/* queued in global hash & list, no refcount is taken by /*
* queued in global hash & list, no refcount is taken by
* global hash & list, if caller release his refcount, * global hash & list, if caller release his refcount,
* node will be released */ * node will be released
*/
list_add_tail(&ndl->ndl_hlink, &console_session.ses_ndl_hash[idx]); list_add_tail(&ndl->ndl_hlink, &console_session.ses_ndl_hash[idx]);
list_add_tail(&ndl->ndl_link, &console_session.ses_ndl_list); list_add_tail(&ndl->ndl_link, &console_session.ses_ndl_list);
...@@ -601,8 +603,10 @@ lstcon_group_del(char *name) ...@@ -601,8 +603,10 @@ lstcon_group_del(char *name)
lstcon_rpc_trans_destroy(trans); lstcon_rpc_trans_destroy(trans);
lstcon_group_decref(grp); lstcon_group_decref(grp);
/* -ref for session, it's destroyed, /*
* status can't be rolled back, destroy group anyway */ * -ref for session, it's destroyed,
* status can't be rolled back, destroy group anyway
*/
lstcon_group_decref(grp); lstcon_group_decref(grp);
return rc; return rc;
......
...@@ -386,8 +386,10 @@ sfw_get_stats(srpc_stat_reqst_t *request, srpc_stat_reply_t *reply) ...@@ -386,8 +386,10 @@ sfw_get_stats(srpc_stat_reqst_t *request, srpc_stat_reply_t *reply)
lnet_counters_get(&reply->str_lnet); lnet_counters_get(&reply->str_lnet);
srpc_get_counters(&reply->str_rpc); srpc_get_counters(&reply->str_rpc);
/* send over the msecs since the session was started /*
- with 32 bits to send, this is ~49 days */ * send over the msecs since the session was started
* with 32 bits to send, this is ~49 days
*/
cnt->running_ms = jiffies_to_msecs(jiffies - sn->sn_started); cnt->running_ms = jiffies_to_msecs(jiffies - sn->sn_started);
cnt->brw_errors = atomic_read(&sn->sn_brw_errors); cnt->brw_errors = atomic_read(&sn->sn_brw_errors);
cnt->ping_errors = atomic_read(&sn->sn_ping_errors); cnt->ping_errors = atomic_read(&sn->sn_ping_errors);
...@@ -437,12 +439,14 @@ sfw_make_session(srpc_mksn_reqst_t *request, srpc_mksn_reply_t *reply) ...@@ -437,12 +439,14 @@ sfw_make_session(srpc_mksn_reqst_t *request, srpc_mksn_reply_t *reply)
} }
} }
/* reject the request if it requires unknown features /*
* reject the request if it requires unknown features
* NB: old version will always accept all features because it's not * NB: old version will always accept all features because it's not
* aware of srpc_msg_t::msg_ses_feats, it's a defect but it's also * aware of srpc_msg_t::msg_ses_feats, it's a defect but it's also
* harmless because it will return zero feature to console, and it's * harmless because it will return zero feature to console, and it's
* console's responsibility to make sure all nodes in a session have * console's responsibility to make sure all nodes in a session have
* same feature mask. */ * same feature mask.
*/
if ((msg->msg_ses_feats & ~LST_FEATS_MASK) != 0) { if ((msg->msg_ses_feats & ~LST_FEATS_MASK) != 0) {
reply->mksn_status = EPROTO; reply->mksn_status = EPROTO;
return 0; return 0;
...@@ -570,10 +574,12 @@ sfw_load_test(struct sfw_test_instance *tsi) ...@@ -570,10 +574,12 @@ sfw_load_test(struct sfw_test_instance *tsi)
if (rc != 0) { if (rc != 0) {
CWARN("Failed to reserve enough buffers: service %s, %d needed: %d\n", CWARN("Failed to reserve enough buffers: service %s, %d needed: %d\n",
svc->sv_name, nbuf, rc); svc->sv_name, nbuf, rc);
/* NB: this error handler is not strictly correct, because /*
* NB: this error handler is not strictly correct, because
* it may release more buffers than already allocated, * it may release more buffers than already allocated,
* but it doesn't matter because request portal should * but it doesn't matter because request portal should
* be lazy portal and will grow buffers if necessary. */ * be lazy portal and will grow buffers if necessary.
*/
srpc_service_remove_buffers(svc, nbuf); srpc_service_remove_buffers(svc, nbuf);
return -ENOMEM; return -ENOMEM;
} }
...@@ -594,9 +600,11 @@ sfw_unload_test(struct sfw_test_instance *tsi) ...@@ -594,9 +600,11 @@ sfw_unload_test(struct sfw_test_instance *tsi)
if (tsi->tsi_is_client) if (tsi->tsi_is_client)
return; return;
/* shrink buffers, because request portal is lazy portal /*
* shrink buffers, because request portal is lazy portal
* which can grow buffers at runtime so we may leave * which can grow buffers at runtime so we may leave
* some buffers behind, but never mind... */ * some buffers behind, but never mind...
*/
srpc_service_remove_buffers(tsc->tsc_srv_service, srpc_service_remove_buffers(tsc->tsc_srv_service,
sfw_test_buffers(tsi)); sfw_test_buffers(tsi));
return; return;
...@@ -1272,9 +1280,11 @@ sfw_handle_server_rpc(struct srpc_server_rpc *rpc) ...@@ -1272,9 +1280,11 @@ sfw_handle_server_rpc(struct srpc_server_rpc *rpc)
} }
} else if ((request->msg_ses_feats & ~LST_FEATS_MASK) != 0) { } else if ((request->msg_ses_feats & ~LST_FEATS_MASK) != 0) {
/* NB: at this point, old version will ignore features and /*
* NB: at this point, old version will ignore features and
* create new session anyway, so console should be able * create new session anyway, so console should be able
* to handle this */ * to handle this
*/
reply->msg_body.reply.status = EPROTO; reply->msg_body.reply.status = EPROTO;
goto out; goto out;
} }
......
...@@ -278,16 +278,20 @@ srpc_service_init(struct srpc_service *svc) ...@@ -278,16 +278,20 @@ srpc_service_init(struct srpc_service *svc)
scd->scd_ev.ev_data = scd; scd->scd_ev.ev_data = scd;
scd->scd_ev.ev_type = SRPC_REQUEST_RCVD; scd->scd_ev.ev_type = SRPC_REQUEST_RCVD;
/* NB: don't use lst_sched_serial for adding buffer, /*
* see details in srpc_service_add_buffers() */ * NB: don't use lst_sched_serial for adding buffer,
* see details in srpc_service_add_buffers()
*/
swi_init_workitem(&scd->scd_buf_wi, scd, swi_init_workitem(&scd->scd_buf_wi, scd,
srpc_add_buffer, lst_sched_test[i]); srpc_add_buffer, lst_sched_test[i]);
if (i != 0 && srpc_serv_is_framework(svc)) { if (i != 0 && srpc_serv_is_framework(svc)) {
/* NB: framework service only needs srpc_service_cd for /*
* NB: framework service only needs srpc_service_cd for
* one partition, but we allocate for all to make * one partition, but we allocate for all to make
* it easier to implement, it will waste a little * it easier to implement, it will waste a little
* memory but nobody should care about this */ * memory but nobody should care about this
*/
continue; continue;
} }
...@@ -414,9 +418,11 @@ srpc_post_active_rdma(int portal, __u64 matchbits, void *buf, int len, ...@@ -414,9 +418,11 @@ srpc_post_active_rdma(int portal, __u64 matchbits, void *buf, int len,
return -ENOMEM; return -ENOMEM;
} }
/* this is kind of an abuse of the LNET_MD_OP_{PUT,GET} options. /*
* this is kind of an abuse of the LNET_MD_OP_{PUT,GET} options.
* they're only meaningful for MDs attached to an ME (i.e. passive * they're only meaningful for MDs attached to an ME (i.e. passive
* buffers... */ * buffers...
*/
if ((options & LNET_MD_OP_PUT) != 0) { if ((options & LNET_MD_OP_PUT) != 0) {
rc = LNetPut(self, *mdh, LNET_NOACK_REQ, peer, rc = LNetPut(self, *mdh, LNET_NOACK_REQ, peer,
portal, matchbits, 0, 0); portal, matchbits, 0, 0);
...@@ -431,7 +437,8 @@ srpc_post_active_rdma(int portal, __u64 matchbits, void *buf, int len, ...@@ -431,7 +437,8 @@ srpc_post_active_rdma(int portal, __u64 matchbits, void *buf, int len,
((options & LNET_MD_OP_PUT) != 0) ? "Put" : "Get", ((options & LNET_MD_OP_PUT) != 0) ? "Put" : "Get",
libcfs_id2str(peer), portal, matchbits, rc); libcfs_id2str(peer), portal, matchbits, rc);
/* The forthcoming unlink event will complete this operation /*
* The forthcoming unlink event will complete this operation
* with failure, so fall through and return success here. * with failure, so fall through and return success here.
*/ */
rc = LNetMDUnlink(*mdh); rc = LNetMDUnlink(*mdh);
...@@ -476,10 +483,11 @@ srpc_service_post_buffer(struct srpc_service_cd *scd, struct srpc_buffer *buf) ...@@ -476,10 +483,11 @@ srpc_service_post_buffer(struct srpc_service_cd *scd, struct srpc_buffer *buf)
msg, sizeof(*msg), &buf->buf_mdh, msg, sizeof(*msg), &buf->buf_mdh,
&scd->scd_ev); &scd->scd_ev);
/* At this point, a RPC (new or delayed) may have arrived in /*
* At this point, a RPC (new or delayed) may have arrived in
* msg and its event handler has been called. So we must add * msg and its event handler has been called. So we must add
* buf to scd_buf_posted _before_ dropping scd_lock */ * buf to scd_buf_posted _before_ dropping scd_lock
*/
spin_lock(&scd->scd_lock); spin_lock(&scd->scd_lock);
if (rc == 0) { if (rc == 0) {
...@@ -487,8 +495,10 @@ srpc_service_post_buffer(struct srpc_service_cd *scd, struct srpc_buffer *buf) ...@@ -487,8 +495,10 @@ srpc_service_post_buffer(struct srpc_service_cd *scd, struct srpc_buffer *buf)
return 0; return 0;
spin_unlock(&scd->scd_lock); spin_unlock(&scd->scd_lock);
/* srpc_shutdown_service might have tried to unlink me /*
* when my buf_mdh was still invalid */ * srpc_shutdown_service might have tried to unlink me
* when my buf_mdh was still invalid
*/
LNetMDUnlink(buf->buf_mdh); LNetMDUnlink(buf->buf_mdh);
spin_lock(&scd->scd_lock); spin_lock(&scd->scd_lock);
return 0; return 0;
...@@ -514,9 +524,11 @@ srpc_add_buffer(struct swi_workitem *wi) ...@@ -514,9 +524,11 @@ srpc_add_buffer(struct swi_workitem *wi)
struct srpc_buffer *buf; struct srpc_buffer *buf;
int rc = 0; int rc = 0;
/* it's called by workitem scheduler threads, these threads /*
* it's called by workitem scheduler threads, these threads
* should have been set CPT affinity, so buffers will be posted * should have been set CPT affinity, so buffers will be posted
* on CPT local list of Portal */ * on CPT local list of Portal
*/
spin_lock(&scd->scd_lock); spin_lock(&scd->scd_lock);
while (scd->scd_buf_adjust > 0 && while (scd->scd_buf_adjust > 0 &&
...@@ -732,9 +744,11 @@ srpc_abort_service(struct srpc_service *sv) ...@@ -732,9 +744,11 @@ srpc_abort_service(struct srpc_service *sv)
cfs_percpt_for_each(scd, i, sv->sv_cpt_data) { cfs_percpt_for_each(scd, i, sv->sv_cpt_data) {
spin_lock(&scd->scd_lock); spin_lock(&scd->scd_lock);
/* schedule in-flight RPCs to notice the abort, NB: /*
* schedule in-flight RPCs to notice the abort, NB:
* racing with incoming RPCs; complete fix should make test * racing with incoming RPCs; complete fix should make test
* RPCs carry session ID in its headers */ * RPCs carry session ID in its headers
*/
list_for_each_entry(rpc, &scd->scd_rpc_active, srpc_list) { list_for_each_entry(rpc, &scd->scd_rpc_active, srpc_list) {
rpc->srpc_aborted = 1; rpc->srpc_aborted = 1;
swi_schedule_workitem(&rpc->srpc_wi); swi_schedule_workitem(&rpc->srpc_wi);
...@@ -772,8 +786,10 @@ srpc_shutdown_service(srpc_service_t *sv) ...@@ -772,8 +786,10 @@ srpc_shutdown_service(srpc_service_t *sv)
spin_unlock(&scd->scd_lock); spin_unlock(&scd->scd_lock);
/* OK to traverse scd_buf_posted without lock, since no one /*
* touches scd_buf_posted now */ * OK to traverse scd_buf_posted without lock, since no one
* touches scd_buf_posted now
*/
list_for_each_entry(buf, &scd->scd_buf_posted, buf_list) list_for_each_entry(buf, &scd->scd_buf_posted, buf_list)
LNetMDUnlink(buf->buf_mdh); LNetMDUnlink(buf->buf_mdh);
} }
...@@ -915,8 +931,10 @@ srpc_server_rpc_done(struct srpc_server_rpc *rpc, int status) ...@@ -915,8 +931,10 @@ srpc_server_rpc_done(struct srpc_server_rpc *rpc, int status)
spin_lock(&scd->scd_lock); spin_lock(&scd->scd_lock);
if (rpc->srpc_reqstbuf != NULL) { if (rpc->srpc_reqstbuf != NULL) {
/* NB might drop sv_lock in srpc_service_recycle_buffer, but /*
* sv won't go away for scd_rpc_active must not be empty */ * NB might drop sv_lock in srpc_service_recycle_buffer, but
* sv won't go away for scd_rpc_active must not be empty
*/
srpc_service_recycle_buffer(scd, rpc->srpc_reqstbuf); srpc_service_recycle_buffer(scd, rpc->srpc_reqstbuf);
rpc->srpc_reqstbuf = NULL; rpc->srpc_reqstbuf = NULL;
} }
...@@ -1102,7 +1120,8 @@ srpc_add_client_rpc_timer(srpc_client_rpc_t *rpc) ...@@ -1102,7 +1120,8 @@ srpc_add_client_rpc_timer(srpc_client_rpc_t *rpc)
* Called with rpc->crpc_lock held. * Called with rpc->crpc_lock held.
* *
* Upon exit the RPC expiry timer is not queued and the handler is not * Upon exit the RPC expiry timer is not queued and the handler is not
* running on any CPU. */ * running on any CPU.
*/
static void static void
srpc_del_client_rpc_timer(srpc_client_rpc_t *rpc) srpc_del_client_rpc_timer(srpc_client_rpc_t *rpc)
{ {
...@@ -1210,9 +1229,11 @@ srpc_send_rpc(swi_workitem_t *wi) ...@@ -1210,9 +1229,11 @@ srpc_send_rpc(swi_workitem_t *wi)
break; break;
case SWI_STATE_REQUEST_SUBMITTED: case SWI_STATE_REQUEST_SUBMITTED:
/* CAVEAT EMPTOR: rqtev, rpyev, and bulkev may come in any /*
* CAVEAT EMPTOR: rqtev, rpyev, and bulkev may come in any
* order; however, they're processed in a strict order: * order; however, they're processed in a strict order:
* rqt, rpy, and bulk. */ * rqt, rpy, and bulk.
*/
if (!rpc->crpc_reqstev.ev_fired) if (!rpc->crpc_reqstev.ev_fired)
break; break;
...@@ -1259,10 +1280,12 @@ srpc_send_rpc(swi_workitem_t *wi) ...@@ -1259,10 +1280,12 @@ srpc_send_rpc(swi_workitem_t *wi)
rc = do_bulk ? rpc->crpc_bulkev.ev_status : 0; rc = do_bulk ? rpc->crpc_bulkev.ev_status : 0;
/* Bulk buffer was unlinked due to remote error. Clear error /*
* Bulk buffer was unlinked due to remote error. Clear error
* since reply buffer still contains valid data. * since reply buffer still contains valid data.
* NB rpc->crpc_done shouldn't look into bulk data in case of * NB rpc->crpc_done shouldn't look into bulk data in case of
* remote error. */ * remote error.
*/
if (do_bulk && rpc->crpc_bulkev.ev_lnet == LNET_EVENT_UNLINK && if (do_bulk && rpc->crpc_bulkev.ev_lnet == LNET_EVENT_UNLINK &&
rpc->crpc_status == 0 && reply->msg_body.reply.status != 0) rpc->crpc_status == 0 && reply->msg_body.reply.status != 0)
rc = 0; rc = 0;
...@@ -1364,8 +1387,10 @@ srpc_send_reply(struct srpc_server_rpc *rpc) ...@@ -1364,8 +1387,10 @@ srpc_send_reply(struct srpc_server_rpc *rpc)
spin_lock(&scd->scd_lock); spin_lock(&scd->scd_lock);
if (!sv->sv_shuttingdown && !srpc_serv_is_framework(sv)) { if (!sv->sv_shuttingdown && !srpc_serv_is_framework(sv)) {
/* Repost buffer before replying since test client /*
* might send me another RPC once it gets the reply */ * Repost buffer before replying since test client
* might send me another RPC once it gets the reply
*/
if (srpc_service_post_buffer(scd, buffer) != 0) if (srpc_service_post_buffer(scd, buffer) != 0)
CWARN("Failed to repost %s buffer\n", sv->sv_name); CWARN("Failed to repost %s buffer\n", sv->sv_name);
rpc->srpc_reqstbuf = NULL; rpc->srpc_reqstbuf = NULL;
...@@ -1472,8 +1497,10 @@ srpc_lnet_ev_handler(lnet_event_t *ev) ...@@ -1472,8 +1497,10 @@ srpc_lnet_ev_handler(lnet_event_t *ev)
scd->scd_buf_nposted--; scd->scd_buf_nposted--;
if (sv->sv_shuttingdown) { if (sv->sv_shuttingdown) {
/* Leave buffer on scd->scd_buf_nposted since /*
* srpc_finish_service needs to traverse it. */ * Leave buffer on scd->scd_buf_nposted since
* srpc_finish_service needs to traverse it.
*/
spin_unlock(&scd->scd_lock); spin_unlock(&scd->scd_lock);
break; break;
} }
...@@ -1507,9 +1534,11 @@ srpc_lnet_ev_handler(lnet_event_t *ev) ...@@ -1507,9 +1534,11 @@ srpc_lnet_ev_handler(lnet_event_t *ev)
ev->status, ev->mlength, ev->status, ev->mlength,
msg->msg_type, msg->msg_magic); msg->msg_type, msg->msg_magic);
/* NB can't call srpc_service_recycle_buffer here since /*
* NB can't call srpc_service_recycle_buffer here since
* it may call LNetM[DE]Attach. The invalid magic tells * it may call LNetM[DE]Attach. The invalid magic tells
* srpc_handle_rpc to drop this RPC */ * srpc_handle_rpc to drop this RPC
*/
msg->msg_magic = 0; msg->msg_magic = 0;
} }
......
...@@ -281,8 +281,10 @@ srpc_unpack_msg_hdr(srpc_msg_t *msg) ...@@ -281,8 +281,10 @@ srpc_unpack_msg_hdr(srpc_msg_t *msg)
if (msg->msg_magic == SRPC_MSG_MAGIC) if (msg->msg_magic == SRPC_MSG_MAGIC)
return; /* no flipping needed */ return; /* no flipping needed */
/* We do not swap the magic number here as it is needed to /*
determine whether the body needs to be swapped. */ * We do not swap the magic number here as it is needed to
* determine whether the body needs to be swapped.
*/
/* __swab32s(&msg->msg_magic); */ /* __swab32s(&msg->msg_magic); */
__swab32s(&msg->msg_type); __swab32s(&msg->msg_type);
__swab32s(&msg->msg_version); __swab32s(&msg->msg_version);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment