Commit 0ab71045 authored by Bharath Ravi's avatar Bharath Ravi Committed by Martin K. Petersen

scsi: iscsi: Perform connection failure entirely in kernel space

Connection failure processing depends on a daemon being present to (at
least) stop the connection and start recovery.  This is a problem on a
multipath scenario, where if the daemon failed for whatever reason, the
SCSI path is never marked as down, multipath won't perform the failover and
IO to the device will be forever waiting for that connection to come back.

This patch performs the connection failure entirely inside the kernel.
This way, the failover can happen and pending IO can continue even if the
daemon is dead. Once the daemon comes alive again, it can execute recovery
procedures if applicable.

Cc: Mike Christie <mchristi@redhat.com>
Cc: Lee Duncan <LDuncan@suse.com>
Cc: Bart Van Assche <bvanassche@acm.org>
Link: https://lore.kernel.org/r/20200125061925.191601-1-krisman@collabora.comCo-developed-by: default avatarDave Clausen <dclausen@google.com>
Co-developed-by: default avatarNick Black <nlb@google.com>
Co-developed-by: default avatarVaibhav Nagarnaik <vnagarnaik@google.com>
Co-developed-by: default avatarAnatol Pomazau <anatol@google.com>
Co-developed-by: default avatarTahsin Erdogan <tahsin@google.com>
Co-developed-by: default avatarFrank Mayhar <fmayhar@google.com>
Co-developed-by: default avatarJunho Ryu <jayr@google.com>
Co-developed-by: default avatarKhazhismel Kumykov <khazhy@google.com>
Reviewed-by: default avatarReviewed-by: Khazhismel Kumykov <khazhy@google.com>
Co-developed-by: default avatarGabriel Krisman Bertazi <krisman@collabora.com>
Reviewed-by: default avatarLee Duncan <lduncan@suse.com>
Signed-off-by: default avatarBharath Ravi <rbharath@google.com>
Signed-off-by: default avatarDave Clausen <dclausen@google.com>
Signed-off-by: default avatarNick Black <nlb@google.com>
Signed-off-by: default avatarVaibhav Nagarnaik <vnagarnaik@google.com>
Signed-off-by: default avatarAnatol Pomazau <anatol@google.com>
Signed-off-by: default avatarTahsin Erdogan <tahsin@google.com>
Signed-off-by: default avatarFrank Mayhar <fmayhar@google.com>
Signed-off-by: default avatarJunho Ryu <jayr@google.com>
Signed-off-by: default avatarKhazhismel Kumykov <khazhy@google.com>
Signed-off-by: default avatarGabriel Krisman Bertazi <krisman@collabora.com>
Signed-off-by: default avatarMartin K. Petersen <martin.petersen@oracle.com>
parent 80363e1b
...@@ -86,6 +86,12 @@ struct iscsi_internal { ...@@ -86,6 +86,12 @@ struct iscsi_internal {
struct transport_container session_cont; struct transport_container session_cont;
}; };
/* Worker to perform connection failure on unresponsive connections
* completely in kernel space.
*/
static void stop_conn_work_fn(struct work_struct *work);
static DECLARE_WORK(stop_conn_work, stop_conn_work_fn);
static atomic_t iscsi_session_nr; /* sysfs session id for next new session */ static atomic_t iscsi_session_nr; /* sysfs session id for next new session */
static struct workqueue_struct *iscsi_eh_timer_workq; static struct workqueue_struct *iscsi_eh_timer_workq;
...@@ -1611,6 +1617,7 @@ static DEFINE_MUTEX(rx_queue_mutex); ...@@ -1611,6 +1617,7 @@ static DEFINE_MUTEX(rx_queue_mutex);
static LIST_HEAD(sesslist); static LIST_HEAD(sesslist);
static DEFINE_SPINLOCK(sesslock); static DEFINE_SPINLOCK(sesslock);
static LIST_HEAD(connlist); static LIST_HEAD(connlist);
static LIST_HEAD(connlist_err);
static DEFINE_SPINLOCK(connlock); static DEFINE_SPINLOCK(connlock);
static uint32_t iscsi_conn_get_sid(struct iscsi_cls_conn *conn) static uint32_t iscsi_conn_get_sid(struct iscsi_cls_conn *conn)
...@@ -2254,6 +2261,7 @@ iscsi_create_conn(struct iscsi_cls_session *session, int dd_size, uint32_t cid) ...@@ -2254,6 +2261,7 @@ iscsi_create_conn(struct iscsi_cls_session *session, int dd_size, uint32_t cid)
mutex_init(&conn->ep_mutex); mutex_init(&conn->ep_mutex);
INIT_LIST_HEAD(&conn->conn_list); INIT_LIST_HEAD(&conn->conn_list);
INIT_LIST_HEAD(&conn->conn_list_err);
conn->transport = transport; conn->transport = transport;
conn->cid = cid; conn->cid = cid;
...@@ -2307,6 +2315,7 @@ int iscsi_destroy_conn(struct iscsi_cls_conn *conn) ...@@ -2307,6 +2315,7 @@ int iscsi_destroy_conn(struct iscsi_cls_conn *conn)
spin_lock_irqsave(&connlock, flags); spin_lock_irqsave(&connlock, flags);
list_del(&conn->conn_list); list_del(&conn->conn_list);
list_del(&conn->conn_list_err);
spin_unlock_irqrestore(&connlock, flags); spin_unlock_irqrestore(&connlock, flags);
transport_unregister_device(&conn->dev); transport_unregister_device(&conn->dev);
...@@ -2421,6 +2430,51 @@ int iscsi_offload_mesg(struct Scsi_Host *shost, ...@@ -2421,6 +2430,51 @@ int iscsi_offload_mesg(struct Scsi_Host *shost,
} }
EXPORT_SYMBOL_GPL(iscsi_offload_mesg); EXPORT_SYMBOL_GPL(iscsi_offload_mesg);
static void stop_conn_work_fn(struct work_struct *work)
{
struct iscsi_cls_conn *conn, *tmp;
unsigned long flags;
LIST_HEAD(recovery_list);
spin_lock_irqsave(&connlock, flags);
if (list_empty(&connlist_err)) {
spin_unlock_irqrestore(&connlock, flags);
return;
}
list_splice_init(&connlist_err, &recovery_list);
spin_unlock_irqrestore(&connlock, flags);
list_for_each_entry_safe(conn, tmp, &recovery_list, conn_list_err) {
uint32_t sid = iscsi_conn_get_sid(conn);
struct iscsi_cls_session *session;
mutex_lock(&rx_queue_mutex);
session = iscsi_session_lookup(sid);
if (session) {
if (system_state != SYSTEM_RUNNING) {
session->recovery_tmo = 0;
conn->transport->stop_conn(conn,
STOP_CONN_TERM);
} else {
conn->transport->stop_conn(conn,
STOP_CONN_RECOVER);
}
}
list_del_init(&conn->conn_list_err);
mutex_unlock(&rx_queue_mutex);
/* we don't want to hold rx_queue_mutex for too long,
* for instance if many conns failed at the same time,
* since this stall other iscsi maintenance operations.
* Give other users a chance to proceed.
*/
cond_resched();
}
}
void iscsi_conn_error_event(struct iscsi_cls_conn *conn, enum iscsi_err error) void iscsi_conn_error_event(struct iscsi_cls_conn *conn, enum iscsi_err error)
{ {
struct nlmsghdr *nlh; struct nlmsghdr *nlh;
...@@ -2428,6 +2482,12 @@ void iscsi_conn_error_event(struct iscsi_cls_conn *conn, enum iscsi_err error) ...@@ -2428,6 +2482,12 @@ void iscsi_conn_error_event(struct iscsi_cls_conn *conn, enum iscsi_err error)
struct iscsi_uevent *ev; struct iscsi_uevent *ev;
struct iscsi_internal *priv; struct iscsi_internal *priv;
int len = nlmsg_total_size(sizeof(*ev)); int len = nlmsg_total_size(sizeof(*ev));
unsigned long flags;
spin_lock_irqsave(&connlock, flags);
list_add(&conn->conn_list_err, &connlist_err);
spin_unlock_irqrestore(&connlock, flags);
queue_work(system_unbound_wq, &stop_conn_work);
priv = iscsi_if_transport_lookup(conn->transport); priv = iscsi_if_transport_lookup(conn->transport);
if (!priv) if (!priv)
...@@ -2757,11 +2817,19 @@ static int ...@@ -2757,11 +2817,19 @@ static int
iscsi_if_destroy_conn(struct iscsi_transport *transport, struct iscsi_uevent *ev) iscsi_if_destroy_conn(struct iscsi_transport *transport, struct iscsi_uevent *ev)
{ {
struct iscsi_cls_conn *conn; struct iscsi_cls_conn *conn;
unsigned long flags;
conn = iscsi_conn_lookup(ev->u.d_conn.sid, ev->u.d_conn.cid); conn = iscsi_conn_lookup(ev->u.d_conn.sid, ev->u.d_conn.cid);
if (!conn) if (!conn)
return -EINVAL; return -EINVAL;
spin_lock_irqsave(&connlock, flags);
if (!list_empty(&conn->conn_list_err)) {
spin_unlock_irqrestore(&connlock, flags);
return -EAGAIN;
}
spin_unlock_irqrestore(&connlock, flags);
ISCSI_DBG_TRANS_CONN(conn, "Destroying transport conn\n"); ISCSI_DBG_TRANS_CONN(conn, "Destroying transport conn\n");
if (transport->destroy_conn) if (transport->destroy_conn)
transport->destroy_conn(conn); transport->destroy_conn(conn);
......
...@@ -190,6 +190,7 @@ extern void iscsi_ping_comp_event(uint32_t host_no, ...@@ -190,6 +190,7 @@ extern void iscsi_ping_comp_event(uint32_t host_no,
struct iscsi_cls_conn { struct iscsi_cls_conn {
struct list_head conn_list; /* item in connlist */ struct list_head conn_list; /* item in connlist */
struct list_head conn_list_err; /* item in connlist_err */
void *dd_data; /* LLD private data */ void *dd_data; /* LLD private data */
struct iscsi_transport *transport; struct iscsi_transport *transport;
uint32_t cid; /* connection id */ uint32_t cid; /* connection id */
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment