[PATCH] iseries_veth: Try to avoid pathological reset behaviour

author Michael Ellerman <michael@ellerman.id.au>

Thu, 1 Sep 2005 01:29:00 +0000 (11:29 +1000)

committer Jeff Garzik <jgarzik@pobox.com>

Thu, 1 Sep 2005 02:37:56 +0000 (22:37 -0400)
author Michael Ellerman <michael@ellerman.id.au>
Thu, 1 Sep 2005 01:29:00 +0000 (11:29 +1000)
committer Jeff Garzik <jgarzik@pobox.com>
Thu, 1 Sep 2005 02:37:56 +0000 (22:37 -0400)
diff --git a/drivers/net/iseries_veth.c b/drivers/net/iseries_veth.c

index c19b32e0a5ad71fcfaf7075584e8b8c265e706ea..db83b0d313271e59a662b2304896dad46af0cd50 100644 (file)
--- a/drivers/net/iseries_veth.c
+++ b/drivers/net/iseries_veth.c
@@ -324,8 +324,14 @@ static void veth_take_monitor_ack(struct veth_lpar_connection *cnx,
  
         spin_lock_irqsave(&cnx->lock, flags);
         veth_debug("cnx %d: lost connection.\n", cnx->remote_lp);
-       cnx->state |= VETH_STATE_RESET;
-       veth_kick_statemachine(cnx);
+
+       /* Avoid kicking the statemachine once we're shutdown.
+        * It's unnecessary and it could break veth_stop_connection(). */
+
+       if (! (cnx->state & VETH_STATE_SHUTDOWN)) {
+               cnx->state |= VETH_STATE_RESET;
+               veth_kick_statemachine(cnx);
+       }
         spin_unlock_irqrestore(&cnx->lock, flags);
  }
  
@@ -483,6 +489,12 @@ static void veth_statemachine(void *p)
  
                 if (cnx->state & VETH_STATE_RESET)
                         goto restart;
+
+               /* Hack, wait for the other end to reset itself. */
+               if (! (cnx->state & VETH_STATE_SHUTDOWN)) {
+                       schedule_delayed_work(&cnx->statemachine_wq, 5 * HZ);
+                       goto out;
+               }
         }
  
         if (cnx->state & VETH_STATE_SHUTDOWN)
@@ -667,6 +679,15 @@ static void veth_stop_connection(u8 rlp)
         veth_kick_statemachine(cnx);
         spin_unlock_irq(&cnx->lock);
  
+       /* There's a slim chance the reset code has just queued the
+        * statemachine to run in five seconds. If so we need to cancel
+        * that and requeue the work to run now. */
+       if (cancel_delayed_work(&cnx->statemachine_wq)) {
+               spin_lock_irq(&cnx->lock);
+               veth_kick_statemachine(cnx);
+               spin_unlock_irq(&cnx->lock);
+       }
+
         /* Wait for the state machine to run. */
         flush_scheduled_work();
author	Michael Ellerman <michael@ellerman.id.au>
	Thu, 1 Sep 2005 01:29:00 +0000 (11:29 +1000)
committer	Jeff Garzik <jgarzik@pobox.com>
	Thu, 1 Sep 2005 02:37:56 +0000 (22:37 -0400)