Pylons · djay · Sep 11, 2023 · Sep 12, 2023 · Sep 12, 2023 · Sep 14, 2023
diff --git a/src/waitress/channel.py b/src/waitress/channel.py
@@ -67,6 +67,9 @@ def __init__(self, server, sock, addr, adj, map=None):
         self.outbuf_lock = threading.Condition()
 
         wasyncore.dispatcher.__init__(self, sock, map=map)
+        if not self.connected:
+            # Sometimes can be closed quickly and getpeername fails.
+            self.handle_close()
 
         # Don't let wasyncore.dispatcher throttle self.addr on us.
         self.addr = addr
@@ -86,15 +89,15 @@ def writable(self):
         # the channel (possibly by our server maintenance logic), run
         # handle_write
 
-        return self.total_outbufs_len or self.will_close or self.close_when_flushed
+        return (self.total_outbufs_len or self.will_close or self.close_when_flushed)
 
     def handle_write(self):
         # Precondition: there's data in the out buffer to be sent, or
         # there's a pending will_close request
 
-        if not self.connected:
-            # we dont want to close the channel twice
-
+        if not self.connected and not (self.will_close or self.close_when_flushed):
+            # we dont want to close the channel twice.
+            # but we need let the channel close if it's marked to close
             return
 
         # try to flush any pending output
@@ -150,7 +153,6 @@ def readable(self):
         # 3. There are not too many tasks already queued
         # 4. There's no data in the output buffer that needs to be sent
         #    before we potentially create a new task.
-
         return not (
             self.will_close
             or self.close_when_flushed

diff --git a/tests/test_channel.py b/tests/test_channel.py
@@ -1,4 +1,6 @@
+from errno import EINVAL
 import io
+import socket
 import unittest
 
 import pytest
@@ -11,10 +13,10 @@ def _makeOne(self, sock, addr, adj, map=None):
         server = DummyServer()
         return HTTPChannel(server, sock, addr, adj=adj, map=map)
 
-    def _makeOneWithMap(self, adj=None):
+    def _makeOneWithMap(self, adj=None, sock_shutdown=False):
         if adj is None:
             adj = DummyAdjustments()
-        sock = DummySock()
+        sock = DummySock(shutdown=sock_shutdown)
         map = {}
         inst = self._makeOne(sock, "127.0.0.1", adj, map=map)
         inst.outbuf_lock = DummyLock()
@@ -906,8 +908,9 @@ class DummySock:
     blocking = False
     closed = False
 
-    def __init__(self):
+    def __init__(self, shutdown=False):
         self.sent = b""
+        self.shutdown = shutdown
 
     def setblocking(self, *arg):
         self.blocking = True
@@ -916,6 +919,8 @@ def fileno(self):
         return 100
 
     def getpeername(self):
+        if self.shutdown:
+            raise OSError(EINVAL)
         return "127.0.0.1"
 
     def getsockopt(self, level, option):

diff --git a/tests/test_server.py b/tests/test_server.py
@@ -1,5 +1,10 @@
 import errno
+import select
 import socket
+import struct
+from threading import Event
+from time import sleep
+import time
 import unittest
 
 dummy_app = object()
@@ -311,6 +316,103 @@ def test_create_with_one_socket_handle_accept_noerror(self):
         self.assertEqual(innersock.opts, [("level", "optname", "value")])
         self.assertEqual(L, [(inst, innersock, None, inst.adj)])
 
+    def test_quick_shutdown(self):
+        """ Issue found in production that led to 100% useage because getpeername failed after accept but before channel setup.
+        """
+        class DummyParser:
+            error = True  # We are simulating a header parsing error
+            version = 1
+            data = None
+            completed = True
+            empty = False
+            headers_finished = True
+            expect_continue = False
+            retval = None
+            connection_close = False
+
+            def __init__(self, adj):
+                pass
+
+            def received(self, data):
+                self.data = data
+                if self.retval is not None:
+                    return self.retval
+                return len(data)
+
+            def close(self):
+                pass
+
+        from waitress.channel import HTTPChannel
+        client = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
+        channel = None
+
+        class ShutdownChannel(HTTPChannel):
+            parser_class = DummyParser
+
+            def __init__(self, server, sock, addr, adj, map=None):
+                self.count_writes = self.count_close = self.count_wouldblock = 0
+                nonlocal channel
+                channel = self
+                client.close()  # simulate race condition where close happens between accept adn getpeername
+                return HTTPChannel.__init__(self, server, sock, addr, adj, map)
+
+            def handle_write(self):
+                self.count_writes += 1
+                return HTTPChannel.handle_write(self)
+
+            def handle_close(self):
+                # import pdb; pdb.set_trace()
+                self.count_close += 1
+                return HTTPChannel.handle_close(self)
+
+        def server_run(count=1):
+            # Modified server run to prevent infinite loop
+            inst.asyncore.loop(
+                timeout=inst.adj.asyncore_loop_timeout,
+                map=inst._map,
+                use_poll=inst.adj.asyncore_use_poll,
+                count=count
+            )
+
+        sockets = [socket.socket(socket.AF_INET, socket.SOCK_STREAM)]
+        sockets[0].setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 0)
+        sockets[0].bind(("127.0.0.1", 8000))
+        sockets[0].listen()
+        inst = self._makeWithSockets(_start=False, sockets=sockets)
+        inst.channel_class = ShutdownChannel
+        inst.task_dispatcher = DummyTaskDispatcher()
+
+        # This will make getpeername fail fast with EINVAL OSError
+        client.setsockopt(socket.SOL_SOCKET, socket.SO_LINGER, struct.pack('ii', 1, 0))
+        client.connect(("127.0.0.1", 8000))
+        client.send(b"1")  # Send our fake request before we accept and close the connection
+        inst.handle_accept()  # ShutdownServer will close the connection after acceot but before getpeername
+        self.assertRaises(OSError, sockets[0].getpeername)
+        self.assertFalse(channel.connected, "race condition means our socket is marked not connected")
+        self.assertNotIn(channel, inst._map.values(), "we should get an automatic close")
+
+        # UNCOMMENT: To reproduce previous 100% CPU looping behaviour
+        # self.assertIn(channel, inst._map.values(), "broken request still active to get this bug")
+
+        # server_run(1)  # Read the request
+        # self.assertTrue(channel.requests[0].error, "for this bug we need the request to have a parsing error")
+        # server_run(5)  
+        # self.assertIn(channel, inst._map.values(), "our rchannel doesn't get read and closed")
+        # # channel_request_lookahead > 0 would avoid this bug
+        # self.assertTrue(len(channel.requests) > channel.adj.channel_request_lookahead, "channel_request_lookahead == 0 means we don't read the disconnect")
+        # # simulate thread processing the request
+        # channel.service()
+        # self.assertTrue(channel.close_when_flushed, "This prevents reads (which lead to close) and loops on handle_write (with 100% CPU)")
+        # server_run(5)  # Our loop
+        # self.assertEqual(channel.count_writes, 5, "We're supposed to be in a loop trying to write but can't")
+        # self.assertEqual(channel.count_close, 0, "but also this connection never gets closed")
+        # # But shouldn't maintenance clear this up?
+        # channel.last_activity = 0
+        # inst.maintenance(1000)
+        # self.assertEqual(channel.will_close, 1, "maintenance will try to close it")
+        # server_run(5)  # Our loop
+        # self.assertEqual(channel.count_writes, 10, "But we still get our loop")
+
 
 if hasattr(socket, "AF_UNIX"):