python tornado TCPserver异步协程实例
项目所用知识点
- tornado
- socket
- tcpserver
- 协程
- 异步
tornado tcpserver源码抛析
在tornado的tcpserver文件中,实现了TCPServer这个类,他是一个单线程的,非阻塞的tcp 服务。
为了与上层协议(在tornado中就是HTTPServer)交互,TCPServer提供了一个接口:handle_stream, 要求其子类必需实现该方法,该方法就是主要用来处理应用层逻辑的。
我们可以通过下面代码倒入模块查看源码
from tornado.tcpserver import TCPServer
源码中给了好多解释,先把源码注释贴进来
class TCPServer(object): ‘’‘ 1.要想用TCPserver,我给你提供你一个接口handle_stream,子类中必须要有这个方法 2.他已经给我们举出了例子 3.往下他给咱们介绍了几种启动方法,而我用的listen()方法启动看起来简单明了 ’‘’ r"""A non-blocking, single-threaded TCP server. To use `TCPServer`, define a subclass which overrides the `handle_stream` method. For example, a simple echo server could be defined like this:: from tornado.tcpserver import TCPServer from tornado.iostream import StreamClosedError from tornado import gen class EchoServer(TCPServer): @gen.coroutine def handle_stream(self, stream, address): while True: try: data = yield stream.read_until(b"\n") yield stream.write(data) except StreamClosedError: break To make this server serve SSL traffic, send the ``ssl_options`` keyword argument with an `ssl.SSLContext` object. For compatibility with older versions of Python ``ssl_options`` may also be a dictionary of keyword arguments for the `ssl.wrap_socket` method.:: ssl_ctx = ssl.create_default_context(ssl.Purpose.CLIENT_AUTH) ssl_ctx.load_cert_chain(os.path.join(data_dir, "mydomain.crt"), os.path.join(data_dir, "mydomain.key")) TCPServer(ssl_options=ssl_ctx) `TCPServer` initialization follows one of three patterns: 1. `listen`: simple single-process:: server = TCPServer() server.listen(8888) IOLoop.current().start() 2. `bind`/`start`: simple multi-process:: server = TCPServer() server.bind(8888) server.start(0) # Forks multiple sub-processes IOLoop.current().start() When using this interface, an `.IOLoop` must *not* be passed to the `TCPServer` constructor. `start` will always start the server on the default singleton `.IOLoop`. 3. `add_sockets`: advanced multi-process:: sockets = bind_sockets(8888) tornado.process.fork_processes(0) server = TCPServer() server.add_sockets(sockets) IOLoop.current().start() The `add_sockets` interface is more complicated, but it can be used with `tornado.process.fork_processes` to give you more flexibility in when the fork happens. `add_sockets` can also be used in single-process servers if you want to create your listening sockets in some way other than `~tornado.netutil.bind_sockets`. .. versionadded:: 3.1 The ``max_buffer_size`` argument. .. versionchanged:: 5.0 The ``io_loop`` argument has been removed. """
自己仔细看该类的其他方法
def listen(self, port, address=""): """Starts accepting connections on the given port. This method may be called more than once to listen on multiple ports. `listen` takes effect immediately; it is not necessary to call `TCPServer.start` afterwards. It is, however, necessary to start the `.IOLoop`. """ sockets = bind_sockets(port, address=address) self.add_sockets(sockets) def add_sockets(self, sockets): """Makes this server start accepting connections on the given sockets. The ``sockets`` parameter is a list of socket objects such as those returned by `~tornado.netutil.bind_sockets`. `add_sockets` is typically used in combination with that method and `tornado.process.fork_processes` to provide greater control over the initialization of a multi-process server. """ for sock in sockets: self._sockets[sock.fileno()] = sock self._handlers[sock.fileno()] = add_accept_handler( sock, self._handle_connection) def add_socket(self, socket): """Singular version of `add_sockets`. Takes a single socket object.""" self.add_sockets([socket]) def bind(self, port, address=None, family=socket.AF_UNSPEC, backlog=128, reuse_port=False): """Binds this server to the given port on the given address. To start the server, call `start`. If you want to run this server in a single process, you can call `listen` as a shortcut to the sequence of `bind` and `start` calls. Address may be either an IP address or hostname. If it's a hostname, the server will listen on all IP addresses associated with the name. Address may be an empty string or None to listen on all available interfaces. Family may be set to either `socket.AF_INET` or `socket.AF_INET6` to restrict to IPv4 or IPv6 addresses, otherwise both will be used if available. The ``backlog`` argument has the same meaning as for `socket.listen <socket.socket.listen>`. The ``reuse_port`` argument has the same meaning as for `.bind_sockets`. This method may be called multiple times prior to `start` to listen on multiple ports or interfaces. .. versionchanged:: 4.4 Added the ``reuse_port`` argument. """ sockets = bind_sockets(port, address=address, family=family, backlog=backlog, reuse_port=reuse_port) if self._started: self.add_sockets(sockets) else: self._pending_sockets.extend(sockets) def start(self, num_processes=1): """Starts this server in the `.IOLoop`. By default, we run the server in this process and do not fork any additional child process. If num_processes is ``None`` or <= 0, we detect the number of cores available on this machine and fork that number of child processes. If num_processes is given and > 1, we fork that specific number of sub-processes. Since we use processes and not threads, there is no shared memory between any server code. Note that multiple processes are not compatible with the autoreload module (or the ``autoreload=True`` option to `tornado.web.Application` which defaults to True when ``debug=True``). When using multiple processes, no IOLoops can be created or referenced until after the call to ``TCPServer.start(n)``. """ assert not self._started self._started = True if num_processes != 1: process.fork_processes(num_processes) sockets = self._pending_sockets self._pending_sockets = [] self.add_sockets(sockets) def stop(self): """Stops listening for new connections. Requests currently in progress may still continue after the server is stopped. """ if self._stopped: return self._stopped = True for fd, sock in self._sockets.items(): assert sock.fileno() == fd # Unregister socket from IOLoop self._handlers.pop(fd)() sock.close() def handle_stream(self, stream, address): """Override to handle a new `.IOStream` from an incoming connection. This method may be a coroutine; if so any exceptions it raises asynchronously will be logged. Accepting of incoming connections will not be blocked by this coroutine. If this `TCPServer` is configured for SSL, ``handle_stream`` may be called before the SSL handshake has completed. Use `.SSLIOStream.wait_for_handshake` if you need to verify the client's certificate or use NPN/ALPN. .. versionchanged:: 4.2 Added the option for this method to be a coroutine. """ raise NotImplementedError() def _handle_connection(self, connection, address): if self.ssl_options is not None: assert ssl, "Python 2.6+ and OpenSSL required for SSL" try: connection = ssl_wrap_socket(connection, self.ssl_options, server_side=True, do_handshake_on_connect=False) except ssl.SSLError as err: if err.args[0] == ssl.SSL_ERROR_EOF: return connection.close() else: raise except socket.error as err: # If the connection is closed immediately after it is created # (as in a port scan), we can get one of several errors. # wrap_socket makes an internal call to getpeername, # which may return either EINVAL (Mac OS X) or ENOTCONN # (Linux). If it returns ENOTCONN, this error is # silently swallowed by the ssl module, so we need to # catch another error later on (AttributeError in # SSLIOStream._do_ssl_handshake). # To test this behavior, try nmap with the -sT flag. # https://github.com/tornadoweb/tornado/pull/750 if errno_from_exception(err) in (errno.ECONNABORTED, errno.EINVAL): return connection.close() else: raise try: if self.ssl_options is not None: stream = SSLIOStream(connection, max_buffer_size=self.max_buffer_size, read_chunk_size=self.read_chunk_size) else: stream = IOStream(connection, max_buffer_size=self.max_buffer_size, read_chunk_size=self.read_chunk_size) future = self.handle_stream(stream, address) if future is not None: IOLoop.current().add_future(gen.convert_yielded(future), lambda f: f.result()) except Exception: app_log.error("Error in connection callback", exc_info=True)
通过方法名就能看出来,而且开头已经给出实例怎么去用,所以这个就不一一解释了,我自己的用法如下
from tornado.tcpserver import TCPServer from tornado.iostream import IOStream, StreamClosedError from tornado import gen from tornado.ioloop import IOLoop import struct class ProxyServer(TCPServer): def __init__(self, *args, **kwargs): super(ProxyServer, self).__init__(*args, **kwargs) self.devices = dict() @gen.coroutine def handle_stream(self, stream, address): pass if __name__ == "__main__": server = ProxyServer() server.listen(1234) IOLoop.current().start()
具体步骤来分析 一下
TCPServer执行过程
1.server = ProxyServer()创建tcpserver对象,该步骤仅仅做了一个初始化操作
def __init__(self, io_loop=None, ssl_options=None, max_buffer_size=None, read_chunk_size=None): self.io_loop = io_loop self.ssl_options = ssl_options self._sockets = {} # fd -> socket object 用来存储文件描述符与socket对象的映射关系 self._pending_sockets = [] self._started = False self.max_buffer_size = max_buffer_size # 最大缓冲长度 self.read_chunk_size = read_chunk_size # 每次读的chunk大小 # 校验ssl选项. if self.ssl_options is not None and isinstance(self.ssl_options, dict): if 'certfile' not in self.ssl_options: raise KeyError('missing key "certfile" in ssl_options') if not os.path.exists(self.ssl_options['certfile']): raise ValueError('certfile "%s" does not exist' % self.ssl_options['certfile']) if ('keyfile' in self.ssl_options and not os.path.exists(self.ssl_options['keyfile'])): raise ValueError('keyfile "%s" does not exist' % self.ssl_options['keyfile'])
2.想都不要想肯定是开启socket
步骤是执行server.listen(1234)的时候,
def listen(self, port, address=""): """Starts accepting connections on the given port. This method may be called more than once to listen on multiple ports. `listen` takes effect immediately; it is not necessary to call `TCPServer.start` afterwards. It is, however, necessary to start the `.IOLoop`. """ sockets = bind_sockets(port, address=address) self.add_sockets(sockets)
3.看下listen里面有调用bind_sockets()方法,来看下该方法
def bind_sockets(port, address=None, family=socket.AF_UNSPEC, backlog=_DEFAULT_BACKLOG, flags=None, reuse_port=False): if reuse_port and not hasattr(socket, "SO_REUSEPORT"): raise ValueError("the platform doesn't support SO_REUSEPORT") sockets = [] if address == "": address = None # address family参数指定调用者期待返回的套接口地址结构的类型。它的值包括四种:AF_UNIX,AF_INET,AF_INET6和AF_UNSPEC。 # AF_UNIX用于同一台机器上的进程间通信 # 如果指定AF_INET,那么函数就不能返回任何IPV6相关的地址信息;如果仅指定了AF_INET6,则就不能返回任何IPV4地址信息。 # AF_UNSPEC则意味着函数返回的是适用于指定主机名和服务名且适合任何协议族的地址。 # 如果某个主机既有AAAA记录(IPV6)地址,同时又有A记录(IPV4)地址,那么AAAA记录将作为sockaddr_in6结构返回,而A记录则作为sockaddr_in结构返回 if not socket.has_ipv6 and family == socket.AF_UNSPEC: # 如果系统不支持ipv6 family = socket.AF_INET if flags is None: flags = socket.AI_PASSIVE bound_port = None for res in set(socket.getaddrinfo(address, port, family, socket.SOCK_STREAM, 0, flags)): af, socktype, proto, canonname, sockaddr = res if (sys.platform == 'darwin' and address == 'localhost' and af == socket.AF_INET6 and sockaddr[3] != 0): # Mac OS X在“localhost”的getaddrinfo结果中包含一个链接本地地址fe80 :: 1%lo0。 # 但是,防火墙不了解这是一个本地地址,并且会提示访问。 所以跳过这些地址。 continue try: sock = socket.socket(af, socktype, proto) except socket.error as e: # 如果协议不支持该地址 if errno_from_exception(e) == errno.EAFNOSUPPORT: continue raise # 为 fd 设置 FD_CLOEXEC 标识 set_close_exec(sock.fileno()) if os.name != 'nt': # 非windows sock.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEADDR, 1) if reuse_port: sock.setsockopt(socket.SOL_SOCKET, socket.SO_REUSEPORT, 1) if af == socket.AF_INET6: # On linux, ipv6 sockets accept ipv4 too by default, # but this makes it impossible to bind to both # 0.0.0.0 in ipv4 and :: in ipv6. On other systems, # separate sockets *must* be used to listen for both ipv4 # and ipv6. For consistency, always disable ipv4 on our # ipv6 sockets and use a separate ipv4 socket when needed. # # Python 2.x on windows doesn't have IPPROTO_IPV6. if hasattr(socket, "IPPROTO_IPV6"): sock.setsockopt(socket.IPPROTO_IPV6, socket.IPV6_V6ONLY, 1) # 自动端口分配,端口=None # 应该绑定在IPv4和IPv6地址上的同一个端口上 host, requested_port = sockaddr[:2] if requested_port == 0 and bound_port is not None: sockaddr = tuple([host, bound_port] + list(sockaddr[2:])) # 设置socket为非阻塞 sock.setblocking(0) sock.bind(sockaddr) bound_port = sock.getsockname()[1] sock.listen(backlog) sockets.append(sock) return sockets
4.接下来执行的是add_sockets()方法
def add_sockets(self, sockets): if self.io_loop is None: self.io_loop = IOLoop.current() # 获取IOLoop实例对象 for sock in sockets: self._sockets[sock.fileno()] = sock add_accept_handler(sock, self._handle_connection, io_loop=self.io_loop)
可以看到里面调用了add_accept_handler方法,来我们进去看看该方法干啥了
5.探析add_accept_handler方法
def add_accept_handler(sock, callback, io_loop=None): if io_loop is None: # 获取IOLoop实例对象 io_loop = IOLoop.current() def accept_handler(fd, events): # 我们处理回调时可能会有许多的连接等待建立; 为了防止其他任务的饥饿,我们必须限制我们一次接受的连接数。 # 理想情况下,我们接受在处理回调过程中等待的连接数,但此可能会对负载产生不利影响。 # 相反,我们使用listen backlog作为我们可以合理接受的连接数的。 for i in xrange(_DEFAULT_BACKLOG): # _DEFAULT_BACKLOG默认为128 try: connection, address = sock.accept() except socket.error as e: # _ERRNO_WOULDBLOCK 与EAGAIN相同,表示再尝试一下,很多情况下是因为资源不足,或者条件未达成 # 当某个子进程与客户端建立了连接,其他子进程再次尝试与该客户端建立连接时就会产生该错误 if errno_from_exception(e) in _ERRNO_WOULDBLOCK: return # ECONNABORTED表示有一个连接,在他处于等待被服务端accept的时候主动关闭了。 if errno_from_exception(e) == errno.ECONNABORTED: continue raise callback(connection, address) io_loop.add_handler(sock, accept_handler, IOLoop.READ) # 为socket注册handler:当发生READ事件时运行accept_handler函数。
欣欣然我们来到了最后一步
6.IOLoop.current().start(),然我们看下源码
def start(self): try: while True: callbacks = self._callbacks self._callbacks = [] due_timeouts = [] # 将时间已到的定时任务放置到due_timeouts中,过程省略 for callback in callbacks: # 执行callback self._run_callback(callback) for timeout in due_timeouts: # 执行定时任务 if timeout.callback is not None: self._run_callback(timeout.callback) callbacks = callback = due_timeouts = timeout = None # 释放内存 # 根据情况设置poll_timeout的值,过程省略 if not self._running: # 终止ioloop运行时,在执行完了callback后结束循环 breaktry: event_pairs = self._impl.poll(poll_timeout) except Exception as e: if errno_from_exception(e) == errno.EINTR: # 系统调用被信号处理函数中断,进行下一次循环 continue else: raise self._events.update(event_pairs) while self._events: fd, events = self._events.popitem() # 获取一个fd以及对应事件 try: fd_obj, handler_func = self._handlers[fd] # 获取该fd对应的事件处理函数 handler_func(fd_obj, events) # 运行该事件处理函数 except (OSError, IOError) as e: if errno_from_exception(e) == errno.EPIPE: # 当客户端关闭连接时会产生EPIPE错误 pass # 其他异常处理已经省略 fd_obj = handler_func = None # 释放内存空间
这一步想了解更多去参考这篇文章http://www.cnblogs.com/MnCu8261/p/6730691.html
代码实例
目前公司有这么一个需求,iphonex--server--ue4,面对两个客户端,达到iphonex把数据给ue4,server起一个代理作用,需求大概就是这样,具体实现代码如下
from tornado.tcpserver import TCPServer from tornado.iostream import IOStream, StreamClosedError from tornado import gen from tornado.ioloop import IOLoop import struct class ProxyServer(TCPServer): def __init__(self, *args, **kwargs): super(ProxyServer, self).__init__(*args, **kwargs) self.devices = dict() @gen.coroutine def handle_stream(self, stream, address): device = yield stream.read_bytes(1) if device == b"\x0a": self.handle_iphonex_stream(stream, address) elif device == b"\x0b": self.handle_ue4_stream(stream, address) else: print("protocol error.") @gen.coroutine def handle_iphonex_stream(self, stream, address): yield stream.write(b"\x00") print("iphonex") # uuid rlen = yield stream.read_bytes(4) rlen = struct.unpack(">I", rlen)[0] uuid = yield stream.read_bytes(rlen) uuid = uuid.decode() yield stream.write(b"\x00") print(uuid) # keys rlen = yield stream.read_bytes(4) rlen = struct.unpack(">I", rlen)[0] keys = yield stream.read_bytes(rlen) keys = keys.decode() yield stream.write(b"\x00") print(keys) # save self.devices[uuid] = {'keys': keys} # data keys = keys.split(',') fmt = "%df" % len(keys) while True: try: data = yield stream.read_bytes(struct.calcsize(fmt)) except StreamClosedError: print 'iphonex is closed' break pdata = struct.unpack(fmt, data) print(pdata) ue4stream = self.devices[uuid].get('ue4') if ue4stream: try: yield ue4stream.write(data) except Exception as e: self.devices[uuid]['ue4'] = None print('request for %s closed' % uuid) @gen.coroutine def handle_ue4_stream(self, stream, address): yield stream.write(b"\x00") print("ue4") # uuid rlen = yield stream.read_bytes(4) rlen = struct.unpack(">I", rlen)[0] uuid = yield stream.read_bytes(rlen) uuid = uuid.decode() print(uuid) if self.devices.get(uuid): yield stream.write(b"\x00") else: yield stream.write(b"\x01") raise Exception # send keys keys = self.devices[uuid].get('keys') stream.write(struct.pack(">I", len(keys))) stream.write(keys.encode()) valid = yield stream.read_bytes(1) if valid == b'x\01': print('keys not support.') raise Exception self.devices[uuid]['ue4'] = stream if __name__ == "__main__": server = ProxyServer() server.listen(1234) IOLoop.current().start()
请点赞转发帮助身边更多的人