个人技术博客
个人技术博客

Subscribe to kk

Subscribe to kk
Share Dialog
Share Dialog
<100 subscribers
<100 subscribers

class Fetcher:
def connected(self, key):
selector.unregister(key.fd)
self.con.send('GET {} HTTP/1.1\r\nHost:{}\r\nConnection:close\r\n\r\n'.format(self.path,self.host).encode('utf-8'))
selector.register(self.con.fileno(), EVENT_READ, self.read)
def read(self, key):
d = self.con.recv(1024)
if d:
print(d)
self.data += d
else:
selector.unregister(key.fd)
self.data = self.data.decode('utf-8')
html_data = self.data.split('\r\n\r\n')[1]
print(html_data)
self.con.close()
def get_url(self, url):
...
self.con = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
self.con.setblocking(False)
#设置非阻塞
try:
self.con.connect((self.host, 80))
except BlockingIOError as e:
pass
selector.register(self.con.fileno(), EVENT_WRITE, self.connected)
过程:发送一个socket请求设置为非阻塞,在select函数中注册事件,self.con.fileno表示当前连接在进程中的描述符,EVENT_WRITE表示socket准备是否就绪,self.connected为回调函数,准备完成后就调用。selector.unregister(key.fd)取消注册,发送HTTP请求,再调用selector.register(self.con.fileno(), EVENT_READ, self.read)注册,若当前请求内容可读,则调用read回调函数读取出响应内容。
注明:在windows下会调用select函数,而在linux/unix下则会调用epoll函数
完整代码如下:
import socket
from urllib.parse import urlparse
from selectors import DefaultSelector, EVENT_READ, EVENT_WRITE
selector = DefaultSelector()
class Fetcher:
def connected(self, key):
selector.unregister(key.fd)
self.con.send('GET {} HTTP/1.1\r\nHost:{}\r\nConnection:close\r\n\r\n'.format(self.path,self.host).encode('utf-8'))
selector.register(self.con.fileno(), EVENT_READ, self.read)
def read(self, key):
d = self.con.recv(1024)
if d:
print(d)
self.data += d
else:
selector.unregister(key.fd)
self.data = self.data.decode('utf-8')
html_data = self.data.split('\r\n\r\n')[1]
print(html_data)
self.con.close()
def get_url(self, url):
url = urlparse(url)
self.host = url.netloc
self.path = url.path
self.data = b''
if self.path == "":
self.path = '/'
self.con = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
self.con.setblocking(False)
try:
self.con.connect((self.host, 80))
except BlockingIOError as e:
pass
#注册
selector.register(self.con.fileno(), EVENT_WRITE, self.connected)
def loop():
while True:
ready = selector.select()
for key, mask in ready:
callback = key.data
callback(key)
if __name__ == '__main__':
fetcher = Fetcher()
fetcher.get_url('http://www.baidu.com')
loop()

class Fetcher:
def connected(self, key):
selector.unregister(key.fd)
self.con.send('GET {} HTTP/1.1\r\nHost:{}\r\nConnection:close\r\n\r\n'.format(self.path,self.host).encode('utf-8'))
selector.register(self.con.fileno(), EVENT_READ, self.read)
def read(self, key):
d = self.con.recv(1024)
if d:
print(d)
self.data += d
else:
selector.unregister(key.fd)
self.data = self.data.decode('utf-8')
html_data = self.data.split('\r\n\r\n')[1]
print(html_data)
self.con.close()
def get_url(self, url):
...
self.con = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
self.con.setblocking(False)
#设置非阻塞
try:
self.con.connect((self.host, 80))
except BlockingIOError as e:
pass
selector.register(self.con.fileno(), EVENT_WRITE, self.connected)
过程:发送一个socket请求设置为非阻塞,在select函数中注册事件,self.con.fileno表示当前连接在进程中的描述符,EVENT_WRITE表示socket准备是否就绪,self.connected为回调函数,准备完成后就调用。selector.unregister(key.fd)取消注册,发送HTTP请求,再调用selector.register(self.con.fileno(), EVENT_READ, self.read)注册,若当前请求内容可读,则调用read回调函数读取出响应内容。
注明:在windows下会调用select函数,而在linux/unix下则会调用epoll函数
完整代码如下:
import socket
from urllib.parse import urlparse
from selectors import DefaultSelector, EVENT_READ, EVENT_WRITE
selector = DefaultSelector()
class Fetcher:
def connected(self, key):
selector.unregister(key.fd)
self.con.send('GET {} HTTP/1.1\r\nHost:{}\r\nConnection:close\r\n\r\n'.format(self.path,self.host).encode('utf-8'))
selector.register(self.con.fileno(), EVENT_READ, self.read)
def read(self, key):
d = self.con.recv(1024)
if d:
print(d)
self.data += d
else:
selector.unregister(key.fd)
self.data = self.data.decode('utf-8')
html_data = self.data.split('\r\n\r\n')[1]
print(html_data)
self.con.close()
def get_url(self, url):
url = urlparse(url)
self.host = url.netloc
self.path = url.path
self.data = b''
if self.path == "":
self.path = '/'
self.con = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
self.con.setblocking(False)
try:
self.con.connect((self.host, 80))
except BlockingIOError as e:
pass
#注册
selector.register(self.con.fileno(), EVENT_WRITE, self.connected)
def loop():
while True:
ready = selector.select()
for key, mask in ready:
callback = key.data
callback(key)
if __name__ == '__main__':
fetcher = Fetcher()
fetcher.get_url('http://www.baidu.com')
loop()
No activity yet