diff options
| author | 2019-07-08 11:43:09 +0100 | |
|---|---|---|
| committer | 2019-07-08 11:43:09 +0100 | |
| commit | 15e143fcff39d64c5acc2d93f61c2f00f65c2ee0 (patch) | |
| tree | f3d1cb44251c34edb64bfe0f7bbc6e3773d51b91 /src | |
| parent | only set last_stdout/last_stderr when there's actually output (diff) | |
| signature | ||
implement utils.http.request_many as a tonado ioloop yield
Diffstat (limited to 'src')
| -rw-r--r-- | src/utils/http.py | 20 |
1 files changed, 19 insertions, 1 deletions
diff --git a/src/utils/http.py b/src/utils/http.py index 2885ebee..d12a978b 100644 --- a/src/utils/http.py +++ b/src/utils/http.py @@ -1,7 +1,7 @@ import ipaddress, re, signal, socket, traceback, typing import urllib.error, urllib.parse import json as _json -import bs4, netifaces, requests +import bs4, netifaces, requests, tornado.gen, tornado.httpclient, tornado.ioloop from src import utils REGEX_URL = re.compile("https?://[A-Z0-9{}]+".format(re.escape("-._~:/%?#[]@!$&'()*+,;=")), re.I) @@ -109,6 +109,24 @@ def request(url: str, method: str="GET", get_params: dict={}, return Response(response.status_code, data, response_headers) +def request_many(urls: typing.List[str]) -> typing.Dict[str, Response]: + responses = {} + + @tornado.gen.coroutine + def _request(): + for url in urls: + client = tornado.httpclient.AsyncHTTPClient() + request = tornado.httpclient.HTTPRequest(url, method="GET", + connect_timeout=2, request_timeout=2) + response = yield client.fetch(request) + + headers = utils.CaseInsensitiveDict(dict(response.headers)) + data = response.body.decode("utf8") + responses[url] = Response(response.code, data, headers) + + tornado.ioloop.IOLoop.current().run_sync(_request) + return responses + def strip_html(s: str) -> str: return bs4.BeautifulSoup(s, "lxml").get_text() |
