Web tool now handles HTTPS connections, content is decoded following given charset header

This commit is contained in:
nemunaire 2014-06-24 18:07:28 +02:00
parent 7575c41645
commit 05a148fef4
2 changed files with 26 additions and 4 deletions

View File

@ -40,11 +40,13 @@ def cmd_curl(msg):
req = web.getURLContent(" ".join(msg.cmds[1:])) req = web.getURLContent(" ".join(msg.cmds[1:]))
if req is not None: if req is not None:
res = Response(msg.sender, channel=msg.channel) res = Response(msg.sender, channel=msg.channel)
for m in req.decode().split("\n"): for m in req.split("\n"):
res.append_message(m) res.append_message(m)
return res return res
else: else:
return Response(msg.sender, "Une erreur est survenue lors de l'accès à cette URL", channel=msg.channel) return Response(msg.sender, "Une erreur est survenue lors de l'accès à cette URL", channel=msg.channel)
except socket.timeout:
return Response(msg.sender, "le délais d'attente a été dépassé durant l'accès à %s" % msg.cmds[1:], channel=msg.channel, nick=msg.nick)
except socket.error as e: except socket.error as e:
return Response(msg.sender, e.strerror, channel=msg.channel) return Response(msg.sender, e.strerror, channel=msg.channel)
else: else:
@ -117,6 +119,8 @@ def cmd_whois(msg):
try: try:
req = urllib.request.Request("http://www.whoisxmlapi.com/whoisserver/WhoisService?rid=1&domainName=%s&outputFormat=json&userName=%s&password=%s" % (urllib.parse.quote(dom), urllib.parse.quote(CONF.getNode("whoisxmlapi")["username"]), urllib.parse.quote(CONF.getNode("whoisxmlapi")["password"])), headers={ 'User-Agent' : "nemubot v3" }) req = urllib.request.Request("http://www.whoisxmlapi.com/whoisserver/WhoisService?rid=1&domainName=%s&outputFormat=json&userName=%s&password=%s" % (urllib.parse.quote(dom), urllib.parse.quote(CONF.getNode("whoisxmlapi")["username"]), urllib.parse.quote(CONF.getNode("whoisxmlapi")["password"])), headers={ 'User-Agent' : "nemubot v3" })
raw = urllib.request.urlopen(req, timeout=10) raw = urllib.request.urlopen(req, timeout=10)
except socket.timeout:
raise IRCException("Sorry, the request has timed out.")
except urllib.error.HTTPError as e: except urllib.error.HTTPError as e:
raise IRCException("HTTP error occurs: %s %s" % (e.code, e.reason)) raise IRCException("HTTP error occurs: %s %s" % (e.code, e.reason))

View File

@ -61,7 +61,17 @@ def getPassword(url):
def getURLContent(url, timeout=15): def getURLContent(url, timeout=15):
"""Return page content corresponding to URL or None if any error occurs""" """Return page content corresponding to URL or None if any error occurs"""
o = urlparse(url) o = urlparse(url)
conn = http.client.HTTPConnection(o.netloc, port=o.port, timeout=timeout) if o.netloc == "":
o = urlparse("http://" + url)
if o.scheme == "http":
conn = http.client.HTTPConnection(o.netloc, port=o.port, timeout=timeout)
elif o.scheme == "https":
conn = http.client.HTTPSConnection(o.netloc, port=o.port, timeout=timeout)
elif o.scheme is None or o.scheme == "":
conn = http.client.HTTPConnection(o.netloc, port=80, timeout=timeout)
else:
return None
try: try:
if o.query != '': if o.query != '':
conn.request("GET", o.path + "?" + o.query, None, {"User-agent": "Nemubot v3"}) conn.request("GET", o.path + "?" + o.query, None, {"User-agent": "Nemubot v3"})
@ -70,8 +80,8 @@ def getURLContent(url, timeout=15):
except socket.timeout: except socket.timeout:
return None return None
except socket.gaierror: except socket.gaierror:
print ("<tools.web> Unable to receive page %s from %s on %d." print ("<tools.web> Unable to receive page %s on %s from %s."
% (o.path, o.netloc, o.port)) % (o.path, o.netloc, url))
return None return None
try: try:
@ -83,6 +93,14 @@ def getURLContent(url, timeout=15):
return None return None
data = res.read(size) data = res.read(size)
# Decode content
charset = res.getheader("Content-Type").split(";")
if len(charset) > 1:
for c in charset:
ch = c.split("=")
if ch[0].strip().lower() == "charset" and len(ch) > 1:
data = data.decode(ch[1])
except http.client.BadStatusLine: except http.client.BadStatusLine:
return None return None
finally: finally: