4KiB was not enough for everyone
This commit is contained in:
parent
d936b9646e
commit
179ff85f4c
12
botcmd.py
12
botcmd.py
|
@ -125,13 +125,17 @@ def handle_message(*, prefix, message, nick, channel, irc):
|
||||||
try:
|
try:
|
||||||
with urllib.request.urlopen(url, timeout = 1) as response:
|
with urllib.request.urlopen(url, timeout = 1) as response:
|
||||||
if response.info().get_content_type() == 'text/html':
|
if response.info().get_content_type() == 'text/html':
|
||||||
# First 4KB of a page should be enough for any <title>
|
# First 4KiB of a page should be enough for any <title>
|
||||||
first_kb = response.read(4 * 1024)
|
# Turns out it's not, so download 64KiB
|
||||||
title = sanitize(extract_title(first_kb))
|
page_source_fragment = response.read(64 * 1024)
|
||||||
|
title = sanitize(extract_title(page_source_fragment))
|
||||||
|
|
||||||
domain = sanitize(urllib.parse.urlparse(url).netloc)
|
domain = sanitize(urllib.parse.urlparse(url).netloc)
|
||||||
|
|
||||||
message = '%s: %s' % (domain, title)
|
if title is not None:
|
||||||
|
message = '%s: %s' % (domain, title)
|
||||||
|
else:
|
||||||
|
message = '%s: <no title found>' % domain
|
||||||
irc.bot_response(channel, message)
|
irc.bot_response(channel, message)
|
||||||
|
|
||||||
possible_titles_left -= 1
|
possible_titles_left -= 1
|
||||||
|
|
Loading…
Reference in New Issue