home
·
contact
·
privacy
projects
/
plomlombot-irc.git
/ blobdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
|
commitdiff
|
tree
raw
|
inline
| side by side
In recv_line(), handle UnicodeDecodeErrors by assuming latin1.
[plomlombot-irc.git]
/
plomlombot.py
diff --git
a/plomlombot.py
b/plomlombot.py
index d6feb9377b4e36a1c5af96adb078f480c1c6f5fa..0b605e9946b04f79a8f3e843da56eee2b59b0169 100755
(executable)
--- a/
plomlombot.py
+++ b/
plomlombot.py
@@
-67,7
+67,11
@@
class IO:
self._pingtest(send_ping)
return None
self.last_pong = time.time()
self._pingtest(send_ping)
return None
self.last_pong = time.time()
- received_runes = self.socket.recv(1024).decode("UTF-8")
+ received_bytes = self.socket.recv(1024)
+ try:
+ received_runes = received_bytes.decode("UTF-8")
+ except UnicodeDecodeError:
+ received_runes = received_bytes.decode("latin1")
if len(received_runes) == 0:
print("SOCKET CONNECTION BROKEN")
raise ExceptionForRestart
if len(received_runes) == 0:
print("SOCKET CONNECTION BROKEN")
raise ExceptionForRestart
@@
-100,14
+104,21
@@
def lineparser_loop(io, nickname):
def act_on_privmsg(tokens):
def url_check(msg):
def act_on_privmsg(tokens):
def url_check(msg):
+
+ def notice(msg):
+ io.send_line("NOTICE " + target + " :" + msg)
+
matches = re.findall("(https?://[^\s>]+)", msg)
for i in range(len(matches)):
url = matches[i]
matches = re.findall("(https?://[^\s>]+)", msg)
for i in range(len(matches)):
url = matches[i]
+ request = urllib.request.Request(url, headers={
+ "User-Agent": "plomlombot"
+ })
try:
try:
- webpage = urllib.request.urlopen(
url
, timeout=15)
+ webpage = urllib.request.urlopen(
request
, timeout=15)
except (urllib.error.HTTPError, urllib.error.URLError,
UnicodeError, http.client.BadStatusLine) as error:
except (urllib.error.HTTPError, urllib.error.URLError,
UnicodeError, http.client.BadStatusLine) as error:
-
print
("TROUBLE FOLLOWING URL: " + str(error))
+
notice
("TROUBLE FOLLOWING URL: " + str(error))
continue
charset = webpage.info().get_content_charset()
if not charset:
continue
charset = webpage.info().get_content_charset()
if not charset:
@@
-115,14
+126,13
@@
def lineparser_loop(io, nickname):
content_type = webpage.info().get_content_type()
if content_type not in ('text/html', 'text/xml',
'application/xhtml+xml'):
content_type = webpage.info().get_content_type()
if content_type not in ('text/html', 'text/xml',
'application/xhtml+xml'):
-
print("TROUBLE INTERPRETING URL
: bad content type "
- + content_type)
+
notice("TROUBLE READING PAGE TITLE
: bad content type "
+
+ content_type)
continue
content = webpage.read().decode(charset)
title = str(content).split('<title>')[1].split('</title>')[0]
title = html.unescape(title)
continue
content = webpage.read().decode(charset)
title = str(content).split('<title>')[1].split('</title>')[0]
title = html.unescape(title)
- io.send_line("PRIVMSG " + target + " :page title for url: "
- + title)
+ notice("PAGE TITLE FOR URL: " + title)
sender = ""
for rune in tokens[0]:
sender = ""
for rune in tokens[0]: