URL interpreter: Handle HTTPErrors.

[plomlombot-irc.git] / plomlombot.py
diff --git a/plomlombot.py b/plomlombot.py

index 7d915dc2f80c79157119089aa2e0dd6e9566d16a..ffb4192ac8f2925b1d6a34684acfd585eec82c6f 100644 (file)
--- a/plomlombot.py
+++ b/plomlombot.py
@@ -9,10 +9,10 @@ import html
  servernet = "irc.freenode.net"
  port = 6667
  servername = ""
  servernet = "irc.freenode.net"
  port = 6667
  servername = ""
-timeout = 480
+timeout = 240
  username = "plomlombot"
  nickname = username
  username = "plomlombot"
  nickname = username
-channel = "#zrolaps"
+channel = "#zrolaps-test"
  
  class IO:
  
  
  class IO:
  
@@ -71,6 +71,28 @@ class IO:
              line)
          return line
  
              line)
          return line
  
+def url_check(msg):
+    matches = re.findall("(https?://[^\s]+)", msg)
+    for i in range(len(matches)):
+        url = matches[i]
+        try:
+            webpage = urllib.request.urlopen(url, timeout=15)
+        except urllib.error.HTTPError as error:
+            print("TROUBLE FOLLOWING URL: " + str(error))
+            continue
+        charset = webpage.info().get_content_charset()
+        if not charset:
+            charset="utf-8"
+        content_type = webpage.info().get_content_type()
+        if not content_type in ('text/html', 'text/xml',
+                'application/xhtml+xml'):
+            print("TROUBLE INTERPRETING URL: bad content_type " + content_type)
+            continue
+        content = webpage.read().decode(charset)
+        title = str(content).split('<title>')[1].split('</title>')[0]
+        title = html.unescape(title)
+        io.send_line("PRIVMSG " + target + " :page title for url: " + title)
+
  io = IO(servernet, port)
  io.send_line("NICK " + nickname)
  io.send_line("USER " + username + " 0 * : ")
  io = IO(servernet, port)
  io.send_line("NICK " + nickname)
  io.send_line("USER " + username + " 0 * : ")
@@ -99,19 +121,6 @@ while 1:
              if receiver != nickname:
                  target = receiver
              msg = str.join(" ", tokens[3:])[1:]
              if receiver != nickname:
                  target = receiver
              msg = str.join(" ", tokens[3:])[1:]
-            matches = re.findall("(https?://[^\s]+)", msg)
-            for i in range(len(matches)):
-                url = matches[i]
-                webpage = urllib.request.urlopen(url)
-                content_type = webpage.info().get_content_type()
-                if not content_type in ('text/html', 'text/xml',
-                    'application/xhtml+xml'):
-                    continue
-                charset = webpage.info().get_content_charset()
-                content = webpage.read().decode(charset)
-                title = str(content).split('<title>')[1].split('</title>')[0]
-                title = html.unescape(title)
-                io.send_line("PRIVMSG "
-                    + target + " :page title for url: " + title)
+            url_check(msg)
          if tokens[0] == "PING":
              io.send_line("PONG " + tokens[1])
          if tokens[0] == "PING":
              io.send_line("PONG " + tokens[1])