home
·
contact
·
privacy
projects
/
plomlombot-irc.git
/ commitdiff
commit
grep
author
committer
pickaxe
?
search:
re
summary
|
shortlog
|
log
|
commit
| commitdiff |
tree
raw
|
patch
| inline |
side by side
(parent:
01c61f5
)
Add content-type check to URL interpreter.
author
Christian Heller
<c.heller@plomlompom.de>
Sun, 17 Jan 2016 19:38:57 +0000
(20:38 +0100)
committer
Christian Heller
<c.heller@plomlompom.de>
Sun, 17 Jan 2016 19:38:57 +0000
(20:38 +0100)
plomlombot.py
patch
|
blob
|
history
diff --git
a/plomlombot.py
b/plomlombot.py
index 179bc2a2221d90da84580f57898aa3b704fca0f5..7d915dc2f80c79157119089aa2e0dd6e9566d16a 100644
(file)
--- a/
plomlombot.py
+++ b/
plomlombot.py
@@
-103,6
+103,10
@@
while 1:
for i in range(len(matches)):
url = matches[i]
webpage = urllib.request.urlopen(url)
+ content_type = webpage.info().get_content_type()
+ if not content_type in ('text/html', 'text/xml',
+ 'application/xhtml+xml'):
+ continue
charset = webpage.info().get_content_charset()
content = webpage.read().decode(charset)
title = str(content).split('<title>')[1].split('</title>')[0]