Fixed the 'title' regexp to be non-greedy, in case there's a </title> tag

within the document itself. Also put a test for this (which will hopefully be a permanent link... not sure though)
2026-06-02 14:02:31 +02:00 · 2003-10-24 00:46:21 +00:00 · 2003-10-24 00:46:21 +00:00 · f0574da59a
commit f0574da59a
parent aa05fc1a79
2 changed files with 6 additions and 1 deletions
--- a/plugins/Http.py
+++ b/plugins/Http.py
@ -79,7 +79,7 @@ class FreshmeatException(Exception):
 class Http(callbacks.Privmsg):
    threaded = True

-    _titleRe = re.compile(r'<title>(.*)</title>', re.I | re.S)
+    _titleRe = re.compile(r'<title>(.*?)</title>', re.I | re.S)
    def title(self, irc, msg, args):
        """<url>

--- a/test/test_Http.py
+++ b/test/test_Http.py
@ -49,6 +49,11 @@ class HttpTest(PluginTestCase, PluginDocumentation):
                             '1884822312/qid=1063140754/sr=8-1/ref=sr_8_1/'
                             '002-9802970-2308826?v=glance&s=books&n=507846',
                             'no HTML title')
+        # Checks the non-greediness of the regexp
+        self.assertResponse('title '
+                            'http://www.space.com/scienceastronomy/'
+                            'jupiter_dark_spot_031023.html',
+                            'Mystery Spot on Jupiter Baffles Astronomers')

    def testGeekquote(self):
        self.assertNotError('geekquote')