2004-09-29 06:40:25 +02:00
|
|
|
###
|
|
|
|
# Copyright (c) 2002-2004, Jeremiah Fincher
|
|
|
|
# All rights reserved.
|
|
|
|
#
|
|
|
|
# Redistribution and use in source and binary forms, with or without
|
|
|
|
# modification, are permitted provided that the following conditions are met:
|
|
|
|
#
|
|
|
|
# * Redistributions of source code must retain the above copyright notice,
|
|
|
|
# this list of conditions, and the following disclaimer.
|
|
|
|
# * Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
# this list of conditions, and the following disclaimer in the
|
|
|
|
# documentation and/or other materials provided with the distribution.
|
|
|
|
# * Neither the name of the author of this software nor the name of
|
|
|
|
# contributors to this software may be used to endorse or promote products
|
|
|
|
# derived from this software without specific prior written consent.
|
|
|
|
#
|
|
|
|
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
# POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
###
|
|
|
|
|
|
|
|
"""
|
2004-10-01 18:08:00 +02:00
|
|
|
Shrinks URLs using tinyurl.com and ln-s.net.
|
2004-09-29 06:40:25 +02:00
|
|
|
"""
|
|
|
|
|
|
|
|
__revision__ = "$Id$"
|
|
|
|
|
|
|
|
import supybot.plugins as plugins
|
|
|
|
|
|
|
|
import os
|
|
|
|
import re
|
|
|
|
import sets
|
|
|
|
import time
|
|
|
|
import getopt
|
|
|
|
import urlparse
|
|
|
|
import itertools
|
|
|
|
|
|
|
|
import supybot.dbi as dbi
|
|
|
|
import supybot.conf as conf
|
|
|
|
import supybot.utils as utils
|
|
|
|
import supybot.ircmsgs as ircmsgs
|
2004-10-16 05:39:42 +02:00
|
|
|
from supybot.commands import *
|
2004-09-29 06:40:25 +02:00
|
|
|
import supybot.webutils as webutils
|
|
|
|
import supybot.ircutils as ircutils
|
|
|
|
import supybot.registry as registry
|
|
|
|
import supybot.callbacks as callbacks
|
|
|
|
|
|
|
|
def configure(advanced):
|
|
|
|
from supybot.questions import output, expect, anything, something, yn
|
|
|
|
conf.registerPlugin('ShrinkUrl', True)
|
|
|
|
if yn("""This plugin offers a snarfer that will go to tinyurl.com and get
|
|
|
|
a shorter version of long URLs that are sent to the channel.
|
|
|
|
Would you like this snarfer to be enabled?""", default=False):
|
|
|
|
conf.supybot.plugins.ShrinkUrl.tinyurlSnarfer.setValue(True)
|
|
|
|
|
2004-10-01 18:08:00 +02:00
|
|
|
class ShrinkService(registry.OnlySomeStrings):
|
|
|
|
validStrings = ('ln', 'tiny')
|
|
|
|
|
2004-09-29 06:40:25 +02:00
|
|
|
conf.registerPlugin('ShrinkUrl')
|
2004-10-01 20:44:36 +02:00
|
|
|
conf.registerChannelValue(conf.supybot.plugins.ShrinkUrl, 'shrinkSnarfer',
|
2004-09-29 06:40:25 +02:00
|
|
|
registry.Boolean(False, """Determines whether the
|
2004-10-01 20:44:36 +02:00
|
|
|
shrink snarfer is enabled. This snarfer will watch for URLs in the
|
2004-09-29 06:40:25 +02:00
|
|
|
channel, and if they're sufficiently long (as determined by
|
2004-09-30 06:10:54 +02:00
|
|
|
supybot.plugins.ShrinkUrl.minimumLength) it will post a
|
2004-10-01 20:44:36 +02:00
|
|
|
smaller URL from either ln-s.net or tinyurl.com, as denoted in
|
|
|
|
supybot.plugins.ShrinkUrl.default."""))
|
2004-09-30 06:10:54 +02:00
|
|
|
conf.registerChannelValue(conf.supybot.plugins.ShrinkUrl, 'minimumLength',
|
|
|
|
registry.PositiveInteger(48, """The minimum length a URL must be before
|
|
|
|
the bot will shrink it."""))
|
2004-09-29 06:40:25 +02:00
|
|
|
conf.registerChannelValue(conf.supybot.plugins.ShrinkUrl, 'nonSnarfingRegexp',
|
2004-09-30 06:10:54 +02:00
|
|
|
registry.Regexp(None, """Determines what URLs are to be snarfed; URLs
|
|
|
|
matching the regexp given will not be snarfed. Give the empty string if
|
|
|
|
you have no URLs that you'd like to exclude from being snarfed."""))
|
|
|
|
conf.registerChannelValue(conf.supybot.plugins.ShrinkUrl, 'outFilter',
|
|
|
|
registry.Boolean(False, """Determines whether the bot will shrink the URLs
|
|
|
|
of outgoing messages if those URLs are longer than
|
|
|
|
supybot.plugins.ShrinkUrl.minimumLength."""))
|
2004-10-01 18:08:00 +02:00
|
|
|
conf.registerChannelValue(conf.supybot.plugins.ShrinkUrl, 'default',
|
|
|
|
ShrinkService('ln', """Determines what website the bot will use when
|
|
|
|
shrinking a URL."""))
|
2004-09-29 06:40:25 +02:00
|
|
|
|
2004-09-30 06:10:54 +02:00
|
|
|
class CdbShrunkenUrlDB(object):
|
|
|
|
def __init__(self, filename):
|
2004-10-01 18:08:00 +02:00
|
|
|
self.tinyDb = conf.supybot.databases.types.cdb.connect(
|
2004-10-04 20:15:06 +02:00
|
|
|
filename.replace('.db', '.Tiny.db'))
|
2004-10-01 18:08:00 +02:00
|
|
|
self.lnDb = conf.supybot.databases.types.cdb.connect(
|
2004-10-04 20:15:06 +02:00
|
|
|
filename.replace('.db', '.Ln.db'))
|
|
|
|
|
2004-10-01 18:08:00 +02:00
|
|
|
def getTiny(self, url):
|
|
|
|
return self.tinyDb[url]
|
|
|
|
|
|
|
|
def setTiny(self, url, tinyurl):
|
|
|
|
self.tinyDb[url] = tinyurl
|
2004-09-30 06:10:54 +02:00
|
|
|
|
2004-10-01 18:08:00 +02:00
|
|
|
def getLn(self, url):
|
|
|
|
return self.lnDb[url]
|
|
|
|
|
|
|
|
def setLn(self, url, lnurl):
|
|
|
|
self.lnDb[url] = lnurl
|
2004-09-30 06:10:54 +02:00
|
|
|
|
|
|
|
def close(self):
|
2004-10-01 20:44:36 +02:00
|
|
|
self.tinyDb.close()
|
|
|
|
self.lnDb.close()
|
2004-09-30 06:10:54 +02:00
|
|
|
|
|
|
|
def flush(self):
|
2004-10-01 20:44:36 +02:00
|
|
|
self.tinyDb.flush()
|
|
|
|
self.lnDb.flush()
|
2004-09-30 06:10:54 +02:00
|
|
|
|
|
|
|
ShrunkenUrlDB = plugins.DB('ShrinkUrl', {'cdb': CdbShrunkenUrlDB})
|
2004-10-04 20:15:06 +02:00
|
|
|
|
2004-09-29 06:40:25 +02:00
|
|
|
class ShrinkUrl(callbacks.PrivmsgCommandAndRegexp):
|
2004-10-01 20:44:36 +02:00
|
|
|
regexps = ['shrinkSnarfer']
|
2004-09-30 06:10:54 +02:00
|
|
|
def __init__(self):
|
|
|
|
self.db = ShrunkenUrlDB()
|
|
|
|
self.__parent = super(ShrinkUrl, self)
|
|
|
|
self.__parent.__init__()
|
2004-10-04 20:15:06 +02:00
|
|
|
|
2004-09-30 06:10:54 +02:00
|
|
|
def die(self):
|
|
|
|
self.db.close()
|
|
|
|
|
2004-09-29 06:40:25 +02:00
|
|
|
def callCommand(self, name, irc, msg, *L, **kwargs):
|
|
|
|
try:
|
2004-09-30 06:10:54 +02:00
|
|
|
self.__parent.callCommand(name, irc, msg, *L, **kwargs)
|
2004-09-29 06:40:25 +02:00
|
|
|
except webutils.WebError, e:
|
|
|
|
irc = callbacks.SimpleProxy(irc, msg)
|
|
|
|
irc.error(str(e))
|
2004-09-30 06:10:54 +02:00
|
|
|
|
|
|
|
def _outFilterThread(self, irc, msg):
|
|
|
|
(channel, text) = msg.args
|
|
|
|
for m in webutils.httpUrlRe.finditer(text):
|
|
|
|
url = m.group(1)
|
|
|
|
if len(url) > self.registryValue('minimumLength', channel):
|
2004-10-04 20:15:06 +02:00
|
|
|
cmd = self.registryValue('default', channel)
|
|
|
|
try:
|
|
|
|
if cmd == 'ln':
|
|
|
|
(shortUrl, _) = self._getLnUrl(url)
|
|
|
|
elif cmd == 'tiny':
|
|
|
|
shortUrl = self._getTinyUrl(url)
|
|
|
|
text = text.replace(url, shortUrl)
|
|
|
|
except webutils.WebError:
|
|
|
|
pass
|
2004-09-30 06:10:54 +02:00
|
|
|
newMsg = ircmsgs.privmsg(channel, text, msg=msg)
|
|
|
|
newMsg.tag('shrunken')
|
|
|
|
irc.queueMsg(newMsg)
|
|
|
|
|
|
|
|
def outFilter(self, irc, msg):
|
|
|
|
channel = msg.args[0]
|
2004-12-16 08:56:57 +01:00
|
|
|
if msg.command == 'PRIVMSG' and irc.isChannel(channel):
|
2004-09-30 06:10:54 +02:00
|
|
|
if not msg.shrunken:
|
|
|
|
if self.registryValue('outFilter', channel):
|
|
|
|
if webutils.httpUrlRe.search(msg.args[1]):
|
|
|
|
self._outFilterThread(irc, msg)
|
|
|
|
return None
|
|
|
|
return msg
|
2004-10-04 20:15:06 +02:00
|
|
|
|
2004-10-01 18:08:00 +02:00
|
|
|
def shrinkSnarfer(self, irc, msg, match):
|
2004-09-29 06:40:25 +02:00
|
|
|
r"https?://[^\])>\s]{13,}"
|
|
|
|
channel = msg.args[0]
|
2004-12-16 08:56:57 +01:00
|
|
|
if not irc.isChannel(channel):
|
2004-09-29 06:40:25 +02:00
|
|
|
return
|
2004-10-01 18:08:00 +02:00
|
|
|
if self.registryValue('shrinkSnarfer', channel):
|
2004-09-29 06:40:25 +02:00
|
|
|
url = match.group(0)
|
|
|
|
r = self.registryValue('nonSnarfingRegexp', channel)
|
|
|
|
if r and r.search(url) is not None:
|
2004-10-24 00:07:50 +02:00
|
|
|
self.log.debug('Matched nonSnarfingRegexp: %s',
|
|
|
|
utils.quoted(url))
|
2004-09-29 06:40:25 +02:00
|
|
|
return
|
2004-10-01 18:08:00 +02:00
|
|
|
minlen = self.registryValue('minimumLength', channel)
|
2004-10-04 20:15:06 +02:00
|
|
|
cmd = self.registryValue('default', channel)
|
2004-09-29 06:40:25 +02:00
|
|
|
if len(url) >= minlen:
|
2004-10-04 20:15:06 +02:00
|
|
|
shorturl = None
|
|
|
|
if cmd == 'tiny':
|
|
|
|
shorturl = self._getTinyUrl(url)
|
|
|
|
elif cmd == 'ln':
|
|
|
|
(shorturl, _) = self._getLnUrl(url)
|
|
|
|
if shorturl is None:
|
2004-10-24 00:07:50 +02:00
|
|
|
self.log.info('Couldn\'t get shorturl for %s',
|
|
|
|
utils.quoted(url))
|
2004-10-04 20:15:06 +02:00
|
|
|
return
|
2004-09-29 06:40:25 +02:00
|
|
|
domain = webutils.getDomain(url)
|
2004-10-04 20:15:06 +02:00
|
|
|
s = '%s (at %s)' % (ircutils.bold(shorturl), domain)
|
2004-09-30 06:10:54 +02:00
|
|
|
m = irc.reply(s, prefixName=False)
|
|
|
|
m.tag('shrunken')
|
2004-10-22 07:56:55 +02:00
|
|
|
shrinkSnarfer = urlSnarfer(shrinkSnarfer)
|
2004-09-29 06:40:25 +02:00
|
|
|
|
2004-10-01 18:08:00 +02:00
|
|
|
def _getLnUrl(self, url):
|
2004-12-30 09:32:36 +01:00
|
|
|
url = webutils.urlquote(url)
|
2004-10-01 18:08:00 +02:00
|
|
|
try:
|
2004-10-04 20:45:20 +02:00
|
|
|
return (self.db.getLn(url), '200')
|
2004-10-01 18:08:00 +02:00
|
|
|
except KeyError:
|
2004-10-04 20:15:06 +02:00
|
|
|
text = webutils.getUrl('http://ln-s.net/home/api.jsp?url=%s' % url)
|
|
|
|
(code, lnurl) = text.split(None, 1)
|
|
|
|
lnurl = lnurl.strip()
|
|
|
|
if code == '200':
|
|
|
|
self.db.setLn(url, lnurl)
|
|
|
|
else:
|
|
|
|
lnurl = None
|
|
|
|
return (lnurl, code)
|
2004-10-01 18:08:00 +02:00
|
|
|
|
|
|
|
def ln(self, irc, msg, args, url):
|
|
|
|
"""<url>
|
|
|
|
|
|
|
|
Returns an ln-s.net version of <url>.
|
|
|
|
"""
|
|
|
|
if len(url) < 17:
|
|
|
|
irc.error('Stop being a lazy-biotch and type the URL yourself.')
|
|
|
|
return
|
|
|
|
(lnurl, error) = self._getLnUrl(url)
|
2004-10-04 20:15:06 +02:00
|
|
|
if lnurl is not None:
|
|
|
|
domain = webutils.getDomain(url)
|
2004-10-01 20:44:36 +02:00
|
|
|
m = irc.reply(lnurl)
|
2004-10-01 18:08:00 +02:00
|
|
|
m.tag('shrunken')
|
|
|
|
else:
|
|
|
|
irc.error(error)
|
2004-10-22 07:56:55 +02:00
|
|
|
ln = thread(wrap(ln, ['url']))
|
2004-10-01 18:08:00 +02:00
|
|
|
|
2004-09-29 06:40:25 +02:00
|
|
|
_tinyRe = re.compile(r'<blockquote><b>(http://tinyurl\.com/\w+)</b>')
|
|
|
|
def _getTinyUrl(self, url):
|
2004-09-30 06:10:54 +02:00
|
|
|
try:
|
2004-10-01 18:08:00 +02:00
|
|
|
return self.db.getTiny(url)
|
2004-09-30 06:10:54 +02:00
|
|
|
except KeyError:
|
|
|
|
s = webutils.getUrl('http://tinyurl.com/create.php?url=%s' % url)
|
|
|
|
m = self._tinyRe.search(s)
|
|
|
|
if m is None:
|
|
|
|
tinyurl = None
|
|
|
|
else:
|
|
|
|
tinyurl = m.group(1)
|
2004-10-01 18:08:00 +02:00
|
|
|
self.db.setTiny(url, tinyurl)
|
2004-09-30 06:10:54 +02:00
|
|
|
return tinyurl
|
2004-09-29 06:40:25 +02:00
|
|
|
|
2004-09-30 11:57:47 +02:00
|
|
|
def tiny(self, irc, msg, args, url):
|
2004-09-29 06:40:25 +02:00
|
|
|
"""<url>
|
|
|
|
|
|
|
|
Returns a TinyURL.com version of <url>
|
|
|
|
"""
|
|
|
|
if len(url) < 20:
|
|
|
|
irc.error('Stop being a lazy-biotch and type the URL yourself.')
|
|
|
|
return
|
|
|
|
tinyurl = self._getTinyUrl(url)
|
|
|
|
if tinyurl is not None:
|
2004-09-30 06:10:54 +02:00
|
|
|
m = irc.reply(tinyurl)
|
|
|
|
m.tag('shrunken')
|
2004-09-29 06:40:25 +02:00
|
|
|
else:
|
|
|
|
s = 'Could not parse the TinyURL.com results page.'
|
|
|
|
irc.errorPossibleBug(s)
|
2004-10-22 07:56:55 +02:00
|
|
|
tiny = thread(wrap(tiny, ['url']))
|
2004-09-29 06:40:25 +02:00
|
|
|
|
|
|
|
|
|
|
|
Class = ShrinkUrl
|
|
|
|
|
|
|
|
# vim:set shiftwidth=4 tabstop=8 expandtab textwidth=78:
|