#!/usr/bin/env python
###
# Copyright (c) 2002, Jeremiah Fincher
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions are met:
#
# * Redistributions of source code must retain the above copyright notice,
# this list of conditions, and the following disclaimer.
# * Redistributions in binary form must reproduce the above copyright notice,
# this list of conditions, and the following disclaimer in the
# documentation and/or other materials provided with the distribution.
# * Neither the name of the author of this software nor the name of
# contributors to this software may be used to endorse or promote products
# derived from this software without specific prior written consent.
#
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
# POSSIBILITY OF SUCH DAMAGE.
###
"""
Keeps track of URLs posted to a channel, along with relevant context. Allows
searching for URLs and returning random URLs. Also provides statistics on the
URLs in the database.
"""
__revision__ = "$Id$"
import plugins
import os
import re
import time
import getopt
import urllib2
import urlparse
import conf
import utils
import ircmsgs
import webutils
import ircutils
import privmsgs
import registry
import callbacks
try:
import sqlite
except ImportError:
raise callbacks.Error, 'You need to have PySQLite installed to use this ' \
'plugin. Download it at
(http://tinyurl\.com/\w+)') def _getTinyUrl(self, url, channel, cmd=False): db = self.getDb(channel) cursor = db.cursor() try: cursor.execute("""SELECT tinyurls.tinyurl FROM urls, tinyurls WHERE urls.url=%s AND tinyurls.url_id=urls.id""", url) except sqlite.OperationalError: raise if cursor.rowcount == 0: updateDb = True try: fd = urllib2.urlopen('http://tinyurl.com/create.php?url=%s' % url) s = fd.read() fd.close() m = self._tinyRe.search(s) if m is None: tinyurl = None else: tinyurl = m.group(1) except urllib2.HTTPError, e: if cmd: raise callbacks.Error, e.msg() else: self.log.warning(str(e)) else: updateDb = False tinyurl = cursor.fetchone()[0] return (tinyurl, updateDb) def _formatUrl(self, url, added, addedBy): when = time.strftime(conf.supybot.humanTimestampFormat(), time.localtime(int(added))) return '<%s> (added by %s at %s)' % (url, addedBy, when) def random(self, irc, msg, args): """[] Returns a random URL from the URL database. is only required if the message isn't sent in the channel itself. """ channel = privmsgs.getChannel(msg, args) db = self.getDb(channel) cursor = db.cursor() cursor.execute("""SELECT url, added, added_by FROM urls ORDER BY random() LIMIT 1""") if cursor.rowcount == 0: irc.reply('I have no URLs in my database for %s' % channel) else: irc.reply(self._formatUrl(*cursor.fetchone())) def tiny(self, irc, msg, args): """ Returns a TinyURL.com version of """ url = privmsgs.getArgs(args) if len(url) < 20: irc.error('Stop being a lazy-biotch and type the URL yourself.') return channel = msg.args[0] snarf = self.registryValue('tinyurlSnarfer', channel) minlen = self.registryValue('tinyurlSnarfer.minimumLength', channel) r = self.registryValue('nonSnarfingRegexp', channel) if snarf and len(url) >= minlen and not r.search(url): return try: (tinyurl, updateDb) = self._getTinyUrl(url, channel, cmd=True) except sqlite.OperationalError: irc.error('The database just decided to crap itself.') return if tinyurl is not None: if updateDb: self._updateTinyDb(url, tinyurl, channel) irc.reply(tinyurl) else: s = 'Could not parse the TinyURL.com results page.' irc.errorPossibleBug(s) tiny = privmsgs.thread(tiny) def stats(self, irc, msg, args): """[ ] Returns the number of URLs in the URL database. is only required if the message isn't sent in the channel itself. """ channel = privmsgs.getChannel(msg, args) db = self.getDb(channel) cursor = db.cursor() cursor.execute("""SELECT COUNT(*) FROM urls""") (count,) = cursor.fetchone() count = int(count) irc.reply('I have %s %s in my database.' % (count, count == 1 and 'URL' or 'URLs')) def last(self, irc, msg, args): """[ ] [--{from,with,at,proto,near}= ] --{nolimit,fancy} Gives the last URL matching the given criteria. --from is from whom the URL came; --at is the site of the URL; --proto is the protocol the URL used; --with is something inside the URL; --near is a string in the messages before and after the link. If --nolimit is given, returns all the URLs that are found. --fancy returns information in addition to just the URL. is only necessary if the message isn't sent in the channel itself. """ channel = privmsgs.getChannel(msg, args) (optlist, rest) = getopt.getopt(args, '', ['from=', 'with=', 'at=', 'proto=', 'near=', 'nolimit', 'fancy']) criteria = ['1=1'] formats = [] simple = True nolimit = False for (option, argument) in optlist: option = option.lstrip('-') # Strip off the --. if option == 'nolimit': nolimit = True if option == 'fancy': simple = False elif option == 'from': criteria.append('added_by LIKE %s') formats.append(argument) elif option == 'with': if '%' not in argument and '_' not in argument: argument = '%%%s%%' % argument criteria.append('url LIKE %s') formats.append(argument) elif option == 'at': if '%' not in argument and '_' not in argument: argument = '%' + argument criteria.append('site LIKE %s') formats.append(argument) elif option == 'proto': criteria.append('protocol=%s') formats.append(argument) elif option == 'near': criteria.append("""(previous_msg LIKE %s OR next_msg LIKE %s OR current_msg LIKE %s)""") if '%' not in argument: argument = '%%%s%%' % argument formats.append(argument) formats.append(argument) formats.append(argument) db = self.getDb(channel) cursor = db.cursor() criterion = ' AND '.join(criteria) sql = """SELECT id, url, added, added_by FROM urls WHERE %s ORDER BY id DESC LIMIT 100""" % criterion cursor.execute(sql, *formats) if cursor.rowcount == 0: irc.reply('No URLs matched that criteria.') else: if nolimit: urls = ['<%s>' % t[1] for t in cursor.fetchall()] s = ', '.join(urls) elif simple: s = cursor.fetchone()[1] else: (id, url, added, added_by) = cursor.fetchone() timestamp = time.strftime('%I:%M %p, %B %d, %Y', time.localtime(int(added))) s = '#%s: <%s>, added by %s at %s.' % \ (id, url, added_by, timestamp) irc.reply(s) Class = URL # vim:set shiftwidth=4 tabstop=8 expandtab textwidth=78: