#!/usr/bin/env python ### # Copyright (c) 2002, Jeremiah Fincher # All rights reserved. # # Redistribution and use in source and binary forms, with or without # modification, are permitted provided that the following conditions are met: # # * Redistributions of source code must retain the above copyright notice, # this list of conditions, and the following disclaimer. # * Redistributions in binary form must reproduce the above copyright notice, # this list of conditions, and the following disclaimer in the # documentation and/or other materials provided with the distribution. # * Neither the name of the author of this software nor the name of # contributors to this software may be used to endorse or promote products # derived from this software without specific prior written consent. # # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE # ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE # POSSIBILITY OF SUCH DAMAGE. ### __revision__ = "$Id$" import supybot.fix as fix import gc import os import re import csv import sys import sets import time import random import urllib2 import UserDict import threading import supybot.cdb as cdb import supybot.log as log import supybot.conf as conf import supybot.utils as utils import supybot.world as world import supybot.ircutils as ircutils import supybot.webutils as webutils try: mxCrap = {} for (name, module) in sys.modules.items(): if name.startswith('mx'): mxCrap[name] = module sys.modules[name] = None import sqlite for (name, module) in mxCrap.items(): sys.modules[name] = module sqlite.have_datetime = False Connection = sqlite.Connection class MyConnection(sqlite.Connection): def commit(self, *args, **kwargs): if self.autocommit: return else: Connection.commit(self, *args, **kwargs) sqlite.Connection = MyConnection except ImportError: pass class DBHandler(object): def __init__(self, name=None, suffix='.db'): if name is None: self.name = self.__class__.__name__ else: self.name = name if suffix and suffix[0] != '.': suffix = '.' + suffix self.suffix = suffix self.cachedDb = None def makeFilename(self): if self.name.endswith(self.suffix): return self.name else: return self.name + self.suffix def makeDb(self, filename): raise NotImplementedError def getDb(self): if self.cachedDb is None or \ threading.currentThread() is not world.mainThread: db = self.makeDb(self.makeFilename()) else: db = self.cachedDb db.autocommit = 1 return db def die(self): if self.cachedDb is not None: self.cachedDb.die() del self.cachedDb # XXX: This shouldn't be a mixin. This should be contained by classes that # want such behavior. But at this point, it wouldn't gain much for us # to refactor it. class ChannelDBHandler(object): """A class to handle database stuff for individual channels transparently. """ suffix = '.db' def __init__(self, suffix='.db'): self.dbCache = ircutils.IrcDict() suffix = self.suffix if self.suffix and self.suffix[0] != '.': suffix = '.' + suffix self.suffix = suffix def makeFilename(self, channel): """Override this to specialize the filenames of your databases.""" channel = ircutils.toLower(channel) prefix = '%s-%s%s' % (channel, self.__class__.__name__, self.suffix) return os.path.join(conf.supybot.directories.data(), prefix) def makeDb(self, filename): """Override this to create your databases.""" return cdb.shelf(filename) def getDb(self, channel): """Use this to get a database for a specific channel.""" currentThread = threading.currentThread() if channel not in self.dbCache and currentThread == world.mainThread: self.dbCache[channel] = self.makeDb(self.makeFilename(channel)) if currentThread != world.mainThread: db = self.makeDb(self.makeFilename(channel)) else: db = self.dbCache[channel] db.autocommit = 1 return db def die(self): for db in self.dbCache.itervalues(): try: db.commit() except AttributeError: # In case it's not an SQLite database. pass try: db.close() except AttributeError: # In case it doesn't have a close method. pass del db gc.collect() class ChannelUserDictionary(UserDict.DictMixin): IdDict = dict def __init__(self): self.channels = ircutils.IrcDict() def __getitem__(self, (channel, id)): return self.channels[channel][id] def __setitem__(self, (channel, id), v): if channel not in self.channels: self.channels[channel] = self.IdDict() self.channels[channel][id] = v def __delitem__(self, (channel, id)): del self.channels[channel][id] def iteritems(self): for (channel, ids) in self.channels.iteritems(): for (id, v) in ids.iteritems(): yield ((channel, id), v) def keys(self): L = [] for (k, _) in self.iteritems(): L.append(k) return L class ChannelUserDB(ChannelUserDictionary): def __init__(self, filename): ChannelUserDictionary.__init__(self) self.filename = filename try: fd = file(self.filename) except EnvironmentError, e: log.warning('Couldn\'t open %s: %s.', self.filename, e) return reader = csv.reader(fd) try: lineno = 0 for t in reader: lineno += 1 try: channel = t.pop(0) id = t.pop(0) try: id = int(id) except ValueError: # We'll skip over this so, say, nicks can be kept here. pass v = self.deserialize(channel, id, t) self[channel, id] = v except Exception, e: log.warning('Invalid line #%s in %s.', lineno, self.__class__.__name__) log.debug('Exception: %s', utils.exnToString(e)) except Exception, e: # This catches exceptions from csv.reader. log.warning('Invalid line #%s in %s.', lineno, self.__class__.__name__) log.debug('Exception: %s', utils.exnToString(e)) def flush(self): fd = utils.AtomicFile(self.filename) writer = csv.writer(fd) items = self.items() if not items: log.warning('%s: Refusing to write blank file.', self.__class__.__name__) fd.rollback() return items.sort() for ((channel, id), v) in items: L = self.serialize(v) L.insert(0, id) L.insert(0, channel) writer.writerow(L) fd.close() def close(self): self.flush() self.clear() def deserialize(self, channel, id, L): """Should take a list of strings and return an object to be accessed via self.get(channel, id).""" raise NotImplementedError def serialize(self, x): """Should take an object (as returned by self.get(channel, id)) and return a list (of any type serializable to csv).""" raise NotImplementedError class PeriodicFileDownloader(object): """A class to periodically download a file/files. A class-level dictionary 'periodicFiles' maps names of files to three-tuples of (url, seconds between downloads, function to run with downloaded file). 'url' should be in some form that urllib2.urlopen can handle (do note that urllib2.urlopen handles file:// links perfectly well.) 'seconds between downloads' is the number of seconds between downloads, obviously. An important point to remember, however, is that it is only engaged when a command is run. I.e., if you say you want the file downloaded every day, but no commands that use it are run in a week, the next time such a command is run, it'll be using a week-old file. If you don't want such behavior, you'll have to give an error mess age to the user and tell him to call you back in the morning. 'function to run with downloaded file' is a function that will be passed a string *filename* of the downloaded file. This will be some random filename probably generated via some mktemp-type-thing. You can do what you want with this; you may want to build a database, take some stats, or simply rename the file. You can pass None as your function and the file with automatically be renamed to match the filename you have it listed under. It'll be in conf.supybot.directories.data, of course. Aside from that dictionary, simply use self.getFile(filename) in any method that makes use of a periodically downloaded file, and you'll be set. """ periodicFiles = None def __init__(self): if self.periodicFiles is None: raise ValueError, 'You must provide files to download' self.lastDownloaded = {} self.downloadedCounter = {} for filename in self.periodicFiles: if self.periodicFiles[filename][-1] is None: fullname = os.path.join(conf.supybot.directories.data(), filename) if os.path.exists(fullname): self.lastDownloaded[filename] = os.stat(fullname).st_ctime else: self.lastDownloaded[filename] = 0 else: self.lastDownloaded[filename] = 0 self.currentlyDownloading = sets.Set() self.downloadedCounter[filename] = 0 self.getFile(filename) def _downloadFile(self, filename, url, f): self.currentlyDownloading.add(filename) try: try: infd = webutils.getUrlFd(url) except IOError, e: self.log.warning('Error downloading %s: %s', url, e) return except webutils.WebError, e: self.log.warning('Error downloading %s: %s', url, e) return confDir = conf.supybot.directories.data() newFilename = os.path.join(confDir, utils.mktemp()) outfd = file(newFilename, 'wb') start = time.time() s = infd.read(4096) while s: outfd.write(s) s = infd.read(4096) infd.close() outfd.close() self.log.info('Downloaded %s in %s seconds', filename, time.time()-start) self.downloadedCounter[filename] += 1 self.lastDownloaded[filename] = time.time() if f is None: toFilename = os.path.join(confDir, filename) if os.name == 'nt': # Windows, grrr... if os.path.exists(toFilename): os.remove(toFilename) os.rename(newFilename, toFilename) else: start = time.time() f(newFilename) total = time.time() - start self.log.info('Function ran on %s in %s seconds', filename, total) finally: self.currentlyDownloading.remove(filename) def getFile(self, filename): if world.documenting: return (url, timeLimit, f) = self.periodicFiles[filename] if time.time() - self.lastDownloaded[filename] > timeLimit and \ filename not in self.currentlyDownloading: self.log.info('Beginning download of %s', url) args = (filename, url, f) name = '%s #%s' % (filename, self.downloadedCounter[filename]) t = threading.Thread(target=self._downloadFile, name=name, args=(filename, url, f)) t.setDaemon(True) t.start() world.threadsSpawned += 1 _randomnickRe = re.compile(r'\$rand(?:om)?nick', re.I) _randomdateRe = re.compile(r'\$rand(?:om)?date', re.I) _randomintRe = re.compile(r'\$rand(?:omint)?', re.I) _channelRe = re.compile(r'\$channel', re.I) _whoRe = re.compile(r'\$(?:who|nick)', re.I) _botnickRe = re.compile(r'\$botnick', re.I) _todayRe = re.compile(r'\$(?:today|date)', re.I) _nowRe = re.compile(r'\$(?:now|time)', re.I) _userRe = re.compile(r'\$user', re.I) _hostRe = re.compile(r'\$host', re.I) def standardSubstitute(irc, msg, text): """Do the standard set of substitutions on text, and return it""" if ircutils.isChannel(msg.args[0]): channel = msg.args[0] else: channel = 'somewhere' def randInt(m): return str(random.randint(-1000, 1000)) def randDate(m): t = pow(2,30)*random.random()+time.time()/4.0 return time.ctime(t) def randNick(m): if channel != 'somewhere': return random.choice(list(irc.state.channels[channel].users)) else: return 'someone' text = _channelRe.sub(channel, text) text = _randomnickRe.sub(randNick, text) text = _randomdateRe.sub(randDate, text) text = _randomintRe.sub(randInt, text) text = _whoRe.sub(msg.nick, text) text = _botnickRe.sub(irc.nick, text) text = _todayRe.sub(time.ctime(), text) text = _nowRe.sub(time.ctime(), text) text = _userRe.sub(msg.user, text) text = _hostRe.sub(msg.host, text) return text # vim:set shiftwidth=4 tabstop=8 expandtab textwidth=78: