2 import string, cPickle, random, urllib, sys, time, re, os, twitter, subprocess, datetime, urlparse
3 from collections import defaultdict
4 from irclib import irc_lower, nm_to_n
7 def karmaq(bot, cmd, nick, conn, public, karma):
9 item=cmd.split()[1].lower()
13 bot.automsg(public,nick,"I have karma on %s items." %
15 elif karma.has_key(item):
16 bot.automsg(public,nick,"%s has karma %s."
19 bot.automsg(public,nick, "%s has no karma set." % item)
22 def karmadelq(bot, cmd, nick, conn, public, karma):
24 item=cmd.split()[1].lower()
26 conn.notice(nick, "What should I delete?")
29 conn.notice(nick, "You are not my owner.")
31 if karma.has_key(item):
33 conn.notice(nick, "Item %s deleted."%item)
35 conn.notice(nick, "There is no karma stored for %s."%item)
37 # help - provides the URL of the help file
38 def helpq(bot, cmd, nick, conn, public):
39 bot.automsg(public,nick,
40 "For help see http://www.chiark.greenend.org.uk/~matthewv/irc/servus.html")
44 def infoq(bot, cmd, nick, conn, public, karma):
45 bot.automsg(public,nick,
46 ("I am Acrobat %s, on %s, as nick %s. "+
47 "My owner is %s; I have karma on %s items.") %
48 (bot.revision.split()[1], bot.channel, conn.get_nickname(),
49 bot.owner, len(karma.keys())))
51 # Check on fish stocks
54 if time.time()>=pond.quotatime:
58 if (time.time()-pond.quotatime)>pond.fish_time_inc:
59 pond.cur_fish+=(((time.time()-pond.quotatime)
60 /pond.fish_time_inc)*pond.fish_inc)
61 if pond.cur_fish>pond.max_fish:
62 pond.cur_fish=pond.max_fish
63 pond.quotatime=time.time()
65 # List of things the bot might be called to work round the self-trouting code
66 synonyms=["itself","the bot","themself"]
68 # trout someone, or flirt with them
69 def troutq(bot, cmd, nick, conn, public, cfg):
76 selftroutchance=cfg[6]
80 conn.notice(nick, quietmsg%fishpond.Boring_Git)
82 if fishpond.cur_fish<=0:
83 conn.notice(nick, nofishmsg)
85 target = string.join(cmd.split()[1:])
87 conn.notice(nick, notargetmsg)
89 me = bot.connection.get_nickname()
90 trout_msg = random.choice(fishlist)
91 fishpond.last=trout_msg
92 # The bot won't trout or flirt with itself;
93 if irc_lower(me) == irc_lower(target) or irc_lower(target) in synonyms:
95 # There's a chance the game may be given away if the request was not
98 if random.random()<=selftroutchance:
99 trout_msg=trout_msg+(selftrout%nick)
101 conn.action(bot.channel, trout_msg % target)
105 def slashq(bot, cmd, nick, conn, public, cfg):
112 selfslashchance=cfg[6]
116 conn.notice(nick, quietmsg%fishpond.Boring_Git)
118 if fishpond.cur_fish<=0:
119 conn.notice(nick, nofishmsg)
121 target = string.join(cmd.split()[1:])
122 #who = cmd.split()[1:]
123 who = ' '.join(cmd.split()[1:]).split(' / ')
125 conn.notice(nick, "it takes two to tango!")
128 conn.notice(nick, "we'll have none of that round here")
130 me = bot.connection.get_nickname()
131 slash_msg = random.choice(fishlist)
132 fishpond.last=slash_msg
133 # The bot won't slash people with themselves
134 if irc_lower(who[0]) == irc_lower(who[1]):
135 conn.notice(nick, "oooooh no missus!")
137 # The bot won't slash with itself, instead slashing the requester
139 if irc_lower(me) == irc_lower(who[n]) or irc_lower(who[n]) in synonyms:
141 # Perhaps someone asked to slash themselves with the bot then we get
142 if irc_lower(who[0]) == irc_lower(who[1]):
143 conn.notice(nick, "you wish!")
145 # There's a chance the game may be given away if the request was not
148 if random.random()<=selfslashchance:
149 slash_msg=slash_msg+(selfslash%nick)
151 conn.action(bot.channel, slash_msg % (who[0], who[1]))
155 def unitq(bot, cmd, nick, conn, public):
156 args = ' '.join(cmd.split()[1:]).split(' as ')
158 args = ' '.join(cmd.split()[1:]).split(' / ')
160 conn.notice(nick, "syntax: units arg1 as arg2")
163 sin,sout=os.popen4(["units","--verbose","--",args[0]],"r")
165 sin,sout=os.popen4(["units","--verbose","--",args[0],args[1]],"r")
168 #popen2 doesn't clean up the child properly. Do this by hand
170 if os.WEXITSTATUS(child[1])==0:
171 bot.automsg(public,nick,res[0].strip())
173 conn.notice(nick,'; '.join(map(lambda x: x.strip(),res)))
175 # Shut up trouting for a minute
176 def nofishq(bot, cmd, nick, conn, public, fish):
180 fish.quotatime=time.time()
181 fish.quotatime+=fish.nofish_time
182 conn.notice(nick, "Fish stocks depleted, as you wish.")
185 def reloadq(bot, cmd, nick, conn, public):
186 if not public and irc_lower(nick) == irc_lower(bot.owner):
189 conn.notice(nick, "Config reloaded.")
191 conn.notice(nick, "Config reloading failed!")
193 bot.automsg(public,nick,
194 "Configuration can only be reloaded by my owner, by /msg.")
197 def quitq(bot, cmd, nick, conn, public):
198 if irc_lower(nick) == irc_lower(bot.owner):
199 bot.die(msg = "I have been chosen!")
201 conn.notice(nick, "Such aggression in public!")
203 conn.notice(nick, "You're not my owner.")
205 # google for something
206 def googleq(bot, cmd, nick, conn, public):
207 cmdrest = string.join(cmd.split()[1:])
208 # "I'm Feeling Lucky" rather than try and parse the html
209 targ = ("http://www.google.com/search?q=%s&btnI=I'm+Feeling+Lucky"
210 % urllib.quote_plus(cmdrest))
212 # get redirected and grab the resulting url for returning
213 gsearch = urllib.urlopen(targ).geturl()
214 if gsearch != targ: # we've found something
215 bot.automsg(public,nick,str(gsearch))
216 else: # we haven't found anything.
217 bot.automsg(public,nick,"No pages found.")
218 except IOError: # if the connection times out. This blocks. :(
219 bot.automsg(public,nick,"The web's broken. Waah!")
221 # Look up the definition of something using google
222 def defineq(bot, cmd, nick, conn, public):
223 #this doesn't work any more
224 bot.automsg(public,nick,"'define' is broken because google are bastards :(")
226 cmdrest = string.join(cmd.split()[1:])
227 targ = ("http://www.google.co.uk/search?q=define%%3A%s&ie=utf-8&oe=utf-8"
228 % urllib.quote_plus(cmdrest))
230 # Just slurp everything into a string
231 defnpage = urllib.urlopen(targ).read()
232 # For definitions we really do have to parse the HTML, sadly.
233 # This is of course going to be a bit fragile. We first look for
234 # 'Definitions of %s on the Web' -- if this isn't present we
235 # assume we have the 'no definitions found page'.
236 # The first defn starts after the following <p> tag, but as the
237 # first <li> in a <ul type="disc" class=std>
238 # Following that we assume that each definition is all the non-markup
239 # before a <br> tag. Currently we just dump out the first definition.
240 match = re.search(r"Definitions of <b>.*?</b> on the Web.*?<li>\s*([^>]*)((<br>)|(<li>))",defnpage,re.MULTILINE)
242 bot.automsg(public,nick,"Some things defy definition.")
244 # We assume google has truncated the definition for us so this
245 # won't flood the channel with text...
246 defn = " ".join(match.group(1).split("\n"))
247 bot.automsg(public,nick,defn)
248 except IOError: # if the connection times out. This blocks. :(
249 bot.automsg(public,nick,"The web's broken. Waah!")
251 # Look up a currency conversion via xe.com
252 def currencyq(bot, cmd, nick, conn, public):
253 args = ' '.join(cmd.split()[1:]).split(' as ')
254 if len(args) != 2 or len(args[0]) != 3 or len(args[1]) != 3:
255 conn.notice(nick, "syntax: currency arg1 as arg2")
257 targ = ("http://www.xe.com/ucc/convert.cgi?From=%s&To=%s" % (args[0], args[1]))
259 currencypage = urllib.urlopen(targ).read()
260 match = re.search(r"(1 %s = [\d\.]+ %s)" % (args[0].upper(),args[1].upper()),currencypage,re.MULTILINE)
262 bot.automsg(public,nick,"Dear Chief Secretary, there is no money.")
264 conversion = match.group(1);
265 conversion = conversion.replace(' ',' ');
266 bot.automsg(public,nick,conversion + " (from xe.com)")
267 except IOError: # if the connection times out. This blocks. :(
268 bot.automsg(public,nick,"The web's broken. Waah!")
271 ### extract the commit message and timestamp for commit
272 def __getcommitinfo(commit):
273 cmd=["git","log","-n","1","--pretty=format:%ct|%s",commit]
274 x=subprocess.Popen(cmd,
275 stdout=subprocess.PIPE,stderr=subprocess.PIPE)
276 out,err=x.communicate()
281 ts,mes=out.split('|')
282 when=datetime.date.fromtimestamp(float(ts))
283 return mes.strip(), when
285 ###Return an array of commit messages and timestamps for lines in db that match what
286 def __getcommits(db,keys,what):
290 ret=__getcommitinfo(db[k])
291 if len(ret)==1: #error message
292 return ["Error message from git blame: %s" % ret]
294 ans.append( (k,ret[0],ret[1]) )
297 ###search all three databases for what
298 def __getall(tdb,tdbk,fdb,fdbk,sdb,sdbk,what):
301 tans=__getcommits(tdb,tdbk,what)
302 fans=__getcommits(fdb,fdbk,what)
303 sans=__getcommits(sdb,sdbk,what)
304 return tans+fans+sans
306 def blameq(bot,cmd,nick,conn,public,fish,tdb,tdbk,fdb,fdbk,sdb,sdbk):
309 bot.automsg(public,nick,"Who or what do you want to blame?")
311 cwhat=' '.join(clist[2:])
312 if clist[1]=="#last":
313 ans=__getall(tdb,tdbk,fdb,fdbk,sdb,sdbk,fish.last)
314 elif clist[1]=="#trouts" or clist[1]=="#trout":
315 ans=__getcommits(tdb,tdbk,cwhat)
316 elif clist[1]=="#flirts" or clist[1]=="#flirt":
317 ans=__getcommits(fdb,fdbk,cwhat)
318 elif clist[1]=="#slashes" or clist[1]=="#slash":
319 ans=__getcommits(sdb,sdbk,cwhat)
321 cwhat=' '.join(clist[1:])
322 ans=__getall(tdb,tdbk,fdb,fdbk,sdb,sdbk,cwhat)
324 bot.automsg(public,nick,"No match found")
327 bot.automsg(public,nick,ans[0])
329 bot.automsg(public,nick,"Modified %s: %s" % (ans[0][2].isoformat(),ans[0][1]))
331 bot.automsg(public,nick,"I found %d matches, which is too many. Please be more specific!" % (len(ans)) )
335 bot.automsg(public,nick,a)
337 bot.automsg(public,nick,"'%s' modified on %s: %s" % (a[0],a[2].isoformat(),a[1]))
339 ### say to msg/channel
340 def sayq(bot, cmd, nick, conn, public):
341 if irc_lower(nick) == irc_lower(bot.owner):
342 conn.privmsg(bot.channel, string.join(cmd.split()[1:]))
345 conn.notice(nick, "You're not my owner!")
347 ### action to msg/channel
348 def doq(bot, cmd, nick, conn, public):
349 sys.stderr.write(irc_lower(bot.owner))
350 sys.stderr.write(irc_lower(nick))
352 if irc_lower(nick) == irc_lower(bot.owner):
353 conn.action(bot.channel, string.join(cmd.split()[1:]))
355 conn.notice(nick, "You're not my owner!")
358 def disconnq(bot, cmd, nick, conn, public):
359 if cmd == "disconnect": # hop off for 60s
360 bot.disconnect(msg="Be right back.")
362 ### list keys of a dictionary
363 def listkeysq(bot, cmd, nick, conn, public, dict, sort=False):
367 bot.automsg(public,nick,string.join(d))
369 ### rot13 text (yes, I could have typed out the letters....)
370 ### also "foo".encode('rot13') would have worked
371 def rot13q(bot, cmd, nick, conn, public):
372 a=''.join(map(chr,range((ord('a')),(ord('z')+1))))
374 trans=string.maketrans(a+a.upper(),b+b.upper())
375 conn.notice(nick, string.join(cmd.split()[1:]).translate(trans))
377 ### URL-tracking stuff
379 ### return a easy-to-read approximation of a time period
380 def nicetime(tempus):
382 tm="%d seconds ago"%int(tempus)
384 tm="%d minutes ago"%int(tempus/60)
386 tm="%d hours ago"%int(tempus/3600)
389 ### class to store URL data
391 "contains meta-data about a URL seen on-channel"
392 def __init__(self,url,nick):
395 self.first=time.time()
397 self.lastseen=time.time()
398 self.lastasked=time.time()
399 def recenttime(self):
400 return max(self.lastseen,self.lastasked)
402 return nicetime(time.time()-self.first)
404 z=min(len(urlcomplaints)-1, self.count-1)
405 return urlcomplaints[z]
407 #(?:) is a regexp that doesn't group
408 urlre = re.compile(r"((?:(?:http)|(?:nsfw))s?://[^ ]+)( |$)")
409 hturlre= re.compile(r"(http)(s?://[^ ]+)( |$)")
410 #matches \bre\:?\s+ before a regexp; (?i)==case insensitive match
411 shibboleth = re.compile(r"(?i)\bre\:?\s+((?:(?:http)|(?:nsfw))s?://[^ ]+)( |$)")
412 urlcomplaints = ["a new",
417 ### Deal with /msg bot url or ~url in channel
418 def urlq(bot, cmd, nick, conn, public,urldb):
419 if (not urlre.search(cmd)):
420 bot.automsg(False,nick,"Please use 'url' only with http, https, nsfw, or nsfws URLs")
423 urlstring=urlre.search(cmd).group(1)
424 url=canonical_url(urlstring)
427 complaint="That's %s URL that was first mentioned %s by %s" % \
428 (T.urltype(),T.firstmen(),T.nick)
430 complaint=complaint+". Furthermore it defeats the point of this command to use it other than via /msg."
432 bot.automsg(False,nick,complaint)
433 T.lastasked=time.time()
434 #URL suppressed, so mention in #urls
435 if urlstring != cmd.split()[1]: #first argument to URL was not the url
436 conn.privmsg("#urls","%s remarks: %s" % (nick," ".join(cmd.split()[1:])))
438 conn.privmsg("#urls","(via %s) %s"%(nick," ".join(cmd.split()[1:])))
441 bot.automsg(False,nick,"That URL was unique. There is little point in using !url out loud; please use it via /msg")
443 if urlstring != cmd.split()[1]: #first argument to URL was not the url
444 conn.privmsg(bot.channel,"%s remarks: %s" % (nick," ".join(cmd.split()[1:])))
446 conn.privmsg(bot.channel,"(via %s) %s"%(nick," ".join(cmd.split()[1:])))
447 urldb[url]=UrlLog(url,nick)
449 ### Deal with URLs spotted in channel
450 def dourl(bot,conn,nick,command,urldb):
451 urlstring=urlre.search(command).group(1)
452 urlstring=canonical_url(urlstring)
454 if urlstring in urldb:
456 message="observes %s URL, first mentioned %s by %s" % \
457 (T.urltype(),T.firstmen(),T.nick)
458 if shibboleth.search(command)==None:
459 conn.action(bot.channel, message)
460 T.lastseen=time.time()
463 urldb[urlstring]=UrlLog(urlstring,nick)
466 def urlexpire(urldb,expire):
469 if time.time() - urldb[u].recenttime() > expire:
472 # canonicalise BBC URLs (internal use only)
473 def canonical_url(urlstring):
474 if "nsfw://" in urlstring or "nsfws://" in urlstring:
475 urlstring=urlstring.replace("nsfw","http",1)
476 if (urlstring.find("news.bbc.co.uk") != -1):
477 for middle in ("/low/","/mobile/"):
478 x = urlstring.find(middle)
480 urlstring.replace(middle,"/hi/")
483 # automatically make nsfw urls for you and pass them on to url
484 def nsfwq(bot,cmd,nick,conn,public,urldb):
485 if (not hturlre.search(cmd)):
486 bot.automsg(False,nick,"Please use 'nsfw' only with http or https URLs")
488 newcmd=hturlre.sub(nsfwify,cmd)
489 urlq(bot,newcmd,nick,conn,public,urldb)
496 def twitterq(bot,cmd,nick,conn,public,twitapi):
498 if (not urlre.search(cmd)):
499 bot.automsg(False,nick,"Please use 'twit' only with http or https URLs")
502 urlstring = urlre.search(cmd).group(1)
503 if (urlstring.find("twitter.com") !=-1):
504 stringsout = getTweet(urlstring,twitapi)
505 for stringout in stringsout:
506 bot.automsg(public, nick, stringout)
508 def getTweet(urlstring,twitapi,inclusion=False,recurlvl=0):
509 unobfuscate_urls=True
510 expand_included_tweets=True
513 parts = string.split(urlstring,'/')
516 status = twitapi.GetStatus(tweetID)
518 return "twitapi.GetStatus returned nothing :-("
519 if status.user == None and status.text == None:
520 return "Empty status object returned :("
521 if status.retweeted_status and status.retweeted_status.text:
522 status = status.retweeted_status
523 if status.user is not None:
524 tweeter_screen = status.user.screen_name #.encode('UTF-8', 'replace')
525 tweeter_name = status.user.name #.encode('UTF-8', 'replace')
527 tweeter_screen = "[not returned]" ; tweeter_name = "[not returned]"
528 tweeter_name = tweeter_name + " RTing " + status.user.name #.encode('UTF-8', 'replace')
529 tweetText = status.full_text
531 replacements = defaultdict( list )
532 for medium in status.media:
533 replacements[medium.url].append(medium.media_url_https)
535 for k,v in replacements.items():
537 v = [re.sub(r"/tweet_video_thumb/([\w\-]+).jpg", r"/tweet_video/\1.mp4", link) for link in v]
539 replacementstring = "[" + " ; ".join(v) +"]"
541 replacementstring = v[0]
542 tweetText = tweetText.replace(k, replacementstring)
544 for url in status.urls:
545 toReplace = url.expanded_url
549 rv = urlparse.urlparse(toReplace)
551 # sourced from http://bit.do/list-of-url-shorteners.php
552 "bit.do", "t.co", "lnkd.in", "db.tt", "qr.ae", "adf.ly",
553 "goo.gl", "bitly.com", "cur.lv", "tinyurl.com", "ow.ly",
554 "bit.ly", "adcrun.ch", "ity.im", "q.gs", "viralurl.com",
555 "is.gd", "po.st", "vur.me", "bc.vc", "twitthis.com", "u.to",
556 "j.mp", "buzurl.com", "cutt.us", "u.bb", "yourls.org",
557 "crisco.com", "x.co", "prettylinkpro.com", "viralurl.biz",
558 "adcraft.co", "virl.ws", "scrnch.me", "filoops.info", "vurl.bz",
559 "vzturl.com", "lemde.fr", "qr.net", "1url.com", "tweez.me",
560 "7vd.cn", "v.gd", "dft.ba", "aka.gr", "tr.im",
564 #expand list as needed.
565 response = urllib.urlopen('http://urlex.org/txt/' + toReplace)
566 resptext = response.read()
567 if resptext.startswith('http'): # ie it looks urlish (http or https)
568 if resptext != toReplace:
570 # maybe make a note of the domain of the original URL to compile list of shortenable domains?
572 # remove tracking utm_ query parameters, for privacy and brevity
573 # code snippet from https://gist.github.com/lepture/5997883
574 rv = urlparse.urlparse(toReplace)
576 query = re.sub(r'utm_\w+=[^&]+&?', '', rv.query)
578 toReplace = '%s://%s%s?%s' % (rv.scheme, rv.hostname, rv.path, query)
580 toReplace = '%s://%s%s' % (rv.scheme, rv.hostname, rv.path) # leave off the final '?'
582 if expand_included_tweets:
583 if rv.hostname == 'twitter.com' and re.search(r'status/\d+',rv.path):
585 stringsout = [ "{{ Recursion level too high }}" ] + stringsout
587 quotedtweet = getTweet(toReplace, twitapi, inclusion=True, recurlvl=recurlvl+1) # inclusion parameter limits recursion.
590 quotedtweet[0] = "Q{ " + quotedtweet[0]
591 quotedtweet[-1] += " }"
592 stringsout = quotedtweet + stringsout
594 tweetText = tweetText.replace(url.url, toReplace)
596 tweetText = tweetText.replace(">",">")
597 tweetText = tweetText.replace("<","<")
598 tweetText = tweetText.replace("&","&")
599 tweetText = tweetText.replace("\n"," ")
600 stringout = "tweet by %s (%s): %s" %(tweeter_screen,tweeter_name,tweetText)
601 except twitter.TwitterError:
602 terror = sys.exc_info()
603 stringout = "Twitter error: %s" % terror[1].__str__()
605 terror = sys.exc_info()
606 stringout = "Error: %s" % terror[1].__str__()
607 stringsout = [stringout] + stringsout
609 return stringsout # don't want to double-encode it, so just pass it on for now and encode later
611 return map(lambda x: x.encode('UTF-8', 'replace'), stringsout)