h/plugins/urlhistory.py

import time
import re

from util import hook, urlnorm

url_re = re.compile(r'([a-zA-Z]+://|www\.)[^ ]*')

expiration_period = 60 * 60 * 24 # 1 day
expiration_period_text = "24 hours"

ignored_urls = [urlnorm.normalize("http://google.com")]

def db_connect(bot, server):
    "check to see that our db has the the seen table and return a connection."
    conn = bot.get_db_connection(server)
    conn.execute("create table if not exists urlhistory"
                 "(chan, url, nick, time)")
    conn.commit()
    return conn

def insert_history(conn, chan, url, nick):
    now = time.time()
    conn.execute("insert into urlhistory(chan, url, nick, time) "
                 "values(?,?,?,?)", (chan, url, nick, time.time()))
    conn.commit()

def get_history(conn, chan, url):
    conn.execute("delete from urlhistory where time < ?", 
                 (time.time() - expiration_period,))
    nicks = conn.execute("select nick from urlhistory where "
            "chan=? and url=?", (chan, url)).fetchall()
    return [x[0] for x in nicks]
    
def get_nicklist(nicks):
    nicks = sorted(set(nicks), key=unicode.lower)
    if len(nicks) <= 2:
        return ' and '.join(nicks)
    else:
        return ', and '.join((', '.join(nicks[:-1]), nicks[-1]))

def ordinal(count):
    return ["once", "twice", "%d times" % count][min(count, 3) - 1]
       
@hook.command(hook=r'(.*)', prefix=False)
def urlinput(bot, input):
    m = url_re.search(input.msg.encode('utf8'))
    if not m:
        return

    # URL detected
    conn = db_connect(bot, input.server)
    try:
        url = urlnorm.normalize(m.group(0))
        if url not in ignored_urls:
            dupes = get_history(conn, input.chan, url)
            insert_history(conn, input.chan, url, input.nick)
            if dupes and input.nick not in dupes:
                input.reply("That link has been posted " + ordinal(len(dupes))
                    + " in the past " + expiration_period_text + " by " +
                    get_nicklist(dupes))
    finally:
        conn.commit()
        conn.close()
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`import time`
			`import re`

			`from util import hook, urlnorm`

			`url_re = re.compile(r'([a-zA-Z]+://\|www\.)[^ ]*')`

			`expiration_period = 60 * 60 * 24 # 1 day`
			`expiration_period_text = "24 hours"`

			`ignored_urls = [urlnorm.normalize("http://google.com")]`

rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`def db_connect(bot, server):`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`"check to see that our db has the the seen table and return a connection."`
rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`conn = bot.get_db_connection(server)`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`conn.execute("create table if not exists urlhistory"`
rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`"(chan, url, nick, time)")`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`conn.commit()`
			`return conn`

rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`def insert_history(conn, chan, url, nick):`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`now = time.time()`
rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`conn.execute("insert into urlhistory(chan, url, nick, time) "`
			`"values(?,?,?,?)", (chan, url, nick, time.time()))`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`conn.commit()`

rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`def get_history(conn, chan, url):`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`conn.execute("delete from urlhistory where time < ?",`
			`(time.time() - expiration_period,))`
rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`nicks = conn.execute("select nick from urlhistory where "`
			`"chan=? and url=?", (chan, url)).fetchall()`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`return [x[0] for x in nicks]`

			`def get_nicklist(nicks):`
make urlhistory nick sorting case-insensitive, simplify a few decorator calls 2010-01-19 05:14:49 +00:00			`nicks = sorted(set(nicks), key=unicode.lower)`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`if len(nicks) <= 2:`
			`return ' and '.join(nicks)`
			`else:`
			`return ', and '.join((', '.join(nicks[:-1]), nicks[-1]))`

			`def ordinal(count):`
			`return ["once", "twice", "%d times" % count][min(count, 3) - 1]`

			`@hook.command(hook=r'(.*)', prefix=False)`
			`def urlinput(bot, input):`
			`m = url_re.search(input.msg.encode('utf8'))`
			`if not m:`
			`return`

			`# URL detected`
rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`conn = db_connect(bot, input.server)`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`try:`
			`url = urlnorm.normalize(m.group(0))`
			`if url not in ignored_urls:`
rewrite tell, simplify db access in quote, seen, urlhistory. fix wolframalpha for the last time 2010-02-01 07:29:50 +00:00			`dupes = get_history(conn, input.chan, url)`
			`insert_history(conn, input.chan, url, input.nick)`
make urlhistory.py record irc servers as well 2010-01-19 03:16:40 +00:00			`if dupes and input.nick not in dupes:`
			`input.reply("That link has been posted " + ordinal(len(dupes))`
			`+ " in the past " + expiration_period_text + " by " +`
			`get_nicklist(dupes))`
			`finally:`
			`conn.commit()`
			`conn.close()`