Source code for modules.qdb

import re
import difflib
from event import Event

try:
    import imgurpython
except (ImportError, SystemError):
    print("Warning: QDB module requires imgurpython.")
    imgurpython = object

try:
    import requests
except (ImportError, SystemError):
    print("Warning: QDB module requires requests.")
    requests = object


[docs]class QDB:
    def __init__(self, events=None, printer_handle=None, bot=None, say=None):
        self.events = events
        self.printer = printer_handle
        self.bot = bot
        self.say = say
        try:
            from imgur_credentials import ImgurCredentials as ic
        except (ImportError, SystemError):
            print(
                "Warning: imgur module requires credentials in modules/imgur_credentials.py")

            class PhonyIc:
                imgur_client_id = "None"
                imgur_client_secret = "None"
            ic = PhonyIc()
        self.imgur_client_id = ic.imgur_client_id
        self.imgur_client_secret = ic.imgur_client_secret

        # prevent unecessarily clearing our mem_store['qdb'] dict
        if not "qdb" in self.bot.mem_store:
            self.bot.mem_store['qdb'] = {}
        # define a key for _recent since that will not be a potential channel
        # name
        self.bot.mem_store['qdb']['_recent'] = []

        # subscribing to all lines ALSO catches lines matching ".qdb something something"
        # so we don't need a second ".qdb" event
        all_lines = Event('1__all_lines__')
        all_lines.define('.*')
        all_lines.subscribe(self)

        self.bot.register_event(all_lines, self)

        self.help = ".qdb <search string of first line> | <search string of last line>"
        self.MAX_BUFFER_SIZE = 500
        self.MAX_HISTORY_SIZE = 10

    def _imgurify(self, url):
        client = imgurpython.ImgurClient(
            self.imgur_client_id, self.imgur_client_secret)

        replacement_values = list()

        if isinstance(url, list):
            for u in url:
                resp = client.upload_from_url(u)
                replacement_values.append(resp)
        else:
            try:
                resp = client.upload_from_url(url)
                replacement_values.append(resp)
            except imgurpython.helpers.error.ImgurClientError as e:
                self.bot.debug_print("ImgurClientError: ")
                self.bot.debug_print(str(e))
            except UnboundLocalError as e:
                self.bot.debug_print("UnboundLocalError: ")
                self.bot.debug_print(str(e))
            except requests.exceptions.ConnectionError as e:
                self.bot.debug_print("ConnectionError: ")
                self.bot.debug_print(str(e))
        return replacement_values

    def _detect_url(self, quote):
        """
        for tsd printouts and imgflip (.meme)
        follows this format:
        http://irc.teamschoolyd.org/printouts/8xnK5DmfMz
        http://i.imgflip.com/zs1e6.jpg
        """
        tsd_regex = "(?P<url>http://irc\\.teamschoolyd\\.org/printouts/\\w+)"
        if_regex = "(?P<url>http://i\\.imgflip\\.com/\\w+.jpg)"

        # to allow us to check both variables at the end
        tsd_url, if_url = None, None

        try:
            tsd_url = re.search(tsd_regex, quote).group("url")
        except AttributeError:
            pass
        try:
            if_url = re.search(if_regex, quote).group("url")
        except AttributeError:
            pass

        if not tsd_url and not if_url:
            return quote

        if tsd_url:
            url = tsd_url
        if if_url:
            url = if_url

        repl = self._imgurify(url)

        if tsd_url:
            new_quote = re.sub(tsd_regex, repl[0]['link'], quote)
        if if_url:
            new_quote = re.sub(if_regex, repl[0]['link'], quote)
        return new_quote

[docs]    def strip_formatting(self, msg):
        """Uses regex to replace any special formatting in IRC (bold, colors) with nothing"""
        return re.sub('([\x02\x1D\x1F\x16\x0F]|\x03([0-9]{2})?)', '', msg)

[docs]    def add_buffer(self, event=None, debug=False):
        """Takes a channel name and line passed to it and stores them in the bot's mem_store dict
        for future access. The dict will have channel as key. The value to that key will be a list
        of formatted lines of activity.
        If the buffer size is not yet exceeded, lines are just added. If the buffer
        is maxed out, the oldest line is removed and newest one inserted at the beginning.
        """
        if debug:
            print("Line: " + event.line)
            print("Verb: " + event.verb)
            print("Channel: " + event.channel)
            print("")
        if not event:
            return
        # there are certain things we want to record in history, like nick changes and quits
        # these often add to the humor of a quote. however, these are not specific to a channel
        # in IRC and our bot does not maintain a userlist per channel. Therefore, when nick
        # changes and quits occur, we will add them to every buffer. This is not technically
        # correct behavior and could very well lead to quits/nick changes that are not visible
        # showing up in a quote, but it's the best we can do at the moment
        if not event.channel:
            # discard events with unwanted verbs
            if event.verb not in ["QUIT", "NICK"]:
                return
            try:
                for chan in list(self.bot.mem_store['qdb'].keys()):
                    if chan != '_recent':
                        if len(self.bot.mem_store['qdb']
                               [chan]) >= self.MAX_BUFFER_SIZE:
                            self.bot.mem_store['qdb'][chan].pop()
                        line = self.format_line(event)
                        if line:
                            self.bot.mem_store['qdb'][chan].insert(0, line)
            except (KeyError, IndexError):
                print("QDB add_buffer() error when no event channel")
        # now we continue with normal, per channel line addition
        # create a dictionary associating the channel with an empty list if it
        # doesn't exist yet
        else:
            if event.channel not in self.bot.mem_store['qdb']:
                self.bot.mem_store['qdb'][event.channel] = []
            try:
                # check for the length of the buffer. if it's too long, pop the
                # last item
                if len(self.bot.mem_store['qdb']
                       [event.channel]) >= self.MAX_BUFFER_SIZE:
                    self.bot.mem_store['qdb'][event.channel].pop()
                # get a line by passing event to format_line
                # insert the line into the first position in the list
                line = self.format_line(event)
                if line:
                    self.bot.mem_store['qdb'][event.channel].insert(0, line)
            except IndexError:
                print("QDB add_buffer() error. Couldn't access the list index.")

[docs]    def format_line(self, event):
        """Takes an event and formats a string appropriate for quotation from it"""

        # first strip out printout urls and replace them with imgur mirrors
        # commenting out for now to avoid uploading to imgur so often
        #event.msg = self._detect_url(event.msg)

        # format all strings based on the verb
        if event.verb == "":
            return ''
        elif event.verb == "PRIVMSG":
            # special formatting for ACTION strings
            if event.msg.startswith('\001ACTION'):
                # strip out the word ACTION from the msg
                return ' * %s %s\n' % (event.user, event.msg[7:])
            else:
                return '<%s> %s\n' % (
                    event.user, self.strip_formatting(event.msg))
        elif event.verb == "JOIN":
            return ' --> %s has joined channel %s\n' % (
                event.user, event.channel)
        elif event.verb == "PART":
            return ' <-- %s has left channel %s\n' % (
                event.user, event.channel)
        elif event.verb == "NICK":
            return ' -- %s has changed their nick to %s\n' % (
                event.user, event.msg)
        elif event.verb == "TOPIC":
            return ' -- %s has changed the topic for %s to "%s"\n' % (
                event.user, event.channel, event.msg)
        elif event.verb == "QUIT":
            return ' <-- %s has quit (%s)\n' % (event.user, event.msg)
        elif event.verb == "KICK":
            # this little bit of code finds the kick target by getting the last
            # thing before the event message begins
            target = event.line.split(":", 2)[1].split()[-1]
            return ' <--- %s has kicked %s from %s (%s)\n' % (
                event.user, target, event.channel, event.msg)
        elif event.verb == "NOTICE":
            return ' --NOTICE from %s: %s\n' % (event.user, event.msg)
        else:
            # no matching verbs found. just ignore the line
            return ''

[docs]    def get_qdb_submission(
            self, channel=None, start_msg='', end_msg='', strict=False):
        """Given two strings, start_msg and end_msg, this function will assemble a submission for the QDB.
        start_msg is a substring to search for and identify a starting line. end_msg similarly is used
        to search for the last desired line in the submission. This function returns a string ready
        for submission to the QDB if it finds the desired selection. If not, it returns None.
        """
        if not channel:
            return None
        # must have at least one msg to search for and channel to look it up in
        if len(start_msg) == 0 or not channel:
            return None
        # first, check to see if we are doing a single string submission.
        if end_msg == '':
            for line in self.bot.mem_store['qdb'][channel]:
                if start_msg.lower() in line.lower():
                    # removing temporary printout urls and replacing with imgur
                    return self._detect_url(line)
            # making sure we get out of the function if no matching strings were found
            # don't want to search for a nonexistent second string later
            return None
        # search for a matching start and end string and get the buffer index
        # for the start and end message
        start_index = -1
        end_index = -1
        """Finds matching string for beginning line. Buffer is traversed in reverse-chronological order
        .qdb -> strict = False -> earliest occurence
        .qdbs -> strict = True -> latest occurence
        """
        for index, line in enumerate(self.bot.mem_store['qdb'][channel]):
            # print "evaluating line for beginning: {}".format(line)
            if start_msg.encode(
                    'utf-8', 'ignore').lower() in line.encode('utf-8', 'ignore').lower():
                # print "found match, start_index={}".format(index)
                start_index = index
                if strict:
                    break
        # finds newest matching string for ending line
        for index, line in enumerate(self.bot.mem_store['qdb'][channel]):
            # print "evaluating line for end: {}".format(line)
            if end_msg.lower() in line.lower():
                # print "found match, end_index={}".format(index)
                end_index = index
                break
        # check to see if index values are positive. if not, string was not
        # found and we're done
        if start_index == -1 or end_index == -1 or start_index < end_index:
            return None
        # now we generate the string to be returned for submission
        submission = ''
        try:
            for i in reversed(list(range(end_index, start_index + 1))):
                # print 'Index number is ' + str(i) + ' and current submission
                # is ' + submission
                # detect temporary printout urls and replace with imgur
                submission += self._detect_url(
                    self.bot.mem_store['qdb'][channel][i])
        except IndexError:
            print("QDB get_qdb_submission() error when accessing list index")

        return submission

[docs]    def submit(self, qdb_submission, debug=False):
        """Given a string, qdb_submission, this function will upload the string to hlmtre's qdb
        server. Returns a string with status of submission. If it worked, includes a link to new quote.
        """
        if debug:
            print("Submission is:")
            print(qdb_submission)
            print("Current buffer is:")
            print(self.bot.mem_store['qdb'])
            print("")
            return ''
        # accessing hlmtre's qdb api
        url = 'https://qdb.zero9f9.com/api.php'
        payload = {'q': 'new', 'quote': qdb_submission.rstrip('\n')}
        try:
            qdb = requests.post(url, payload)
        except requests.exceptions.ConnectionError as e:
            self.bot.debug_print("ConnectionError: ")
            self.bot.debug_print(str(e))
        # check for any HTTP errors and return False if there were any
        try:
            qdb.raise_for_status()
        except requests.exceptions.HTTPError as e:
            self.bot.debug_print('HTTPError: ')
            self.bot.debug_print(str(e))
            self.bot.debug_print("Perhaps informative:")
            self.bot.debug_print(url)
            self.bot.debug_print(str(payload))
            return "HTTPError encountered when submitting to QDB"
        try:
            q_url = qdb.json()
            self.add_recently_submitted(q_url['id'], qdb_submission)
            if q_url['status'] == "success":
                return "QDB submission successful! https://qdb.zero9f9.com/quote.php?id=" + \
                    str(q_url['id'])
            else:
                self.bot.debug_print("QDB error:")
                print(q_url)
                return "QDB submission unsuccessful :(. Check console output."
        except (KeyError, UnicodeDecodeError):
            return "Error getting status of quote submission."
        return "That was probably successful since no errors came up, but no status available."

[docs]    def delete(self, user, post_id='', passcode=''):
        """A special function that allows certain users to delete posts"""
        # accessing hlmtre's qdb api
        url = 'http://qdb.zero9f9.com/api.php'
        payload = {
            'q': 'delete',
            'user': user,
            'id': post_id,
            'code': passcode}
        deletion = requests.get(url, params=payload)
        # check for any HTTP errors and return False if there were any
        try:
            deletion.raise_for_status()
        except requests.exceptions.HTTPError as e:
            self.bot.debug_print('HTTPError: ')
            self.bot.debug_print(str(e))
            return "HTTPError encountered when accessing QDB"
        try:
            del_status = deletion.json()
            if del_status['success'] == "true":
                # they're a list of dicts
                for quote in self.bot.mem_store['qdb']['_recent']:
                    if int(post_id) in quote:
                        self.bot.mem_store['qdb']['_recent'].remove(quote)
                return "QDB deletion succeeded."
            return "QDB deletion failed."
        except (KeyError, UnicodeDecodeError):
            return "Error getting status of quote deletion."

[docs]    def recently_submitted(self, submission):
        """Checks to see if the given submission is string is at least 75% similar to the strings
        in the list of recently submitted quotes.
        Returns the id of the quote if it was recently submitted. If not, returns -1.
        """
        # set up a difflib SequenceMatcher with the first string to test
        comparer = difflib.SequenceMatcher()
        comparer.set_seq1(submission)
        # if we find that it has 75% similarity or greater to a recent
        # submission, return True
        try:
            for recent_quote in self.bot.mem_store['qdb']['_recent']:
                comparer.set_seq2(list(recent_quote.values())[0])
                if comparer.ratio() >= .75:
                    return list(recent_quote.keys())[0]
        except TypeError:
            return -1
        except KeyError:
            return -1
        except IndexError:
            return -1
        return -1

[docs]    def add_recently_submitted(self, q_id, submission):
        """Takes a string, submission, and adds it to the list of recent submissions.
        Also we do length checking, only keep record of the previous MAX_HISTORY_SIZE quotes.
        """
        # first, see if we have reached the maximum history size. if so, remove
        # last item
        if len(self.bot.mem_store['qdb']['_recent']) >= self.MAX_HISTORY_SIZE:
            self.bot.mem_store['qdb']['_recent'].pop()
        # inserting a dict with the qdb id of the submission and the submission
        # content
        self.bot.mem_store['qdb']['_recent'].insert(0, {q_id: submission})

[docs]    def handle(self, event):
        # first check to see if there is a special deletion going on
        if event.msg.startswith(".qdbdelete") and event.is_pm:
            deletion = event.msg.split(' ', 2)
            try:
                # requires the format ".qdbdelete <post_id> <password>"
                self.say(
                    event.user,
                    self.delete(
                        event.user,
                        deletion[1],
                        deletion[2]))
            except IndexError:
                self.say(
                    event.user,
                    "Not enough parameters provided for deletion.")
            return
        """
        See if we're going to generate a qdb submission, or just add the line to the buffer.
        .qdb is the standard, generous implementation selected after hours of testing and ideal for a significant number of situations where lines are repeated. Use specific search strings. the start_index of the submission will be the EARLIEST occurrence of the substring in the buffer.
        .qdbs is the strict implementation. The start_index will be the LATEST occurrence of the substring.
        """

        if event.msg.startswith(".qdb ") or event.msg.startswith(".qdbs "):
            # split the msg with '.qdb[s] ' stripped off beginning and divide into 1 or 2 search strings
            # e.g. ".qdb string1|string2" -> [".qdb", "string1|string2"]
            cmd_parts = event.msg.split(None, 1)
            if len(cmd_parts) < 2:
                # do something here to handle '.qdb[s]'
                return
            # determine if using strict mode
            strict_mode = cmd_parts[0] == ".qdbs"
            # split the search parameter(s)
            # e.g. "string1|string2" -> ["string1", "string2"]
            string_token = cmd_parts[1].split('|', 1)
            start_msg = string_token[0].rstrip()
            # see if we only have a one line submission
            if len(string_token) == 1:
                # s is the string to submit
                s = self.get_qdb_submission(event.channel, start_msg)
                recent = self.recently_submitted(s)
                if recent > 0:
                    q_url = "http://qdb.zero9f9.com/quote.php?id=" + \
                        str(recent)
                    self.printer(
                        "PRIVMSG " +
                        event.channel +
                        " :QDB Error: A quote of >75% similarity has already been posted here: " +
                        q_url +
                        "\n")
                    return
                if not s:
                    self.printer(
                        "PRIVMSG " +
                        event.channel +
                        ' :QDB Error: Could not find requested string.\n')
                    return
                # Print the link to the newly submitted quote
                self.printer(
                    "PRIVMSG " +
                    event.channel +
                    ' :' +
                    self.submit(s) +
                    '\n')
                return
            # We should only get here if there are two items in string_token
            end_msg = string_token[1].lstrip()
            s = self.get_qdb_submission(
                event.channel, start_msg, end_msg, strict_mode)
            recent = self.recently_submitted(s)
            if recent > 0:
                q_url = "http://qdb.zero9f9.com/quote.php?id=" + str(recent)
                self.printer(
                    "PRIVMSG " +
                    event.channel +
                    " :QDB Error: A quote of >75% similarity has already been posted here: " +
                    q_url +
                    "\n")
                return
            # if there's nothing found for the submission, then we alert the
            # channel and gtfo
            if not s:
                self.printer(
                    "PRIVMSG " +
                    event.channel +
                    ' :QDB Error: Could not find requested quotes or parameters were not specific enough.\n')
                return
            # print the link to the new submission
            self.printer(
                "PRIVMSG " +
                event.channel +
                ' :' +
                self.submit(s) +
                '\n')
            return
        self.add_buffer(event)