Poodletooth-iLand/otp/chat/WhiteList.py

from bisect import bisect_left
import re

class WhiteList:

    def __init__(self):
        self.sequenceList = []

    def setWords(self, words):
        self.words = words
        self.numWords = len(self.words)

    def setSequenceList(self, sequences):
        self.sequenceList = sequences
    
    def getSequenceList(self, word):
        return self.sequenceList[word] if word and word in self.sequenceList else None

    def cleanText(self, text):
        return text.strip('.,?!').lower()

    def isWord(self, text):
        return self.cleanText(text) in self.words

    def isPrefix(self, text):
        text = self.cleanText(text)
        i = bisect_left(self.words, text)

        return i != self.numWords and self.words[i].startswith(text)
    
    def getReplacement(self, text, av=None, garbler=None):
        return '\x01WLRed\x01%s\x02' % text if not garbler else garbler.garble(av, len(text.split(' ')))

    def processText(self, text, av=None, garbler=None):
        if not self.words:
            return text

        words = text.split(' ')
        newWords = []

        for word in words:
            if (not word) or self.isWord(word):
                newWords.append(word)
            else:
                newWords.append(self.getReplacement(word, av, garbler))

        lastWord = words[-1]

        if not garbler:
            if (not lastWord) or self.isPrefix(lastWord):
                newWords[-1] = lastWord
            else:
                newWords[-1] = self.getReplacement(lastWord, av, garbler)

        return ' '.join(newWords)
    
    def processSequences(self, text, av=None, garbler=None):
        if not self.sequenceList:
            return text

        words = text.split(' ')

        for wordNum in xrange(len(words)):
            word = words[wordNum].lower()
            sequences = self.getSequenceList(word)

            if not sequences:
                continue

            for sequenceNum in xrange(len(sequences)):
                sequence = sequences[sequenceNum].split()
                total = wordNum + len(sequence) + 1

                if total <= len(words) and sequence == [word.lower() for word in words[wordNum + 1:total]]:
                    words[wordNum:total] = self.getReplacement(' '.join(words[wordNum:total]), av, garbler).split()

        return ' '.join(words)

    def processThroughAll(self, text, av=None, garbler=None):
        if (text.startswith('~') and not garbler):
            return text

        return self.processSequences(self.processText(re.sub(' +', ' ', text), av, garbler), av, garbler)
Initial commit 2015-03-03 16:10:12 -06:00			`from bisect import bisect_left`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`import re`
Added staff chat channels. 2015-03-31 06:59:36 -05:00
Made it not crash uberdog lel 2015-04-01 06:39:59 -05:00			`class WhiteList:`
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00
Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`def __init__(self):`
			`self.sequenceList = []`

DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`def setWords(self, words):`
Revert "Added staff chat channels." This reverts commit c72e45fbc469b22937009d4d371109185a1147bf. 2015-04-01 15:30:08 -05:00			`self.words = words`
Initial commit 2015-03-03 16:10:12 -06:00			`self.numWords = len(self.words)`

Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`def setSequenceList(self, sequences):`
			`self.sequenceList = sequences`

			`def getSequenceList(self, word):`
Fix upper case sequence list 2015-06-12 06:21:20 -05:00			`return self.sequenceList[word] if word and word in self.sequenceList else None`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00
Initial commit 2015-03-03 16:10:12 -06:00			`def cleanText(self, text):`
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`return text.strip('.,?!').lower()`
Initial commit 2015-03-03 16:10:12 -06:00
			`def isWord(self, text):`
Revert "Added staff chat channels." This reverts commit c72e45fbc469b22937009d4d371109185a1147bf. 2015-04-01 15:30:08 -05:00			`return self.cleanText(text) in self.words`
Initial commit 2015-03-03 16:10:12 -06:00
			`def isPrefix(self, text):`
			`text = self.cleanText(text)`
			`i = bisect_left(self.words, text)`
Revert "Added staff chat channels." This reverts commit c72e45fbc469b22937009d4d371109185a1147bf. 2015-04-01 15:30:08 -05:00
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`return i != self.numWords and self.words[i].startswith(text)`

			`def getReplacement(self, text, av=None, garbler=None):`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`return '\x01WLRed\x01%s\x02' % text if not garbler else garbler.garble(av, len(text.split(' ')))`
Initial commit 2015-03-03 16:10:12 -06:00
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`def processText(self, text, av=None, garbler=None):`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`if not self.words:`
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`return text`
sequence asslist and chathoes 2015-04-02 07:23:24 -05:00
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`words = text.split(' ')`
			`newWords = []`
sequence asslist and chathoes 2015-04-02 07:23:24 -05:00
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`for word in words:`
			`if (not word) or self.isWord(word):`
			`newWords.append(word)`
			`else:`
			`newWords.append(self.getReplacement(word, av, garbler))`
sequence asslist and chathoes 2015-04-02 07:23:24 -05:00
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`lastWord = words[-1]`

Fix whitelist 2015-06-18 11:07:51 -05:00			`if not garbler:`
			`if (not lastWord) or self.isPrefix(lastWord):`
			`newWords[-1] = lastWord`
			`else:`
			`newWords[-1] = self.getReplacement(lastWord, av, garbler)`
sequence asslist and chathoes 2015-04-02 07:23:24 -05:00
DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`return ' '.join(newWords)`

Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`def processSequences(self, text, av=None, garbler=None):`
			`if not self.sequenceList:`
			`return text`

			`words = text.split(' ')`

			`for wordNum in xrange(len(words)):`
			`word = words[wordNum].lower()`
			`sequences = self.getSequenceList(word)`

			`if not sequences:`
			`continue`

			`for sequenceNum in xrange(len(sequences)):`
			`sequence = sequences[sequenceNum].split()`
			`total = wordNum + len(sequence) + 1`

Fix upper case sequence list 2015-06-12 06:21:20 -05:00			`if total <= len(words) and sequence == [word.lower() for word in words[wordNum + 1:total]]:`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`words[wordNum:total] = self.getReplacement(' '.join(words[wordNum:total]), av, garbler).split()`

			`return ' '.join(words)`

DANIEL: Work on whitelist 2015-05-30 13:50:36 -05:00			`def processThroughAll(self, text, av=None, garbler=None):`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 09:52:42 -05:00			`if (text.startswith('~') and not garbler):`
			`return text`

			`return self.processSequences(self.processText(re.sub(' +', ' ', text), av, garbler), av, garbler)`