Poodletooth-iLand/otp/chat/WhiteList.py

from bisect import bisect_left
import re

class WhiteList:

    def __init__(self):
        self.sequenceList = []

    def setWords(self, words):
        self.words = words
        self.numWords = len(self.words)

    def setSequenceList(self, sequences):
        self.sequenceList = sequences
    
    def getSequenceList(self, word):
        return self.sequenceList[word] if word and word in self.sequenceList else None

    def cleanText(self, text):
        return text.strip('.,?!').lower()

    def isWord(self, text):
        return self.cleanText(text) in self.words

    def isPrefix(self, text):
        text = self.cleanText(text)
        i = bisect_left(self.words, text)

        return i != self.numWords and self.words[i].startswith(text)
    
    def getReplacement(self, text, av=None, garbler=None):
        return '\x01WLRed\x01%s\x02' % text if not garbler else garbler.garble(av, len(text.split(' ')))

    def processText(self, text, av=None, garbler=None):
        if not self.words:
            return text

        words = text.split(' ')
        newWords = []

        for word in words:
            if (not word) or self.isWord(word):
                newWords.append(word)
            else:
                newWords.append(self.getReplacement(word, av, garbler))

        lastWord = words[-1]

        if (not lastWord) or self.isPrefix(lastWord):
            newWords[-1] = lastWord
        else:
            newWords[-1] = self.getReplacement(lastWord, av, garbler)

        return ' '.join(newWords)
    
    def processSequences(self, text, av=None, garbler=None):
        if not self.sequenceList:
            return text

        words = text.split(' ')

        for wordNum in xrange(len(words)):
            word = words[wordNum].lower()
            sequences = self.getSequenceList(word)

            if not sequences:
                continue

            for sequenceNum in xrange(len(sequences)):
                sequence = sequences[sequenceNum].split()
                total = wordNum + len(sequence) + 1

                if total <= len(words) and sequence == [word.lower() for word in words[wordNum + 1:total]]:
                    words[wordNum:total] = self.getReplacement(' '.join(words[wordNum:total]), av, garbler).split()

        return ' '.join(words)

    def processThroughAll(self, text, av=None, garbler=None):
        if (text.startswith('~') and not garbler):
            return text

        return self.processSequences(self.processText(re.sub(' +', ' ', text), av, garbler), av, garbler)
Initial commit 2015-03-03 22:10:12 +00:00			`from bisect import bisect_left`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`import re`
Added staff chat channels. 2015-03-31 11:59:36 +00:00
Made it not crash uberdog lel 2015-04-01 11:39:59 +00:00			`class WhiteList:`
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00
Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`def __init__(self):`
			`self.sequenceList = []`

DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`def setWords(self, words):`
Revert "Added staff chat channels." This reverts commit c72e45fbc469b22937009d4d371109185a1147bf. 2015-04-01 20:30:08 +00:00			`self.words = words`
Initial commit 2015-03-03 22:10:12 +00:00			`self.numWords = len(self.words)`

Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`def setSequenceList(self, sequences):`
			`self.sequenceList = sequences`

			`def getSequenceList(self, word):`
Fix upper case sequence list 2015-06-12 11:21:20 +00:00			`return self.sequenceList[word] if word and word in self.sequenceList else None`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00
Initial commit 2015-03-03 22:10:12 +00:00			`def cleanText(self, text):`
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`return text.strip('.,?!').lower()`
Initial commit 2015-03-03 22:10:12 +00:00
			`def isWord(self, text):`
Revert "Added staff chat channels." This reverts commit c72e45fbc469b22937009d4d371109185a1147bf. 2015-04-01 20:30:08 +00:00			`return self.cleanText(text) in self.words`
Initial commit 2015-03-03 22:10:12 +00:00
			`def isPrefix(self, text):`
			`text = self.cleanText(text)`
			`i = bisect_left(self.words, text)`
Revert "Added staff chat channels." This reverts commit c72e45fbc469b22937009d4d371109185a1147bf. 2015-04-01 20:30:08 +00:00
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`return i != self.numWords and self.words[i].startswith(text)`

			`def getReplacement(self, text, av=None, garbler=None):`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`return '\x01WLRed\x01%s\x02' % text if not garbler else garbler.garble(av, len(text.split(' ')))`
Initial commit 2015-03-03 22:10:12 +00:00
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`def processText(self, text, av=None, garbler=None):`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`if not self.words:`
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`return text`
sequence asslist and chathoes 2015-04-02 12:23:24 +00:00
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`words = text.split(' ')`
			`newWords = []`
sequence asslist and chathoes 2015-04-02 12:23:24 +00:00
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`for word in words:`
			`if (not word) or self.isWord(word):`
			`newWords.append(word)`
			`else:`
			`newWords.append(self.getReplacement(word, av, garbler))`
sequence asslist and chathoes 2015-04-02 12:23:24 +00:00
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`lastWord = words[-1]`

			`if (not lastWord) or self.isPrefix(lastWord):`
			`newWords[-1] = lastWord`
			`else:`
			`newWords[-1] = self.getReplacement(lastWord, av, garbler)`
sequence asslist and chathoes 2015-04-02 12:23:24 +00:00
DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`return ' '.join(newWords)`

Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`def processSequences(self, text, av=None, garbler=None):`
			`if not self.sequenceList:`
			`return text`

			`words = text.split(' ')`

			`for wordNum in xrange(len(words)):`
			`word = words[wordNum].lower()`
			`sequences = self.getSequenceList(word)`

			`if not sequences:`
			`continue`

			`for sequenceNum in xrange(len(sequences)):`
			`sequence = sequences[sequenceNum].split()`
			`total = wordNum + len(sequence) + 1`

Fix upper case sequence list 2015-06-12 11:21:20 +00:00			`if total <= len(words) and sequence == [word.lower() for word in words[wordNum + 1:total]]:`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`words[wordNum:total] = self.getReplacement(' '.join(words[wordNum:total]), av, garbler).split()`

			`return ' '.join(words)`

DANIEL: Work on whitelist 2015-05-30 18:50:36 +00:00			`def processThroughAll(self, text, av=None, garbler=None):`
Add sequence list + prevent multiple spaces in the chat 2015-06-11 14:52:42 +00:00			`if (text.startswith('~') and not garbler):`
			`return text`

			`return self.processSequences(self.processText(re.sub(' +', ' ', text), av, garbler), av, garbler)`