### # Copyright (c) 2003-2005, Jeremiah Fincher # Copyright (c) 2008-2009, James McCoy # Copyright (c) 2010-2021, Valentin Lorentz # All rights reserved. # # Redistribution and use in source and binary forms, with or without # modification, are permitted provided that the following conditions are met: # # * Redistributions of source code must retain the above copyright notice, # this list of conditions, and the following disclaimer. # * Redistributions in binary form must reproduce the above copyright notice, # this list of conditions, and the following disclaimer in the # documentation and/or other materials provided with the distribution. # * Neither the name of the author of this software nor the name of # contributors to this software may be used to endorse or promote products # derived from this software without specific prior written consent. # # THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" # AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE # IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE # ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE # LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR # CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF # SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS # INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN # CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) # ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE # POSSIBILITY OF SUCH DAMAGE. ### import re import sys import types import codecs import base64 import binascii import unicodedata import supybot.utils as utils from supybot.commands import * import supybot.utils.minisix as minisix import supybot.plugins as plugins import supybot.commands as commands import supybot.ircutils as ircutils import supybot.callbacks as callbacks from supybot.i18n import PluginInternationalization _ = PluginInternationalization('String') import multiprocessing class String(callbacks.Plugin): """Provides useful commands for manipulating characters and strings.""" def ord(self, irc, msg, args, s): """ Returns the unicode codepoint of characters in . """ irc.replies([str(ord(char)) for char in s]) ord = wrap(ord, ['text']) def chr(self, irc, msg, args, i): """ Returns the unicode character associated with codepoint """ try: irc.reply(chr(i), stripCtcp=False) except ValueError: irc.error(_('That number doesn\'t map to a unicode character.')) chr = wrap(chr, ['int']) def unicodename(self, irc, msg, args, s): """ Returns the name of characters in . This will error if any character is not a valid Unicode character.""" replies = [] for idx, char in enumerate(s): try: replies.append(unicodedata.name(char)) except ValueError: irc.error(_('No name found for character %r at position %d.') % (char, idx), Raise=True) irc.replies(replies) unicodename = wrap(unicodename, ['text']) def unicodesearch(self, irc, msg, args, name): """ Searches for a unicode character from its .""" try: irc.reply(unicodedata.lookup(name)) except KeyError: irc.error(_('No character found with this name.')) unicodesearch = wrap(unicodesearch, ['text']) def encode(self, irc, msg, args, encoding, text): """ Returns an encoded form of the given text; the valid encodings are available in the documentation of the Python codecs module: . """ # Binary codecs are prefixed with _codec in Python 3 if encoding in 'base64 bz2 hex quopri uu zlib': encoding += '_codec' if encoding.endswith('_codec'): text = text.encode() # Do the encoding try: encoder = codecs.getencoder(encoding) except LookupError: irc.errorInvalid(_('encoding'), encoding) text = encoder(text)[0] # If this is a binary codec, re-encode it with base64 if encoding.endswith('_codec') and encoding != 'base64_codec': text = codecs.getencoder('base64_codec')(text)[0].decode() # Change result into a string if minisix.PY2 and isinstance(text, unicode): text = text.encode('utf-8') elif minisix.PY3 and isinstance(text, bytes): text = text.decode() if encoding in ('base64', 'base64_codec'): text = text.replace('\n', '') # Reply irc.reply(text.rstrip('\n')) encode = wrap(encode, ['something', 'text']) def decode(self, irc, msg, args, encoding, text): """ Returns an un-encoded form of the given text; the valid encodings are available in the documentation of the Python codecs module: . """ # Binary codecs are prefixed with _codec in Python 3 if encoding in 'base64 bz2 hex quopri uu zlib': encoding += '_codec' # If this is a binary codec, pre-decode it with base64 if encoding.endswith('_codec') and encoding != 'base64_codec': text = codecs.getdecoder('base64_codec')(text.encode())[0] # Do the decoding try: decoder = codecs.getdecoder(encoding) except LookupError: irc.errorInvalid(_('encoding'), encoding) if minisix.PY3 and not isinstance(text, bytes): text = text.encode() try: text = decoder(text)[0] except binascii.Error: irc.errorInvalid(_('base64 string'), s=_('Base64 strings must be a multiple of 4 in ' 'length, padded with \'=\' if necessary.')) return # Change result into a string if minisix.PY2 and isinstance(text, unicode): text = text.encode('utf-8') elif minisix.PY3 and isinstance(text, bytes): try: text = text.decode() except UnicodeDecodeError: pass # Reply irc.reply(text) decode = wrap(decode, ['something', 'text']) def levenshtein(self, irc, msg, args, s1, s2): """ Returns the levenshtein distance (also known as the "edit distance" between and ) """ max = self.registryValue('levenshtein.max') if len(s1) > max or len(s2) > max: irc.error(_('Levenshtein distance is a complicated algorithm, try ' 'it with some smaller inputs.')) else: irc.reply(str(utils.str.distance(s1, s2))) levenshtein = thread(wrap(levenshtein, ['something', 'text'])) def soundex(self, irc, msg, args, text, length): """ [] Returns the Soundex hash to a given length. The length defaults to 4, since that's the standard length for a soundex hash. For unlimited length, use 0. Maximum length 1024. """ if length > 1024: irc.error("Maximum allowed length is 1024.") return irc.reply(utils.str.soundex(text, length)) soundex = wrap(soundex, ['somethingWithoutSpaces', additional('int', 4)]) def len(self, irc, msg, args, text): """ Returns the length of . """ irc.reply(str(len(text))) len = wrap(len, ['text']) def re(self, irc, msg, args, f, text): """ If is of the form m/regexp/flags, returns the portion of that matches the regexp. If is of the form s/regexp/replacement/flags, returns the result of applying such a regexp to . """ if f('') and len(f(' ')) > len(f(''))+1: # Matches the empty string. s = _('You probably don\'t want to match the empty string.') irc.error(s) else: t = self.registryValue('re.timeout') try: v = process(f, text, timeout=t, pn=self.name(), cn='re') if isinstance(v, list): v = format('%L', v) irc.reply(v) except commands.ProcessTimeoutError as e: irc.error("ProcessTimeoutError: %s" % (e,)) except re.error as e: irc.error(e.args[0]) re = thread(wrap(re, [first('regexpMatcherMany', 'regexpReplacer'), 'text'])) def xor(self, irc, msg, args, password, text): """ Returns XOR-encrypted with . """ chars = utils.iter.cycle(password) ret = [chr(ord(c) ^ ord(next(chars))) for c in text] irc.reply(''.join(ret)) xor = wrap(xor, ['something', 'text']) def md5(self, irc, msg, args, text): """ Returns the md5 hash of a given string. """ irc.reply(utils.crypt.md5(text.encode('utf8')).hexdigest()) md5 = wrap(md5, ['text']) def sha(self, irc, msg, args, text): """ Returns the SHA1 hash of a given string. """ irc.reply(utils.crypt.sha(text.encode('utf8')).hexdigest()) sha = wrap(sha, ['text']) Class = String # vim:set shiftwidth=4 softtabstop=4 expandtab textwidth=79: