SublimeStringEncode/string_encode.py at master · manafire/SublimeStringEncode

180 lines (143 loc) · 9.44 KB
# coding: utf8
import sublime_plugin
import urllib
import base64
class StringEncode(sublime_plugin.TextCommand):
    def run(self, edit):
        e = self.view.begin_edit('encode')
        regions = [region for region in self.view.sel()]
        # sort by region.end() DESC
        def compare(region_a, region_b):
            return cmp(region_b.end(), region_a.end())
        regions.sort(compare)
        for region in regions:
            if region.empty():
                continue
            text = self.view.substr(region)
            replacement = self.encode(text)
            self.view.replace(edit, region, replacement)
        self.view.end_edit(e)
html_escape_table = {
    u"\"": "&quot;", u"'": "&#039;", u"<": "&lt;", u">": "&gt;", u"¡": "&iexcl;", u"¢": "&cent;", u"£": "&pound;", u"¤": "&curren;", u"¥": "&yen;", u"¦": "&brvbar;", u"§": "&sect;", u"¨": "&uml;", u"©": "&copy;", u"ª": "&ordf;", u"«": "&laquo;", u"¬": "&not;", u"®": "&reg;", u"¯": "&macr;", u"°": "&deg;", u"±": "&plusmn;", u"²": "&sup2;", u"³": "&sup3;", u"´": "&acute;", u"µ": "&micro;", u"¶": "&para;", u"·": "&middot;", u"¸": "&cedil;", u"¹": "&sup1;", u"º": "&ordm;", u"»": "&raquo;", u"¼": "&frac14;", u"½": "&frac12;", u"¾": "&frac34;", u"¿": "&iquest;", u"À": "&Agrave;", u"Á": "&Aacute;", u"Â": "&Acirc;", u"Ã": "&Atilde;", u"Ä": "&Auml;", u"Å": "&Aring;", u"Æ": "&AElig;", u"Ç": "&Ccedil;", u"È": "&Egrave;", u"É": "&Eacute;", u"Ê": "&Ecirc;", u"Ë": "&Euml;", u"Ì": "&Igrave;", u"Í": "&Iacute;", u"Î": "&Icirc;", u"Ï": "&Iuml;", u"Ð": "&ETH;", u"Ñ": "&Ntilde;", u"Ò": "&Ograve;", u"Ó": "&Oacute;", u"Ô": "&Ocirc;", u"Õ": "&Otilde;", u"Ö": "&Ouml;", u"×": "&times;", u"Ø": "&Oslash;", u"Ù": "&Ugrave;", u"Ú": "&Uacute;", u"Û": "&Ucirc;", u"Ü": "&Uuml;", u"Ý": "&Yacute;", u"Þ": "&THORN;", u"ß": "&szlig;", u"à": "&agrave;", u"á": "&aacute;", u"â": "&acirc;", u"ã": "&atilde;", u"ä": "&auml;", u"å": "&aring;", u"æ": "&aelig;", u"ç": "&ccedil;", u"è": "&egrave;", u"é": "&eacute;", u"ê": "&ecirc;", u"ë": "&euml;", u"ì": "&igrave;", u"í": "&iacute;", u"î": "&icirc;", u"ï": "&iuml;", u"ð": "&eth;", u"ñ": "&ntilde;", u"ò": "&ograve;", u"ó": "&oacute;", u"ô": "&ocirc;", u"õ": "&otilde;", u"ö": "&ouml;", u"÷": "&divide;", u"ø": "&oslash;", u"ù": "&ugrave;", u"ú": "&uacute;", u"û": "&ucirc;", u"ü": "&uuml;", u"ý": "&yacute;", u"þ": "&thorn;", u"ÿ": "&yuml;", u"Œ": "&OElig;", u"œ": "&oelig;", u"Š": "&Scaron;", u"š": "&scaron;", u"Ÿ": "&Yuml;", u"ƒ": "&fnof;", u"ˆ": "&circ;", u"˜": "&tilde;", u"Α": "&Alpha;", u"Β": "&Beta;", u"Γ": "&Gamma;", u"Δ": "&Delta;", u"Ε": "&Epsilon;", u"Ζ": "&Zeta;", u"Η": "&Eta;", u"Θ": "&Theta;", u"Ι": "&Iota;", u"Κ": "&Kappa;", u"Λ": "&Lambda;", u"Μ": "&Mu;", u"Ν": "&Nu;", u"Ξ": "&Xi;", u"Ο": "&Omicron;", u"Π": "&Pi;", u"Ρ": "&Rho;", u"Σ": "&Sigma;", u"Τ": "&Tau;", u"Υ": "&Upsilon;", u"Φ": "&Phi;", u"Χ": "&Chi;", u"Ψ": "&Psi;", u"Ω": "&Omega;", u"α": "&alpha;", u"β": "&beta;", u"γ": "&gamma;", u"δ": "&delta;", u"ε": "&epsilon;", u"ζ": "&zeta;", u"η": "&eta;", u"θ": "&theta;", u"ι": "&iota;", u"κ": "&kappa;", u"λ": "&lambda;", u"μ": "&mu;", u"ν": "&nu;", u"ξ": "&xi;", u"ο": "&omicron;", u"π": "&pi;", u"ρ": "&rho;", u"ς": "&sigmaf;", u"σ": "&sigma;", u"τ": "&tau;", u"υ": "&upsilon;", u"φ": "&phi;", u"χ": "&chi;", u"ψ": "&psi;", u"ω": "&omega;", u"ϑ": "&thetasym;", u"ϒ": "&upsih;", u"ϖ": "&piv;", u"–": "&ndash;", u"—": "&mdash;", u"‘": "&lsquo;", u"’": "&rsquo;", u"‚": "&sbquo;", u"“": "&ldquo;", u"”": "&rdquo;", u"„": "&bdquo;", u"†": "&dagger;", u"‡": "&Dagger;", u"•": "&bull;", u"…": "&hellip;", u"‰": "&permil;", u"′": "&prime;", u"″": "&Prime;", u"‹": "&lsaquo;", u"›": "&rsaquo;", u"‾": "&oline;", u"⁄": "&frasl;", u"€": "&euro;", u"ℑ": "&image;", u"℘": "&weierp;", u"ℜ": "&real;", u"™": "&trade;", u"ℵ": "&alefsym;", u"←": "&larr;", u"↑": "&uarr;", u"→": "&rarr;", u"↓": "&darr;", u"↔": "&harr;", u"↵": "&crarr;", u"⇐": "&lArr;", u"⇑": "&uArr;", u"⇒": "&rArr;", u"⇓": "&dArr;", u"⇔": "&hArr;", u"∀": "&forall;", u"∂": "&part;", u"∃": "&exist;", u"∅": "&empty;", u"∇": "&nabla;", u"∈": "&isin;", u"∉": "&notin;", u"∋": "&ni;", u"∏": "&prod;", u"∑": "&sum;", u"−": "&minus;", u"∗": "&lowast;", u"√": "&radic;", u"∝": "&prop;", u"∞": "&infin;", u"∠": "&ang;", u"∧": "&and;", u"∨": "&or;", u"∩": "&cap;", u"∪": "&cup;", u"∫": "&int;", u"∴": "&there4;", u"∼": "&sim;", u"≅": "&cong;", u"≈": "&asymp;", u"≠": "&ne;", u"≡": "&equiv;", u"≤": "&le;", u"≥": "&ge;", u"⊂": "&sub;", u"⊃": "&sup;", u"⊄": "&nsub;", u"⊆": "&sube;", u"⊇": "&supe;", u"⊕": "&oplus;", u"⊗": "&otimes;", u"⊥": "&perp;", u"⋅": "&sdot;", u"⌈": "&lceil;", u"⌉": "&rceil;", u"⌊": "&lfloor;", u"⌋": "&rfloor;", u"〈": "&lang;", u"〉": "&rang;", u"◊": "&loz;", u"♠": "&spades;", u"♣": "&clubs;", u"♥": "&hearts;", u"♦": "&diams;",
xml_escape_table = {
    u"\"": "&quot;", u"'": "&#039;", u"<": "&lt;", u">": "&gt;"
french_escape_table = {
  u"À": "&Agrave;",  # Capital A-grave
  u"à": "&agrave;",  # Lowercase a-grave
  u"Â": "&Acirc;", # Capital A-circumflex
  u"â": "&acirc;", # Lowercase a-circumflex
  u"Æ": "&AElig;", # Capital AE Ligature
  u"æ": "&aelig;", # Lowercase AE Ligature
  u"Ç": "&Ccedil;",  # Capital C-cedilla
  u"ç": "&ccedil;",  # Lowercase c-cedilla
  u"È": "&Egrave;",  # Capital E-grave
  u"è": "&egrave;",  # Lowercase e-grave
  u"É": "&Eacute;",  # Capital E-acute
  u"é": "&eacute;",  # Lowercase e-acute
  u"Ê": "&Ecirc;", # Capital E-circumflex
  u"ê": "&ecirc;", # Lowercase e-circumflex
  u"Ë": "&Euml;",  # Capital E-umlaut
  u"ë": "&euml;",  # Lowercase e-umlaut
  u"Î": "&Icirc;", # Capital I-circumflex
  u"î": "&icirc;", # Lowercase i-circumflex
  u"Ï": "&Iuml;",  # Capital I-umlaut
  u"ï": "&iuml;",  # Lowercase i-umlaut
  u"Ô": "&Ocirc;", # Capital O-circumflex
  u"ô": "&ocirc;", # Lowercase o-circumflex
  u"Œ": "&OElig;", # Capital OE ligature
  u"œ": "&oelig;", # Lowercase oe ligature
  u"Ù": "&Ugrave;",  # Capital U-grave
  u"ù": "&ugrave;",  # Lowercase u-grave
  u"Û": "&Ucirc;", # Capital U-circumflex
  u"û": "&ucirc;", # Lowercase U-circumflex
  u"Ü": "&Uuml;",  # Capital U-umlaut
  u"ü": "&uuml;",  # Lowercase U-umlaut
  u"«": "&laquo;", # Left angle quotes
  u"»": "&raquo;", # Right angle quotes
  u"€": "&euro;"  # Euro
class HtmlEntitizeCommand(StringEncode):
    def encode(self, text):
        text = text.replace('&', '&amp;')
        for k in html_escape_table:
            v = html_escape_table[k]
            text = text.replace(k, v)
        ret = ''
        for i, c in enumerate(text):
            if ord(c) > 127:
                ret += hex(ord(c)).replace('0x', '&#x') + ';'
            else:
                ret += c
        return ret
class HtmlDeentitizeCommand(StringEncode):
    def encode(self, text):
        for k in html_escape_table:
            v = html_escape_table[k]
            text = text.replace(v, k)
        while re.search('&#[xX][a-fA-F0-9]+;', text):
            match = re.search('&#[xX]([a-fA-F0-9]+);', text)
            text = text.replace(match.group(0), unichr(int('0x' + match.group(1), 16)))
        text = text.replace('&amp;', '&')
        return text
class FrenchEntitizeCommand(StringEncode):
  def encode(self, text):
      for k in french_escape_table:
          v = french_escape_table[k]
          text = text.replace(k, v)
      while re.search('&#[xX][a-fA-F0-9]+;', text):
          match = re.search('&#[xX]([a-fA-F0-9]+);', text)
          text = text.replace(match.group(0), unichr(int('0x' + match.group(1), 16)))
      text = text.replace('&amp;', '&')
      return text
class FrenchDeentitizeCommand(StringEncode):
  def encode(self, text):
      for k in french_escape_table:
          v = french_escape_table[k]
          text = text.replace(v, k)
      while re.search('&#[xX][a-fA-F0-9]+;', text):
          match = re.search('&#[xX]([a-fA-F0-9]+);', text)
          text = text.replace(match.group(0), unichr(int('0x' + match.group(1), 16)))
      text = text.replace('&amp;', '&')
      return text
class XmlEntitizeCommand(StringEncode):
    def encode(self, text):
        text = text.replace('&', '&amp;')
        for k in xml_escape_table:
            v = xml_escape_table[k]
            text = text.replace(k, v)
        return text
class XmlDeentitizeCommand(StringEncode):
    def encode(self, text):
        for k in xml_escape_table:
            v = xml_escape_table[k]
            text = text.replace(v, k)
        text = text.replace('&amp;', '&')
        return text
class UrlEncodeCommand(StringEncode):
    def encode(self, text):
        return urllib.quote(text)
class UrlDecodeCommand(StringEncode):
    def encode(self, text):
        return urllib.unquote(text)
class Base64EncodeCommand(StringEncode):
    def encode(self, text):
        return base64.b64encode(text)
class Base64DecodeCommand(StringEncode):
    def encode(self, text):
        return base64.b64decode(text)
class Escaper(StringEncode):
    def encode(self, text):
        return re.sub(r'(?<!\\)(%s)' % self.meta, r'\\\1', text)
class EscapeRegexCommand(Escaper):
    meta = r'[\\*.+^$()\[\]\{\}]'
class EscapeLikeCommand(Escaper):
    meta = r'[%_]'
class HexDecCommand(StringEncode):
    def encode(self, text):
        return str(int(text, 16))
class DecHexCommand(StringEncode):
    def encode(self, text):
        return hex(int(text))
Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

string_encode.py

Latest commit

History

string_encode.py

File metadata and controls