#!/usr/bin/env python3 # -*- coding: utf-8 -*- from arjun.core.colors import green, end, info, bad, good, run, res import argparse import json from urllib.parse import urlparse import arjun.core.config as mem from arjun.core.exporter import exporter from arjun.core.anomaly import define, compare from arjun.core.utils import fetch_params, stable_request, random_str, slicer, confirm, populate, reader, nullify, prepare_requests, compatible_path from arjun.plugins.heuristic import heuristic arjun_dir = compatible_path(mem.__file__.replace(compatible_path('/core/config.py'), '')) parser = argparse.ArgumentParser() # defines the parser # Arguments that can be supplied parser.add_argument('-u', help='Target URL', dest='url') parser.add_argument('-o', '-oJ', help='Path for json output file.', dest='json_file') parser.add_argument('-oT', help='Path for text output file.', dest='text_file') parser.add_argument('-oB', help='Output to Burp Suite Proxy. Default is 127.0.0.1:8080.', dest='burp_proxy', nargs='?', const='127.0.0.1:8080') parser.add_argument('-d', help='Delay between requests in seconds. (default: 0)', dest='delay', type=float, default=0) parser.add_argument('-t', help='Number of concurrent threads. (default: 5)', dest='threads', type=int, default=5) parser.add_argument('-w', help='Wordlist file path. (default: {arjundir}/db/large.txt)', dest='wordlist', default=arjun_dir+'/db/large.txt') parser.add_argument('-m', help='Request method to use: GET/POST/XML/JSON/HEADERS. (default: GET)', dest='method', default='GET') parser.add_argument('-i', help='Import target URLs from file.', dest='import_file', nargs='?', const=True) parser.add_argument('-T', help='HTTP request timeout in seconds. (default: 15)', dest='timeout', type=float, default=15) parser.add_argument('-c', help='Chunk size. The number of parameters to be sent at once', type=int, dest='chunks', default=250) parser.add_argument('-q', help='Quiet mode. No output.', dest='quiet', action='store_true') parser.add_argument('--rate-limit', help='Max number of requests to be sent out per second (default: 9999)', dest='rate_limit', type=int, default=9999) parser.add_argument('--headers', help='Add headers. Separate multiple headers with a new line.', dest='headers', nargs='?', const=True) parser.add_argument('--passive', help='Collect parameter names from passive sources like wayback, commoncrawl and otx.', dest='passive', nargs='?', const='-') parser.add_argument('--stable', help='Prefer stability over speed.', dest='stable', action='store_true') parser.add_argument('--include', help='Include this data in every request.', dest='include', default={}) parser.add_argument('--disable-redirects', help='disable redirects', dest='disable_redirects', action='store_true') args = parser.parse_args() # arguments to be parsed if args.quiet: print = nullify print('''%s _ /_| _ ' ( |/ /(//) v%s _/ %s ''' % (green, __import__('arjun').__version__, end)) try: from concurrent.futures import ThreadPoolExecutor, as_completed except ImportError: print('%s Please use Python > 3.2 to run Arjun.' % bad) quit() mem.var = vars(args) mem.var['method'] = mem.var['method'].upper() if mem.var['method'] != 'GET': mem.var['chunks'] = 500 if mem.var['stable'] or mem.var['delay']: mem.var['threads'] = 1 if mem.var['wordlist'] in ('large', 'medium', 'small'): mem.var['wordlist'] = f'{arjun_dir}/db/{mem.var["wordlist"]}.txt' try: wordlist_file = arjun_dir + '/db/small.txt' if args.wordlist == 'small' else args.wordlist wordlist_file = compatible_path(wordlist_file) wordlist = set(reader(wordlist_file, mode='lines')) if mem.var['passive']: host = mem.var['passive'] if host == '-': host = urlparse(args.url).netloc print('%s Collecting parameter names from passive sources for %s, it may take a while' % (run, host)) passive_params = fetch_params(host) wordlist.update(passive_params) print('%s Collected %s parameters, added to the wordlist' % (info, len(passive_params))) wordlist = list(wordlist) except FileNotFoundError: exit('%s The specified file for parameters doesn\'t exist' % bad) if len(wordlist) < mem.var['chunks']: mem.var['chunks'] = int(len(wordlist)/2) if not args.url and not args.import_file: exit('%s No target(s) specified' % bad) from arjun.core.requester import requester from arjun.core.bruter import bruter def narrower(request, factors, param_groups): """ takes a list of parameters and narrows it down to parameters that cause anomalies returns list """ anomalous_params = [] threadpool = ThreadPoolExecutor(max_workers=mem.var['threads']) futures = (threadpool.submit(bruter, request, factors, params) for params in param_groups) for i, result in enumerate(as_completed(futures)): if result.result(): anomalous_params.extend(slicer(result.result())) if mem.var['kill']: return anomalous_params print('%s Processing chunks: %i/%-6i' % (info, i + 1, len(param_groups)), end='\r') return anomalous_params def initialize(request, wordlist, single_url=False): """ handles parameter finding process for a single request object returns 'skipped' (on error), list on success """ url = request['url'] if not url.startswith('http'): print('%s %s is not a valid URL' % (bad, url)) return 'skipped' print('%s Probing the target for stability' % run) request['url'] = stable_request(url, request['headers']) if not request['url']: return 'skipped' else: fuzz = "z" + random_str(6) response_1 = requester(request, {fuzz[:-1]: fuzz[::-1][:-1]}) if single_url: print('%s Analysing HTTP response for anomalies' % run) response_2 = requester(request, {fuzz[:-1]: fuzz[::-1][:-1]}) if type(response_1) == str or type(response_2) == str: return 'skipped' # params from response must be extracted before factors but displayed later found, words_exist = heuristic(response_1, wordlist) factors = define(response_1, response_2, fuzz, fuzz[::-1], wordlist) zzuf = "z" + random_str(6) response_3 = requester(request, {zzuf[:-1]: zzuf[::-1][:-1]}) while True: reason = compare(response_3, factors, {zzuf[:-1]: zzuf[::-1][:-1]})[2] if not reason: break factors[reason] = False if single_url: print('%s Analysing HTTP response for potential parameter names' % run) if found: num = len(found) if words_exist: print('%s Heuristic scanner found %i parameters' % (good, num)) else: s = 's' if num > 1 else '' print('%s Heuristic scanner found %i parameter%s: %s' % (good, num, s, ', '.join(found))) if single_url: print('%s Logicforcing the URL endpoint' % run) populated = populate(wordlist) with open(f'{arjun_dir}/db/special.json', 'r') as f: populated.update(json.load(f)) param_groups = slicer(populated, int(len(wordlist)/mem.var['chunks'])) prev_chunk_count = len(param_groups) last_params = [] while True: param_groups = narrower(request, factors, param_groups) if len(param_groups) > prev_chunk_count: response_3 = requester(request, {zzuf[:-1]: zzuf[::-1][:-1]}) if compare(response_3, factors, {zzuf[:-1]: zzuf[::-1][:-1]})[0] != '': print('%s Webpage is returning different content on each request. Skipping.' % bad) return [] if mem.var['kill']: return 'skipped' param_groups = confirm(param_groups, last_params) prev_chunk_count = len(param_groups) if not param_groups: break confirmed_params = [] for param in last_params: reason = bruter(request, factors, param, mode='verify') if reason: name = list(param.keys())[0] confirmed_params.append(name) if single_url: print('%s parameter detected: %s, based on: %s' % (res, name, reason)) return confirmed_params def main(): requests = prepare_requests(args) final_result = {} is_single = False if args.import_file else True try: mem.var['kill'] = False count = 0 for request in requests: url = request['url'] these_params = initialize(request, wordlist, single_url=is_single) count += 1 mem.var['kill'] = False mem.var['bad_req_count'] = 0 print('%s Scanning %d/%d: %s' % (run, count, len(requests), url)) if these_params == 'skipped': print('%s Skipped %s due to errors' % (bad, url)) elif these_params: final_result[url] = {} final_result[url]['params'] = these_params final_result[url]['method'] = request['method'] final_result[url]['headers'] = request['headers'] exporter(final_result) print('%s Parameters found: %s\n' % (good, ', '.join(final_result[url]['params']))) if not mem.var['json_file']: final_result = {} continue else: print('%s No parameters were discovered.\n' % info) except KeyboardInterrupt: exit() if __name__ == '__main__': main()