From 8be8216521a68ed400e78134a1aca9a5c1de25db Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 1 May 2023 16:42:32 -0400
Subject: [PATCH 001/387] massdns improvements, added module sequence

---
 bbot/core/event/base.py      |  14 ++++
 bbot/modules/httpx.py        |   4 +-
 bbot/modules/massdns.py      | 140 +++++++++++++++++++----------------
 bbot/modules/output/csv.py   |   2 +-
 bbot/modules/output/human.py |   2 +-
 5 files changed, 95 insertions(+), 67 deletions(-)

diff --git a/bbot/core/event/base.py b/bbot/core/event/base.py
index cd16574dac..a88c5314fc 100644
--- a/bbot/core/event/base.py
+++ b/bbot/core/event/base.py
@@ -447,6 +447,8 @@ def json(self, mode="json"):
             j.update({"tags": list(self.tags)})
         if self.module:
             j.update({"module": str(self.module)})
+        if self.module_sequence:
+            j.update({"module_sequence": str(self.module_sequence)})
 
         # normalize non-primitive python objects
         for k, v in list(j.items()):
@@ -463,6 +465,18 @@ def json(self, mode="json"):
     def from_json(j):
         return event_from_json(j)
 
+    @property
+    def module_sequence(self):
+        """
+        A human-friendly representation of the module name that includes modules from omitted source events
+
+        Helpful in identifying where a URL came from
+        """
+        module_name = getattr(self.module, "name", "")
+        if getattr(self.source, "_omit", False):
+            module_name = f"{self.source.module_sequence}->{module_name}"
+        return module_name
+
     @property
     def module_priority(self):
         if self._module_priority is None:
diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index d367951ac9..6641b38301 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -136,14 +136,14 @@ def handle_batch(self, *events):
             title = self.helpers.tagify(j.get("title", ""))
             if title:
                 tags.append(f"http-title-{title}")
-            url_event = self.make_event(url, "URL", source_event, module=source_event.module, tags=tags)
+            url_event = self.make_event(url, "URL", source_event, tags=tags)
             if url_event:
                 if url_event != source_event:
                     self.emit_event(url_event)
                 else:
                     url_event._resolved.set()
                 # HTTP response
-                self.emit_event(j, "HTTP_RESPONSE", url_event, module=source_event.module, internal=True)
+                self.emit_event(j, "HTTP_RESPONSE", url_event, internal=True)
 
     def cleanup(self):
         resume_file = self.helpers.current_dir / "resume.cfg"
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index fd8b58bc85..10b69aa0cd 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -233,80 +233,94 @@ def _massdns(self, domain, subdomains):
 
     def finish(self):
         found = sorted(self.found.items(), key=lambda x: len(x[-1]), reverse=True)
+        # if we have a lot of rounds to make, don't try mutations on less-populated domains
+        avg_subdomains = sum([len(subdomains) for domain, subdomains in found[:50]]) / len(found[:50])
+        trimmed_found = []
+        for i, (domain, subdomains) in enumerate(found):
+            # accept domains that are in the top 50 or have more than 5 percent of the average number of subdomains
+            if i < 50 or (len(subdomains) > 1 and len(subdomains) >= (avg_subdomains * 0.05)):
+                trimmed_found.append((domain, subdomains))
+            else:
+                self.verbose(
+                    f"Skipping mutations on {domain} because it only has {len(subdomains):,} subdomain(s) (avg: {avg_subdomains:,})"
+                )
 
         base_mutations = set()
-        for i, (domain, subdomains) in enumerate(found):
-            # keep looping as long as we're finding things
-            while 1:
-                max_mem_percent = 90
-                mem_status = self.helpers.memory_status()
-                # abort if we don't have the memory
-                mem_percent = mem_status.percent
-                if mem_percent > max_mem_percent:
-                    free_memory = mem_status.available
-                    free_memory_human = self.helpers.bytes_to_human(free_memory)
-                    self.hugewarning(
-                        f"Cannot proceed with DNS mutations because system memory is at {mem_percent:.1f}% ({free_memory_human} remaining)"
-                    )
-                    break
+        try:
+            for i, (domain, subdomains) in enumerate(trimmed_found):
+                self.verbose(f"{domain} has {len(subdomains):,} subdomains")
+                # keep looping as long as we're finding things
+                while 1:
+                    max_mem_percent = 90
+                    mem_status = self.helpers.memory_status()
+                    # abort if we don't have the memory
+                    mem_percent = mem_status.percent
+                    if mem_percent > max_mem_percent:
+                        free_memory = mem_status.available
+                        free_memory_human = self.helpers.bytes_to_human(free_memory)
+                        assert (
+                            False
+                        ), f"Cannot proceed with DNS mutations because system memory is at {mem_percent:.1f}% ({free_memory_human} remaining)"
 
-                query = domain
-                domain_hash = hash(domain)
-                if self.scan.stopping:
-                    return
+                    query = domain
+                    domain_hash = hash(domain)
+                    if self.scan.stopping:
+                        return
 
-                mutations = set(base_mutations)
+                    mutations = set(base_mutations)
 
-                def add_mutation(_domain_hash, m):
-                    h = hash((_domain_hash, m))
-                    if h not in self.mutations_tried:
-                        self.mutations_tried.add(h)
-                        mutations.add(m)
+                    def add_mutation(_domain_hash, m):
+                        h = hash((_domain_hash, m))
+                        if h not in self.mutations_tried:
+                            self.mutations_tried.add(h)
+                            mutations.add(m)
 
-                # try every subdomain everywhere else
-                for _domain, _subdomains in found:
-                    if _domain == domain:
-                        continue
-                    for s in _subdomains:
-                        first_segment = s.split(".")[0]
-                        # skip stuff with lots of numbers (e.g. PTRs)
-                        digits = self.digit_regex.findall(first_segment)
-                        excessive_digits = len(digits) > 2
-                        long_digits = any(len(d) > 3 for d in digits)
-                        if excessive_digits or long_digits:
+                    # try every subdomain everywhere else
+                    for _domain, _subdomains in found:
+                        if _domain == domain:
                             continue
-                        add_mutation(domain_hash, first_segment)
-                        for word in self.helpers.extract_words(
-                            first_segment, word_regexes=self.helpers.word_cloud.dns_mutator.extract_word_regexes
-                        ):
-                            add_mutation(domain_hash, word)
+                        for s in _subdomains:
+                            first_segment = s.split(".")[0]
+                            # skip stuff with lots of numbers (e.g. PTRs)
+                            digits = self.digit_regex.findall(first_segment)
+                            excessive_digits = len(digits) > 2
+                            long_digits = any(len(d) > 3 for d in digits)
+                            if excessive_digits or long_digits:
+                                continue
+                            add_mutation(domain_hash, first_segment)
+                            for word in self.helpers.extract_words(
+                                first_segment, word_regexes=self.helpers.word_cloud.dns_mutator.extract_word_regexes
+                            ):
+                                add_mutation(domain_hash, word)
 
-                # word cloud
-                for mutation in self.helpers.word_cloud.mutations(
-                    subdomains, cloud=False, numbers=3, number_padding=1
-                ):
-                    for delimiter in ("", ".", "-"):
-                        m = delimiter.join(mutation).lower()
-                        add_mutation(domain_hash, m)
+                    # numbers + devops mutations
+                    for mutation in self.helpers.word_cloud.mutations(
+                        subdomains, cloud=False, numbers=3, number_padding=1
+                    ):
+                        for delimiter in ("", ".", "-"):
+                            m = delimiter.join(mutation).lower()
+                            add_mutation(domain_hash, m)
 
-                # special dns mutator
-                for subdomain in self.helpers.word_cloud.dns_mutator.mutations(
-                    subdomains, max_mutations=self.max_mutations
-                ):
-                    add_mutation(domain_hash, subdomain)
+                    # special dns mutator
+                    for subdomain in self.helpers.word_cloud.dns_mutator.mutations(
+                        subdomains, max_mutations=self.max_mutations
+                    ):
+                        add_mutation(domain_hash, subdomain)
 
-                if mutations:
-                    self.info(f"Trying {len(mutations):,} mutations against {domain} ({i+1}/{len(found)})")
-                    results = list(self.massdns(query, mutations))
-                    for hostname in results:
-                        source_event = self.get_source_event(hostname)
-                        if source_event is None:
-                            self.warning(f"Could not correlate source event from: {hostname}")
+                    if mutations:
+                        self.info(f"Trying {len(mutations):,} mutations against {domain} ({i+1}/{len(found)})")
+                        results = list(self.massdns(query, mutations))
+                        for hostname in results:
+                            source_event = self.get_source_event(hostname)
+                            if source_event is None:
+                                self.warning(f"Could not correlate source event from: {hostname}")
+                                continue
+                            self.emit_result(hostname, source_event, query)
+                        if results:
                             continue
-                        self.emit_result(hostname, source_event, query)
-                    if results:
-                        continue
-                break
+                    break
+        except AssertionError as e:
+            self.warning(e)
 
     def add_found(self, host):
         if not isinstance(host, str):
diff --git a/bbot/modules/output/csv.py b/bbot/modules/output/csv.py
index aa18483ae9..81ecc8ca8c 100644
--- a/bbot/modules/output/csv.py
+++ b/bbot/modules/output/csv.py
@@ -52,7 +52,7 @@ def handle_event(self, event):
                 "IP Address": ",".join(
                     str(x) for x in getattr(event, "resolved_hosts", set()) if self.helpers.is_ip(x)
                 ),
-                "Source Module": str(getattr(event, "module", "")),
+                "Source Module": str(getattr(event, "module_sequence", "")),
                 "Scope Distance": str(getattr(event, "scope_distance", "")),
                 "Event Tags": ",".join(sorted(list(getattr(event, "tags", [])))),
             }
diff --git a/bbot/modules/output/human.py b/bbot/modules/output/human.py
index b9eef9402e..61f403c095 100644
--- a/bbot/modules/output/human.py
+++ b/bbot/modules/output/human.py
@@ -20,7 +20,7 @@ def handle_event(self, event):
         event_tags = ""
         if getattr(event, "tags", []):
             event_tags = f'\t({", ".join(sorted(getattr(event, "tags", [])))})'
-        event_str = f"{event_type:<20}\t{event.data_human}\t{event.module}{event_tags}"
+        event_str = f"{event_type:<20}\t{event.data_human}\t{event.module_sequence}{event_tags}"
         # log vulnerabilities in vivid colors
         if event.type == "VULNERABILITY":
             severity = event.data.get("severity", "INFO")

From 839ef0a8de33b8a41da0b979fd44baa5c3d787b3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 1 May 2023 16:59:59 -0400
Subject: [PATCH 002/387] division by zero

---
 bbot/modules/massdns.py | 19 ++++++++++---------
 1 file changed, 10 insertions(+), 9 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 10b69aa0cd..718dc0eb58 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -234,16 +234,17 @@ def _massdns(self, domain, subdomains):
     def finish(self):
         found = sorted(self.found.items(), key=lambda x: len(x[-1]), reverse=True)
         # if we have a lot of rounds to make, don't try mutations on less-populated domains
-        avg_subdomains = sum([len(subdomains) for domain, subdomains in found[:50]]) / len(found[:50])
         trimmed_found = []
-        for i, (domain, subdomains) in enumerate(found):
-            # accept domains that are in the top 50 or have more than 5 percent of the average number of subdomains
-            if i < 50 or (len(subdomains) > 1 and len(subdomains) >= (avg_subdomains * 0.05)):
-                trimmed_found.append((domain, subdomains))
-            else:
-                self.verbose(
-                    f"Skipping mutations on {domain} because it only has {len(subdomains):,} subdomain(s) (avg: {avg_subdomains:,})"
-                )
+        if found:
+            avg_subdomains = sum([len(subdomains) for domain, subdomains in found[:50]]) / len(found[:50])
+            for i, (domain, subdomains) in enumerate(found):
+                # accept domains that are in the top 50 or have more than 5 percent of the average number of subdomains
+                if i < 50 or (len(subdomains) > 1 and len(subdomains) >= (avg_subdomains * 0.05)):
+                    trimmed_found.append((domain, subdomains))
+                else:
+                    self.verbose(
+                        f"Skipping mutations on {domain} because it only has {len(subdomains):,} subdomain(s) (avg: {avg_subdomains:,})"
+                    )
 
         base_mutations = set()
         try:

From 1400e6c94cc6098a7fbe5c227cba6b8dde60f712 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Fri, 5 May 2023 19:26:08 -0400
Subject: [PATCH 003/387] set status frequency default to 15 and made
 configurable

---
 bbot/defaults.yml       |  2 ++
 bbot/scanner/manager.py | 10 ++++++----
 2 files changed, 8 insertions(+), 4 deletions(-)

diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index a22c296cc8..6de4c44c48 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -75,6 +75,8 @@ dns_filter_ptrs: true
 dns_debug: false
 # Whether to verify SSL certificates
 ssl_verify: false
+# Interval for displaying status messages
+status_frequency: 15
 # How many scan results to keep before cleaning up the older ones
 keep_scans: 20
 # Completely ignore URLs with these extensions
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 913c24f5e8..fd7d585daf 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -34,6 +34,8 @@ def __init__(self, scan):
         self.events_resolved = dict()
         self.dns_resolution = self.scan.config.get("dns_resolution", False)
 
+        self.status_frequency = self.scan.config.get("status_frequency", 15)
+
         self.last_log_time = datetime.now()
 
     def init_events(self):
@@ -407,7 +409,7 @@ def loop_until_finished(self):
                     yield from events
 
                 try:
-                    self.log_status()
+                    self.log_status(self.status_frequency)
                     event, kwargs = self.incoming_event_queue.get_nowait()
                     while not self.scan.aborting:
                         try:
@@ -416,7 +418,7 @@ def loop_until_finished(self):
                                 activity = True
                             break
                         except queue.Full:
-                            self.log_status()
+                            self.log_status(self.status_frequency)
                             with self.event_emitted:
                                 self.event_emitted.wait(timeout=0.1)
                 except queue.Empty:
@@ -451,8 +453,8 @@ def loop_until_finished(self):
             for mod in self.scan.modules.values():
                 self.catch(mod._register_running, mod.report, _force=True)
 
-    def log_status(self, frequency=10):
-        # print status every 10 seconds
+    def log_status(self, frequency=15):
+        # print status every 15 seconds (or status_frequency setting)
         timedelta_secs = timedelta(seconds=frequency)
         now = datetime.now()
         time_since_last_log = now - self.last_log_time

From 91b4f988358d04da591f491edd22409e75db4bbd Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 5 May 2023 09:44:37 -0400
Subject: [PATCH 004/387] basic scan working (no modules)

---
 bbot/cli.py                            |  33 ++-
 bbot/core/event/base.py                |   6 +-
 bbot/core/helpers/async_helpers.py     |  46 ++++
 bbot/core/helpers/dns.py               | 239 +++++++-----------
 bbot/core/helpers/helper.py            |   5 -
 bbot/core/helpers/misc.py              |   4 +
 bbot/core/helpers/threadpool.py        | 266 --------------------
 bbot/modules/base.py                   | 166 +++++--------
 bbot/modules/internal/aggregate.py     |   2 +-
 bbot/modules/internal/excavate.py      |   4 +-
 bbot/modules/internal/speculate.py     |   4 +-
 bbot/modules/output/asset_inventory.py |   4 +-
 bbot/modules/output/csv.py             |  11 +-
 bbot/modules/output/http.py            |   2 +-
 bbot/modules/output/human.py           |  11 +-
 bbot/modules/output/json.py            |  11 +-
 bbot/modules/output/neo4j.py           |   2 +-
 bbot/modules/output/web_report.py      |   2 +-
 bbot/modules/output/websocket.py       |   2 +-
 bbot/modules/report/asn.py             |   2 +-
 bbot/scanner/manager.py                | 324 ++++++++++---------------
 bbot/scanner/scanner.py                | 192 +++++++--------
 bbot/test/test.conf                    |   2 +-
 bbot/test/test_step_2/test_helpers.py  | 104 +-------
 bbot/test/test_step_2/test_manager.py  |  20 ++
 poetry.lock                            |  21 +-
 pyproject.toml                         |   1 +
 27 files changed, 506 insertions(+), 980 deletions(-)
 create mode 100644 bbot/core/helpers/async_helpers.py
 delete mode 100644 bbot/core/helpers/threadpool.py

diff --git a/bbot/cli.py b/bbot/cli.py
index ea8f305690..55ee624f3d 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -2,6 +2,7 @@
 
 import os
 import sys
+import asyncio
 import logging
 import threading
 import traceback
@@ -31,9 +32,12 @@
 from . import config
 
 
-def main():
+scan_name = ""
+
+
+async def _main():
     err = False
-    scan_name = ""
+    global scan_name
 
     ensure_config_files()
 
@@ -258,7 +262,7 @@ def main():
 
                 scanner.helpers.word_cloud.load(options.load_wordcloud)
 
-                scanner.prep()
+                await scanner.prep()
 
                 if not options.dry_run:
                     if not options.agent_mode and not options.yes and sys.stdin.isatty():
@@ -282,7 +286,7 @@ def keyboard_listen():
                     keyboard_listen_thread = threading.Thread(target=keyboard_listen, daemon=True)
                     keyboard_listen_thread.start()
 
-                    scanner.start_without_generator()
+                    await scanner.start_without_generator()
 
             except bbot.core.errors.ScanError as e:
                 log_to_stderr(str(e), level="ERROR")
@@ -290,7 +294,7 @@ def keyboard_listen():
                 raise
             finally:
                 with suppress(NameError):
-                    scanner.cleanup()
+                    await scanner.cleanup()
 
     except bbot.core.errors.BBOTError as e:
         log_to_stderr(f"{e} (--debug for details)", level="ERROR")
@@ -302,13 +306,6 @@ def keyboard_listen():
         log_to_stderr(f"Encountered unknown error: {traceback.format_exc()}", level="ERROR")
         err = True
 
-    except KeyboardInterrupt:
-        msg = "Interrupted"
-        if scan_name:
-            msg = f"You killed {scan_name}"
-        log_to_stderr(msg, level="ERROR")
-        err = True
-
     finally:
         # save word cloud
         with suppress(BaseException):
@@ -330,5 +327,17 @@ def keyboard_listen():
         """
 
 
+def main():
+    global scan_name
+    try:
+        asyncio.run(_main())
+    except KeyboardInterrupt:
+        msg = "Interrupted"
+        if scan_name:
+            msg = f"You killed {scan_name}"
+        log_to_stderr(msg, level="ERROR")
+        err = True
+
+
 if __name__ == "__main__":
     main()
diff --git a/bbot/core/event/base.py b/bbot/core/event/base.py
index a88c5314fc..f96e4a79a2 100644
--- a/bbot/core/event/base.py
+++ b/bbot/core/event/base.py
@@ -1,4 +1,5 @@
 import json
+import asyncio
 import logging
 import ipaddress
 import traceback
@@ -6,7 +7,6 @@
 from datetime import datetime
 from contextlib import suppress
 from pydantic import BaseModel, validator
-from threading import Event as ThreadingEvent
 
 from .helpers import *
 from bbot.core.errors import *
@@ -125,8 +125,8 @@ def __init__(
             if _internal:  # or source._internal:
                 self.make_internal()
 
-        # a threading event indicating whether the event has undergone DNS resolution yet
-        self._resolved = ThreadingEvent()
+        # an event indicating whether the event has undergone DNS resolution
+        self._resolved = asyncio.Event()
 
     @property
     def data(self):
diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
new file mode 100644
index 0000000000..9a7b7bcde1
--- /dev/null
+++ b/bbot/core/helpers/async_helpers.py
@@ -0,0 +1,46 @@
+import asyncio
+import logging
+from contextlib import asynccontextmanager
+
+log = logging.getLogger("bbot.core.helpers.async_helpers")
+
+from .cache import CacheDict
+
+
+class _Lock(asyncio.Lock):
+    def __init__(self, name):
+        self.name = name
+        super().__init__()
+
+
+class NamedLock:
+    """
+    Returns a unique asyncio.Lock() based on a provided string
+
+    Useful for preventing multiple operations from occuring on the same data in parallel
+    E.g. simultaneous DNS lookups on the same hostname
+    """
+
+    def __init__(self, max_size=1000):
+        self._cache = CacheDict(max_size=max_size)
+
+    @asynccontextmanager
+    async def lock(self, name):
+        try:
+            lock = self._cache.get(name)
+        except KeyError:
+            lock = _Lock(name)
+            self._cache.put(name, lock)
+        async with lock:
+            yield
+
+
+class TaskCounter:
+    def __init__(self):
+        self.value = 0
+
+    def __enter__(self):
+        self.value += 1
+
+    def __exit__(self, exc_type, exc_val, exc_tb):
+        self.value -= 1
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index cd3686e23e..1089206a61 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -1,15 +1,15 @@
 import json
+import asyncio
 import logging
 import ipaddress
 import traceback
-import dns.resolver
 import dns.exception
-from threading import Lock
+import dns.asyncresolver
 from contextlib import suppress
 
 from .regexes import dns_name_regex
+from bbot.core.helpers.async_helpers import NamedLock
 from bbot.core.errors import ValidationError, DNSError
-from .threadpool import NamedLock, PatchedThreadPoolExecutor
 from .misc import is_ip, is_domain, domain_parents, parent_domain, rand_string, cloudcheck
 
 log = logging.getLogger("bbot.core.helpers.dns")
@@ -20,13 +20,12 @@ class DNSHelper:
     For automatic wildcard detection, nameserver validation, etc.
     """
 
-    nameservers_url = "https://public-dns.info/nameserver/nameservers.json"
     all_rdtypes = ["A", "AAAA", "SRV", "MX", "NS", "SOA", "CNAME", "TXT"]
 
     def __init__(self, parent_helper):
         self.parent_helper = parent_helper
         try:
-            self.resolver = dns.resolver.Resolver()
+            self.resolver = dns.asyncresolver.Resolver()
         except Exception as e:
             raise DNSError(f"Failed to create BBOT DNS resolver: {e}")
         self.timeout = self.parent_helper.config.get("dns_timeout", 5)
@@ -48,25 +47,13 @@ def __init__(self, parent_helper):
         self._wildcard_lock = NamedLock()
         # keeps track of warnings issued for wildcard detection to prevent duplicate warnings
         self._dns_warnings = set()
-
         self._errors = dict()
-        self._error_lock = Lock()
-
         self.fallback_nameservers_file = self.parent_helper.wordlist_dir / "nameservers.txt"
-
-        # we need our own threadpool because using the shared one can lead to deadlocks
-        max_workers = self.parent_helper.config.get("max_dns_threads", 100)
-        self._thread_pool = PatchedThreadPoolExecutor(max_workers=max_workers)
-
+        self.max_threads = self.parent_helper.config.get("max_dns_threads", 100)
         self._debug = self.parent_helper.config.get("dns_debug", False)
-
         self._dummy_modules = dict()
-        self._dummy_modules_lock = Lock()
-
         self._dns_cache = self.parent_helper.CacheDict(max_size=100000)
-
         self._event_cache = self.parent_helper.CacheDict(max_size=10000)
-        self._event_cache_lock = Lock()
         self._event_cache_locks = NamedLock()
 
         # copy the system's current resolvers to a text file for tool use
@@ -75,7 +62,7 @@ def __init__(self, parent_helper):
 
         self.filter_bad_ptrs = self.parent_helper.config.get("dns_filter_ptrs", True)
 
-    def resolve(self, query, **kwargs):
+    async def resolve(self, query, **kwargs):
         """
         "1.2.3.4" --> {
             "evilcorp.com",
@@ -86,14 +73,14 @@ def resolve(self, query, **kwargs):
         }
         """
         results = set()
-        raw_results, errors = self.resolve_raw(query, **kwargs)
+        raw_results, errors = await self.resolve_raw(query, **kwargs)
         for rdtype, answers in raw_results:
             for answer in answers:
                 for _, t in self.extract_targets(answer):
                     results.add(t)
         return results
 
-    def resolve_raw(self, query, **kwargs):
+    async def resolve_raw(self, query, **kwargs):
         # DNS over TCP is more reliable
         # But setting this breaks DNS resolution on Ubuntu because systemd-resolve doesn't support TCP
         # kwargs["tcp"] = True
@@ -101,7 +88,7 @@ def resolve_raw(self, query, **kwargs):
         if is_ip(query):
             kwargs.pop("type", None)
             kwargs.pop("rdtype", None)
-            results, errors = self._resolve_ip(query, **kwargs)
+            results, errors = await self._resolve_ip(query, **kwargs)
             return [("PTR", results)], [("PTR", e) for e in errors]
         else:
             results = []
@@ -118,7 +105,7 @@ def resolve_raw(self, query, **kwargs):
                 elif any([isinstance(t, x) for x in (list, tuple)]):
                     types = [str(_).strip().upper() for _ in t]
             for t in types:
-                r, e = self._resolve_hostname(query, rdtype=t, **kwargs)
+                r, e = await self._resolve_hostname(query, rdtype=t, **kwargs)
                 if r:
                     results.append((t, r))
                 for error in e:
@@ -126,13 +113,7 @@ def resolve_raw(self, query, **kwargs):
 
             return (results, errors)
 
-    def submit_task(self, *args, **kwargs):
-        try:
-            return self._thread_pool.submit(*args, **kwargs)
-        except RuntimeError as e:
-            log.debug(f"Error submitting DNS thread task: {e}")
-
-    def _resolve_hostname(self, query, **kwargs):
+    async def _resolve_hostname(self, query, **kwargs):
         self.debug(f"Resolving {query} with kwargs={kwargs}")
         results = []
         errors = []
@@ -144,8 +125,8 @@ def _resolve_hostname(self, query, **kwargs):
         parent_hash = hash(f"{parent}:{rdtype}")
         dns_cache_hash = hash(f"{query}:{rdtype}")
         while tries_left > 0:
-            if self.parent_helper.scan_stopping:
-                break
+            # if self.parent_helper.scan_stopping:
+            #     break
             try:
                 try:
                     results = self._dns_cache[dns_cache_hash]
@@ -156,19 +137,17 @@ def _resolve_hostname(self, query, **kwargs):
                             f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
                         )
                         return results, errors
-                    results = list(self._catch(self.resolver.resolve, query, **kwargs))
+                    results = await self._catch(self.resolver.resolve, query, **kwargs)
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = results
-                    with self._error_lock:
-                        if parent_hash in self._errors:
-                            self._errors[parent_hash] = 0
+                    if parent_hash in self._errors:
+                        self._errors[parent_hash] = 0
                 break
             except (dns.resolver.NoNameservers, dns.exception.Timeout, dns.resolver.LifetimeTimeout) as e:
-                with self._error_lock:
-                    try:
-                        self._errors[parent_hash] += 1
-                    except KeyError:
-                        self._errors[parent_hash] = 1
+                try:
+                    self._errors[parent_hash] += 1
+                except KeyError:
+                    self._errors[parent_hash] = 1
                 errors.append(e)
                 # don't retry if we get a SERVFAIL
                 if isinstance(e, dns.resolver.NoNameservers):
@@ -184,10 +163,9 @@ def _resolve_hostname(self, query, **kwargs):
                 else:
                     log.verbose(err_msg)
 
-        self.debug(f"Results for {query} with kwargs={kwargs}: {results}")
         return results, errors
 
-    def _resolve_ip(self, query, **kwargs):
+    async def _resolve_ip(self, query, **kwargs):
         self.debug(f"Reverse-resolving {query} with kwargs={kwargs}")
         retries = kwargs.pop("retries", 0)
         cache_result = kwargs.pop("cache_result", False)
@@ -196,13 +174,13 @@ def _resolve_ip(self, query, **kwargs):
         errors = []
         dns_cache_hash = hash(f"{query}:PTR")
         while tries_left > 0:
-            if self.parent_helper.scan_stopping:
-                break
+            # if self.parent_helper.scan_stopping:
+            #     break
             try:
                 if dns_cache_hash in self._dns_cache:
                     result = self._dns_cache[dns_cache_hash]
                 else:
-                    result = list(self._catch(self.resolver.resolve_address, query, **kwargs))
+                    result = await self._catch(self.resolver.resolve_address, query, **kwargs)
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = result
                 return result, errors
@@ -220,21 +198,21 @@ def _resolve_ip(self, query, **kwargs):
         self.debug(f"Results for {query} with kwargs={kwargs}: {results}")
         return results, errors
 
-    def handle_wildcard_event(self, event, children):
+    async def handle_wildcard_event(self, event, children):
         event_host = str(event.host)
         # wildcard checks
         if not is_ip(event.host):
             # check if this domain is using wildcard dns
             event_target = "target" in event.tags
-            for hostname, wildcard_domain_rdtypes in self.is_wildcard_domain(
-                event_host, log_info=event_target
+            for hostname, wildcard_domain_rdtypes in (
+                await self.is_wildcard_domain(event_host, log_info=event_target)
             ).items():
                 if wildcard_domain_rdtypes:
                     event.add_tag("wildcard-domain")
                     for rdtype, ips in wildcard_domain_rdtypes.items():
                         event.add_tag(f"{rdtype.lower()}-wildcard-domain")
             # check if the dns name itself is a wildcard entry
-            wildcard_rdtypes = self.is_wildcard(event_host)
+            wildcard_rdtypes = await self.is_wildcard(event_host)
             for rdtype, (is_wildcard, wildcard_host) in wildcard_rdtypes.items():
                 wildcard_tag = "error"
                 if is_wildcard == True:
@@ -263,7 +241,7 @@ def handle_wildcard_event(self, event, children):
                     log.debug(f'Wildcard detected, changing event.data "{event.data}" --> "{wildcard_data}"')
                     event.data = wildcard_data
 
-    def resolve_event(self, event, minimal=False):
+    async def resolve_event(self, event, minimal=False):
         """
         Tag event with appropriate dns record types
         Optionally create child events from dns resolutions
@@ -279,7 +257,7 @@ def resolve_event(self, event, minimal=False):
             return event_tags, event_whitelisted, event_blacklisted, dns_children
 
         # lock to ensure resolution of the same host doesn't start while we're working here
-        with self._event_cache_locks.get_lock(event_host):
+        async with self._event_cache_locks.lock(event_host):
             # try to get data from cache
             _event_tags, _event_whitelisted, _event_blacklisted, _dns_children = self.event_cache_get(event_host)
             event_tags.update(_event_tags)
@@ -299,17 +277,9 @@ def resolve_event(self, event, minimal=False):
                     types = ("A", "AAAA")
 
             if types:
-                futures = {}
-                for t in types:
-                    future = self.submit_task(
-                        self._catch_keyboardinterrupt, self.resolve_raw, event_host, type=t, cache_result=True
-                    )
-                    if future is None:
-                        break
-                    futures[future] = t
-
-                for future in self.parent_helper.as_completed(futures):
-                    resolved_raw, errors = future.result()
+                tasks = [self.resolve_raw(event_host, type=t, cache_result=True) for t in types]
+                for task in asyncio.as_completed(tasks):
+                    resolved_raw, errors = await task
                     for rdtype, e in errors:
                         if rdtype not in resolved_raw:
                             event_tags.add(f"{rdtype.lower()}-error")
@@ -380,22 +350,23 @@ def event_cache_get(self, host):
         except KeyError:
             return set(), None, None, set()
 
-    def resolve_batch(self, queries, **kwargs):
+    async def resolve_batch(self, queries, **kwargs):
         """
-        resolve_batch("www.evilcorp.com", "evilcorp.com") --> [
+        await resolve_batch("www.evilcorp.com", "evilcorp.com") --> [
             ("www.evilcorp.com", {"1.1.1.1"}),
             ("evilcorp.com", {"2.2.2.2"})
         ]
         """
-        futures = dict()
-        for query in queries:
-            future = self.submit_task(self._catch_keyboardinterrupt, self.resolve, query, **kwargs)
-            if future is None:
-                break
-            futures[future] = query
-        for future in self.parent_helper.as_completed(futures):
-            query = futures[future]
-            yield (query, future.result())
+
+        async def coro_wrapper(q, **_kwargs):
+            """
+            Helps us correlate task results back to their original arguments
+            """
+            result = await self.resolve(q, **_kwargs)
+            return (q, result)
+
+        for task in asyncio.as_completed([coro_wrapper(q, **kwargs) for q in queries]):
+            yield await task
 
     def extract_targets(self, record):
         """
@@ -424,44 +395,13 @@ def extract_targets(self, record):
 
     @staticmethod
     def _clean_dns_record(record):
-        with suppress(Exception):
+        if not isinstance(record, str):
             record = str(record.to_text())
         return str(record).rstrip(".").lower()
 
-    def get_valid_resolvers(self, min_reliability=0.99):
-        nameservers = set()
-        nameservers_file = self.parent_helper.download(self.nameservers_url, cache_hrs=72)
-        if nameservers_file is None:
-            log.warning(f"Failed to download nameservers from {self.nameservers_url}")
-        else:
-            nameservers_json = []
-            try:
-                nameservers_json = json.loads(open(nameservers_file).read())
-            except Exception as e:
-                log.warning(f"Failed to load nameserver list from {nameservers_file}: {e}")
-                nameservers_file.unlink()
-            for entry in nameservers_json:
-                try:
-                    ip = str(entry.get("ip", "")).strip()
-                except Exception:
-                    continue
-                try:
-                    reliability = float(entry.get("reliability", 0))
-                except ValueError:
-                    continue
-                if reliability >= min_reliability and is_ip(ip, version=4):
-                    nameservers.add(ip)
-            log.verbose(f"Loaded {len(nameservers):,} nameservers from {self.nameservers_url}")
-        if not nameservers:
-            log.info(f"Loading fallback nameservers from {self.fallback_nameservers_file}")
-            lines = self.parent_helper.read_file(self.fallback_nameservers_file)
-            nameservers = set([l for l in lines if not l.startswith("#")])
-        resolver_list = self.verify_nameservers(nameservers)
-        return resolver_list
-
-    def _catch(self, callback, *args, **kwargs):
+    async def _catch(self, callback, *args, **kwargs):
         try:
-            return callback(*args, **kwargs)
+            return await callback(*args, **kwargs)
         except dns.resolver.NoNameservers:
             raise
         except (dns.exception.Timeout, dns.resolver.LifetimeTimeout):
@@ -473,7 +413,7 @@ def _catch(self, callback, *args, **kwargs):
             log.warning(f"Error in {callback.__qualname__}() with args={args}, kwargs={kwargs}")
         return list()
 
-    def is_wildcard(self, query, ips=None, rdtype=None):
+    async def is_wildcard(self, query, ips=None, rdtype=None):
         """
         Use this method to check whether a *host* is a wildcard entry
 
@@ -507,31 +447,27 @@ def is_wildcard(self, query, ips=None, rdtype=None):
         parent = parent_domain(query)
         parents = list(domain_parents(query))
 
-        futures = []
+        wildcard_tasks = {t: [] for t in self.all_rdtypes}
         base_query_ips = dict()
         # if the caller hasn't already done the work of resolving the IPs
         if ips is None:
             # then resolve the query for all rdtypes
             for _rdtype in self.all_rdtypes:
                 # resolve the base query
-                future = self.submit_task(
-                    self._catch_keyboardinterrupt, self.resolve_raw, query, type=_rdtype, cache_result=True
-                )
-                if future is None:
-                    break
-                futures.append(future)
-
-            for future in self.parent_helper.as_completed(futures):
-                raw_results, errors = future.result()
-                if errors and not raw_results:
-                    self.debug(f"Failed to resolve {query} ({_rdtype}) during wildcard detection")
-                    result[_rdtype] = (None, parent)
-                    continue
-                for _rdtype, answers in raw_results:
-                    base_query_ips[_rdtype] = set()
-                    for answer in answers:
-                        for _, t in self.extract_targets(answer):
-                            base_query_ips[_rdtype].add(t)
+                wildcard_tasks[_rdtype].append(self.resolve_raw(query, type=_rdtype, cache_result=True))
+
+            for _rdtype, tasks in wildcard_tasks.items():
+                for task in asyncio.as_completed(tasks):
+                    raw_results, errors = await task
+                    if errors and not raw_results:
+                        self.debug(f"Failed to resolve {query} ({_rdtype}) during wildcard detection")
+                        result[_rdtype] = (None, parent)
+                        continue
+                    for __rdtype, answers in raw_results:
+                        base_query_ips[__rdtype] = set()
+                        for answer in answers:
+                            for _, t in self.extract_targets(answer):
+                                base_query_ips[__rdtype].add(t)
         else:
             # otherwise, we can skip all that
             base_query_ips[rdtype] = set([self._clean_dns_record(ip) for ip in ips])
@@ -550,7 +486,7 @@ def is_wildcard(self, query, ips=None, rdtype=None):
             for host in parents[::-1]:
                 host_hash = hash(host)
                 # make sure we've checked that domain for wildcards
-                self.is_wildcard_domain(host)
+                await self.is_wildcard_domain(host)
                 if host_hash in self._wildcard_cache:
                     # then get its IPs from our wildcard cache
                     wildcard_rdtypes = self._wildcard_cache[host_hash]
@@ -565,7 +501,7 @@ def is_wildcard(self, query, ips=None, rdtype=None):
 
         return result
 
-    def is_wildcard_domain(self, domain, log_info=False):
+    async def is_wildcard_domain(self, domain, log_info=False):
         """
         Check whether a domain is using wildcard DNS
 
@@ -581,14 +517,14 @@ def is_wildcard_domain(self, domain, log_info=False):
         for i, host in enumerate(parents[::-1]):
             # have we checked this host before?
             host_hash = hash(host)
-            with self._wildcard_lock.get_lock(host_hash):
+            async with self._wildcard_lock.lock(host_hash):
                 # if we've seen this host before
                 if host_hash in self._wildcard_cache:
                     wildcard_domain_results[host] = self._wildcard_cache[host_hash]
                     continue
 
                 # determine if this is a wildcard domain
-                wildcard_futures = {}
+                wildcard_tasks = {t: [] for t in self.all_rdtypes}
                 # resolve a bunch of random subdomains of the same parent
                 for rdtype in self.all_rdtypes:
                     # continue if a wildcard was already found for this rdtype
@@ -596,29 +532,19 @@ def is_wildcard_domain(self, domain, log_info=False):
                     #     continue
                     for _ in range(self.wildcard_tests):
                         rand_query = f"{rand_string(digits=False, length=10)}.{host}"
-                        future = self.submit_task(
-                            self._catch_keyboardinterrupt,
-                            self.resolve,
-                            rand_query,
-                            type=rdtype,
-                            cache_result=False,
-                        )
-                        if future is None:
-                            break
-                        wildcard_futures[future] = rdtype
+                        wildcard_tasks[rdtype].append(self.resolve(rand_query, type=rdtype, cache_result=False))
 
                 # combine the random results
                 is_wildcard = False
                 wildcard_results = dict()
-                for future in self.parent_helper.as_completed(wildcard_futures):
-                    results = future.result()
-                    rdtype = wildcard_futures[future]
-                    if results:
-                        is_wildcard = True
-                    if results:
-                        if not rdtype in wildcard_results:
-                            wildcard_results[rdtype] = set()
-                        wildcard_results[rdtype].update(results)
+                for rdtype, tasks in wildcard_tasks.items():
+                    for task in asyncio.as_completed(tasks):
+                        results = await task
+                        if results:
+                            is_wildcard = True
+                            if not rdtype in wildcard_results:
+                                wildcard_results[rdtype] = set()
+                            wildcard_results[rdtype].update(results)
 
                 self._wildcard_cache.update({host_hash: wildcard_results})
                 wildcard_domain_results.update({host: wildcard_results})
@@ -646,12 +572,11 @@ def debug(self, *args, **kwargs):
             log.debug(*args, **kwargs)
 
     def _get_dummy_module(self, name):
-        with self._dummy_modules_lock:
-            try:
-                dummy_module = self._dummy_modules[name]
-            except KeyError:
-                dummy_module = self.parent_helper._make_dummy_module(name=name, _type="DNS")
-                self._dummy_modules[name] = dummy_module
+        try:
+            dummy_module = self._dummy_modules[name]
+        except KeyError:
+            dummy_module = self.parent_helper._make_dummy_module(name=name, _type="DNS")
+            self._dummy_modules[name] = dummy_module
         return dummy_module
 
     def dns_warning(self, msg):
diff --git a/bbot/core/helpers/helper.py b/bbot/core/helpers/helper.py
index fda18fa745..db6f1b74a8 100644
--- a/bbot/core/helpers/helper.py
+++ b/bbot/core/helpers/helper.py
@@ -9,7 +9,6 @@
 from .wordcloud import WordCloud
 from .cloud import CloudProviders
 from .interactsh import Interactsh
-from .threadpool import as_completed
 from ...scanner.target import Target
 from ...modules.base import BaseModule
 from .depsinstaller import DepsInstaller
@@ -88,10 +87,6 @@ def scan_stopping(self):
     def in_tests(self):
         return os.environ.get("BBOT_TESTING", "") == "True"
 
-    @staticmethod
-    def as_completed(*args, **kwargs):
-        return as_completed(*args, **kwargs)
-
     def _make_dummy_module(self, name, _type="scan"):
         """
         Construct a dummy module, for attachment to events
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index e3637d2187..e65766843a 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -1020,3 +1020,7 @@ def cloudcheck(ip):
         with suppress(KeyError):
             provider = provider_map[provider.lower()]
     return provider, provider_type, subnet
+
+
+def is_async_function(f):
+    return inspect.iscoroutinefunction(f)
diff --git a/bbot/core/helpers/threadpool.py b/bbot/core/helpers/threadpool.py
deleted file mode 100644
index ef5ca8d4ec..0000000000
--- a/bbot/core/helpers/threadpool.py
+++ /dev/null
@@ -1,266 +0,0 @@
-import queue
-import logging
-import threading
-import traceback
-from datetime import datetime
-from queue import SimpleQueue, Full
-from concurrent.futures import ThreadPoolExecutor
-
-log = logging.getLogger("bbot.core.helpers.threadpool")
-
-from .cache import CacheDict
-from ...core.errors import ScanCancelledError
-
-
-def pretty_fn(a):
-    if callable(a):
-        return a.__qualname__
-    return a
-
-
-class ThreadPoolSimpleQueue(SimpleQueue):
-    def __init__(self, *args, **kwargs):
-        self._executor = kwargs.pop("_executor", None)
-        assert self._executor is not None, "Must specify _executor"
-
-    def get(self, *args, **kwargs):
-        work_item = super().get(*args, **kwargs)
-        if work_item is not None:
-            thread_id = threading.get_ident()
-            self._executor._current_work_items[thread_id] = (work_item, datetime.now())
-        return work_item
-
-
-class PatchedThreadPoolExecutor(ThreadPoolExecutor):
-    """
-    This class exists only because of a bug in cpython where
-    futures are not properly marked CANCELLED_AND_NOTIFIED:
-        https://github.com/python/cpython/issues/87893
-    """
-
-    def shutdown(self, wait=True, *, cancel_futures=False):
-        with self._shutdown_lock:
-            self._shutdown = True
-            if cancel_futures:
-                # Drain all work items from the queue, and then cancel their
-                # associated futures.
-                while 1:
-                    try:
-                        work_item = self._work_queue.get_nowait()
-                    except queue.Empty:
-                        break
-                    if work_item is not None:
-                        if work_item.future.cancel():
-                            work_item.future.set_running_or_notify_cancel()
-
-            # Send a wake-up to prevent threads calling
-            # _work_queue.get(block=True) from permanently blocking.
-            self._work_queue.put(None)
-        if wait:
-            for t in self._threads:
-                t.join()
-
-
-class BBOTThreadPoolExecutor(PatchedThreadPoolExecutor):
-    """
-    Allows inspection of thread pool to determine which functions are currently executing
-    """
-
-    def __init__(self, *args, **kwargs):
-        super().__init__(*args, **kwargs)
-        self._current_work_items = {}
-        self._work_queue = ThreadPoolSimpleQueue(_executor=self)
-
-    @property
-    def threads_status(self):
-        work_items = []
-        for thread_id, (work_item, start_time) in sorted(self._current_work_items.items()):
-            func = work_item.fn.__qualname__
-            func_index = 0
-            if work_item and not work_item.future.done():
-                for i, f in enumerate(list(work_item.args)):
-                    if callable(f):
-                        func = f.__qualname__
-                        func_index = i + 1
-                    else:
-                        break
-                running_for = datetime.now() - start_time
-                wi_args = list(work_item.args)[func_index:]
-                wi_args = [pretty_fn(a) for a in wi_args]
-                wi_args = str(wi_args).strip("[]")
-                wi_kwargs = ", ".join(["{0}={1}".format(k, pretty_fn(v)) for k, v in work_item.kwargs.items()])
-                func_with_args = f"{func}({wi_args}" + (f", {wi_kwargs}" if wi_kwargs else "") + ")"
-                work_items.append(
-                    (running_for, f"running for {int(running_for.total_seconds()):>3} seconds: {func_with_args}")
-                )
-        work_items.sort(key=lambda x: x[0])
-        return [x[-1] for x in work_items]
-
-
-class ThreadPoolWrapper:
-    """
-    Layers more granular control overtop of a shared thread pool
-    Allows setting lower thread limits for modules, etc.
-    """
-
-    def __init__(self, executor, max_workers=None, qsize=None):
-        self.executor = executor
-        self.max_workers = max_workers
-        self.max_qsize = qsize
-        self.futures = set()
-
-        self._num_tasks = 0
-        self._task_count_lock = threading.Lock()
-
-        self._lock = threading.RLock()
-        self.not_full = threading.Condition(self._lock)
-
-        try:
-            self.executor._thread_pool_wrappers.append(self)
-        except AttributeError:
-            self.executor._thread_pool_wrappers = [self]
-
-    def submit_task(self, callback, *args, **kwargs):
-        """
-        A wrapper around threadpool.submit()
-        """
-        block = kwargs.pop("_block", True)
-        force = kwargs.pop("_force_submit", False)
-        success = False
-        with self.not_full:
-            self.num_tasks_increment()
-            try:
-                if not force:
-                    if not block:
-                        if self.is_full or self.underlying_executor_is_full:
-                            raise Full
-                    else:
-                        # wait until there's room
-                        while self.is_full or self.underlying_executor_is_full:
-                            self.not_full.wait()
-
-                try:
-                    # submit the job
-                    future = self.executor.submit(self._execute_callback, callback, *args, **kwargs)
-                    future.add_done_callback(self._on_future_done)
-                    success = True
-                    return future
-                except RuntimeError as e:
-                    raise ScanCancelledError(e)
-            finally:
-                if not success:
-                    self.num_tasks_decrement()
-
-    def _execute_callback(self, callback, *args, **kwargs):
-        try:
-            return callback(*args, **kwargs)
-        finally:
-            self.num_tasks_decrement()
-
-    def _on_future_done(self, future):
-        if future.cancelled():
-            self.num_tasks_decrement()
-
-    @property
-    def num_tasks(self):
-        with self._task_count_lock:
-            return self._num_tasks
-
-    def num_tasks_increment(self):
-        with self._task_count_lock:
-            self._num_tasks += 1
-
-    def num_tasks_decrement(self):
-        with self._task_count_lock:
-            self._num_tasks = max(0, self._num_tasks - 1)
-        for wrapper in self.executor._thread_pool_wrappers:
-            try:
-                with wrapper.not_full:
-                    wrapper.not_full.notify()
-            except RuntimeError:
-                continue
-            except Exception as e:
-                log.warning(f"Unknown error in num_tasks_decrement(): {e}")
-                log.trace(traceback.format_exc())
-
-    @property
-    def is_full(self):
-        if self.max_workers is None:
-            return False
-        return self.num_tasks > self.max_workers
-
-    @property
-    def underlying_executor_is_full(self):
-        return self.max_qsize is not None and self.qsize >= self.max_qsize
-
-    @property
-    def qsize(self):
-        return self.executor._work_queue.qsize()
-
-    def shutdown(self, *args, **kwargs):
-        self.executor.shutdown(*args, **kwargs)
-
-    @property
-    def threads_status(self):
-        return self.executor.threads_status
-
-
-from concurrent.futures._base import FINISHED
-from concurrent.futures._base import as_completed as as_completed_orig
-
-
-def as_completed(*args, **kwargs):
-    for f in as_completed_orig(*args, **kwargs):
-        if f._state == FINISHED:
-            yield f
-
-
-class _Lock:
-    def __init__(self, name):
-        self.name = name
-        self.lock = threading.Lock()
-
-    def __enter__(self):
-        self.lock.acquire()
-
-    def __exit__(self, exc_type, exc_val, exc_tb):
-        self.lock.release()
-
-
-class NamedLock:
-    """
-    Returns a unique threading.Lock() based on a provided string
-
-    Useful for preventing multiple operations from occuring on the same data in parallel
-    E.g. simultaneous DNS lookups on the same hostname
-    """
-
-    def __init__(self, max_size=1000):
-        self._cache = CacheDict(max_size=max_size)
-
-    def get_lock(self, name):
-        try:
-            return self._cache.get(name)
-        except KeyError:
-            new_lock = _Lock(name)
-            self._cache.put(name, new_lock)
-            return new_lock
-
-
-class TaskCounter:
-    def __init__(self):
-        self._value = 0
-        self.lock = threading.Lock()
-
-    def __enter__(self):
-        with self.lock:
-            self._value += 1
-
-    def __exit__(self, exc_type, exc_val, exc_tb):
-        with self.lock:
-            self._value -= 1
-
-    @property
-    def value(self):
-        with self.lock:
-            return self._value
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 8e1728d6c6..888a56f9a7 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -1,12 +1,12 @@
 import queue
+import asyncio
 import logging
 import threading
-import traceback
 from sys import exc_info
 from contextlib import suppress
 
 from ..core.helpers.misc import get_size
-from ..core.helpers.threadpool import ThreadPoolWrapper, TaskCounter
+from ..core.helpers.async_helpers import TaskCounter
 from ..core.errors import ScanCancelledError, ValidationError, WordlistError
 
 
@@ -76,28 +76,21 @@ class BaseModule:
     # Type, for differentiating between normal modules and output modules, etc.
     _type = "scan"
 
-    _report_lock = threading.Lock()
-
     def __init__(self, scan):
         self.scan = scan
         self.errored = False
         self._log = None
         self._incoming_event_queue = None
         # seconds since we've submitted a batch
+        self._outgoing_event_queue = None
+        # seconds since we've submitted a batch
         self._last_submitted_batch = None
-        # wrapper around shared thread pool to ensure that a single module doesn't hog more than its share
-        self.thread_pool = ThreadPoolWrapper(self.scan._thread_pool)
-        self._internal_thread_pool = ThreadPoolWrapper(
-            self.scan._internal_thread_pool.executor, max_workers=self.max_event_handlers
-        )
         # additional callbacks to be executed alongside self.cleanup()
         self.cleanup_callbacks = []
         self._cleanedup = False
         self._watched_events = None
 
-        self._lock = threading.RLock()
-        self._running_counter = TaskCounter()
-        self.event_received = threading.Condition(self._lock)
+        self._task_counter = TaskCounter()
 
         # string constant
         self._custom_filter_criteria_msg = "it did not meet custom filter criteria"
@@ -105,7 +98,7 @@ def __init__(self, scan):
         # track number of failures (for .request_with_fail_count())
         self._request_failures = 0
 
-    def setup(self):
+    async def setup(self):
         """
         Perform setup functions at the beginning of the scan.
         Optionally override this method.
@@ -114,7 +107,7 @@ def setup(self):
         """
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         """
         Override this method if batch_size == 1.
         """
@@ -135,7 +128,7 @@ def filter_event(self, event):
         """
         return True
 
-    def finish(self):
+    async def finish(self):
         """
         Perform final functions when scan is nearing completion
 
@@ -147,7 +140,7 @@ def finish(self):
         """
         return
 
-    def report(self):
+    async def report(self):
         """
         Perform a final task when the scan is finished, but before cleanup happens
 
@@ -155,7 +148,7 @@ def report(self):
         """
         return
 
-    def cleanup(self):
+    async def cleanup(self):
         """
         Perform final cleanup after the scan has finished
         This method is called only once, and may not raise events.
@@ -211,21 +204,21 @@ def submit_task(self, *args, **kwargs):
         kwargs["_block"] = False
         return self.thread_pool.submit_task(self.catch, *args, **kwargs)
 
-    def catch(self, *args, **kwargs):
-        return self.scan.manager.catch(*args, **kwargs)
+    async def catch(self, *args, **kwargs):
+        return await self.scan.manager.catch(*args, **kwargs)
 
-    def _postcheck_and_run(self, callback, event):
+    async def _postcheck_and_run(self, callback, event):
         acceptable, reason = self._event_postcheck(event)
         if not acceptable:
             if reason:
                 self.debug(f"Not accepting {event} because {reason}")
             return
         self.scan.stats.event_consumed(event, self)
-        return callback(event)
+        return await callback(event)
 
-    def _register_running(self, callback, *args, **kwargs):
-        with self._running_counter:
-            return callback(*args, **kwargs)
+    async def _register_running(self, callback, *args, **kwargs):
+        with self._task_counter:
+            return await callback(*args, **kwargs)
 
     def _handle_batch(self, force=False):
         if self.batch_size <= 1:
@@ -276,24 +269,7 @@ def emit_event(self, *args, **kwargs):
         for o in ("on_success_callback", "abort_if", "quick"):
             event_kwargs.pop(o, None)
         event = self.make_event(*args, **event_kwargs)
-        if event is None:
-            return
-        # nerf event's priority if it's likely not to be in scope
-        if event.scope_distance > 0:
-            event_in_scope = self.scan.whitelisted(event) and not self.scan.blacklisted(event)
-            if not event_in_scope:
-                event.module_priority += event.scope_distance
-        if event:
-            # Wait for parent event to resolve (in case its scope distance changes)
-            while 1:
-                if self.scan.stopping:
-                    return
-                resolved = event.source._resolved.wait(timeout=0.1)
-                if resolved:
-                    # update event's scope distance based on its parent
-                    event.scope_distance = event.source.scope_distance + 1
-                    break
-            self.scan.manager.incoming_event_queue.put((event, kwargs))
+        self.scan.manager.queue_event(event)
 
     @property
     def events_waiting(self):
@@ -324,16 +300,15 @@ def num_queued_events(self):
         return ret
 
     def start(self):
-        self.thread = threading.Thread(target=self._worker, daemon=True)
-        self.thread.start()
+        self.tasks = [asyncio.create_task(self._worker()) for _ in range(self.max_event_handlers)]
 
-    def _setup(self):
+    async def _setup(self):
         status_codes = {False: "hard-fail", None: "soft-fail", True: "success"}
 
         status = False
         self.debug(f"Setting up module {self.name}")
         try:
-            result = self.setup()
+            result = await self.setup()
             if type(result) == tuple and len(result) == 2:
                 status, msg = result
             else:
@@ -346,7 +321,7 @@ def _setup(self):
                 status = None
             msg = f"{e}"
             self.trace()
-        return status, str(msg)
+        return self.name, status, str(msg)
 
     @property
     def _force_batch(self):
@@ -356,41 +331,36 @@ def _force_batch(self):
         # if we're below our maximum threading potential
         return self._internal_thread_pool.num_tasks < self.max_event_handlers
 
-    def _worker(self):
+    async def _worker(self):
         try:
             while not self.scan.stopping:
                 # hold the reigns if our outgoing queue is full
-                if self._qsize and self.outgoing_event_queue_qsize >= self._qsize:
-                    with self.event_received:
-                        self.event_received.wait(timeout=0.1)
-                    continue
+                # if self._qsize and self.outgoing_event_queue.qsize() >= self._qsize:
+                #     with self.event_received:
+                #         await self.event_received.wait()
 
                 if self.batch_size > 1:
-                    submitted = self._handle_batch(force=self._force_batch)
-                    if not submitted:
-                        with self.event_received:
-                            self.event_received.wait(timeout=0.1)
+                    pass
+                    # submitted = self._handle_batch(force=self._force_batch)
+                    # if not submitted:
+                    #     with self.event_received:
+                    #         await self.event_received.wait()
 
                 else:
                     try:
                         if self.incoming_event_queue:
-                            e = self.incoming_event_queue.get(timeout=0.1)
+                            e = await self.incoming_event_queue.get()
                         else:
                             self.debug(f"Event queue is in bad state")
                             return
                     except queue.Empty:
                         continue
-                    self.debug(f"Got {e} from {getattr(e, 'module', e)}")
+                    self.debug(f"Got {e} from {getattr(e, 'module', 'unknown_module')}")
                     # if we receive the special "FINISHED" event
                     if e.type == "FINISHED":
-                        self._internal_thread_pool.submit_task(self.catch, self._register_running, self.finish)
+                        await self.catch(self._register_running, self.finish)
                     else:
-                        if self._type == "output":
-                            self.catch(self._register_running, self._postcheck_and_run, self.handle_event, e)
-                        else:
-                            self._internal_thread_pool.submit_task(
-                                self.catch, self._register_running, self._postcheck_and_run, self.handle_event, e
-                            )
+                        await self.catch(self._register_running, self._postcheck_and_run, self.handle_event, e)
 
         except KeyboardInterrupt:
             self.debug(f"Interrupted")
@@ -486,12 +456,12 @@ def _event_postcheck(self, event):
 
         return True, ""
 
-    def _cleanup(self):
+    async def _cleanup(self):
         if not self._cleanedup:
             self._cleanedup = True
             for callback in [self.cleanup] + self.cleanup_callbacks:
                 if callable(callback):
-                    self.catch(self._register_running, callback, _force=True)
+                    await self.catch(self._register_running, callback, _force=True)
 
     def queue_event(self, event):
         if self.incoming_event_queue in (None, False):
@@ -503,11 +473,9 @@ def queue_event(self, event):
                 self.debug(f"Not accepting {event} because {reason}")
             return
         try:
-            self.incoming_event_queue.put(event)
+            self.incoming_event_queue.put_nowait(event)
         except AttributeError:
             self.debug(f"Not in an acceptable state to queue event")
-        with self.event_received:
-            self.event_received.notify()
 
     def set_error_state(self, message=None):
         if not self.errored:
@@ -535,34 +503,27 @@ def helpers(self):
 
     @property
     def status(self):
-        main_pool = self.thread_pool.num_tasks
-        internal_pool = self._internal_thread_pool.num_tasks
-        pool_total = main_pool + internal_pool
-        incoming_qsize = 0
-        if self.incoming_event_queue:
-            incoming_qsize = self.incoming_event_queue.qsize()
         status = {
-            "events": {"incoming": incoming_qsize, "outgoing": self.outgoing_event_queue_qsize},
-            "tasks": {"main_pool": main_pool, "internal_pool": internal_pool, "total": pool_total},
+            "events": {"incoming": self.num_queued_events, "outgoing": self.outgoing_event_queue.qsize()},
+            "tasks": self._task_counter.value,
             "errored": self.errored,
         }
         status["running"] = self.running
-        status["active"] = self._is_active(status)
         return status
 
-    @staticmethod
-    def _is_active(status):
-        if status["running"]:
-            return True
-        total = status["tasks"]["total"] + status["events"]["incoming"] + status["events"]["outgoing"]
-        return total > 0
-
     @property
     def running(self):
         """
         Indicates whether the module is currently processing data.
         """
-        return self._running_counter.value > 0
+        return self._task_counter.value > 0
+
+    @property
+    def finished(self):
+        """
+        Indicates whether the module is finished (not running and nothing in queues)
+        """
+        return not self.running and self.num_queued_events <= 0 and self.outgoing_event_queue.qsize() <= 0
 
     def request_with_fail_count(self, *args, **kwargs):
         r = self.helpers.request(*args, **kwargs)
@@ -593,12 +554,14 @@ def config(self):
     @property
     def incoming_event_queue(self):
         if self._incoming_event_queue is None:
-            self._incoming_event_queue = queue.PriorityQueue()
+            self._incoming_event_queue = asyncio.PriorityQueue()
         return self._incoming_event_queue
 
     @property
-    def outgoing_event_queue_qsize(self):
-        return self.scan.manager.incoming_event_queue.modules.get(str(self), 0)
+    def outgoing_event_queue(self):
+        if self._outgoing_event_queue is None:
+            self._outgoing_event_queue = asyncio.PriorityQueue()
+        return self._outgoing_event_queue
 
     @property
     def priority(self):
@@ -627,18 +590,17 @@ def __str__(self):
         return self.name
 
     def log_table(self, *args, **kwargs):
-        with self._report_lock:
-            table_name = kwargs.pop("table_name", None)
-            table = self.helpers.make_table(*args, **kwargs)
-            for line in table.splitlines():
-                self.info(line)
-            if table_name is not None:
-                date = self.helpers.make_date()
-                filename = self.scan.home / f"{self.helpers.tagify(table_name)}-table-{date}.txt"
-                with open(filename, "w") as f:
-                    f.write(table)
-                self.verbose(f"Wrote {table_name} to {filename}")
-            return table
+        table_name = kwargs.pop("table_name", None)
+        table = self.helpers.make_table(*args, **kwargs)
+        for line in table.splitlines():
+            self.info(line)
+        if table_name is not None:
+            date = self.helpers.make_date()
+            filename = self.scan.home / f"{self.helpers.tagify(table_name)}-table-{date}.txt"
+            with open(filename, "w") as f:
+                f.write(table)
+            self.verbose(f"Wrote {table_name} to {filename}")
+        return table
 
     def stdout(self, *args, **kwargs):
         self.log.stdout(*args, extra={"scan_id": self.scan.id}, **kwargs)
diff --git a/bbot/modules/internal/aggregate.py b/bbot/modules/internal/aggregate.py
index ddda0b2b3e..b1f11b04e7 100644
--- a/bbot/modules/internal/aggregate.py
+++ b/bbot/modules/internal/aggregate.py
@@ -5,5 +5,5 @@ class aggregate(BaseReportModule):
     flags = ["passive", "safe"]
     meta = {"description": "Summarize statistics at the end of a scan"}
 
-    def report(self):
+    async def report(self):
         self.log_table(*self.scan.stats._make_table(), table_name="scan-stats")
diff --git a/bbot/modules/internal/excavate.py b/bbot/modules/internal/excavate.py
index c57d6ffa10..6bf98a8604 100644
--- a/bbot/modules/internal/excavate.py
+++ b/bbot/modules/internal/excavate.py
@@ -299,7 +299,7 @@ class excavate(BaseInternalModule):
 
     deps_pip = ["pyjwt~=2.6.0"]
 
-    def setup(self):
+    async def setup(self):
         self.hostname = HostnameExtractor(self)
         self.url = URLExtractor(self)
         self.email = EmailExtractor(self)
@@ -316,7 +316,7 @@ def search(self, source, extractors, event, **kwargs):
         for e in extractors:
             e.search(source, event, **kwargs)
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         data = event.data
 
         # HTTP_RESPONSE is a special case
diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index f4f4724268..74e67ef507 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -25,7 +25,7 @@ class speculate(BaseInternalModule):
     _scope_shepherding = False
     _priority = 4
 
-    def setup(self):
+    async def setup(self):
         self.open_port_consumers = any(["OPEN_TCP_PORT" in m.watched_events for m in self.scan.modules.values()])
         self.portscanner_enabled = any(["portscan" in m.flags for m in self.scan.modules.values()])
         self.range_to_ip = True
@@ -47,7 +47,7 @@ def setup(self):
 
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         # generate individual IP addresses from IP range
         if event.type == "IP_RANGE" and self.range_to_ip:
             net = ipaddress.ip_network(event.data)
diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index f4c0e235ad..f904728556 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -33,7 +33,7 @@ class asset_inventory(CSV):
     header_row = ["Host", "Provider", "IP(s)", "Status", "Open Ports", "Risk Rating", "Findings", "Description"]
     filename = "asset-inventory.csv"
 
-    def setup(self):
+    async def setup(self):
         self.assets = {}
         self.open_port_producers = "httpx" in self.scan.modules or any(
             ["portscan" in m.flags for m in self.scan.modules.values()]
@@ -41,7 +41,7 @@ def setup(self):
         self.use_previous = self.config.get("use_previous", False)
         self.summary_netmask = self.config.get("summary_netmask", 16)
         self.emitted_contents = False
-        ret = super().setup()
+        ret = await super().setup()
         return ret
 
     def filter_event(self, event):
diff --git a/bbot/modules/output/csv.py b/bbot/modules/output/csv.py
index 866cb21497..feed0491db 100644
--- a/bbot/modules/output/csv.py
+++ b/bbot/modules/output/csv.py
@@ -13,7 +13,7 @@ class CSV(BaseOutputModule):
     header_row = ["Event type", "Event data", "IP Address", "Source Module", "Scope Distance", "Event Tags"]
     filename = "output.csv"
 
-    def setup(self):
+    async def setup(self):
         self.custom_headers = []
         self._headers_set = set()
         self._writer = None
@@ -43,7 +43,7 @@ def writerow(self, row):
         self.writer.writerow(row)
         self.file.flush()
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         # ["Event type", "Event data", "IP Address", "Source Module", "Scope Distance", "Event Tags"]
         self.writerow(
             {
@@ -58,15 +58,14 @@ def handle_event(self, event):
             }
         )
 
-    def cleanup(self):
+    async def cleanup(self):
         if getattr(self, "_file", None) is not None:
             with suppress(Exception):
                 self.file.close()
 
-    def report(self):
+    async def report(self):
         if self._file is not None:
-            with self._report_lock:
-                self.info(f"Saved CSV output to {self.output_file}")
+            self.info(f"Saved CSV output to {self.output_file}")
 
     def add_custom_headers(self, headers):
         if isinstance(headers, str):
diff --git a/bbot/modules/output/http.py b/bbot/modules/output/http.py
index 04c8e30101..1e3449df3b 100644
--- a/bbot/modules/output/http.py
+++ b/bbot/modules/output/http.py
@@ -25,7 +25,7 @@ class HTTP(BaseOutputModule):
         "timeout": "HTTP timeout",
     }
 
-    def setup(self):
+    async def setup(self):
         self.session = requests.Session()
         if not self.config.get("url", ""):
             self.warning("Must set URL")
diff --git a/bbot/modules/output/human.py b/bbot/modules/output/human.py
index de9aa858d9..ac80144bb1 100644
--- a/bbot/modules/output/human.py
+++ b/bbot/modules/output/human.py
@@ -11,11 +11,11 @@ class Human(BaseOutputModule):
     options_desc = {"output_file": "Output to file", "console": "Output to console"}
     vuln_severity_map = {"LOW": "HUGEWARNING", "MEDIUM": "HUGEWARNING", "HIGH": "CRITICAL", "CRITICAL": "CRITICAL"}
 
-    def setup(self):
+    async def setup(self):
         self._prep_output_dir("output.txt")
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         event_type = f"[{event.type}]"
         event_tags = ""
         if getattr(event, "tags", []):
@@ -36,12 +36,11 @@ def handle_event(self, event):
         if self.config.get("console", True):
             self.stdout(event_str)
 
-    def cleanup(self):
+    async def cleanup(self):
         if getattr(self, "_file", None) is not None:
             with suppress(Exception):
                 self.file.close()
 
-    def report(self):
+    async def report(self):
         if self._file is not None:
-            with self._report_lock:
-                self.info(f"Saved TXT output to {self.output_file}")
+            self.info(f"Saved TXT output to {self.output_file}")
diff --git a/bbot/modules/output/json.py b/bbot/modules/output/json.py
index 6b1a698bf7..561354c45c 100644
--- a/bbot/modules/output/json.py
+++ b/bbot/modules/output/json.py
@@ -10,11 +10,11 @@ class JSON(BaseOutputModule):
     options = {"output_file": "", "console": False}
     options_desc = {"output_file": "Output to file", "console": "Output to console"}
 
-    def setup(self):
+    async def setup(self):
         self._prep_output_dir("output.json")
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         event_str = json.dumps(dict(event))
         if self.file is not None:
             self.file.write(event_str + "\n")
@@ -22,12 +22,11 @@ def handle_event(self, event):
         if self.config.get("console", False) or "human" not in self.scan.modules:
             self.stdout(event_str)
 
-    def cleanup(self):
+    async def cleanup(self):
         if getattr(self, "_file", None) is not None:
             with suppress(Exception):
                 self.file.close()
 
-    def report(self):
+    async def report(self):
         if self._file is not None:
-            with self._report_lock:
-                self.info(f"Saved JSON output to {self.output_file}")
+            self.info(f"Saved JSON output to {self.output_file}")
diff --git a/bbot/modules/output/neo4j.py b/bbot/modules/output/neo4j.py
index 55c00acb92..ea7e3ff720 100644
--- a/bbot/modules/output/neo4j.py
+++ b/bbot/modules/output/neo4j.py
@@ -19,7 +19,7 @@ class neo4j(BaseOutputModule):
     deps_pip = ["py2neo~=2021.2.3"]
     batch_size = 50
 
-    def setup(self):
+    async def setup(self):
         try:
             self.neo4j = Neo4j(
                 uri=self.config.get("uri", self.options["uri"]),
diff --git a/bbot/modules/output/web_report.py b/bbot/modules/output/web_report.py
index 40e8e8e483..da973a6e38 100644
--- a/bbot/modules/output/web_report.py
+++ b/bbot/modules/output/web_report.py
@@ -13,7 +13,7 @@ class web_report(BaseOutputModule):
     options_desc = {"output_file": "Output to file", "css_theme_file": "CSS theme URL for HTML output"}
     deps_pip = ["markdown~=3.4.3"]
 
-    def setup(self):
+    async def setup(self):
         html_css_file = self.config.get("css_theme_file", "")
 
         self.html_header = f"""
diff --git a/bbot/modules/output/websocket.py b/bbot/modules/output/websocket.py
index 2a7bc625ed..55b06f7adb 100644
--- a/bbot/modules/output/websocket.py
+++ b/bbot/modules/output/websocket.py
@@ -12,7 +12,7 @@ class Websocket(BaseOutputModule):
     options = {"url": "", "token": ""}
     options_desc = {"url": "Web URL", "token": "Authorization Bearer token"}
 
-    def setup(self):
+    async def setup(self):
         self.url = self.config.get("url", "")
         if not self.url:
             return False, "Must set URL"
diff --git a/bbot/modules/report/asn.py b/bbot/modules/report/asn.py
index 04c36db881..331fddafd1 100644
--- a/bbot/modules/report/asn.py
+++ b/bbot/modules/report/asn.py
@@ -45,7 +45,7 @@ def handle_event(self, event):
                     for email in emails:
                         self.emit_event(email, "EMAIL_ADDRESS", source=asn_event)
 
-    def report(self):
+    async def report(self):
         asn_data = sorted(self.asn_cache.items(), key=lambda x: self.asn_counts[x[0]], reverse=True)
         if not asn_data:
             return
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index fd7d585daf..32620faa0d 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -1,12 +1,13 @@
 import queue
+import asyncio
 import logging
-import threading
 import traceback
 from time import sleep
 from contextlib import suppress
 from datetime import datetime, timedelta
 
 from ..core.helpers.queueing import EventQueue
+from ..core.helpers.async_helpers import TaskCounter
 from ..core.errors import ScanCancelledError, ValidationError
 
 log = logging.getLogger("bbot.scanner.manager")
@@ -23,77 +24,74 @@ def __init__(self, scan):
 
         # tracks duplicate events on a global basis
         self.events_distributed = set()
-
         # tracks duplicate events on a per-module basis
         self.events_accepted = set()
-        self.events_accepted_lock = threading.Lock()
-
-        self._lock = threading.Lock()
-        self.event_emitted = threading.Condition(self._lock)
-
-        self.events_resolved = dict()
         self.dns_resolution = self.scan.config.get("dns_resolution", False)
-
-        self.status_frequency = self.scan.config.get("status_frequency", 15)
+        self._task_counter = TaskCounter()
+        self._new_activity = True
 
         self.last_log_time = datetime.now()
 
-    def init_events(self):
+    async def init_events(self):
         """
         seed scanner with target events
         """
-        self.distribute_event(self.scan.root_event)
-        sorted_events = sorted(self.scan.target.events, key=lambda e: len(e.data))
-        for event in sorted_events:
-            self.scan.verbose(f"Target: {event}")
-            self.emit_event(event, _block=False, _force_submit=True)
-        # force submit batches
-        for mod in self.scan.modules.values():
-            mod._handle_batch(force=True)
-
-    def emit_event(self, event, *args, **kwargs):
+        with self._task_counter:
+            self.distribute_event(self.scan.root_event)
+            sorted_events = sorted(self.scan.target.events, key=lambda e: len(e.data))
+            for event in sorted_events:
+                self.scan.verbose(f"Target: {event}")
+                self.queue_event(event)
+            # force submit batches
+            # for mod in self.scan.modules.values():
+            #     mod._handle_batch(force=True)
+            self.scan._finished_init = True
+
+    async def emit_event(self, event, *args, **kwargs):
         """
         TODO: Register + kill duplicate events immediately?
         bbot.scanner: scan._event_thread_pool: running for 0 seconds: ScanManager._emit_event(DNS_NAME("sipfed.online.lync.com"))
         bbot.scanner: scan._event_thread_pool: running for 0 seconds: ScanManager._emit_event(DNS_NAME("sipfed.online.lync.com"))
         bbot.scanner: scan._event_thread_pool: running for 0 seconds: ScanManager._emit_event(DNS_NAME("sipfed.online.lync.com"))
         """
-        # skip event if it fails precheck
-        if not self._event_precheck(event):
-            event._resolved.set()
-            return False
-
-        # "quick" queues the event immediately
-        quick = kwargs.pop("quick", False)
-        if quick:
-            log.debug(f'Module "{event.module}" raised {event}')
-            event._resolved.set()
-            for kwarg in ["abort_if", "on_success_callback", "_block"]:
-                kwargs.pop(kwarg, None)
-            try:
-                self.distribute_event(event, *args, **kwargs)
-                return True
-            except ScanCancelledError:
+        with self._task_counter:
+            # skip event if it fails precheck
+            if not self._event_precheck(event):
+                event._resolved.set()
                 return False
-            except Exception as e:
-                log.error(f"Unexpected error in manager.emit_event(): {e}")
-                log.trace(traceback.format_exc())
-        else:
-            # don't raise an exception if the thread pool has been shutdown
-            try:
-                self.scan._event_thread_pool.submit_task(self.catch, self._emit_event, event, *args, **kwargs)
+
+            # "quick" queues the event immediately
+            quick = kwargs.pop("quick", False)
+            if quick:
                 log.debug(f'Module "{event.module}" raised {event}')
-                return True
-            except ScanCancelledError:
-                return False
-            except queue.Full:
-                raise
-            except Exception as e:
-                log.error(f"Unexpected error in manager.emit_event(): {e}")
-                log.trace(traceback.format_exc())
-            finally:
                 event._resolved.set()
-        return False
+                for kwarg in ["abort_if", "on_success_callback", "_block"]:
+                    kwargs.pop(kwarg, None)
+                try:
+                    self.distribute_event(event, *args, **kwargs)
+                    return True
+                except ScanCancelledError:
+                    return False
+                except Exception as e:
+                    log.error(f"Unexpected error in manager.emit_event(): {e}")
+                    log.trace(traceback.format_exc())
+            else:
+                # don't raise an exception if the thread pool has been shutdown
+                error = True
+                try:
+                    await self.catch(self._emit_event, event, *args, **kwargs)
+                    error = False
+                    log.debug(f'Module "{event.module}" raised {event}')
+                    return True
+                except ScanCancelledError:
+                    return False
+                except Exception as e:
+                    log.error(f"Unexpected error in manager.emit_event(): {e}")
+                    log.trace(traceback.format_exc())
+                finally:
+                    if error:
+                        event._resolved.set()
+            return False
 
     def _event_precheck(self, event, exclude=("DNS_NAME",)):
         """
@@ -110,7 +108,7 @@ def _event_precheck(self, event, exclude=("DNS_NAME",)):
             return False
         return True
 
-    def _emit_event(self, event, *args, **kwargs):
+    async def _emit_event(self, event, *args, **kwargs):
         log.debug(f"Emitting {event}")
         distribute_event = True
         event_distributed = False
@@ -134,7 +132,7 @@ def _emit_event(self, event, *args, **kwargs):
                     event_whitelisted_dns,
                     event_blacklisted_dns,
                     dns_children,
-                ) = self.scan.helpers.dns.resolve_event(event, minimal=not self.dns_resolution)
+                ) = await self.scan.helpers.dns.resolve_event(event, minimal=not self.dns_resolution)
                 resolved_hosts = set()
                 for rdtype, ips in dns_children.items():
                     if rdtype in ("A", "AAAA", "CNAME"):
@@ -193,7 +191,7 @@ def _emit_event(self, event, *args, **kwargs):
                         log.debug(f"Making {event} in-scope")
                     source_trail = event.make_in_scope(set_scope_distance)
                     for s in source_trail:
-                        self.emit_event(s, _block=False, _force_submit=True)
+                        self.queue_event(s)
                 else:
                     if event.scope_distance > self.scan.scope_report_distance:
                         log.debug(
@@ -205,7 +203,7 @@ def _emit_event(self, event, *args, **kwargs):
             if event.scope_distance <= self.scan.scope_search_distance:
                 if not "unresolved" in event.tags:
                     if not self.scan.helpers.is_ip_type(event.host):
-                        self.scan.helpers.dns.handle_wildcard_event(event, dns_children)
+                        await self.scan.helpers.dns.handle_wildcard_event(event, dns_children)
 
             # now that the event is properly tagged, we can finally make decisions about it
             if callable(abort_if):
@@ -232,7 +230,7 @@ def _emit_event(self, event, *args, **kwargs):
                 )
                 source_trail = event.unmake_internal(force_output=True)
                 for s in source_trail:
-                    self.emit_event(s, _block=False, _force_submit=True)
+                    self.queue_event(s)
 
             if distribute_event:
                 self.distribute_event(event)
@@ -253,17 +251,16 @@ def _emit_event(self, event, *args, **kwargs):
                     source_event.scope_distance = event.scope_distance
                     if "target" in event.tags:
                         source_event.add_tag("target")
-                    self.emit_event(source_event, _block=False, _force_submit=True)
+                    self.queue_event(source_event)
 
             ### Emit DNS children ###
             if self.dns_resolution:
                 emit_children = -1 < event.scope_distance < self.scan.dns_search_distance
                 if emit_children:
                     host_hash = hash(str(event.host))
-                    with self.events_accepted_lock:
-                        if host_hash in self.events_accepted:
-                            emit_children = False
-                        self.events_accepted.add(host_hash)
+                    if host_hash in self.events_accepted:
+                        emit_children = False
+                    self.events_accepted.add(host_hash)
 
                 if emit_children:
                     dns_child_events = []
@@ -282,7 +279,7 @@ def _emit_event(self, event, *args, **kwargs):
                                         f'Event validation failed for DNS child of {source_event}: "{record}" ({rdtype}): {e}'
                                     )
                     for child_event in dns_child_events:
-                        self.emit_event(child_event, _block=False, _force_submit=True)
+                        self.queue_event(child_event)
 
         except ValidationError as e:
             log.warning(f"Event validation failed with args={args}, kwargs={kwargs}: {e}")
@@ -292,8 +289,6 @@ def _emit_event(self, event, *args, **kwargs):
             event._resolved.set()
             if event_distributed:
                 self.scan.stats.event_distributed(event)
-            with self.event_emitted:
-                self.event_emitted.notify()
             log.debug(f"{event.module}.emit_event() finished for {event}")
 
     def hash_event(self, event):
@@ -316,10 +311,9 @@ def is_duplicate_event(self, event, add=False):
         """
         event_hash = self.hash_event(event)
         suppress_dupes = getattr(event.module, "suppress_dupes", True)
-        with self.events_accepted_lock:
-            duplicate_event = suppress_dupes and event_hash in self.events_accepted
-            if add:
-                self.events_accepted.add(event_hash)
+        duplicate_event = suppress_dupes and event_hash in self.events_accepted
+        if add:
+            self.events_accepted.add(event_hash)
         return duplicate_event
 
     def accept_event(self, event):
@@ -329,7 +323,7 @@ def accept_event(self, event):
             return False
         return True
 
-    def catch(self, callback, *args, **kwargs):
+    async def catch(self, callback, *args, **kwargs):
         """
         Wrapper to ensure error messages get surfaced to the user
         """
@@ -344,7 +338,10 @@ def catch(self, callback, *args, **kwargs):
                 break
         try:
             if not self.scan.stopping or force:
-                ret = callback(*args, **kwargs)
+                if self.scan.helpers.is_async_function(callback):
+                    ret = await callback(*args, **kwargs)
+                else:
+                    ret = callback(*args, **kwargs)
         except ScanCancelledError as e:
             log.debug(f"ScanCancelledError in {fn.__qualname__}(): {e}")
         except BrokenPipeError as e:
@@ -357,7 +354,10 @@ def catch(self, callback, *args, **kwargs):
             self.scan.stop()
         if callable(on_finish_callback):
             try:
-                on_finish_callback()
+                if self.scan.helpers.is_async_function(on_finish_callback):
+                    await on_finish_callback()
+                else:
+                    on_finish_callback()
             except Exception as e:
                 log.error(
                     f"Error in on_finish_callback {on_finish_callback.__qualname__}() after {fn.__qualname__}(): {e}"
@@ -365,6 +365,10 @@ def catch(self, callback, *args, **kwargs):
                 log.trace(traceback.format_exc())
         return ret
 
+    async def _register_running(self, callback, *args, **kwargs):
+        with self._task_counter:
+            return await callback(*args, **kwargs)
+
     def distribute_event(self, *args, **kwargs):
         """
         Queue event with modules
@@ -384,63 +388,16 @@ def distribute_event(self, *args, **kwargs):
             if not dup or mod.accept_dupes:
                 mod.queue_event(event)
 
-    def loop_until_finished(self):
-        modules = list(self.scan.modules.values())
-        activity = True
-
+    async def _worker_loop(self):
         try:
-            self.scan.dispatcher.on_start(self.scan)
-
             while 1:
-                # abort if we're aborting
-                if self.scan.aborting:
-                    # Empty event queues
-                    for module in self.scan.modules.values():
-                        with suppress(queue.Empty):
-                            while 1:
-                                module.incoming_event_queue.get_nowait()
-                    with suppress(queue.Empty):
-                        while 1:
-                            self.incoming_event_queue.get_nowait()
-                    break
-
-                if "python" in self.scan.modules:
-                    events, finish, report = self.scan.modules["python"].events_waiting
-                    yield from events
-
                 try:
-                    self.log_status(self.status_frequency)
                     event, kwargs = self.incoming_event_queue.get_nowait()
-                    while not self.scan.aborting:
-                        try:
-                            acceptable = self.emit_event(event, _block=False, **kwargs)
-                            if acceptable:
-                                activity = True
-                            break
-                        except queue.Full:
-                            self.log_status(self.status_frequency)
-                            with self.event_emitted:
-                                self.event_emitted.wait(timeout=0.1)
+                    acceptable = await self.emit_event(event, **kwargs)
+                    if acceptable:
+                        self._new_activity = True
                 except queue.Empty:
-                    # if we're on the last module
-                    modules_status = self.modules_status()
-                    finished = modules_status.get("finished", False)
-                    # And if the scan is finished
-                    if finished:
-                        # And if new events were generated since last time we were here
-                        if activity:
-                            activity = False
-                            self.scan.status = "FINISHING"
-                            # Trigger .finished() on every module and start over
-                            log.info("Finishing scan")
-                            finished_event = self.scan.make_event("FINISHED", "FINISHED", dummy=True)
-                            for module in modules:
-                                module.queue_event(finished_event)
-                        else:
-                            # Otherwise stop the scan if no new events were generated since last time
-                            break
-                    with self.incoming_event_queue.not_empty:
-                        self.incoming_event_queue.not_empty.wait(timeout=0.1)
+                    await asyncio.sleep(0.1)
 
         except KeyboardInterrupt:
             self.scan.stop()
@@ -448,52 +405,45 @@ def loop_until_finished(self):
         except Exception:
             log.critical(traceback.format_exc())
 
-        finally:
-            # Run .report() on every module
-            for mod in self.scan.modules.values():
-                self.catch(mod._register_running, mod.report, _force=True)
-
-    def log_status(self, frequency=15):
-        # print status every 15 seconds (or status_frequency setting)
-        timedelta_secs = timedelta(seconds=frequency)
-        now = datetime.now()
-        time_since_last_log = now - self.last_log_time
-        if time_since_last_log > timedelta_secs:
-            self.modules_status(_log=True, passes=1)
-            self.last_log_time = now
-
-    def modules_status(self, _log=False, passes=None):
-        # If scan looks to be finished, check an additional five times to ensure that it really is
-        # There is a tiny chance of a race condition, which this helps to avoid
-        if passes is None:
-            passes = 5
-        else:
-            passes = max(1, int(passes))
-
+    def queue_event(self, event, **kwargs):
+        if event:
+            # nerf event's priority if it's likely not to be in scope
+            if event.scope_distance > 0:
+                event_in_scope = self.scan.whitelisted(event) and not self.scan.blacklisted(event)
+                if not event_in_scope:
+                    event.module_priority += event.scope_distance
+            # Wait for parent event to resolve (in case its scope distance changes)
+            # await resolved = event.source._resolved.wait()
+            # update event's scope distance based on its parent
+            event.scope_distance = event.source.scope_distance + 1
+            self.incoming_event_queue.put_nowait((event, kwargs))
+
+    @property
+    def running(self):
+        return self._task_counter.value > 0 or self.incoming_event_queue.qsize() > 0
+
+    @property
+    def modules_finished(self):
+        return all(m.finished for m in self.scan.modules.values())
+
+    @property
+    def active(self):
+        return self.running or not self.modules_finished
+
+    async def modules_status(self, _log=False):
         finished = True
-        while passes > 0:
-            status = {"modules": {}, "scan": self.scan.status_detailed}
-
-            for num_tasks in status["scan"]["queued_tasks"].values():
-                if num_tasks > 0:
-                    finished = False
-
-            for m in self.scan.modules.values():
-                mod_status = m.status
-                if mod_status["active"]:
-                    finished = False
-                status["modules"][m.name] = mod_status
-
-            for mod in self.scan.modules.values():
-                if mod.errored and mod.incoming_event_queue not in [None, False]:
-                    with suppress(Exception):
-                        mod.set_error_state()
-
-            passes -= 1
-            if finished and passes > 0:
-                sleep(0.1)
-            else:
-                break
+        status = {"modules": {}}
+
+        for m in self.scan.modules.values():
+            mod_status = m.status
+            if mod_status["running"]:
+                finished = False
+            status["modules"][m.name] = mod_status
+
+        for mod in self.scan.modules.values():
+            if mod.errored and mod.incoming_event_queue not in [None, False]:
+                with suppress(Exception):
+                    mod.set_error_state()
 
         status["finished"] = finished
 
@@ -505,7 +455,7 @@ def modules_status(self, _log=False, passes=None):
                 running = s["running"]
                 incoming = s["events"]["incoming"]
                 outgoing = s["events"]["outgoing"]
-                tasks = s["tasks"]["total"]
+                tasks = s["tasks"]
                 total = sum([incoming, outgoing, tasks])
                 if running or total > 0:
                     modules_status.append((m, running, incoming, outgoing, tasks, total))
@@ -528,13 +478,6 @@ def modules_status(self, _log=False, passes=None):
             else:
                 self.scan.info(f"{self.scan.name}: No events produced yet")
 
-            total_tasks = status["scan"]["queued_tasks"]["total"]
-            event_tasks = status["scan"]["queued_tasks"]["event"]
-            internal_tasks = status["scan"]["queued_tasks"]["internal"]
-            self.scan.verbose(
-                f"{self.scan.name}: Thread pool tasks: {total_tasks:,} (Event: {event_tasks:,}, Internal: {internal_tasks:,})"
-            )
-
             if modules_errored:
                 self.scan.verbose(
                     f'{self.scan.name}: Modules errored: {len(modules_errored):,} ({", ".join([m for m in modules_errored])})'
@@ -550,29 +493,6 @@ def modules_status(self, _log=False, passes=None):
             else:
                 self.scan.info(f"{self.scan.name}: No events in queue")
 
-            # if debugging is enabled
-            self.scan.debug(f"THREAD POOL STATUS:")
-            if self.scan.log_level <= logging.DEBUG:
-                # log thread pool statuses
-                threadpool_names = [
-                    "_internal_thread_pool",
-                    "_event_thread_pool",
-                    "_thread_pool",
-                ]
-                for threadpool_name in threadpool_names:
-                    threadpool = getattr(self.scan, threadpool_name)
-                    for thread_status in threadpool.threads_status:
-                        self.scan.debug(f"    - {threadpool_name}: {thread_status}")
-                # log module memory usage
-                module_memory_usage = []
-                for module in self.scan.modules.values():
-                    memory_usage = module.memory_usage
-                    module_memory_usage.append((module.name, memory_usage))
-                module_memory_usage.sort(key=lambda x: x[-1], reverse=True)
-                self.scan.debug(f"MODULE MEMORY USAGE:")
-                for module_name, usage in module_memory_usage:
-                    self.scan.debug(f"    - {module_name}: {self.scan.helpers.bytes_to_human(usage)}")
-
             # Uncomment these lines to enable debugging of event queues
 
             # queued_events = self.incoming_event_queue.events
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 01a7e0831a..0b33903727 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -1,5 +1,5 @@
+import asyncio
 import logging
-import threading
 import traceback
 from sys import exc_info
 from pathlib import Path
@@ -22,7 +22,6 @@
 from bbot.core.logger import init_logging, get_log_level
 from bbot.core.helpers.names_generator import random_name
 from bbot.core.configurator.environ import prepare_environment
-from bbot.core.helpers.threadpool import ThreadPoolWrapper, BBOTThreadPoolExecutor
 from bbot.core.errors import BBOTError, ScanError, ScanCancelledError, ValidationError
 
 log = logging.getLogger("bbot.scanner")
@@ -84,25 +83,8 @@ def __init__(
         self._status = "NOT_STARTED"
         self._status_code = 0
 
-        # Set up thread pools
-        max_workers = max(1, self.config.get("max_threads", 25))
-        # Shared thread pool, for module use
-        self._thread_pool = BBOTThreadPoolExecutor(max_workers=max_workers)
-        # Event thread pool, for event emission
-        self._event_thread_pool = ThreadPoolWrapper(
-            BBOTThreadPoolExecutor(max_workers=max_workers * 2), qsize=max_workers
-        )
-        # Internal thread pool, for handle_event(), module setup, cleanup callbacks, etc.
-        self._internal_thread_pool = ThreadPoolWrapper(BBOTThreadPoolExecutor(max_workers=max_workers))
-        self.process_pool = ThreadPoolWrapper(concurrent.futures.ProcessPoolExecutor())
+        self.max_workers = max(1, self.config.get("max_threads", 25))
         self.helpers = ConfigAwareHelper(config=self.config, scan=self)
-        self.pools = {
-            "process_pool": self.process_pool,
-            "internal_thread_pool": self._internal_thread_pool,
-            "dns_thread_pool": self.helpers.dns._thread_pool,
-            "event_thread_pool": self._event_thread_pool,
-            "main_thread_pool": self._thread_pool,
-        }
         output_dir = self.config.get("output_dir", "")
 
         if name is None:
@@ -170,12 +152,14 @@ def __init__(
                 "You have enabled custom HTTP headers. These will be attached to all in-scope requests and all requests made by httpx."
             )
 
+        # how often to print scan status
+        self.status_frequency = self.config.get("status_frequency", 15)
+
         self._prepped = False
-        self._thread_pools_shutdown = False
-        self._thread_pools_shutdown_threads = []
+        self._finished_init = False
         self._cleanedup = False
 
-    def prep(self):
+    async def prep(self):
         self.helpers.mkdir(self.home)
         if not self._prepped:
             start_msg = f"Scan with {len(self._scan_modules):,} modules seeded with {len(self.target):,} targets"
@@ -191,22 +175,26 @@ def prep(self):
             self.load_modules()
 
             self.info(f"Setting up modules...")
-            self.setup_modules()
+            await self.setup_modules()
 
             self.success(f"Setup succeeded for {len(self.modules):,} modules.")
             self._prepped = True
 
-    def start_without_generator(self):
-        deque(self.start(), maxlen=0)
+    async def start_without_generator(self):
+        async for event in self.start():
+            pass
 
-    def start(self):
-        self.prep()
+    async def start(self):
+        await self.prep()
 
         failed = True
 
         if not self.target:
             self.warning(f"No scan targets specified")
 
+        # start status ticker
+        ticker_task = asyncio.create_task(self._status_ticker(self.))
+
         scan_start_time = datetime.now()
         try:
             self.status = "STARTING"
@@ -218,23 +206,59 @@ def start(self):
             else:
                 self.hugesuccess(f"Starting scan {self.name}")
 
-            if self.stopping:
-                return
+            self.dispatcher.on_start(self)
 
-            # distribute seed events
-            self.manager.init_events()
+            # start manager worker loops
+            manager_worker_loop_tasks = [
+                asyncio.create_task(self.manager._worker_loop()) for _ in range(self.max_workers)
+            ]
 
-            if self.stopping:
-                return
+            # distribute seed events
+            init_events_task = asyncio.create_task(self.manager.init_events())
 
             self.status = "RUNNING"
             self.start_modules()
             self.verbose(f"{len(self.modules):,} modules started")
 
-            if self.stopping:
-                return
+            # main scan loop
+            while 1:
+                # abort if we're aborting
+                if self.aborting:
+                    # Empty event queues
+                    for module in self.modules.values():
+                        with suppress(queue.Empty):
+                            while 1:
+                                module.incoming_event_queue.get_nowait()
+                    with suppress(queue.Empty):
+                        while 1:
+                            self.incoming_event_queue.get_nowait()
+                    break
+
+                if "python" in self.modules:
+                    events, finish, report = self.modules["python"].events_waiting
+                    for e in events:
+                        yield e
+
+                if self._finished_init and not self.manager.active:
+                    # And if new events were generated since last time we were here
+                    if self.manager._new_activity:
+                        self.manager._new_activity = False
+                        self.status = "FINISHING"
+                        # Trigger .finished() on every module and start over
+                        log.info("Finishing scan")
+                        finished_event = self.make_event("FINISHED", "FINISHED", dummy=True)
+                        for module in self.modules.values():
+                            module.queue_event(finished_event)
+                    else:
+                        # Otherwise stop the scan if no new events were generated since last time
+                        break
+
+                await asyncio.sleep(0.01)
+
+            # for module in self.modules.values():
+            #     for task in module.tasks:
+            #         await task
 
-            yield from self.manager.loop_until_finished()
             failed = False
 
         except KeyboardInterrupt:
@@ -255,21 +279,8 @@ def start(self):
             self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
 
         finally:
-            self.cleanup()
-            self.shutdown_threadpools()
-            while 1:
-                for t in self._thread_pools_shutdown_threads:
-                    t.join(timeout=1)
-                    if t.is_alive():
-                        try:
-                            pool = t._args[0]
-                            for s in pool.threads_status:
-                                self.debug(s)
-                        except AttributeError:
-                            continue
-                if not any(t.is_alive() for t in self._thread_pools_shutdown_threads):
-                    self.debug("Finished shutting down thread pools")
-                    break
+            await self.report()
+            await self.cleanup()
 
             log_fn = self.hugesuccess
             if self.status == "ABORTING":
@@ -281,6 +292,19 @@ def start(self):
             else:
                 self.status = "FINISHED"
 
+            ticker_task.cancel()
+            with suppress(asyncio.CancelledError):
+                await ticker_task
+
+            init_events_task.cancel()
+            with suppress(asyncio.CancelledError):
+                await init_events_task
+
+            for t in manager_worker_loop_tasks:
+                t.cancel()
+                with suppress(asyncio.CancelledError):
+                    await t
+
             scan_run_time = datetime.now() - scan_start_time
             scan_run_time = self.helpers.human_timedelta(scan_run_time)
             log_fn(f"Scan {self.name} completed in {scan_run_time} with status {self.status}")
@@ -288,23 +312,19 @@ def start(self):
             self.dispatcher.on_finish(self)
 
     def start_modules(self):
-        self.verbose(f"Starting module threads")
+        self.verbose(f"Starting module worker loops")
         for module_name, module in self.modules.items():
             module.start()
 
-    def setup_modules(self, remove_failed=True):
+    async def setup_modules(self, remove_failed=True):
         self.load_modules()
         self.verbose(f"Setting up modules")
         hard_failed = []
         soft_failed = []
         setup_futures = dict()
 
-        for module_name, module in self.modules.items():
-            future = self._internal_thread_pool.submit_task(module._setup)
-            setup_futures[future] = module_name
-        for future in self.helpers.as_completed(setup_futures):
-            module_name = setup_futures[future]
-            status, msg = future.result()
+        for task in asyncio.as_completed([m._setup() for m in self.modules.values()]):
+            module_name, status, msg = await task
             if status == True:
                 self.debug(f"Setup succeeded for {module_name} ({msg})")
             elif status == False:
@@ -332,34 +352,17 @@ def stop(self, wait=False):
             self.status = "ABORTING"
             self.hugewarning(f"Aborting scan")
             self.helpers.kill_children()
-            self.shutdown_threadpools()
             self.helpers.kill_children()
 
-    def shutdown_threadpools(self):
-        if not self._thread_pools_shutdown:
-            self._thread_pools_shutdown = True
-
-            def shutdown_pool(pool, pool_name, **kwargs):
-                self.debug(f"Shutting down {pool_name} with kwargs={kwargs}")
-                pool.shutdown(**kwargs)
-                self.debug(f"Finished shutting down {pool_name} with kwargs={kwargs}")
-
-            self.debug(f"Shutting down thread pools")
-            for pool_name, pool in self.pools.items():
-                t = threading.Thread(
-                    target=shutdown_pool,
-                    args=(pool, pool_name),
-                    kwargs={"wait": True, "cancel_futures": True},
-                    daemon=True,
-                )
-                t.start()
-                self._thread_pools_shutdown_threads.append(t)
+    async def report(self):
+        for mod in self.modules.values():
+            await self.manager.catch(mod._register_running, mod.report)
 
-    def cleanup(self):
+    async def cleanup(self):
         # clean up modules
         self.status = "CLEANING_UP"
         for mod in self.modules.values():
-            mod._cleanup()
+            await mod._cleanup()
         if not self._cleanedup:
             self._cleanedup = True
             with suppress(Exception):
@@ -393,6 +396,10 @@ def word_cloud(self):
     def stopping(self):
         return not self.running
 
+    @property
+    def stopped(self):
+        return self._status_code > 5
+
     @property
     def running(self):
         return 0 < self._status_code < 4
@@ -421,22 +428,6 @@ def status(self, status):
         else:
             self.debug(f'Attempt to set invalid status "{status}" on scan')
 
-    @property
-    def status_detailed(self):
-        event_threadpool_tasks = self._event_thread_pool.num_tasks
-        internal_tasks = self._internal_thread_pool.num_tasks
-        process_tasks = self.process_pool.num_tasks
-        total_tasks = event_threadpool_tasks + internal_tasks + process_tasks
-        status = {
-            "queued_tasks": {
-                "internal": internal_tasks,
-                "process": process_tasks,
-                "event": event_threadpool_tasks,
-                "total": total_tasks,
-            },
-        }
-        return status
-
     def make_event(self, *args, **kwargs):
         kwargs["scan"] = self
         event = make_event(*args, **kwargs)
@@ -614,3 +605,8 @@ def _load_modules(self, modules):
                 self.warning(f'Failed to load unknown module "{module_name}"')
             failed.add(module_name)
         return loaded_modules, failed
+
+    async def _status_ticker(self, interval=15):
+        while not self.stopped:
+            await asyncio.sleep(interval)
+            await self.manager.modules_status(_log=True)
diff --git a/bbot/test/test.conf b/bbot/test/test.conf
index 52ee009ba6..597d313fc4 100644
--- a/bbot/test/test.conf
+++ b/bbot/test/test.conf
@@ -29,7 +29,7 @@ scope_search_distance: 0
 scope_report_distance: 0
 scope_dns_search_distance: 1
 plumbus: asdf
-dns_debug: false
+dns_debug: true
 http_debug: false
 keep_scans: 1
 agent_url: test
diff --git a/bbot/test/test_step_2/test_helpers.py b/bbot/test/test_step_2/test_helpers.py
index d10273d4ee..5ea38e8ff6 100644
--- a/bbot/test/test_step_2/test_helpers.py
+++ b/bbot/test/test_step_2/test_helpers.py
@@ -483,113 +483,11 @@ def plumbus_generator():
         helpers.wordlist("/tmp/a9pseoysadf/asdkgjaosidf")
     test_file.unlink()
 
-    ### DNS ###
-    # resolution
-    assert all([helpers.is_ip(i) for i in helpers.resolve("scanme.nmap.org")])
-    assert "dns.google" in helpers.resolve("8.8.8.8")
-    assert "dns.google" in helpers.resolve("2001:4860:4860::8888")
-    resolved_ips = helpers.resolve("dns.google")
-    assert "2001:4860:4860::8888" in resolved_ips
-    assert "8.8.8.8" in resolved_ips
-    assert any([helpers.is_subdomain(h) for h in helpers.resolve("google.com", type="mx")])
-    v6_ips = helpers.resolve("www.google.com", type="AAAA")
-    assert all([i.version == 6 for i in [ipaddress.ip_address(_) for _ in v6_ips]])
-    assert not helpers.resolve(f"{helpers.rand_string(length=30)}.com")
-    # batch resolution
-    batch_results = list(helpers.resolve_batch(["8.8.8.8", "dns.google"]))
-    assert len(batch_results) == 2
-    batch_results = dict(batch_results)
-    assert any([x in batch_results["dns.google"] for x in ("8.8.8.8", "8.8.4.4")])
-    assert "dns.google" in batch_results["8.8.8.8"]
-    # "any" type
-    resolved = helpers.resolve("google.com", type="any")
-    assert any([helpers.is_subdomain(h) for h in resolved])
-    # dns cache
-    assert hash(f"8.8.8.8:PTR") not in helpers.dns._dns_cache
-    assert hash(f"scanme.nmap.org:A") not in helpers.dns._dns_cache
-    assert hash(f"scanme.nmap.org:AAAA") not in helpers.dns._dns_cache
-    helpers.resolve("8.8.8.8", cache_result=True)
-    assert hash(f"8.8.8.8:PTR") in helpers.dns._dns_cache
-    helpers.resolve("scanme.nmap.org", cache_result=True)
-    assert hash(f"scanme.nmap.org:A") in helpers.dns._dns_cache
-    assert hash(f"scanme.nmap.org:AAAA") in helpers.dns._dns_cache
-    # wildcards
-    wildcard_domains = helpers.is_wildcard_domain("asdf.github.io")
-    assert "github.io" in wildcard_domains
-    assert "A" in wildcard_domains["github.io"]
-    assert "SRV" not in wildcard_domains["github.io"]
-    assert wildcard_domains["github.io"]["A"] and all(helpers.is_ip(r) for r in wildcard_domains["github.io"]["A"])
-    wildcard_rdtypes = helpers.is_wildcard("blacklanternsecurity.github.io")
-    assert "A" in wildcard_rdtypes
-    assert "SRV" not in wildcard_rdtypes
-    assert wildcard_rdtypes["A"] == (True, "github.io")
-    assert hash("github.io") in helpers.dns._wildcard_cache
-    assert len(helpers.dns._wildcard_cache[hash("github.io")]) > 0
-    helpers.dns._wildcard_cache.clear()
-    wildcard_rdtypes = helpers.is_wildcard("asdf.asdf.asdf.github.io")
-    assert "A" in wildcard_rdtypes
-    assert "SRV" not in wildcard_rdtypes
-    assert wildcard_rdtypes["A"] == (True, "github.io")
-    assert hash("github.io") in helpers.dns._wildcard_cache
-    assert len(helpers.dns._wildcard_cache[hash("github.io")]) > 0
-    wildcard_event1 = scan.make_event("wat.asdf.fdsa.github.io", "DNS_NAME", dummy=True)
-    wildcard_event2 = scan.make_event("wats.asd.fdsa.github.io", "DNS_NAME", dummy=True)
-    wildcard_event3 = scan.make_event("github.io", "DNS_NAME", dummy=True)
-    event_tags1, event_whitelisted1, event_blacklisted1, children1 = scan.helpers.resolve_event(wildcard_event1)
-    event_tags2, event_whitelisted2, event_blacklisted2, children2 = scan.helpers.resolve_event(wildcard_event2)
-    event_tags3, event_whitelisted3, event_blacklisted3, children3 = scan.helpers.resolve_event(wildcard_event3)
-    helpers.handle_wildcard_event(wildcard_event1, children1)
-    helpers.handle_wildcard_event(wildcard_event2, children2)
-    helpers.handle_wildcard_event(wildcard_event3, children3)
-    assert "wildcard" in wildcard_event1.tags
-    assert "a-wildcard" in wildcard_event1.tags
-    assert "srv-wildcard" not in wildcard_event1.tags
-    assert "wildcard" in wildcard_event2.tags
-    assert "a-wildcard" in wildcard_event2.tags
-    assert "srv-wildcard" not in wildcard_event2.tags
-    assert wildcard_event1.data == "_wildcard.github.io"
-    assert wildcard_event2.data == "_wildcard.github.io"
-    assert wildcard_event1.tags == wildcard_event2.tags
-    assert "wildcard-domain" in wildcard_event3.tags
-    assert "a-wildcard-domain" in wildcard_event3.tags
-    assert "srv-wildcard-domain" not in wildcard_event3.tags
-    # misc dns helpers
+    # misc DNS helpers
     assert helpers.is_ptr("wsc-11-22-33-44-wat.evilcorp.com") == True
     assert helpers.is_ptr("wsc-11-22-33-wat.evilcorp.com") == False
     assert helpers.is_ptr("11wat.evilcorp.com") == False
 
-    # Ensure events with hosts have resolved_hosts attribute populated
-
-    resolved_hosts_event1 = scan.make_event("dns.google", "DNS_NAME", dummy=True)
-    resolved_hosts_event2 = scan.make_event("http://dns.google/", "URL_UNVERIFIED", dummy=True)
-    event_tags1, event_whitelisted1, event_blacklisted1, children1 = scan.helpers.resolve_event(resolved_hosts_event1)
-    event_tags2, event_whitelisted2, event_blacklisted2, children2 = scan.helpers.resolve_event(resolved_hosts_event2)
-
-    assert "8.8.8.8" in [str(x) for x in children1["A"]]
-    assert "8.8.8.8" in [str(x) for x in children2["A"]]
-    assert set(children1.keys()) == set(children2.keys())
-
-    msg = "Ignore this error, it belongs here"
-
-    def raise_e():
-        raise Exception(msg)
-
-    def raise_k():
-        raise KeyboardInterrupt(msg)
-
-    def raise_s():
-        raise ScanCancelledError(msg)
-
-    def raise_b():
-        raise BrokenPipeError(msg)
-
-    helpers.dns._catch_keyboardinterrupt(raise_e)
-    helpers.dns._catch_keyboardinterrupt(raise_k)
-    scan.manager.catch(raise_e, _on_finish_callback=raise_e)
-    scan.manager.catch(raise_k)
-    scan.manager.catch(raise_s)
-    scan.manager.catch(raise_b)
-
     ## NTLM
     testheader = "TlRMTVNTUAACAAAAHgAeADgAAAAVgorilwL+bvnVipUAAAAAAAAAAJgAmABWAAAACgBjRQAAAA9XAEkATgAtAFMANAAyAE4ATwBCAEQAVgBUAEsAOAACAB4AVwBJAE4ALQBTADQAMgBOAE8AQgBEAFYAVABLADgAAQAeAFcASQBOAC0AUwA0ADIATgBPAEIARABWAFQASwA4AAQAHgBXAEkATgAtAFMANAAyAE4ATwBCAEQAVgBUAEsAOAADAB4AVwBJAE4ALQBTADQAMgBOAE8AQgBEAFYAVABLADgABwAIAHUwOZlfoNgBAAAAAA=="
     decoded = helpers.ntlm.ntlmdecode(testheader)
diff --git a/bbot/test/test_step_2/test_manager.py b/bbot/test/test_step_2/test_manager.py
index ec58276ec4..4a0bcff54a 100644
--- a/bbot/test/test_step_2/test_manager.py
+++ b/bbot/test/test_step_2/test_manager.py
@@ -87,6 +87,26 @@ class DummyModule3:
     assert len(event_children) == 0
     assert googledns in output
 
+    # error catching
+    msg = "Ignore this error, it belongs here"
+
+    def raise_e():
+        raise Exception(msg)
+
+    def raise_k():
+        raise KeyboardInterrupt(msg)
+
+    def raise_s():
+        raise ScanCancelledError(msg)
+
+    def raise_b():
+        raise BrokenPipeError(msg)
+
+    manager.catch(raise_e, _on_finish_callback=raise_e)
+    manager.catch(raise_k)
+    manager.catch(raise_s)
+    manager.catch(raise_b)
+
 
 def test_scope_distance(bbot_scanner, bbot_config):
     # event filtering based on scope_distance
diff --git a/poetry.lock b/poetry.lock
index ec3eeedca2..d563198a5a 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1057,6 +1057,25 @@ tomli = {version = ">=1.0.0", markers = "python_version < \"3.11\""}
 [package.extras]
 testing = ["argcomplete", "hypothesis (>=3.56)", "mock", "nose", "pygments (>=2.7.2)", "requests", "xmlschema"]
 
+[[package]]
+name = "pytest-asyncio"
+version = "0.21.0"
+description = "Pytest support for asyncio"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "pytest-asyncio-0.21.0.tar.gz", hash = "sha256:2b38a496aef56f56b0e87557ec313e11e1ab9276fc3863f6a7be0f1d0e415e1b"},
+    {file = "pytest_asyncio-0.21.0-py3-none-any.whl", hash = "sha256:f2b3366b7cd501a4056858bd39349d5af19742aed2d81660b7998b6341c7eb9c"},
+]
+
+[package.dependencies]
+pytest = ">=7.0.0"
+
+[package.extras]
+docs = ["sphinx (>=5.3)", "sphinx-rtd-theme (>=1.0)"]
+testing = ["coverage (>=6.2)", "flaky (>=3.5.0)", "hypothesis (>=5.7.1)", "mypy (>=0.931)", "pytest-trio (>=0.7.0)"]
+
 [[package]]
 name = "pytest-cov"
 version = "4.0.0"
@@ -1491,4 +1510,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "5154e783b3e49545e75315e8ae36f21d279bd21b3e108ef4bdadd5f3c340f35a"
+content-hash = "010faf1151a864dfd8f7d72f16be9457675f1359dcb30393ed2ca8db47b3887c"
diff --git a/pyproject.toml b/pyproject.toml
index 27b476decc..32b6df29b2 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -39,6 +39,7 @@ requests-mock = "^1.10.0"
 poetry-dynamic-versioning = "^0.21.4"
 pytest-httpserver = "^1.0.6"
 pytest-rerunfailures = "^11.1.2"
+pytest-asyncio = "^0.21.0"
 
 [build-system]
 requires = ["poetry-core>=1.0.0", "poetry-dynamic-versioning"]

From 0bf518a5ce03967bdf0228a6e349a1ee2f50c02c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 5 May 2023 10:28:17 -0400
Subject: [PATCH 005/387] websocket

---
 bbot/modules/output/websocket.py | 68 ++++++++++++-------------
 bbot/scanner/manager.py          |  3 ++
 bbot/scanner/scanner.py          |  8 +--
 poetry.lock                      | 85 +++++++++++++++++++++++++++-----
 pyproject.toml                   |  2 +-
 5 files changed, 117 insertions(+), 49 deletions(-)

diff --git a/bbot/modules/output/websocket.py b/bbot/modules/output/websocket.py
index 55b06f7adb..7e302d0b66 100644
--- a/bbot/modules/output/websocket.py
+++ b/bbot/modules/output/websocket.py
@@ -1,6 +1,6 @@
 import json
 import threading
-import websocket
+import websockets
 from time import sleep
 
 from bbot.modules.output.base import BaseOutputModule
@@ -16,43 +16,45 @@ async def setup(self):
         self.url = self.config.get("url", "")
         if not self.url:
             return False, "Must set URL"
-        kwargs = {}
         self.token = self.config.get("token", "")
-        if self.token:
-            kwargs.update({"header": {"Authorization": f"Bearer {self.token}"}})
-        self.ws = websocket.WebSocketApp(self.url, **kwargs)
-        self.started = False
+        self._ws = None
         return True
 
-    def start_websocket(self):
-        if not self.started:
-            self.thread = threading.Thread(target=self._start_websocket, daemon=True)
-            self.thread.start()
-            self.started = True
-
-    def _start_websocket(self):
-        not_keyboardinterrupt = False
-        while not self.scan.stopping:
-            not_keyboardinterrupt = self.ws.run_forever()
-            if not not_keyboardinterrupt:
-                break
-            sleep(1)
-
-    def handle_event(self, event):
-        self.start_websocket()
+    async def handle_event(self, event):
         event_json = event.json()
-        self.send(event_json)
-
-    def send(self, message):
-        while self.ws is not None:
+        await self.send(event_json)
+
+    async def ws(self, rebuild=False):
+        if self._ws is None or rebuild:
+            kwargs = {"close_timeout": 0.5}
+            if self.token:
+                kwargs.update({"extra_headers": {"Authorization": f"Bearer {self.token}"}})
+            verbs = ("Building", "Built")
+            if rebuild:
+                verbs = ("Rebuilding", "Rebuilt")
+            self.debug(f"{verbs[0]} websocket connection to {self.url}")
+            self._ws = await websockets.connect(self.url, **kwargs)
+            self.debug(f"{verbs[1]} websocket connection to {self.url}")
+        return self._ws
+
+    async def send(self, message):
+        rebuild = False
+        while not self.scan.stopped:
             try:
-                self.ws.send(json.dumps(message))
+                ws = await self.ws(rebuild=rebuild)
+                message = json.dumps(message)
+                self.debug(f"Sending message of length {len(message)}")
+                await ws.send(message)
+                rebuild = False
                 break
             except Exception as e:
                 self.warning(f"Error sending message: {e}, retrying")
-                sleep(1)
-                continue
-
-    def cleanup(self):
-        self.ws.close()
-        self.ws = None
+                await asyncio.sleep(1)
+                rebuild = True
+
+    async def cleanup(self):
+        if self._ws is not None:
+            self.debug(f"Closing connection to {self.url}")
+            await self._ws.close()
+            self.debug(f"Closed connection to {self.url}")
+        self._ws = None
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 32620faa0d..5a18cdac2f 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -281,6 +281,9 @@ async def _emit_event(self, event, *args, **kwargs):
                     for child_event in dns_child_events:
                         self.queue_event(child_event)
 
+        except KeyboardInterrupt:
+            self.scan.stop()
+
         except ValidationError as e:
             log.warning(f"Event validation failed with args={args}, kwargs={kwargs}: {e}")
             log.trace(traceback.format_exc())
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 0b33903727..11df8d770d 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -279,6 +279,10 @@ async def start(self):
             self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
 
         finally:
+            init_events_task.cancel()
+            with suppress(asyncio.CancelledError):
+                await init_events_task
+
             await self.report()
             await self.cleanup()
 
@@ -296,10 +300,6 @@ async def start(self):
             with suppress(asyncio.CancelledError):
                 await ticker_task
 
-            init_events_task.cancel()
-            with suppress(asyncio.CancelledError):
-                await init_events_task
-
             for t in manager_worker_loop_tasks:
                 t.cancel()
                 with suppress(asyncio.CancelledError):
diff --git a/poetry.lock b/poetry.lock
index d563198a5a..a032ccadeb 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1435,22 +1435,85 @@ secure = ["certifi", "cryptography (>=1.3.4)", "idna (>=2.0.0)", "ipaddress", "p
 socks = ["PySocks (>=1.5.6,!=1.5.7,<2.0)"]
 
 [[package]]
-name = "websocket-client"
-version = "1.5.1"
-description = "WebSocket client for Python with low level API options"
+name = "websockets"
+version = "11.0.2"
+description = "An implementation of the WebSocket Protocol (RFC 6455 & 7692)"
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "websocket-client-1.5.1.tar.gz", hash = "sha256:3f09e6d8230892547132177f575a4e3e73cfdf06526e20cc02aa1c3b47184d40"},
-    {file = "websocket_client-1.5.1-py3-none-any.whl", hash = "sha256:cdf5877568b7e83aa7cf2244ab56a3213de587bbe0ce9d8b9600fc77b455d89e"},
+    {file = "websockets-11.0.2-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:580cc95c58118f8c39106be71e24d0b7e1ad11a155f40a2ee687f99b3e5e432e"},
+    {file = "websockets-11.0.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:143782041e95b63083b02107f31cda999f392903ae331de1307441f3a4557d51"},
+    {file = "websockets-11.0.2-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:8df63dcd955eb6b2e371d95aacf8b7c535e482192cff1b6ce927d8f43fb4f552"},
+    {file = "websockets-11.0.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ca9b2dced5cbbc5094678cc1ec62160f7b0fe4defd601cd28a36fde7ee71bbb5"},
+    {file = "websockets-11.0.2-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:e0eeeea3b01c97fd3b5049a46c908823f68b59bf0e18d79b231d8d6764bc81ee"},
+    {file = "websockets-11.0.2-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:502683c5dedfc94b9f0f6790efb26aa0591526e8403ad443dce922cd6c0ec83b"},
+    {file = "websockets-11.0.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:d3cc3e48b6c9f7df8c3798004b9c4b92abca09eeea5e1b0a39698f05b7a33b9d"},
+    {file = "websockets-11.0.2-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:808b8a33c961bbd6d33c55908f7c137569b09ea7dd024bce969969aa04ecf07c"},
+    {file = "websockets-11.0.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:34a6f8996964ccaa40da42ee36aa1572adcb1e213665e24aa2f1037da6080909"},
+    {file = "websockets-11.0.2-cp310-cp310-win32.whl", hash = "sha256:8f24cd758cbe1607a91b720537685b64e4d39415649cac9177cd1257317cf30c"},
+    {file = "websockets-11.0.2-cp310-cp310-win_amd64.whl", hash = "sha256:3b87cd302f08ea9e74fdc080470eddbed1e165113c1823fb3ee6328bc40ca1d3"},
+    {file = "websockets-11.0.2-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:3565a8f8c7bdde7c29ebe46146bd191290413ee6f8e94cf350609720c075b0a1"},
+    {file = "websockets-11.0.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:f97e03d4d5a4f0dca739ea274be9092822f7430b77d25aa02da6775e490f6846"},
+    {file = "websockets-11.0.2-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:8f392587eb2767afa8a34e909f2fec779f90b630622adc95d8b5e26ea8823cb8"},
+    {file = "websockets-11.0.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:7742cd4524622cc7aa71734b51294644492a961243c4fe67874971c4d3045982"},
+    {file = "websockets-11.0.2-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:46dda4bc2030c335abe192b94e98686615f9274f6b56f32f2dd661fb303d9d12"},
+    {file = "websockets-11.0.2-cp311-cp311-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d6b2bfa1d884c254b841b0ff79373b6b80779088df6704f034858e4d705a4802"},
+    {file = "websockets-11.0.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:1df2413266bf48430ef2a752c49b93086c6bf192d708e4a9920544c74cd2baa6"},
+    {file = "websockets-11.0.2-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:cf45d273202b0c1cec0f03a7972c655b93611f2e996669667414557230a87b88"},
+    {file = "websockets-11.0.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:3a09cce3dacb6ad638fdfa3154d9e54a98efe7c8f68f000e55ca9c716496ca67"},
+    {file = "websockets-11.0.2-cp311-cp311-win32.whl", hash = "sha256:2174a75d579d811279855df5824676d851a69f52852edb0e7551e0eeac6f59a4"},
+    {file = "websockets-11.0.2-cp311-cp311-win_amd64.whl", hash = "sha256:c78ca3037a954a4209b9f900e0eabbc471fb4ebe96914016281df2c974a93e3e"},
+    {file = "websockets-11.0.2-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:3a2100b02d1aaf66dc48ff1b2a72f34f6ebc575a02bc0350cc8e9fbb35940166"},
+    {file = "websockets-11.0.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:dca9708eea9f9ed300394d4775beb2667288e998eb6f542cdb6c02027430c599"},
+    {file = "websockets-11.0.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:320ddceefd2364d4afe6576195201a3632a6f2e6d207b0c01333e965b22dbc84"},
+    {file = "websockets-11.0.2-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b2a573c8d71b7af937852b61e7ccb37151d719974146b5dc734aad350ef55a02"},
+    {file = "websockets-11.0.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:13bd5bebcd16a4b5e403061b8b9dcc5c77e7a71e3c57e072d8dff23e33f70fba"},
+    {file = "websockets-11.0.2-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:95c09427c1c57206fe04277bf871b396476d5a8857fa1b99703283ee497c7a5d"},
+    {file = "websockets-11.0.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:2eb042734e710d39e9bc58deab23a65bd2750e161436101488f8af92f183c239"},
+    {file = "websockets-11.0.2-cp37-cp37m-win32.whl", hash = "sha256:5875f623a10b9ba154cb61967f940ab469039f0b5e61c80dd153a65f024d9fb7"},
+    {file = "websockets-11.0.2-cp37-cp37m-win_amd64.whl", hash = "sha256:634239bc844131863762865b75211a913c536817c0da27f691400d49d256df1d"},
+    {file = "websockets-11.0.2-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:3178d965ec204773ab67985a09f5696ca6c3869afeed0bb51703ea404a24e975"},
+    {file = "websockets-11.0.2-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:955fcdb304833df2e172ce2492b7b47b4aab5dcc035a10e093d911a1916f2c87"},
+    {file = "websockets-11.0.2-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:cb46d2c7631b2e6f10f7c8bac7854f7c5e5288f024f1c137d4633c79ead1e3c0"},
+    {file = "websockets-11.0.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:25aae96c1060e85836552a113495db6d857400288161299d77b7b20f2ac569f2"},
+    {file = "websockets-11.0.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:2abeeae63154b7f63d9f764685b2d299e9141171b8b896688bd8baec6b3e2303"},
+    {file = "websockets-11.0.2-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:daa1e8ea47507555ed7a34f8b49398d33dff5b8548eae3de1dc0ef0607273a33"},
+    {file = "websockets-11.0.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:954eb789c960fa5daaed3cfe336abc066941a5d456ff6be8f0e03dd89886bb4c"},
+    {file = "websockets-11.0.2-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:3ffe251a31f37e65b9b9aca5d2d67fd091c234e530f13d9dce4a67959d5a3fba"},
+    {file = "websockets-11.0.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:adf6385f677ed2e0b021845b36f55c43f171dab3a9ee0ace94da67302f1bc364"},
+    {file = "websockets-11.0.2-cp38-cp38-win32.whl", hash = "sha256:aa7b33c1fb2f7b7b9820f93a5d61ffd47f5a91711bc5fa4583bbe0c0601ec0b2"},
+    {file = "websockets-11.0.2-cp38-cp38-win_amd64.whl", hash = "sha256:220d5b93764dd70d7617f1663da64256df7e7ea31fc66bc52c0e3750ee134ae3"},
+    {file = "websockets-11.0.2-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:0fb4480556825e4e6bf2eebdbeb130d9474c62705100c90e59f2f56459ddab42"},
+    {file = "websockets-11.0.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:ec00401846569aaf018700249996143f567d50050c5b7b650148989f956547af"},
+    {file = "websockets-11.0.2-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:87c69f50281126dcdaccd64d951fb57fbce272578d24efc59bce72cf264725d0"},
+    {file = "websockets-11.0.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:232b6ba974f5d09b1b747ac232f3a3d8f86de401d7b565e837cc86988edf37ac"},
+    {file = "websockets-11.0.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:392d409178db1e46d1055e51cc850136d302434e12d412a555e5291ab810f622"},
+    {file = "websockets-11.0.2-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a4fe2442091ff71dee0769a10449420fd5d3b606c590f78dd2b97d94b7455640"},
+    {file = "websockets-11.0.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:ede13a6998ba2568b21825809d96e69a38dc43184bdeebbde3699c8baa21d015"},
+    {file = "websockets-11.0.2-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:4c54086b2d2aec3c3cb887ad97e9c02c6be9f1d48381c7419a4aa932d31661e4"},
+    {file = "websockets-11.0.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:e37a76ccd483a6457580077d43bc3dfe1fd784ecb2151fcb9d1c73f424deaeba"},
+    {file = "websockets-11.0.2-cp39-cp39-win32.whl", hash = "sha256:d1881518b488a920434a271a6e8a5c9481a67c4f6352ebbdd249b789c0467ddc"},
+    {file = "websockets-11.0.2-cp39-cp39-win_amd64.whl", hash = "sha256:25e265686ea385f22a00cc2b719b880797cd1bb53b46dbde969e554fb458bfde"},
+    {file = "websockets-11.0.2-pp37-pypy37_pp73-macosx_10_9_x86_64.whl", hash = "sha256:ce69f5c742eefd039dce8622e99d811ef2135b69d10f9aa79fbf2fdcc1e56cd7"},
+    {file = "websockets-11.0.2-pp37-pypy37_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:b985ba2b9e972cf99ddffc07df1a314b893095f62c75bc7c5354a9c4647c6503"},
+    {file = "websockets-11.0.2-pp37-pypy37_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:1b52def56d2a26e0e9c464f90cadb7e628e04f67b0ff3a76a4d9a18dfc35e3dd"},
+    {file = "websockets-11.0.2-pp37-pypy37_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d70a438ef2a22a581d65ad7648e949d4ccd20e3c8ed7a90bbc46df4e60320891"},
+    {file = "websockets-11.0.2-pp37-pypy37_pp73-win_amd64.whl", hash = "sha256:752fbf420c71416fb1472fec1b4cb8631c1aa2be7149e0a5ba7e5771d75d2bb9"},
+    {file = "websockets-11.0.2-pp38-pypy38_pp73-macosx_10_9_x86_64.whl", hash = "sha256:dd906b0cdc417ea7a5f13bb3c6ca3b5fd563338dc596996cb0fdd7872d691c0a"},
+    {file = "websockets-11.0.2-pp38-pypy38_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3e79065ff6549dd3c765e7916067e12a9c91df2affea0ac51bcd302aaf7ad207"},
+    {file = "websockets-11.0.2-pp38-pypy38_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:46388a050d9e40316e58a3f0838c63caacb72f94129eb621a659a6e49bad27ce"},
+    {file = "websockets-11.0.2-pp38-pypy38_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5c7de298371d913824f71b30f7685bb07ad13969c79679cca5b1f7f94fec012f"},
+    {file = "websockets-11.0.2-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:6d872c972c87c393e6a49c1afbdc596432df8c06d0ff7cd05aa18e885e7cfb7c"},
+    {file = "websockets-11.0.2-pp39-pypy39_pp73-macosx_10_9_x86_64.whl", hash = "sha256:b444366b605d2885f0034dd889faf91b4b47668dd125591e2c64bfde611ac7e1"},
+    {file = "websockets-11.0.2-pp39-pypy39_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e8b967a4849db6b567dec3f7dd5d97b15ce653e3497b8ce0814e470d5e074750"},
+    {file = "websockets-11.0.2-pp39-pypy39_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:2acdc82099999e44fa7bd8c886f03c70a22b1d53ae74252f389be30d64fd6004"},
+    {file = "websockets-11.0.2-pp39-pypy39_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:518ed6782d9916c5721ebd61bb7651d244178b74399028302c8617d0620af291"},
+    {file = "websockets-11.0.2-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:58477b041099bb504e1a5ddd8aa86302ed1d5c6995bdd3db2b3084ef0135d277"},
+    {file = "websockets-11.0.2-py3-none-any.whl", hash = "sha256:5004c087d17251938a52cce21b3dbdabeecbbe432ce3f5bbbf15d8692c36eac9"},
+    {file = "websockets-11.0.2.tar.gz", hash = "sha256:b1a69701eb98ed83dd099de4a686dc892c413d974fa31602bc00aca7cb988ac9"},
 ]
 
-[package.extras]
-docs = ["Sphinx (>=3.4)", "sphinx-rtd-theme (>=0.5)"]
-optional = ["python-socks", "wsaccel"]
-test = ["websockets"]
-
 [[package]]
 name = "werkzeug"
 version = "2.2.3"
@@ -1510,4 +1573,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "010faf1151a864dfd8f7d72f16be9457675f1359dcb30393ed2ca8db47b3887c"
+content-hash = "eee5683fb3dcc73b282ac84c49503087af4b618d1c03d9919fb099e0c2395fb0"
diff --git a/pyproject.toml b/pyproject.toml
index 32b6df29b2..846c307e13 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -26,9 +26,9 @@ xmltojson = "^2.0.2"
 pycryptodome = "^3.17"
 idna = "^3.4"
 ansible = "^7.3.0"
-websocket-client = "^1.5.1"
 tabulate = "0.8.10"
 cloudcheck = "^2.0.0.34"
+websockets = "^11.0.2"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From 8c630c7de4a046318f24440a5134babb11b8c845 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 5 May 2023 17:09:23 -0400
Subject: [PATCH 006/387] working http helpers + interactsh

---
 bbot/cli.py                            |   5 +-
 bbot/core/configurator/args.py         |  40 ++++---
 bbot/core/helpers/dns.py               |  56 +++++-----
 bbot/core/helpers/helper.py            |  10 +-
 bbot/core/helpers/interactsh.py        |  46 ++++----
 bbot/core/helpers/misc.py              |   7 ++
 bbot/core/helpers/web.py               | 146 +++++++++++++++++++++++++
 bbot/modules/base.py                   |   2 +-
 bbot/modules/output/asset_inventory.py |   4 +-
 bbot/modules/output/websocket.py       |   3 +-
 bbot/scanner/manager.py                |  16 +--
 bbot/scanner/scanner.py                |   5 +-
 bbot/test/test.conf                    |   1 +
 bbot/test/test_step_2/test_dns.py      | 121 ++++++++++++++++++++
 bbot/test/test_step_2/test_http.py     |  74 +++++++++++++
 poetry.lock                            | 134 ++++++++++++++++++++++-
 pyproject.toml                         |   1 +
 17 files changed, 582 insertions(+), 89 deletions(-)
 create mode 100644 bbot/test/test_step_2/test_dns.py
 create mode 100644 bbot/test/test_step_2/test_http.py

diff --git a/bbot/cli.py b/bbot/cli.py
index 55ee624f3d..c1c637839f 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -32,11 +32,12 @@
 from . import config
 
 
+err = False
 scan_name = ""
 
 
 async def _main():
-    err = False
+    global err
     global scan_name
 
     ensure_config_files()
@@ -336,7 +337,7 @@ def main():
         if scan_name:
             msg = f"You killed {scan_name}"
         log_to_stderr(msg, level="ERROR")
-        err = True
+        os._exit(1)
 
 
 if __name__ == "__main__":
diff --git a/bbot/core/configurator/args.py b/bbot/core/configurator/args.py
index 4f9bd7202f..0cb2f1519f 100644
--- a/bbot/core/configurator/args.py
+++ b/bbot/core/configurator/args.py
@@ -104,8 +104,8 @@ def error(self, message):
         action="store_true",
         help="Don't consider subdomains of target/whitelist to be in-scope",
     )
-    p.add_argument("-n", "--name", help="Name of scan (default: random)", metavar="SCAN_NAME")
-    p.add_argument(
+    modules = p.add_argument_group(title="Modules")
+    modules.add_argument(
         "-m",
         "--modules",
         nargs="+",
@@ -113,9 +113,11 @@ def error(self, message):
         help=f'Modules to enable. Choices: {",".join(module_choices)}',
         metavar="MODULE",
     )
-    p.add_argument("-l", "--list-modules", action="store_true", help=f"List available modules.")
-    p.add_argument("-em", "--exclude-modules", nargs="+", default=[], help=f"Exclude these modules.", metavar="MODULE")
-    p.add_argument(
+    modules.add_argument("-l", "--list-modules", action="store_true", help=f"List available modules.")
+    modules.add_argument(
+        "-em", "--exclude-modules", nargs="+", default=[], help=f"Exclude these modules.", metavar="MODULE"
+    )
+    modules.add_argument(
         "-f",
         "--flags",
         nargs="+",
@@ -123,7 +125,7 @@ def error(self, message):
         help=f'Enable modules by flag. Choices: {",".join(sorted(flag_choices))}',
         metavar="FLAG",
     )
-    p.add_argument(
+    modules.add_argument(
         "-rf",
         "--require-flags",
         nargs="+",
@@ -131,7 +133,7 @@ def error(self, message):
         help=f"Only enable modules with these flags (e.g. -rf passive)",
         metavar="FLAG",
     )
-    p.add_argument(
+    modules.add_argument(
         "-ef",
         "--exclude-flags",
         nargs="+",
@@ -139,7 +141,7 @@ def error(self, message):
         help=f"Disable modules with these flags. (e.g. -ef aggressive)",
         metavar="FLAG",
     )
-    p.add_argument(
+    modules.add_argument(
         "-om",
         "--output-modules",
         nargs="+",
@@ -147,26 +149,28 @@ def error(self, message):
         help=f'Output module(s). Choices: {",".join(output_module_choices)}',
         metavar="MODULE",
     )
-    p.add_argument(
+    modules.add_argument("--allow-deadly", action="store_true", help="Enable the use of highly aggressive modules")
+    scan = p.add_argument_group(title="Scan")
+    scan.add_argument("-n", "--name", help="Name of scan (default: random)", metavar="SCAN_NAME")
+    scan.add_argument(
         "-o",
         "--output-dir",
         metavar="DIR",
     )
-    p.add_argument(
+    scan.add_argument(
         "-c",
         "--config",
         nargs="*",
         help="custom config file, or configuration options in key=value format: 'modules.shodan.api_key=1234'",
         metavar="CONFIG",
     )
-    p.add_argument("--allow-deadly", action="store_true", help="Enable the use of highly aggressive modules")
-    p.add_argument("-v", "--verbose", action="store_true", help="Be more verbose")
-    p.add_argument("-d", "--debug", action="store_true", help="Enable debugging")
-    p.add_argument("-s", "--silent", action="store_true", help="Be quiet")
-    p.add_argument("--force", action="store_true", help="Run scan even if module setups fail")
-    p.add_argument("-y", "--yes", action="store_true", help="Skip scan confirmation prompt")
-    p.add_argument("--dry-run", action="store_true", help=f"Abort before executing scan")
-    p.add_argument(
+    scan.add_argument("-v", "--verbose", action="store_true", help="Be more verbose")
+    scan.add_argument("-d", "--debug", action="store_true", help="Enable debugging")
+    scan.add_argument("-s", "--silent", action="store_true", help="Be quiet")
+    scan.add_argument("--force", action="store_true", help="Run scan even if module setups fail")
+    scan.add_argument("-y", "--yes", action="store_true", help="Skip scan confirmation prompt")
+    scan.add_argument("--dry-run", action="store_true", help=f"Abort before executing scan")
+    scan.add_argument(
         "--current-config",
         action="store_true",
         help="Show current config in YAML format",
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 1089206a61..56e24262fd 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -1,4 +1,3 @@
-import json
 import asyncio
 import logging
 import ipaddress
@@ -84,32 +83,33 @@ async def resolve_raw(self, query, **kwargs):
         # DNS over TCP is more reliable
         # But setting this breaks DNS resolution on Ubuntu because systemd-resolve doesn't support TCP
         # kwargs["tcp"] = True
-        query = str(query).strip()
-        if is_ip(query):
-            kwargs.pop("type", None)
-            kwargs.pop("rdtype", None)
-            results, errors = await self._resolve_ip(query, **kwargs)
-            return [("PTR", results)], [("PTR", e) for e in errors]
-        else:
+        with suppress(asyncio.CancelledError):
             results = []
             errors = []
-            types = ["A", "AAAA"]
-            kwargs.pop("rdtype", None)
-            if "type" in kwargs:
-                t = kwargs.pop("type")
-                if isinstance(t, str):
-                    if t.strip().lower() in ("any", "all", "*"):
-                        types = self.all_rdtypes
-                    else:
-                        types = [t.strip().upper()]
-                elif any([isinstance(t, x) for x in (list, tuple)]):
-                    types = [str(_).strip().upper() for _ in t]
-            for t in types:
-                r, e = await self._resolve_hostname(query, rdtype=t, **kwargs)
-                if r:
-                    results.append((t, r))
-                for error in e:
-                    errors.append((t, error))
+            query = str(query).strip()
+            if is_ip(query):
+                kwargs.pop("type", None)
+                kwargs.pop("rdtype", None)
+                results, errors = await self._resolve_ip(query, **kwargs)
+                return [("PTR", results)], [("PTR", e) for e in errors]
+            else:
+                types = ["A", "AAAA"]
+                kwargs.pop("rdtype", None)
+                if "type" in kwargs:
+                    t = kwargs.pop("type")
+                    if isinstance(t, str):
+                        if t.strip().lower() in ("any", "all", "*"):
+                            types = self.all_rdtypes
+                        else:
+                            types = [t.strip().upper()]
+                    elif any([isinstance(t, x) for x in (list, tuple)]):
+                        types = [str(_).strip().upper() for _ in t]
+                for t in types:
+                    r, e = await self._resolve_hostname(query, rdtype=t, **kwargs)
+                    if r:
+                        results.append((t, r))
+                    for error in e:
+                        errors.append((t, error))
 
             return (results, errors)
 
@@ -277,7 +277,7 @@ async def resolve_event(self, event, minimal=False):
                     types = ("A", "AAAA")
 
             if types:
-                tasks = [self.resolve_raw(event_host, type=t, cache_result=True) for t in types]
+                tasks = [asyncio.create_task(self.resolve_raw(event_host, type=t, cache_result=True)) for t in types]
                 for task in asyncio.as_completed(tasks):
                     resolved_raw, errors = await task
                     for rdtype, e in errors:
@@ -454,7 +454,9 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
             # then resolve the query for all rdtypes
             for _rdtype in self.all_rdtypes:
                 # resolve the base query
-                wildcard_tasks[_rdtype].append(self.resolve_raw(query, type=_rdtype, cache_result=True))
+                wildcard_tasks[_rdtype].append(
+                    asyncio.create_task(self.resolve_raw(query, type=_rdtype, cache_result=True))
+                )
 
             for _rdtype, tasks in wildcard_tasks.items():
                 for task in asyncio.as_completed(tasks):
diff --git a/bbot/core/helpers/helper.py b/bbot/core/helpers/helper.py
index db6f1b74a8..f7c345e544 100644
--- a/bbot/core/helpers/helper.py
+++ b/bbot/core/helpers/helper.py
@@ -5,6 +5,7 @@
 
 from . import misc
 from .dns import DNSHelper
+from .web import WebHelper
 from .diff import HttpCompare
 from .wordcloud import WordCloud
 from .cloud import CloudProviders
@@ -45,6 +46,7 @@ def __init__(self, config, scan=None):
         self._future_lock = Lock()
 
         self.dns = DNSHelper(self)
+        self.web = WebHelper(self)
         self.depsinstaller = DepsInstaller(self)
         self.word_cloud = WordCloud(self)
         self.dummy_modules = {}
@@ -114,8 +116,12 @@ def __getattribute__(self, attr):
                     # then try dns
                     return getattr(self.dns, attr)
                 except AttributeError:
-                    # then die
-                    raise AttributeError(f'Helper has no attribute "{attr}"')
+                    try:
+                        # then try web
+                        return getattr(self.web, attr)
+                    except AttributeError:
+                        # then die
+                        raise AttributeError(f'Helper has no attribute "{attr}"')
 
 
 class DummyModule(BaseModule):
diff --git a/bbot/core/helpers/interactsh.py b/bbot/core/helpers/interactsh.py
index 42b456c6ee..b79c4cb6a3 100644
--- a/bbot/core/helpers/interactsh.py
+++ b/bbot/core/helpers/interactsh.py
@@ -2,11 +2,10 @@
 import json
 import base64
 import random
+import asyncio
 import logging
 import traceback
-from time import sleep
 from uuid import uuid4
-from threading import Thread
 
 from Crypto.Hash import SHA256
 from Crypto.PublicKey import RSA
@@ -26,9 +25,9 @@ def __init__(self, parent_helper):
         self.correlation_id = None
         self.custom_server = self.parent_helper.config.get("interactsh_server", None)
         self.token = self.parent_helper.config.get("interactsh_token", None)
-        self._thread = None
+        self._poll_task = None
 
-    def register(self, callback=None):
+    async def register(self, callback=None):
         rsa = RSA.generate(1024)
 
         self.public_key = rsa.publickey().exportKey()
@@ -57,7 +56,9 @@ def register(self, callback=None):
                 "secret-key": self.secret,
                 "correlation-id": self.correlation_id,
             }
-            r = self.parent_helper.request(f"https://{server}/register", headers=headers, json=data, method="POST")
+            r = await self.parent_helper.request_async(
+                f"https://{server}/register", headers=headers, json=data, method="POST"
+            )
             if r is None:
                 continue
             try:
@@ -78,12 +79,11 @@ def register(self, callback=None):
         )
 
         if callable(callback):
-            self._thread = Thread(target=self.poll_loop, args=(callback,), daemon=True)
-            self._thread.start()
+            self._poll_task = asyncio.create_task(self.poll_loop(callback))
 
         return self.domain
 
-    def deregister(self):
+    async def deregister(self):
         if not self.server or not self.correlation_id or not self.secret:
             raise InteractshError(f"Missing required information to deregister")
 
@@ -93,11 +93,17 @@ def deregister(self):
 
         data = {"secret-key": self.secret, "correlation-id": self.correlation_id}
 
-        r = self.parent_helper.request(f"https://{self.server}/deregister", headers=headers, json=data, method="POST")
+        r = await self.parent_helper.request_async(
+            f"https://{self.server}/deregister", headers=headers, json=data, method="POST"
+        )
+
+        if self._poll_task is not None:
+            self._poll_task.cancel()
+
         if "success" not in getattr(r, "text", ""):
             raise InteractshError(f"Failed to de-register with interactsh server {self.server}")
 
-    def poll(self):
+    async def poll(self):
         if not self.server or not self.correlation_id or not self.secret:
             raise InteractshError(f"Missing required information to poll")
 
@@ -105,38 +111,40 @@ def poll(self):
         if self.token:
             headers["Authorization"] = self.token
 
-        r = self.parent_helper.request(
+        r = await self.parent_helper.request_async(
             f"https://{self.server}/poll?id={self.correlation_id}&secret={self.secret}", headers=headers
         )
 
+        ret = []
         data_list = r.json().get("data", None)
         if data_list:
             aes_key = r.json()["aes_key"]
 
             for data in data_list:
                 decrypted_data = self.decrypt(aes_key, data)
-                yield decrypted_data
+                ret.append(decrypted_data)
+        return ret
 
-    def poll_loop(self, callback):
-        return self.parent_helper.scan.manager.catch(self._poll_loop, callback, _force=True)
+    async def poll_loop(self, callback):
+        return await self.parent_helper.scan.manager.catch(self._poll_loop, callback, _force=True)
 
-    def _poll_loop(self, callback):
+    async def _poll_loop(self, callback):
         while 1:
             if self.parent_helper.scan.stopping:
-                sleep(1)
+                await asyncio.sleep(1)
                 continue
             data_list = []
             try:
-                data_list = list(self.poll())
+                data_list = await self.poll()
             except InteractshError as e:
                 log.warning(e)
                 log.trace(traceback.format_exc())
             if not data_list:
-                sleep(10)
+                await asyncio.sleep(10)
                 continue
             for data in data_list:
                 if data:
-                    callback(data)
+                    self.parent_helper.execute_sync_or_async(callback, data)
 
     def decrypt(self, aes_key, data):
         private_key = RSA.importKey(self.private_key)
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index e65766843a..8395d285a0 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -1024,3 +1024,10 @@ def cloudcheck(ip):
 
 def is_async_function(f):
     return inspect.iscoroutinefunction(f)
+
+
+async def execute_sync_or_async(callback, *args, **kwargs):
+    if is_async_function(callback):
+        return await callback(*args, **kwargs)
+    else:
+        return callback(*args, **kwargs)
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index d59acb0266..60d7b88cdd 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -1,3 +1,4 @@
+import httpx
 import logging
 import requests
 from time import sleep
@@ -169,6 +170,151 @@ def request(self, *args, **kwargs):
                     raise e
 
 
+class BBOTAsyncClient(httpx.AsyncClient):
+    def __init__(self, *args, **kwargs):
+        self._bbot_scan = kwargs.pop("_bbot_scan")
+
+        # timeout
+        http_timeout = self._bbot_scan.config.get("http_timeout", 20)
+        if not "timeout" in kwargs:
+            kwargs["timeout"] = http_timeout
+
+        # headers
+        headers = kwargs.get("headers", None)
+        if headers is None:
+            headers = {}
+        user_agent = self._bbot_scan.config.get("user_agent", "BBOT")
+        if "User-Agent" not in headers:
+            headers["User-Agent"] = user_agent
+        kwargs["headers"] = headers
+
+        super().__init__(*args, **kwargs)
+
+    def build_request(self, *args, **kwargs):
+        request = super().build_request(*args, **kwargs)
+        # add custom headers if the URL is in-scope
+        if self._bbot_scan.in_scope(str(request.url)):
+            for hk, hv in self._bbot_scan.config.get("http_headers", {}).items():
+                # don't clobber headers
+                if hk not in request.headers:
+                    request.headers[hk] = hv
+        return request
+
+
+class WebHelper:
+    """
+    For making HTTP requests
+    """
+
+    client_options = ("auth", "params", "headers", "cookies", "timeout", "follow_redirects", "max_redirects")
+
+    def __init__(self, parent_helper):
+        self.parent_helper = parent_helper
+
+    def AsyncClient(self, *args, **kwargs):
+        kwargs["_bbot_scan"] = self.parent_helper.scan
+        retries = kwargs.pop("retries", self.parent_helper.config.get("http_retries", 1))
+        kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries)
+        return BBOTAsyncClient(*args, **kwargs)
+
+    async def request_async(self, *args, **kwargs):
+        raise_error = kwargs.pop("raise_error", False)
+
+        # in case of URL only, assume GET request
+        if len(args) == 1:
+            kwargs["url"] = args[0]
+            args = []
+
+        if not args and "method" not in kwargs:
+            kwargs["method"] = "GET"
+
+        http_debug = self.parent_helper.config.get("http_debug", False)
+
+        client_kwargs = {}
+        for k in list(kwargs):
+            if k in self.client_options:
+                v = kwargs.pop(k)
+                client_kwargs[k] = v
+        async with self.AsyncClient(**client_kwargs) as client:
+            try:
+                if http_debug:
+                    logstr = f"Web request: {str(args)}, {str(kwargs)}"
+                    log.debug(logstr)
+                response = await client.request(*args, **kwargs)
+                if http_debug:
+                    log.debug(
+                        f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
+                    )
+                return response
+            except httpx.RequestError as e:
+                log.debug(f"Error with request: {e}")
+                if raise_error:
+                    raise
+
+    async def download_async(self, url, **kwargs):
+        """
+        Downloads file, returns full path of filename
+        If download failed, returns None
+
+        Caching supported via "cache_hrs"
+        """
+        success = False
+        filename = self.parent_helper.cache_filename(url)
+        cache_hrs = float(kwargs.pop("cache_hrs", -1))
+        log.debug(f"Downloading file from {url} with cache_hrs={cache_hrs}")
+        if cache_hrs > 0 and self.parent_helper.is_cached(url):
+            log.debug(f"{url} is cached")
+            success = True
+        else:
+            # kwargs["raise_error"] = True
+            # kwargs["stream"] = True
+            if not "method" in kwargs:
+                kwargs["method"] = "GET"
+            try:
+                async with self.AsyncClient().stream(url=url, **kwargs) as response:
+                    status_code = getattr(response, "status_code", 0)
+                    log.debug(f"Download result: HTTP {status_code}")
+                    if status_code != 0:
+                        response.raise_for_status()
+                        with open(filename, "wb") as f:
+                            async for chunk in response.aiter_bytes(chunk_size=8192):
+                                f.write(chunk)
+                        success = True
+            except httpx.HTTPError as e:
+                log.warning(f"Failed to download {url}: {e}")
+                return
+
+        if success:
+            return filename.resolve()
+
+    async def wordlist_async(self, path, lines=None, **kwargs):
+        if not path:
+            raise WordlistError(f"Invalid wordlist: {path}")
+        if not "cache_hrs" in kwargs:
+            kwargs["cache_hrs"] = 720
+        if self.parent_helper.is_url(path):
+            filename = await self.download_async(str(path), **kwargs)
+            if filename is None:
+                raise WordlistError(f"Unable to retrieve wordlist from {path}")
+        else:
+            filename = Path(path).resolve()
+            if not filename.is_file():
+                raise WordlistError(f"Unable to find wordlist at {path}")
+
+        if lines is None:
+            return filename
+        else:
+            lines = int(lines)
+            with open(filename) as f:
+                read_lines = f.readlines()
+            cache_key = f"{filename}:{lines}"
+            truncated_filename = self.parent_helper.cache_filename(cache_key)
+            with open(truncated_filename, "w") as f:
+                for line in read_lines[:lines]:
+                    f.write(line)
+            return truncated_filename
+
+
 def api_page_iter(self, url, page_size=100, json=True, **requests_kwargs):
     page = 1
     offset = 0
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 888a56f9a7..e4c23e9d90 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -1,7 +1,7 @@
 import queue
 import asyncio
 import logging
-import threading
+import traceback
 from sys import exc_info
 from contextlib import suppress
 
diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index f904728556..5ffb3d86ae 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -55,14 +55,14 @@ def filter_event(self, event):
             return False, "event is unresolved"
         return True, ""
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         if self.filter_event(event)[0]:
             hostkey = _make_hostkey(event.host, event.resolved_hosts)
             if hostkey not in self.assets:
                 self.assets[hostkey] = Asset(event.host)
             self.assets[hostkey].absorb_event(event)
 
-    def report(self):
+    async def report(self):
         stats = dict()
         totals = dict()
 
diff --git a/bbot/modules/output/websocket.py b/bbot/modules/output/websocket.py
index 7e302d0b66..9c78e42d10 100644
--- a/bbot/modules/output/websocket.py
+++ b/bbot/modules/output/websocket.py
@@ -1,7 +1,6 @@
 import json
-import threading
+import asyncio
 import websockets
-from time import sleep
 
 from bbot.modules.output.base import BaseOutputModule
 
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 5a18cdac2f..e2bf595064 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -2,9 +2,7 @@
 import asyncio
 import logging
 import traceback
-from time import sleep
 from contextlib import suppress
-from datetime import datetime, timedelta
 
 from ..core.helpers.queueing import EventQueue
 from ..core.helpers.async_helpers import TaskCounter
@@ -30,8 +28,6 @@ def __init__(self, scan):
         self._task_counter = TaskCounter()
         self._new_activity = True
 
-        self.last_log_time = datetime.now()
-
     async def init_events(self):
         """
         seed scanner with target events
@@ -341,10 +337,7 @@ async def catch(self, callback, *args, **kwargs):
                 break
         try:
             if not self.scan.stopping or force:
-                if self.scan.helpers.is_async_function(callback):
-                    ret = await callback(*args, **kwargs)
-                else:
-                    ret = callback(*args, **kwargs)
+                ret = await self.scan.helpers.execute_sync_or_async(callback, *args, **kwargs)
         except ScanCancelledError as e:
             log.debug(f"ScanCancelledError in {fn.__qualname__}(): {e}")
         except BrokenPipeError as e:
@@ -355,12 +348,11 @@ async def catch(self, callback, *args, **kwargs):
         except KeyboardInterrupt:
             log.debug(f"Interrupted")
             self.scan.stop()
+        except asyncio.CancelledError as e:
+            log.debug(f"{e}")
         if callable(on_finish_callback):
             try:
-                if self.scan.helpers.is_async_function(on_finish_callback):
-                    await on_finish_callback()
-                else:
-                    on_finish_callback()
+                await self.scan.helpers.execute_sync_or_async(on_finish_callback)
             except Exception as e:
                 log.error(
                     f"Error in on_finish_callback {on_finish_callback.__qualname__}() after {fn.__qualname__}(): {e}"
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 11df8d770d..465d2f7a4a 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -1,13 +1,13 @@
+import queue
 import asyncio
 import logging
 import traceback
 from sys import exc_info
 from pathlib import Path
-import concurrent.futures
 from datetime import datetime
 from omegaconf import OmegaConf
 from contextlib import suppress
-from collections import OrderedDict, deque
+from collections import OrderedDict
 
 from bbot import config as bbot_config
 
@@ -321,7 +321,6 @@ async def setup_modules(self, remove_failed=True):
         self.verbose(f"Setting up modules")
         hard_failed = []
         soft_failed = []
-        setup_futures = dict()
 
         for task in asyncio.as_completed([m._setup() for m in self.modules.values()]):
             module_name, status, msg = await task
diff --git a/bbot/test/test.conf b/bbot/test/test.conf
index 597d313fc4..5e534f5067 100644
--- a/bbot/test/test.conf
+++ b/bbot/test/test.conf
@@ -30,6 +30,7 @@ scope_report_distance: 0
 scope_dns_search_distance: 1
 plumbus: asdf
 dns_debug: true
+user_agent: "BBOT Test User-Agent"
 http_debug: false
 keep_scans: 1
 agent_url: test
diff --git a/bbot/test/test_step_2/test_dns.py b/bbot/test/test_step_2/test_dns.py
new file mode 100644
index 0000000000..ab1bcecc18
--- /dev/null
+++ b/bbot/test/test_step_2/test_dns.py
@@ -0,0 +1,121 @@
+from ..bbot_fixtures import *
+
+
+@pytest.mark.asyncio
+async def test_dns(bbot_scanner, bbot_config):
+    scan = bbot_scanner("8.8.8.8")
+    helpers = scan.helpers
+
+    # lowest level functions
+    a_responses = await helpers._resolve_hostname("dns.google")
+    aaaa_responses = await helpers._resolve_hostname("dns.google", rdtype="AAAA")
+    ip_responses = await helpers._resolve_ip("8.8.8.8")
+    assert a_responses[0].response.answer[0][0].address in ("8.8.8.8", "8.8.4.4")
+    assert aaaa_responses[0].response.answer[0][0].address in ("2001:4860:4860::8888", "2001:4860:4860::8844")
+    assert ip_responses[0].response.answer[0][0].target.to_text() in ("dns.google.",)
+
+    # mid level functions
+    _responses, errors = await helpers.resolve_raw("dns.google")
+    responses = []
+    for rdtype, response in _responses:
+        for answers in response:
+            responses += list(helpers.extract_targets(answers))
+    assert ("A", "8.8.8.8") in responses
+    _responses, errors = await helpers.resolve_raw("dns.google", rdtype="AAAA")
+    responses = []
+    for rdtype, response in _responses:
+        for answers in response:
+            responses += list(helpers.extract_targets(answers))
+    assert ("AAAA", "2001:4860:4860::8888") in responses
+    _responses, errors = await helpers.resolve_raw("8.8.8.8")
+    responses = []
+    for rdtype, response in _responses:
+        for answers in response:
+            responses += list(helpers.extract_targets(answers))
+    assert ("PTR", "dns.google") in responses
+
+    # high level functions
+    assert "8.8.8.8" in await helpers.resolve("dns.google")
+    assert "2001:4860:4860::8888" in await helpers.resolve("dns.google", type="AAAA")
+    assert "dns.google" in await helpers.resolve("8.8.8.8")
+    for rdtype in ("NS", "SOA", "MX", "TXT"):
+        assert len(await helpers.resolve("google.com", type=rdtype)) > 0
+
+    # batch resolution
+    batch_results = [r async for r in helpers.resolve_batch(["8.8.8.8", "dns.google"])]
+    assert len(batch_results) == 2
+    batch_results = dict(batch_results)
+    assert any([x in batch_results["dns.google"] for x in ("8.8.8.8", "8.8.4.4")])
+    assert "dns.google" in batch_results["8.8.8.8"]
+
+    # "any" type
+    resolved = await helpers.resolve("google.com", type="any")
+    assert any([helpers.is_subdomain(h) for h in resolved])
+
+    # dns cache
+    assert hash(f"8.8.8.8:PTR") not in helpers.dns._dns_cache
+    assert hash(f"dns.google:A") not in helpers.dns._dns_cache
+    assert hash(f"dns.google:AAAA") not in helpers.dns._dns_cache
+    await helpers.resolve("8.8.8.8", cache_result=True)
+    assert hash(f"8.8.8.8:PTR") in helpers.dns._dns_cache
+    await helpers.resolve("dns.google", cache_result=True)
+    assert hash(f"dns.google:A") in helpers.dns._dns_cache
+    assert hash(f"dns.google:AAAA") in helpers.dns._dns_cache
+
+    # wildcards
+    wildcard_domains = await helpers.is_wildcard_domain("asdf.github.io")
+    assert "github.io" in wildcard_domains
+    assert "A" in wildcard_domains["github.io"]
+    assert "SRV" not in wildcard_domains["github.io"]
+    assert wildcard_domains["github.io"]["A"] and all(helpers.is_ip(r) for r in wildcard_domains["github.io"]["A"])
+
+    wildcard_rdtypes = await helpers.is_wildcard("blacklanternsecurity.github.io")
+    assert "A" in wildcard_rdtypes
+    assert "SRV" not in wildcard_rdtypes
+    assert wildcard_rdtypes["A"] == (True, "github.io")
+    assert hash("github.io") in helpers.dns._wildcard_cache
+    assert len(helpers.dns._wildcard_cache[hash("github.io")]) > 0
+    helpers.dns._wildcard_cache.clear()
+
+    wildcard_rdtypes = await helpers.is_wildcard("asdf.asdf.asdf.github.io")
+    assert "A" in wildcard_rdtypes
+    assert "SRV" not in wildcard_rdtypes
+    assert wildcard_rdtypes["A"] == (True, "github.io")
+    assert hash("github.io") in helpers.dns._wildcard_cache
+    assert len(helpers.dns._wildcard_cache[hash("github.io")]) > 0
+    wildcard_event1 = scan.make_event("wat.asdf.fdsa.github.io", "DNS_NAME", dummy=True)
+    wildcard_event2 = scan.make_event("wats.asd.fdsa.github.io", "DNS_NAME", dummy=True)
+    wildcard_event3 = scan.make_event("github.io", "DNS_NAME", dummy=True)
+
+    # event resolution
+    event_tags1, event_whitelisted1, event_blacklisted1, children1 = await scan.helpers.resolve_event(wildcard_event1)
+    event_tags2, event_whitelisted2, event_blacklisted2, children2 = await scan.helpers.resolve_event(wildcard_event2)
+    event_tags3, event_whitelisted3, event_blacklisted3, children3 = await scan.helpers.resolve_event(wildcard_event3)
+    await helpers.handle_wildcard_event(wildcard_event1, children1)
+    await helpers.handle_wildcard_event(wildcard_event2, children2)
+    await helpers.handle_wildcard_event(wildcard_event3, children3)
+    assert "wildcard" in wildcard_event1.tags
+    assert "a-wildcard" in wildcard_event1.tags
+    assert "srv-wildcard" not in wildcard_event1.tags
+    assert "wildcard" in wildcard_event2.tags
+    assert "a-wildcard" in wildcard_event2.tags
+    assert "srv-wildcard" not in wildcard_event2.tags
+    assert wildcard_event1.data == "_wildcard.github.io"
+    assert wildcard_event2.data == "_wildcard.github.io"
+    assert wildcard_event1.tags == wildcard_event2.tags
+    assert "wildcard-domain" in wildcard_event3.tags
+    assert "a-wildcard-domain" in wildcard_event3.tags
+    assert "srv-wildcard-domain" not in wildcard_event3.tags
+
+    # Ensure events with hosts have resolved_hosts attribute populated
+    resolved_hosts_event1 = scan.make_event("dns.google", "DNS_NAME", dummy=True)
+    resolved_hosts_event2 = scan.make_event("http://dns.google/", "URL_UNVERIFIED", dummy=True)
+    event_tags1, event_whitelisted1, event_blacklisted1, children1 = await scan.helpers.resolve_event(
+        resolved_hosts_event1
+    )
+    event_tags2, event_whitelisted2, event_blacklisted2, children2 = await scan.helpers.resolve_event(
+        resolved_hosts_event2
+    )
+    assert "8.8.8.8" in [str(x) for x in children1["A"]]
+    assert "8.8.8.8" in [str(x) for x in children2["A"]]
+    assert set(children1.keys()) == set(children2.keys())
diff --git a/bbot/test/test_step_2/test_http.py b/bbot/test/test_step_2/test_http.py
new file mode 100644
index 0000000000..47b6c584dc
--- /dev/null
+++ b/bbot/test/test_step_2/test_http.py
@@ -0,0 +1,74 @@
+from ..bbot_fixtures import *
+
+
+@pytest.mark.asyncio
+async def test_http_helpers(bbot_scanner, bbot_config, bbot_httpserver):
+    scan1 = bbot_scanner("8.8.8.8", config=bbot_config)
+    scan2 = bbot_scanner("127.0.0.1", config=bbot_config)
+
+    user_agent = bbot_config.get("user_agent", "")
+    headers = {"User-Agent": user_agent}
+    custom_headers = bbot_config.get("http_headers", {})
+    headers.update(custom_headers)
+    assert headers["test"] == "header"
+
+    url = bbot_httpserver.url_for("/test_http_helpers")
+    # test user agent + custom headers
+    bbot_httpserver.expect_request(uri="/test_http_helpers", headers=headers).respond_with_data(
+        "test_http_helpers_yep"
+    )
+    response = await scan1.helpers.request_async(url)
+    # should fail because URL is not in-scope
+    assert response.status_code == 500
+    response = await scan2.helpers.request_async(url)
+    # should suceed because URL is in-scope
+    assert response.status_code == 200
+    assert response.text == "test_http_helpers_yep"
+
+    # download file
+    path = "/test_http_helpers_download"
+    url = bbot_httpserver.url_for(path)
+    download_content = "test_http_helpers_download_yep"
+    bbot_httpserver.expect_request(uri=path).respond_with_data(download_content)
+    filename = await scan1.helpers.download_async(url)
+    assert Path(str(filename)).is_file()
+    assert scan1.helpers.is_cached(url)
+    with open(filename) as f:
+        assert f.read() == download_content
+    # 404
+    path = "/test_http_helpers_download_404"
+    url = bbot_httpserver.url_for(path)
+    download_content = "404"
+    bbot_httpserver.expect_request(uri=path).respond_with_data(download_content, status=404)
+    filename = await scan1.helpers.download_async(url)
+    assert filename is None
+    assert not scan1.helpers.is_cached(url)
+
+    # wordlist
+    path = "/test_http_helpers_wordlist"
+    url = bbot_httpserver.url_for(path)
+    download_content = "a\ncool\nword\nlist"
+    bbot_httpserver.expect_request(uri=path).respond_with_data(download_content)
+    filename = await scan1.helpers.wordlist_async(url)
+    assert Path(str(filename)).is_file()
+    assert scan1.helpers.is_cached(url)
+    with open(filename) as f:
+        assert f.read().splitlines() == ["a", "cool", "word", "list"]
+
+
+@pytest.mark.asyncio
+async def test_http_interactsh(bbot_scanner, bbot_config, bbot_httpserver):
+    from bbot.core.helpers.interactsh import server_list
+
+    scan1 = bbot_scanner("8.8.8.8", config=bbot_config)
+
+    interactsh_client = scan1.helpers.interactsh()
+
+    async def async_callback(data):
+        log.debug(f"interactsh poll: {data}")
+
+    interactsh_domain = await interactsh_client.register(callback=async_callback)
+    assert any(interactsh_domain.endswith(f"{s}") for s in server_list)
+    data_list = await interactsh_client.poll()
+    assert isinstance(data_list, list)
+    assert await interactsh_client.deregister() is None
diff --git a/poetry.lock b/poetry.lock
index a032ccadeb..f0fdf18237 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -64,6 +64,27 @@ files = [
     {file = "antlr4-python3-runtime-4.9.3.tar.gz", hash = "sha256:f224469b4168294902bb1efa80a8bf7855f24c99aef99cbefc1bcd3cce77881b"},
 ]
 
+[[package]]
+name = "anyio"
+version = "3.6.2"
+description = "High level compatibility layer for multiple asynchronous event loop implementations"
+category = "main"
+optional = false
+python-versions = ">=3.6.2"
+files = [
+    {file = "anyio-3.6.2-py3-none-any.whl", hash = "sha256:fbbe32bd270d2a2ef3ed1c5d45041250284e31fc0a4df4a5a6071842051a51e3"},
+    {file = "anyio-3.6.2.tar.gz", hash = "sha256:25ea0d673ae30af41a0c442f81cf3b38c7e79fdc7b60335a4c14e05eb0947421"},
+]
+
+[package.dependencies]
+idna = ">=2.8"
+sniffio = ">=1.1"
+
+[package.extras]
+doc = ["packaging", "sphinx-autodoc-typehints (>=1.2.0)", "sphinx-rtd-theme"]
+test = ["contextlib2", "coverage[toml] (>=4.5)", "hypothesis (>=4.0)", "mock (>=4)", "pytest (>=7.0)", "pytest-mock (>=3.6.1)", "trustme", "uvloop (<0.15)", "uvloop (>=0.15)"]
+trio = ["trio (>=0.16,<0.22)"]
+
 [[package]]
 name = "appdirs"
 version = "1.4.4"
@@ -602,6 +623,105 @@ mccabe = ">=0.7.0,<0.8.0"
 pycodestyle = ">=2.10.0,<2.11.0"
 pyflakes = ">=3.0.0,<3.1.0"
 
+[[package]]
+name = "h11"
+version = "0.14.0"
+description = "A pure-Python, bring-your-own-I/O implementation of HTTP/1.1"
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "h11-0.14.0-py3-none-any.whl", hash = "sha256:e3fe4ac4b851c468cc8363d500db52c2ead036020723024a109d37346efaa761"},
+    {file = "h11-0.14.0.tar.gz", hash = "sha256:8f19fbbe99e72420ff35c00b27a34cb9937e902a8b810e2c88300c6f0a3b699d"},
+]
+
+[[package]]
+name = "h2"
+version = "4.1.0"
+description = "HTTP/2 State-Machine based protocol implementation"
+category = "main"
+optional = false
+python-versions = ">=3.6.1"
+files = [
+    {file = "h2-4.1.0-py3-none-any.whl", hash = "sha256:03a46bcf682256c95b5fd9e9a99c1323584c3eec6440d379b9903d709476bc6d"},
+    {file = "h2-4.1.0.tar.gz", hash = "sha256:a83aca08fbe7aacb79fec788c9c0bac936343560ed9ec18b82a13a12c28d2abb"},
+]
+
+[package.dependencies]
+hpack = ">=4.0,<5"
+hyperframe = ">=6.0,<7"
+
+[[package]]
+name = "hpack"
+version = "4.0.0"
+description = "Pure-Python HPACK header compression"
+category = "main"
+optional = false
+python-versions = ">=3.6.1"
+files = [
+    {file = "hpack-4.0.0-py3-none-any.whl", hash = "sha256:84a076fad3dc9a9f8063ccb8041ef100867b1878b25ef0ee63847a5d53818a6c"},
+    {file = "hpack-4.0.0.tar.gz", hash = "sha256:fc41de0c63e687ebffde81187a948221294896f6bdc0ae2312708df339430095"},
+]
+
+[[package]]
+name = "httpcore"
+version = "0.17.0"
+description = "A minimal low-level HTTP client."
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "httpcore-0.17.0-py3-none-any.whl", hash = "sha256:0fdfea45e94f0c9fd96eab9286077f9ff788dd186635ae61b312693e4d943599"},
+    {file = "httpcore-0.17.0.tar.gz", hash = "sha256:cc045a3241afbf60ce056202301b4d8b6af08845e3294055eb26b09913ef903c"},
+]
+
+[package.dependencies]
+anyio = ">=3.0,<5.0"
+certifi = "*"
+h11 = ">=0.13,<0.15"
+sniffio = ">=1.0.0,<2.0.0"
+
+[package.extras]
+http2 = ["h2 (>=3,<5)"]
+socks = ["socksio (>=1.0.0,<2.0.0)"]
+
+[[package]]
+name = "httpx"
+version = "0.24.0"
+description = "The next generation HTTP client."
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "httpx-0.24.0-py3-none-any.whl", hash = "sha256:447556b50c1921c351ea54b4fe79d91b724ed2b027462ab9a329465d147d5a4e"},
+    {file = "httpx-0.24.0.tar.gz", hash = "sha256:507d676fc3e26110d41df7d35ebd8b3b8585052450f4097401c9be59d928c63e"},
+]
+
+[package.dependencies]
+certifi = "*"
+h2 = {version = ">=3,<5", optional = true, markers = "extra == \"http2\""}
+httpcore = ">=0.15.0,<0.18.0"
+idna = "*"
+sniffio = "*"
+
+[package.extras]
+brotli = ["brotli", "brotlicffi"]
+cli = ["click (>=8.0.0,<9.0.0)", "pygments (>=2.0.0,<3.0.0)", "rich (>=10,<14)"]
+http2 = ["h2 (>=3,<5)"]
+socks = ["socksio (>=1.0.0,<2.0.0)"]
+
+[[package]]
+name = "hyperframe"
+version = "6.0.1"
+description = "HTTP/2 framing layer for Python"
+category = "main"
+optional = false
+python-versions = ">=3.6.1"
+files = [
+    {file = "hyperframe-6.0.1-py3-none-any.whl", hash = "sha256:0ec6bafd80d8ad2195c4f03aacba3a8265e57bc4cff261e802bf39970ed02a15"},
+    {file = "hyperframe-6.0.1.tar.gz", hash = "sha256:ae510046231dc8e9ecb1a6586f63d2347bf4c8905914aa84ba585ae85f28a914"},
+]
+
 [[package]]
 name = "idna"
 version = "3.4"
@@ -1333,6 +1453,18 @@ files = [
     {file = "six-1.16.0.tar.gz", hash = "sha256:1e61c37477a1626458e36f7b1d82aa5c9b094fa4802892072e49de9c60c4c926"},
 ]
 
+[[package]]
+name = "sniffio"
+version = "1.3.0"
+description = "Sniff out which async library your code is running under"
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "sniffio-1.3.0-py3-none-any.whl", hash = "sha256:eecefdce1e5bbfb7ad2eeaabf7c1eeb404d7757c379bd1f7e5cce9d8bf425384"},
+    {file = "sniffio-1.3.0.tar.gz", hash = "sha256:e60305c5e5d314f5389259b7f22aaa33d8f7dee49763119234af3755c55b9101"},
+]
+
 [[package]]
 name = "tabulate"
 version = "0.8.10"
@@ -1573,4 +1705,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "eee5683fb3dcc73b282ac84c49503087af4b618d1c03d9919fb099e0c2395fb0"
+content-hash = "7d520e30d4c148bb627da6aea282645e5e3452faeb11798bef27ae81d1941f88"
diff --git a/pyproject.toml b/pyproject.toml
index 846c307e13..cebea306f8 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -29,6 +29,7 @@ ansible = "^7.3.0"
 tabulate = "0.8.10"
 cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
+httpx = {extras = ["http2"], version = "^0.24.0"}
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From eaffce0d13bd6dc251de6a535001f0e8d36f8dd7 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 8 May 2023 16:33:50 -0400
Subject: [PATCH 007/387] subprocess, massdns working

---
 bbot/core/helpers/command.py          | 245 ++++++-----------
 bbot/core/helpers/files.py            | 102 ++++++++
 bbot/core/helpers/helper.py           |   6 +-
 bbot/core/helpers/interactsh.py       |   6 +-
 bbot/core/helpers/names_generator.py  |   3 +
 bbot/core/helpers/web.py              | 361 +++++++-------------------
 bbot/modules/base.py                  |   8 +-
 bbot/modules/crobat.py                |  16 +-
 bbot/modules/internal/speculate.py    |   2 +-
 bbot/modules/massdns.py               |  48 ++--
 bbot/scanner/scanner.py               |   4 +-
 bbot/test/test_step_2/test_command.py |  63 +++++
 bbot/test/test_step_2/test_files.py   |  22 ++
 bbot/test/test_step_2/test_helpers.py |  93 -------
 bbot/test/test_step_2/test_http.py    |  48 +++-
 poetry.lock                           |  12 +-
 pyproject.toml                        |   1 -
 17 files changed, 456 insertions(+), 584 deletions(-)
 create mode 100644 bbot/core/helpers/files.py
 create mode 100644 bbot/test/test_step_2/test_command.py
 create mode 100644 bbot/test/test_step_2/test_files.py

diff --git a/bbot/core/helpers/command.py b/bbot/core/helpers/command.py
index 03c0d2f04d..65b376bf66 100644
--- a/bbot/core/helpers/command.py
+++ b/bbot/core/helpers/command.py
@@ -1,94 +1,104 @@
-import io
 import os
+import asyncio
 import logging
-import threading
 import traceback
-import subprocess
-from contextlib import suppress
+from subprocess import CompletedProcess
 
-from .misc import smart_decode, rm_at_exit
+from .misc import smart_decode, smart_encode
 
 log = logging.getLogger("bbot.core.helpers.command")
 
 
-def run_live(self, command, *args, **kwargs):
+async def run(self, *command, **kwargs):
     """
-    Get live output, line by line, as a process executes
-    You can also pass input=<iterator> and pipe data into the process' stdin
-        - This lets you chain processes like so:
+    Simple helper for running a command, and getting its output as a string
+        process = await run(["ls", "/tmp"])
+        process.stdout --> "file1.txt\nfile2.txt"
+    """
+    proc, _input = await self._spawn_proc(*command, **kwargs)
+    if proc is not None:
+        if _input is not None:
+            _input = smart_encode(_input)
+        stdout, stderr = await proc.communicate(_input)
+
+        # surface stderr
+        stderr = smart_decode(stderr)
+        stdout = smart_decode(stdout)
+        if stderr and proc.returncode != 0:
+            command_str = " ".join(command)
+            log.warning(f"Stderr for {command_str}:\n\t{stderr}")
 
-            ls_process = run_live(["ls", "/etc"])
-            grep_process = run_live(["grep", "conf"], input=ls_process)
-            for line in grep_process:
-                log.success(line)
+        return CompletedProcess(command, proc.returncode, stdout, stderr)
 
-        - The above is roughly equivalent to:
-            ls /etc | grep conf
 
-    NOTE: STDERR is logged after the process exits, if its exit code is non-zero
-        If you want to see it immediately, pass stderr=None
+async def run_live(self, *command, **kwargs):
     """
-    command, kwargs = self._prepare_command_kwargs(command, kwargs)
-    _input = kwargs.pop("input", "")
-    input_msg = ""
-    if _input:
-        kwargs["stdin"] = subprocess.PIPE
-        input_msg = " (with stdin)"
-    log.hugeverbose(f"run_live{input_msg}: {' '.join(command)}")
-    try:
-        with catch(subprocess.Popen, command, *args, **kwargs) as process:
-            if _input:
-                if type(_input) in (str, bytes):
-                    _input = (_input,)
-                self.feed_pipe(process.stdin, _input, text=False)
-            for line in io.TextIOWrapper(process.stdout, encoding="utf-8", errors="ignore", line_buffering=True):
-                yield line
-
-            # surface stderr
-            process.wait()
-            if process.stderr and process.returncode != 0:
-                stderr = smart_decode(process.stderr.read())
-                if stderr:
-                    command_str = " ".join(command)
-                    log.warning(f"Stderr for {command_str}:\n\t{stderr}")
-    except AttributeError as e:
-        if not str(e) == "__enter__":
-            raise
-
-
-def run(self, command, *args, **kwargs):
+    Simple helper for running a command and iterating through its output line by line in realtime
+        async for line in run_live(["ls", "/tmp"]):
+            log.info(line)
     """
-    Simple helper for running a command, and getting its output as a string
-        process = run(["ls", "/tmp"])
-        process.stdout --> "file1.txt\nfile2.txt"
+    proc, _input = await self._spawn_proc(*command, **kwargs)
+    if proc is not None:
+        input_task = None
+        if _input is not None:
+            input_task = asyncio.create_task(_write_stdin(proc, _input))
+
+        while 1:
+            line = await proc.stdout.readline()
+            if not line:
+                break
+            yield smart_decode(line).rstrip("\r\n")
+
+        if input_task is not None:
+            await input_task
+        await proc.wait()
+
+        # surface stderr
+        # if proc.stderr and proc.returncode != 0:
+        #     command_str = " ".join(command)
+        #     log.warning(f"Stderr for {command_str}:\n\t{stderr}")
+
+
+async def _spawn_proc(self, *command, **kwargs):
+    command, kwargs = self._prepare_command_kwargs_async(command, kwargs)
+    _input = kwargs.pop("input", None)
+    if _input is not None:
+        if kwargs.get("stdin") is not None:
+            raise ValueError("stdin and input arguments may not both be used.")
+        kwargs["stdin"] = asyncio.subprocess.PIPE
 
-    NOTE: STDERR is captured (not displayed) by default.
-        If you want to see it, self.debug(process.stderr) or pass stderr=None
-    """
-    command, kwargs = self._prepare_command_kwargs(command, kwargs)
-    if not "text" in kwargs:
-        kwargs["text"] = True
     log.hugeverbose(f"run: {' '.join(command)}")
-    result = catch(subprocess.run, command, *args, **kwargs)
+    try:
+        proc = await asyncio.create_subprocess_exec(*command, **kwargs)
+        return proc, _input
+    except FileNotFoundError as e:
+        log.warning(f"{e} - missing executable?")
+        log.trace(traceback.format_exc())
+    return None, None
 
-    # surface stderr
-    if result.stderr and result.returncode != 0:
-        stderr = smart_decode(result.stderr)
-        if stderr:
-            command_str = " ".join(command)
-            log.warning(f"Stderr for {command_str}:\n\t{stderr}")
 
-    return result
+async def _write_stdin(proc, _input):
+    if _input is not None:
+        if isinstance(_input, str):
+            proc.stdin.write(smart_encode(_input))
+        else:
+            async for chunk in _input:
+                proc.stdin.write(smart_encode(chunk) + b"\n")
+        await proc.stdin.drain()
+        proc.stdin.close()
 
 
-def _prepare_command_kwargs(self, command, kwargs):
+def _prepare_command_kwargs_async(self, command, kwargs):
     if not "stdout" in kwargs:
-        kwargs["stdout"] = subprocess.PIPE
+        kwargs["stdout"] = asyncio.subprocess.PIPE
     if not "stderr" in kwargs:
-        kwargs["stderr"] = subprocess.PIPE
+        kwargs["stderr"] = asyncio.subprocess.PIPE
     sudo = kwargs.pop("sudo", False)
 
+    if len(command) == 1 and isinstance(command[0], (list, tuple)):
+        command = command[0]
     command = [str(s) for s in command]
+
     env = kwargs.get("env", os.environ)
     if sudo and os.geteuid() != 0:
         self.depsinstaller.ensure_root()
@@ -100,106 +110,3 @@ def _prepare_command_kwargs(self, command, kwargs):
         LD_LIBRARY_PATH = os.environ.get("LD_LIBRARY_PATH", "")
         command = ["sudo", "-E", "-A", f"LD_LIBRARY_PATH={LD_LIBRARY_PATH}", f"PATH={PATH}"] + command
     return command, kwargs
-
-
-def catch(callback, *args, **kwargs):
-    try:
-        return callback(*args, **kwargs)
-    except FileNotFoundError as e:
-        log.warning(f"{e} - missing executable?")
-        log.trace(traceback.format_exc())
-    except BrokenPipeError as e:
-        log.warning(f"Error in subprocess: {e}")
-        log.trace(traceback.format_exc())
-
-
-def tempfile(self, content, pipe=True):
-    """
-    tempfile(["temp", "file", "content"]) --> Path("/home/user/.bbot/temp/pgxml13bov87oqrvjz7a")
-
-    if "pipe" is True (the default), a named pipe is used instead of
-    a true file, which allows python data to be piped directly into the
-    process without taking up disk space
-    """
-    filename = self.temp_filename()
-    rm_at_exit(filename)
-    try:
-        if type(content) not in (set, list, tuple):
-            content = (content,)
-        if pipe:
-            os.mkfifo(filename)
-            self.feed_pipe(filename, content, text=True)
-        else:
-            with open(filename, "w", errors="ignore") as f:
-                for c in content:
-                    line = f"{self.smart_decode(c)}\n"
-                    f.write(line)
-    except Exception as e:
-        log.error(f"Error creating temp file: {e}")
-        log.trace(traceback.format_exc())
-
-    return filename
-
-
-def _feed_pipe(self, pipe, content, text=True):
-    try:
-        if text:
-            decode_fn = self.smart_decode
-            newline = "\n"
-        else:
-            decode_fn = self.smart_encode
-            newline = b"\n"
-        try:
-            if hasattr(pipe, "write"):
-                try:
-                    for c in content:
-                        pipe.write(decode_fn(c) + newline)
-                finally:
-                    with suppress(Exception):
-                        pipe.close()
-            else:
-                with open(pipe, "w") as p:
-                    for c in content:
-                        p.write(decode_fn(c) + newline)
-        except BrokenPipeError:
-            log.debug(f"Broken pipe in _feed_pipe()")
-        except ValueError:
-            log.debug(f"Error _feed_pipe(): {traceback.format_exc()}")
-    except KeyboardInterrupt:
-        self.scan.stop()
-    except Exception as e:
-        log.error(f"Error in _feed_pipe(): {e}")
-        log.trace(traceback.format_exc())
-
-
-def feed_pipe(self, pipe, content, text=True):
-    t = threading.Thread(target=self._feed_pipe, args=(pipe, content), kwargs={"text": text}, daemon=True)
-    t.start()
-
-
-def tempfile_tail(self, callback):
-    """
-    Create a named pipe and execute a callback on each line
-    """
-    filename = self.temp_filename()
-    rm_at_exit(filename)
-    try:
-        os.mkfifo(filename)
-        t = threading.Thread(target=tail, args=(filename, callback), daemon=True)
-        t.start()
-    except Exception as e:
-        log.error(f"Error setting up tail for file {filename}: {e}")
-        log.trace(traceback.format_exc())
-        return
-    return filename
-
-
-def tail(filename, callback):
-    try:
-        with open(filename, errors="ignore") as f:
-            for line in f:
-                line = line.rstrip("\r\n")
-                callback(line)
-    except Exception as e:
-        log.error(f"Error tailing file {filename}: {e}")
-        log.trace(traceback.format_exc())
diff --git a/bbot/core/helpers/files.py b/bbot/core/helpers/files.py
new file mode 100644
index 0000000000..27ed71948d
--- /dev/null
+++ b/bbot/core/helpers/files.py
@@ -0,0 +1,102 @@
+import os
+import logging
+import threading
+import traceback
+from contextlib import suppress
+
+from .misc import rm_at_exit
+
+
+log = logging.getLogger("bbot.core.helpers.files")
+
+
+def tempfile(self, content, pipe=True):
+    """
+    tempfile(["temp", "file", "content"]) --> Path("/home/user/.bbot/temp/pgxml13bov87oqrvjz7a")
+
+    if "pipe" is True (the default), a named pipe is used instead of
+    a true file, which allows python data to be piped directly into the
+    process without taking up disk space
+    """
+    filename = self.temp_filename()
+    rm_at_exit(filename)
+    try:
+        if type(content) not in (set, list, tuple):
+            content = (content,)
+        if pipe:
+            os.mkfifo(filename)
+            self.feed_pipe(filename, content, text=True)
+        else:
+            with open(filename, "w", errors="ignore") as f:
+                for c in content:
+                    line = f"{self.smart_decode(c)}\n"
+                    f.write(line)
+    except Exception as e:
+        log.error(f"Error creating temp file: {e}")
+        log.trace(traceback.format_exc())
+
+    return filename
+
+
+def _feed_pipe(self, pipe, content, text=True):
+    try:
+        if text:
+            decode_fn = self.smart_decode
+            newline = "\n"
+        else:
+            decode_fn = self.smart_encode
+            newline = b"\n"
+        try:
+            if hasattr(pipe, "write"):
+                try:
+                    for c in content:
+                        pipe.write(decode_fn(c) + newline)
+                finally:
+                    with suppress(Exception):
+                        pipe.close()
+            else:
+                with open(pipe, "w") as p:
+                    for c in content:
+                        p.write(decode_fn(c) + newline)
+        except BrokenPipeError:
+            log.debug(f"Broken pipe in _feed_pipe()")
+        except ValueError:
+            log.debug(f"Error _feed_pipe(): {traceback.format_exc()}")
+    except KeyboardInterrupt:
+        self.scan.stop()
+    except Exception as e:
+        log.error(f"Error in _feed_pipe(): {e}")
+        log.trace(traceback.format_exc())
+
+
+def feed_pipe(self, pipe, content, text=True):
+    t = threading.Thread(target=self._feed_pipe, args=(pipe, content), kwargs={"text": text}, daemon=True)
+    t.start()
+
+
+def tempfile_tail(self, callback):
+    """
+    Create a named pipe and execute a callback on each line
+    """
+    filename = self.temp_filename()
+    rm_at_exit(filename)
+    try:
+        os.mkfifo(filename)
+        t = threading.Thread(target=tail, args=(filename, callback), daemon=True)
+        t.start()
+    except Exception as e:
+        log.error(f"Error setting up tail for file {filename}: {e}")
+        log.trace(traceback.format_exc())
+        return
+    return filename
+
+
+def tail(filename, callback):
+    try:
+        with open(filename, errors="ignore") as f:
+            for line in f:
+                line = line.rstrip("\r\n")
+                callback(line)
+    except Exception as e:
+        log.error(f"Error tailing file {filename}: {e}")
+        log.trace(traceback.format_exc())
diff --git a/bbot/core/helpers/helper.py b/bbot/core/helpers/helper.py
index f7c345e544..cff12d7848 100644
--- a/bbot/core/helpers/helper.py
+++ b/bbot/core/helpers/helper.py
@@ -19,12 +19,12 @@
 
 
 class ConfigAwareHelper:
-    from .web import wordlist, request, download, api_page_iter, curl
-    from .cache import cache_get, cache_put, cache_filename, is_cached, CacheDict
-    from .command import run, run_live, _prepare_command_kwargs, tempfile, feed_pipe, _feed_pipe, tempfile_tail
     from . import ntlm
     from . import regexes
     from . import validators
+    from .files import tempfile, feed_pipe, _feed_pipe, tempfile_tail
+    from .cache import cache_get, cache_put, cache_filename, is_cached, CacheDict
+    from .command import run, run_live, _spawn_proc, _prepare_command_kwargs_async
 
     def __init__(self, config, scan=None):
         self.config = config
diff --git a/bbot/core/helpers/interactsh.py b/bbot/core/helpers/interactsh.py
index b79c4cb6a3..f3303960f4 100644
--- a/bbot/core/helpers/interactsh.py
+++ b/bbot/core/helpers/interactsh.py
@@ -56,7 +56,7 @@ async def register(self, callback=None):
                 "secret-key": self.secret,
                 "correlation-id": self.correlation_id,
             }
-            r = await self.parent_helper.request_async(
+            r = await self.parent_helper.request(
                 f"https://{server}/register", headers=headers, json=data, method="POST"
             )
             if r is None:
@@ -93,7 +93,7 @@ async def deregister(self):
 
         data = {"secret-key": self.secret, "correlation-id": self.correlation_id}
 
-        r = await self.parent_helper.request_async(
+        r = await self.parent_helper.request(
             f"https://{self.server}/deregister", headers=headers, json=data, method="POST"
         )
 
@@ -111,7 +111,7 @@ async def poll(self):
         if self.token:
             headers["Authorization"] = self.token
 
-        r = await self.parent_helper.request_async(
+        r = await self.parent_helper.request(
             f"https://{self.server}/poll?id={self.correlation_id}&secret={self.secret}", headers=headers
         )
 
diff --git a/bbot/core/helpers/names_generator.py b/bbot/core/helpers/names_generator.py
index 50521de030..1dae35c4f6 100644
--- a/bbot/core/helpers/names_generator.py
+++ b/bbot/core/helpers/names_generator.py
@@ -44,6 +44,7 @@
     "decrypted",
     "deep",
     "delicious",
+    "demented",
     "demonic",
     "depraved",
     "depressed",
@@ -77,6 +78,7 @@
     "ferocious",
     "fiendish",
     "fierce",
+    "flamboyant",
     "fleecy",
     "flirtatious",
     "flustered",
@@ -127,6 +129,7 @@
     "liquid",
     "loveable",
     "lovely",
+    "lucid",
     "malevolent",
     "malfunctioning",
     "malicious",
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 60d7b88cdd..3d44e298cc 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -1,175 +1,13 @@
 import httpx
 import logging
-import requests
-from time import sleep
+import traceback
 from pathlib import Path
-from requests_cache import CachedSession
-from requests.adapters import HTTPAdapter
-from requests_cache.backends import SQLiteCache
-from requests.exceptions import RequestException
 
 from bbot.core.errors import WordlistError, CurlError
 
 log = logging.getLogger("bbot.core.helpers.web")
 
 
-def wordlist(self, path, lines=None, **kwargs):
-    if not path:
-        raise WordlistError(f"Invalid wordlist: {path}")
-    if not "cache_hrs" in kwargs:
-        kwargs["cache_hrs"] = 720
-    if self.is_url(path):
-        filename = self.download(str(path), **kwargs)
-        if filename is None:
-            raise WordlistError(f"Unable to retrieve wordlist from {path}")
-    else:
-        filename = Path(path).resolve()
-        if not filename.is_file():
-            raise WordlistError(f"Unable to find wordlist at {path}")
-
-    if lines is None:
-        return filename
-    else:
-        lines = int(lines)
-        with open(filename) as f:
-            read_lines = f.readlines()
-        cache_key = f"{filename}:{lines}"
-        truncated_filename = self.cache_filename(cache_key)
-        with open(truncated_filename, "w") as f:
-            for line in read_lines[:lines]:
-                f.write(line)
-        return truncated_filename
-
-
-def download(self, url, **kwargs):
-    """
-    Downloads file, returns full path of filename
-    If download failed, returns None
-
-    Caching supported via "cache_hrs"
-    """
-    success = False
-    filename = self.cache_filename(url)
-    cache_hrs = float(kwargs.pop("cache_hrs", -1))
-    log.debug(f"Downloading file from {url} with cache_hrs={cache_hrs}")
-    if cache_hrs > 0 and self.is_cached(url):
-        log.debug(f"{url} is cached")
-        success = True
-    else:
-        method = kwargs.get("method", "GET")
-        try:
-            with self.request(method=method, url=url, stream=True, raise_error=True, **kwargs) as response:
-                status_code = getattr(response, "status_code", 0)
-                log.debug(f"Download result: HTTP {status_code}")
-                if status_code != 0:
-                    response.raise_for_status()
-                    with open(filename, "wb") as f:
-                        for chunk in response.iter_content(chunk_size=8192):
-                            f.write(chunk)
-                    success = True
-        except RequestException as e:
-            log.warning(f"Failed to download {url}: {e}")
-            return
-        except AttributeError:
-            return
-
-    if success:
-        return filename.resolve()
-
-
-def request(self, *args, **kwargs):
-    """
-    Multipurpose function for making web requests
-
-    Supports custom sessions
-        session Request.Session()
-
-    Arguments
-        cache_for (Union[None, int, float, str, datetime, timedelta]): Cache response for <int> seconds
-        raise_error (bool): Whether to raise exceptions (default: False)
-    """
-
-    # we handle our own retries
-    retries = kwargs.pop("retries", self.config.get("http_retries", 1))
-    if getattr(self, "retry_adapter", None) is None:
-        self.retry_adapter = HTTPAdapter(max_retries=0)
-
-    raise_error = kwargs.pop("raise_error", False)
-
-    cache_for = kwargs.pop("cache_for", None)
-    if cache_for is not None:
-        log.debug(f"Caching HTTP session with expire_after={cache_for}")
-        db_path = str(self.cache_dir / "requests-cache.sqlite")
-        backend = SQLiteCache(db_path=db_path)
-        session = CachedSession(expire_after=cache_for, backend=backend)
-        session.mount("http://", self.retry_adapter)
-        session.mount("https://", self.retry_adapter)
-    elif kwargs.get("session", None) is not None:
-        session = kwargs.pop("session", None)
-        session.mount("http://", self.retry_adapter)
-        session.mount("https://", self.retry_adapter)
-    else:
-        session = requests.Session()
-        session.mount("http://", self.retry_adapter)
-        session.mount("https://", self.retry_adapter)
-
-    http_timeout = self.config.get("http_timeout", 20)
-    user_agent = self.config.get("user_agent", "BBOT")
-
-    # in case of URL only, assume GET request
-    if len(args) == 1:
-        kwargs["url"] = args[0]
-        args = []
-
-    url = kwargs.get("url", "")
-
-    if not args and "method" not in kwargs:
-        kwargs["method"] = "GET"
-
-    if not "timeout" in kwargs:
-        kwargs["timeout"] = http_timeout
-
-    headers = kwargs.get("headers", None)
-
-    if headers is None:
-        headers = {}
-    if "User-Agent" not in headers:
-        headers.update({"User-Agent": user_agent})
-    # only add custom headers if the URL is in-scope
-    if self.scan.in_scope(url):
-        for hk, hv in self.scan.config.get("http_headers", {}).items():
-            # don't clobber headers
-            if hk not in headers:
-                headers[hk] = hv
-    kwargs["headers"] = headers
-
-    http_debug = self.config.get("http_debug", False)
-    while retries == "infinite" or retries >= 0:
-        try:
-            if http_debug:
-                logstr = f"Web request: {str(args)}, {str(kwargs)}"
-                log.debug(logstr)
-            if session is not None:
-                response = session.request(*args, **kwargs)
-            else:
-                response = requests.request(*args, **kwargs)
-            if http_debug:
-                log.debug(f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}")
-            return response
-        except RequestException as e:
-            log.debug(f"Error with request: {e}")
-            if self.parent_helper.scan_stopping:
-                break
-            if retries != "infinite":
-                retries -= 1
-            if retries == "infinite" or retries >= 0:
-                log.verbose(f'Error requesting "{url}" ({e}), retrying...')
-                sleep(1)
-            else:
-                if raise_error:
-                    raise e
-
-
 class BBOTAsyncClient(httpx.AsyncClient):
     def __init__(self, *args, **kwargs):
         self._bbot_scan = kwargs.pop("_bbot_scan")
@@ -217,7 +55,7 @@ def AsyncClient(self, *args, **kwargs):
         kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries)
         return BBOTAsyncClient(*args, **kwargs)
 
-    async def request_async(self, *args, **kwargs):
+    async def request(self, *args, **kwargs):
         raise_error = kwargs.pop("raise_error", False)
 
         # in case of URL only, assume GET request
@@ -251,7 +89,7 @@ async def request_async(self, *args, **kwargs):
                 if raise_error:
                     raise
 
-    async def download_async(self, url, **kwargs):
+    async def download(self, url, **kwargs):
         """
         Downloads file, returns full path of filename
         If download failed, returns None
@@ -287,13 +125,13 @@ async def download_async(self, url, **kwargs):
         if success:
             return filename.resolve()
 
-    async def wordlist_async(self, path, lines=None, **kwargs):
+    async def wordlist(self, path, lines=None, **kwargs):
         if not path:
             raise WordlistError(f"Invalid wordlist: {path}")
         if not "cache_hrs" in kwargs:
             kwargs["cache_hrs"] = 720
         if self.parent_helper.is_url(path):
-            filename = await self.download_async(str(path), **kwargs)
+            filename = await self.download(str(path), **kwargs)
             if filename is None:
                 raise WordlistError(f"Unable to retrieve wordlist from {path}")
         else:
@@ -314,115 +152,110 @@ async def wordlist_async(self, path, lines=None, **kwargs):
                     f.write(line)
             return truncated_filename
 
+    async def api_page_iter(self, url, page_size=100, json=True, **requests_kwargs):
+        page = 1
+        offset = 0
+        while 1:
+            new_url = url.format(page=page, page_size=page_size, offset=offset)
+            result = await self.request(new_url, **requests_kwargs)
+            try:
+                if json:
+                    result = result.json()
+                yield result
+            except Exception:
+                log.warning(f'Error in api_page_iter() for url: "{new_url}"')
+                log.trace(traceback.format_exc())
+                break
+            finally:
+                offset += page_size
+                page += 1
 
-def api_page_iter(self, url, page_size=100, json=True, **requests_kwargs):
-    page = 1
-    offset = 0
-    while 1:
-        new_url = url.format(page=page, page_size=page_size, offset=offset)
-        result = self.request(new_url, **requests_kwargs)
-        try:
-            if json:
-                result = result.json()
-            yield result
-        except Exception:
-            import traceback
-
-            log.warning(f'Error in api_page_iter() for url: "{new_url}"')
-            log.trace(traceback.format_exc())
-            break
-        finally:
-            offset += page_size
-            page += 1
-
+    async def curl(self, *args, **kwargs):
+        url = kwargs.get("url", "")
 
-def curl(self, *args, **kwargs):
-    url = kwargs.get("url", "")
+        if not url:
+            raise CurlError("No URL supplied to CURL helper")
 
-    if not url:
-        raise CurlError("No URL supplied to CURL helper")
+        curl_command = ["curl", url, "-s"]
 
-    curl_command = ["curl", url, "-s"]
+        raw_path = kwargs.get("raw_path", False)
+        if raw_path:
+            curl_command.append("--path-as-is")
 
-    raw_path = kwargs.get("raw_path", False)
-    if raw_path:
-        curl_command.append("--path-as-is")
+        # respect global ssl verify settings
+        ssl_verify = self.config.get("ssl_verify")
+        if ssl_verify == False:
+            curl_command.append("-k")
 
-    # respect global ssl verify settings
-    ssl_verify = self.config.get("ssl_verify")
-    if ssl_verify == False:
-        curl_command.append("-k")
+        headers = kwargs.get("headers", {})
 
-    headers = kwargs.get("headers", {})
+        ignore_bbot_global_settings = kwargs.get("ignore_bbot_global_settings", False)
 
-    ignore_bbot_global_settings = kwargs.get("ignore_bbot_global_settings", False)
+        if ignore_bbot_global_settings:
+            log.debug("ignore_bbot_global_settings enabled. Global settings will not be applied")
+        else:
+            http_timeout = self.config.get("http_timeout", 20)
+            user_agent = self.config.get("user_agent", "BBOT")
 
-    if ignore_bbot_global_settings:
-        log.debug("ignore_bbot_global_settings enabled. Global settings will not be applied")
-    else:
-        http_timeout = self.config.get("http_timeout", 20)
-        user_agent = self.config.get("user_agent", "BBOT")
+            if "User-Agent" not in headers:
+                headers["User-Agent"] = user_agent
 
-        if "User-Agent" not in headers:
-            headers["User-Agent"] = user_agent
+            # only add custom headers if the URL is in-scope
+            if self.scan.in_scope(url):
+                for hk, hv in self.scan.config.get("http_headers", {}).items():
+                    headers[hk] = hv
 
-        # only add custom headers if the URL is in-scope
-        if self.scan.in_scope(url):
-            for hk, hv in self.scan.config.get("http_headers", {}).items():
-                headers[hk] = hv
+            # add the timeout
+            if not "timeout" in kwargs:
+                timeout = http_timeout
 
-        # add the timeout
-        if not "timeout" in kwargs:
-            timeout = http_timeout
+            curl_command.append("-m")
+            curl_command.append(str(timeout))
 
-        curl_command.append("-m")
-        curl_command.append(str(timeout))
+        for k, v in headers.items():
+            if isinstance(v, list):
+                for x in v:
+                    curl_command.append("-H")
+                    curl_command.append(f"{k}: {x}")
 
-    for k, v in headers.items():
-        if isinstance(v, list):
-            for x in v:
+            else:
                 curl_command.append("-H")
-                curl_command.append(f"{k}: {x}")
-
-        else:
-            curl_command.append("-H")
-            curl_command.append(f"{k}: {v}")
-
-    post_data = kwargs.get("post_data", {})
-    if len(post_data.items()) > 0:
-        curl_command.append("-d")
-        post_data_str = ""
-        for k, v in post_data.items():
-            post_data_str += f"&{k}={v}"
-        curl_command.append(post_data_str.lstrip("&"))
-
-    method = kwargs.get("method", "")
-    if method:
-        curl_command.append("-X")
-        curl_command.append(method)
-
-    cookies = kwargs.get("cookies", "")
-    if cookies:
-        curl_command.append("-b")
-        cookies_str = ""
-        for k, v in cookies.items():
-            cookies_str += f"{k}={v}; "
-        curl_command.append(f'{cookies_str.rstrip(" ")}')
-
-    path_override = kwargs.get("path_override", None)
-    if path_override:
-        curl_command.append("--request-target")
-        curl_command.append(f"{path_override}")
-
-    head_mode = kwargs.get("head_mode", None)
-    if head_mode:
-        curl_command.append("-I")
-
-    raw_body = kwargs.get("raw_body", None)
-    if raw_body:
-        curl_command.append("-d")
-        curl_command.append(raw_body)
-
-    output_bytes = self.run(curl_command, text=False).stdout
-    output = self.smart_decode(output_bytes)
-    return output
+                curl_command.append(f"{k}: {v}")
+
+        post_data = kwargs.get("post_data", {})
+        if len(post_data.items()) > 0:
+            curl_command.append("-d")
+            post_data_str = ""
+            for k, v in post_data.items():
+                post_data_str += f"&{k}={v}"
+            curl_command.append(post_data_str.lstrip("&"))
+
+        method = kwargs.get("method", "")
+        if method:
+            curl_command.append("-X")
+            curl_command.append(method)
+
+        cookies = kwargs.get("cookies", "")
+        if cookies:
+            curl_command.append("-b")
+            cookies_str = ""
+            for k, v in cookies.items():
+                cookies_str += f"{k}={v}; "
+            curl_command.append(f'{cookies_str.rstrip(" ")}')
+
+        path_override = kwargs.get("path_override", None)
+        if path_override:
+            curl_command.append("--request-target")
+            curl_command.append(f"{path_override}")
+
+        head_mode = kwargs.get("head_mode", None)
+        if head_mode:
+            curl_command.append("-I")
+
+        raw_body = kwargs.get("raw_body", None)
+        if raw_body:
+            curl_command.append("-d")
+            curl_command.append(raw_body)
+
+        output = await self.run(curl_command).stdout
+        return output
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index e4c23e9d90..3f8ebedd86 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -119,7 +119,7 @@ def handle_batch(self, *events):
         """
         pass
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         """
         Accept/reject events based on custom criteria
 
@@ -208,7 +208,7 @@ async def catch(self, *args, **kwargs):
         return await self.scan.manager.catch(*args, **kwargs)
 
     async def _postcheck_and_run(self, callback, event):
-        acceptable, reason = self._event_postcheck(event)
+        acceptable, reason = await self._event_postcheck(event)
         if not acceptable:
             if reason:
                 self.debug(f"Not accepting {event} because {reason}")
@@ -411,7 +411,7 @@ def _event_precheck(self, event):
                 return False, "module consumes IP ranges directly"
         return True, ""
 
-    def _event_postcheck(self, event):
+    async def _event_postcheck(self, event):
         """
         Check if an event should be accepted by the module
         Used when taking an event FROM the module's queue (immediately before it's handled)
@@ -437,7 +437,7 @@ def _event_postcheck(self, event):
 
         # custom filtering
         try:
-            filter_result = self.filter_event(event)
+            filter_result = await self.filter_event(event)
             msg = str(self._custom_filter_criteria_msg)
             with suppress(ValueError, TypeError):
                 filter_result, reason = filter_result
diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index a5cc90599e..66c0f70b62 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -22,19 +22,19 @@ class crobat(BaseModule):
     # until the queue is ready to receive its results
     _qsize = 1
 
-    def setup(self):
+    async def setup(self):
         self.processed = set()
         self.http_timeout = self.scan.config.get("http_timeout", 10)
         self._failures = 0
         return True
 
-    def _is_wildcard(self, query):
-        for domain, wildcard_rdtypes in self.helpers.is_wildcard_domain(query).items():
+    async def _is_wildcard(self, query):
+        for domain, wildcard_rdtypes in (await self.helpers.is_wildcard_domain(query)).items():
             if any(t in wildcard_rdtypes for t in ("A", "AAAA", "CNAME")):
                 return True
         return False
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         """
         This filter_event is used across many modules
         """
@@ -42,16 +42,16 @@ def filter_event(self, event):
         # reject if already processed
         if self.already_processed(query):
             return False, "Event was already processed"
-        eligible, reason = self.eligible_for_enumeration(event)
+        eligible, reason = await self.eligible_for_enumeration(event)
         if eligible:
             self.processed.add(hash(query))
             return True, reason
         return False, reason
 
-    def eligible_for_enumeration(self, event):
+    async def eligible_for_enumeration(self, event):
         query = self.make_query(event)
         # check if wildcard
-        is_wildcard = self._is_wildcard(query)
+        is_wildcard = await self._is_wildcard(query)
         # check if cloud
         is_cloud = False
         if any(t.startswith("cloud-") for t in event.tags):
@@ -85,7 +85,7 @@ def abort_if(self, event):
             return True
         return False
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
         results = self.query(query)
         if results:
diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index 74e67ef507..7e9d65f969 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -104,7 +104,7 @@ async def handle_event(self, event):
                         quick=True,
                     )
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         # don't accept IP_RANGE --> IP_ADDRESS events from self
         if str(event.module) == "speculate":
             if not (event.type == "IP_ADDRESS" and str(getattr(event.source, "type")) == "IP_RANGE"):
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 718dc0eb58..e986206fa8 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -62,26 +62,26 @@ class massdns(crobat):
 
     digit_regex = re.compile(r"\d+")
 
-    def setup(self):
+    async def setup(self):
         self.found = dict()
         self.mutations_tried = set()
         self.source_events = dict()
-        self.subdomain_file = self.helpers.wordlist(self.config.get("wordlist"))
+        self.subdomain_file = await self.helpers.wordlist(self.config.get("wordlist"))
         self.max_resolvers = self.config.get("max_resolvers", 500)
         self.max_mutations = self.config.get("max_mutations", 500)
         nameservers_url = (
             "https://raw.githubusercontent.com/blacklanternsecurity/public-dns-servers/master/nameservers.txt"
         )
-        self.resolver_file = self.helpers.wordlist(
+        self.resolver_file = await self.helpers.wordlist(
             nameservers_url,
             cache_hrs=24 * 7,
         )
         self.devops_mutations = list(self.helpers.word_cloud.devops_mutations)
-        return super().setup()
+        return await super().setup()
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         query = self.make_query(event)
-        eligible, reason = self.eligible_for_enumeration(event)
+        eligible, reason = await self.eligible_for_enumeration(event)
         if eligible:
             self.add_found(event)
         # reject if already processed
@@ -92,14 +92,14 @@ def filter_event(self, event):
             return True, reason
         return False, reason
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
         h = hash(query)
         if not h in self.source_events:
             self.source_events[h] = event
 
         self.info(f"Brute-forcing subdomains for {query}")
-        for hostname in self.massdns(query, self.helpers.read_file(self.subdomain_file)):
+        for hostname in await self.massdns(query, self.helpers.read_file(self.subdomain_file)):
             self.emit_result(hostname, event, query)
 
     def abort_if(self, event):
@@ -118,33 +118,35 @@ def already_processed(self, hostname):
             return True
         return False
 
-    def massdns(self, domain, subdomains):
+    async def massdns(self, domain, subdomains):
         abort_msg = f"Aborting massdns on {domain} due to false positives"
-        if self._canary_check(domain):
+        if await self._canary_check(domain):
             self.info(abort_msg)
             return []
-        results = list(self._massdns(domain, subdomains))
+        results = [l async for l in self._massdns(domain, subdomains)]
         if len(results) > 50:
-            if self._canary_check(domain):
+            if await self._canary_check(domain):
                 self.info(abort_msg)
                 return []
         self.verbose(f"Resolving batch of {len(results):,} results")
-        resolved = dict(self.helpers.resolve_batch(results, type=("A", "AAAA", "CNAME"), cache_result=True))
+        resolved = dict(
+            [l async for l in self.helpers.resolve_batch(results, type=("A", "AAAA", "CNAME"), cache_result=True)]
+        )
         resolved = {k: v for k, v in resolved.items() if v}
         for hostname in resolved:
             self.add_found(hostname)
         return list(resolved)
 
-    def _canary_check(self, domain, num_checks=50):
+    async def _canary_check(self, domain, num_checks=50):
         random_subdomains = list(self.gen_random_subdomains(num_checks))
         self.verbose(f"Testing {len(random_subdomains):,} canaries against {domain}")
-        canary_results = list(self._massdns(domain, random_subdomains))
+        canary_results = [l async for l in self._massdns(domain, random_subdomains)]
         for result in canary_results:
-            if self.helpers.resolve(result):
+            if await self.helpers.resolve(result):
                 return True
         return False
 
-    def _massdns(self, domain, subdomains):
+    async def _massdns(self, domain, subdomains):
         """
         {
           "name": "www.blacklanternsecurity.com.",
@@ -176,7 +178,7 @@ def _massdns(self, domain, subdomains):
             return
 
         domain_wildcard_rdtypes = set()
-        for domain, rdtypes in self.helpers.is_wildcard_domain(domain).items():
+        for domain, rdtypes in (await self.helpers.is_wildcard_domain(domain)).items():
             for rdtype, results in rdtypes.items():
                 if results:
                     domain_wildcard_rdtypes.add(rdtype)
@@ -197,7 +199,7 @@ def _massdns(self, domain, subdomains):
         )
         subdomains = self.gen_subdomains(subdomains, domain)
         hosts_yielded = set()
-        for line in self.helpers.run_live(command, stderr=subprocess.DEVNULL, input=subdomains):
+        async for line in self.helpers.run_live(command, stderr=subprocess.DEVNULL, input=subdomains):
             try:
                 j = json.loads(line)
             except json.decoder.JSONDecodeError:
@@ -222,7 +224,7 @@ def _massdns(self, domain, subdomains):
                                     f"Skipping {hostname}:{rdtype} because it may be a wildcard (reason: performance)"
                                 )
                                 continue
-                            wildcard_rdtypes = self.helpers.is_wildcard(hostname, ips=(data,))
+                            wildcard_rdtypes = await self.helpers.is_wildcard(hostname, ips=(data,))
                             if rdtype in wildcard_rdtypes:
                                 self.debug(f"Skipping {hostname}:{rdtype} because it's a wildcard")
                                 continue
@@ -231,7 +233,7 @@ def _massdns(self, domain, subdomains):
                             hosts_yielded.add(hostname_hash)
                             yield hostname
 
-    def finish(self):
+    async def finish(self):
         found = sorted(self.found.items(), key=lambda x: len(x[-1]), reverse=True)
         # if we have a lot of rounds to make, don't try mutations on less-populated domains
         trimmed_found = []
@@ -310,7 +312,7 @@ def add_mutation(_domain_hash, m):
 
                     if mutations:
                         self.info(f"Trying {len(mutations):,} mutations against {domain} ({i+1}/{len(found)})")
-                        results = list(self.massdns(query, mutations))
+                        results = list(await self.massdns(query, mutations))
                         for hostname in results:
                             source_event = self.get_source_event(hostname)
                             if source_event is None:
@@ -334,7 +336,7 @@ def add_found(self, host):
                 except KeyError:
                     self.found[domain] = set((subdomain,))
 
-    def gen_subdomains(self, prefixes, domain):
+    async def gen_subdomains(self, prefixes, domain):
         for p in prefixes:
             d = f"{p}.{domain}"
             yield d
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 465d2f7a4a..df7bb80e15 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -193,7 +193,7 @@ async def start(self):
             self.warning(f"No scan targets specified")
 
         # start status ticker
-        ticker_task = asyncio.create_task(self._status_ticker(self.))
+        ticker_task = asyncio.create_task(self._status_ticker(self.status_frequency))
 
         scan_start_time = datetime.now()
         try:
@@ -322,7 +322,7 @@ async def setup_modules(self, remove_failed=True):
         hard_failed = []
         soft_failed = []
 
-        for task in asyncio.as_completed([m._setup() for m in self.modules.values()]):
+        for task in asyncio.as_completed([asyncio.create_task(m._setup()) for m in self.modules.values()]):
             module_name, status, msg = await task
             if status == True:
                 self.debug(f"Setup succeeded for {module_name} ({msg})")
diff --git a/bbot/test/test_step_2/test_command.py b/bbot/test/test_step_2/test_command.py
new file mode 100644
index 0000000000..ad27ea1f5b
--- /dev/null
+++ b/bbot/test/test_step_2/test_command.py
@@ -0,0 +1,63 @@
+from ..bbot_fixtures import *
+
+
+@pytest.mark.asyncio
+async def test_command(bbot_scanner, bbot_config):
+    scan1 = bbot_scanner(config=bbot_config)
+
+    # run
+    assert "plumbus\n" == (await scan1.helpers.run(["echo", "plumbus"])).stdout
+    result = (await scan1.helpers.run(["cat"], input="some\nrandom\nstdin")).stdout
+    assert result.splitlines() == ["some", "random", "stdin"]
+
+    # run_live
+    lines = []
+    async for line in scan1.helpers.run_live(["echo", "plumbus"]):
+        lines.append(line)
+    assert lines == ["plumbus"]
+    lines = []
+    async for line in scan1.helpers.run_live(["cat"], input="some\nrandom\nstdin"):
+        lines.append(line)
+    assert lines == ["some", "random", "stdin"]
+
+    # test piping
+    lines = []
+    async for line in scan1.helpers.run_live(
+        ["cat"], input=scan1.helpers.run_live(["echo", "-en", r"some\nrandom\nstdin"])
+    ):
+        lines.append(line)
+    log.critical(lines)
+    assert lines == ["some", "random", "stdin"]
+
+    # test missing executable
+    result = await scan1.helpers.run(["sgkjlskdfsdf"])
+    assert result is None
+
+    # test sudo + existence of environment variables
+    scan1.load_modules()
+    path_parts = os.environ.get("PATH", "").split(":")
+    assert "/tmp/.bbot_test/tools" in path_parts
+    run_lines = (await scan1.helpers.run(["env"])).stdout.splitlines()
+    assert f"BBOT_PLUMBUS=asdf" in run_lines
+    for line in run_lines:
+        if line.startswith("PATH="):
+            path_parts = line.split("=", 1)[-1].split(":")
+            assert "/tmp/.bbot_test/tools" in path_parts
+    run_lines_sudo = (await scan1.helpers.run(["env"], sudo=True)).stdout.splitlines()
+    assert f"BBOT_PLUMBUS=asdf" in run_lines_sudo
+    for line in run_lines_sudo:
+        if line.startswith("PATH="):
+            path_parts = line.split("=", 1)[-1].split(":")
+            assert "/tmp/.bbot_test/tools" in path_parts
+    run_live_lines = [l async for l in scan1.helpers.run_live(["env"])]
+    assert f"BBOT_PLUMBUS=asdf" in run_live_lines
+    for line in run_live_lines:
+        if line.startswith("PATH="):
+            path_parts = line.strip().split("=", 1)[-1].split(":")
+            assert "/tmp/.bbot_test/tools" in path_parts
+    run_live_lines_sudo = [l async for l in scan1.helpers.run_live(["env"], sudo=True)]
+    assert f"BBOT_PLUMBUS=asdf" in run_live_lines_sudo
+    for line in run_live_lines_sudo:
+        if line.startswith("PATH="):
+            path_parts = line.strip().split("=", 1)[-1].split(":")
+            assert "/tmp/.bbot_test/tools" in path_parts
diff --git a/bbot/test/test_step_2/test_files.py b/bbot/test/test_step_2/test_files.py
new file mode 100644
index 0000000000..210a6342f2
--- /dev/null
+++ b/bbot/test/test_step_2/test_files.py
@@ -0,0 +1,22 @@
+from time import sleep
+
+from ..bbot_fixtures import *
+
+
+@pytest.mark.asyncio
+async def test_files(bbot_scanner, bbot_config):
+    scan1 = bbot_scanner(config=bbot_config)
+
+    # tempfile
+    tempfile = scan1.helpers.tempfile(("line1", "line2"), pipe=False)
+    assert list(scan1.helpers.read_file(tempfile)) == ["line1", "line2"]
+    tempfile = scan1.helpers.tempfile(("line1", "line2"), pipe=True)
+    assert list(scan1.helpers.read_file(tempfile)) == ["line1", "line2"]
+
+    # tempfile tail
+    results = []
+    tempfile = scan1.helpers.tempfile_tail(callback=lambda x: results.append(x))
+    with open(tempfile, "w") as f:
+        f.write("asdf\n")
+    sleep(0.1)
+    assert "asdf" in results
diff --git a/bbot/test/test_step_2/test_helpers.py b/bbot/test/test_step_2/test_helpers.py
index 5ea38e8ff6..e3f9bc1d3b 100644
--- a/bbot/test/test_step_2/test_helpers.py
+++ b/bbot/test/test_step_2/test_helpers.py
@@ -2,7 +2,6 @@
 import datetime
 import ipaddress
 import requests_mock
-from time import sleep
 
 from ..bbot_fixtures import *
 
@@ -351,72 +350,6 @@ def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
         helpers.recursive_decode(r"Hello\\nWorld\\\tGreetings\\\\nMore\nText") == "Hello\nWorld\tGreetings\nMore\nText"
     )
 
-    def raise_filenotfound():
-        raise FileNotFoundError("asdf")
-
-    def raise_brokenpipe():
-        raise BrokenPipeError("asdf")
-
-    from bbot.core.helpers import command
-
-    command.catch(raise_filenotfound)
-    command.catch(raise_brokenpipe)
-
-    ### COMMAND ###
-    scan1 = bbot_scanner(config=bbot_config)
-    assert "plumbus\n" in scan1.helpers.run(["echo", "plumbus"], text=True).stdout
-    assert "plumbus\n" in list(scan1.helpers.run_live(["echo", "plumbus"]))
-    expected_output = ["lumbus\n", "plumbus\n", "rumbus\n"]
-    assert list(scan1.helpers.run_live(["cat"], input="lumbus\nplumbus\nrumbus")) == expected_output
-
-    def plumbus_generator():
-        yield "lumbus"
-        yield "plumbus"
-
-    assert "plumbus\n" in list(scan1.helpers.run_live(["cat"], input=plumbus_generator()))
-    tempfile = helpers.tempfile(("lumbus", "plumbus"), pipe=True)
-    with open(tempfile) as f:
-        assert "plumbus\n" in list(f)
-    tempfile = helpers.tempfile(("lumbus", "plumbus"), pipe=False)
-    with open(tempfile) as f:
-        assert "plumbus\n" in list(f)
-
-    results = []
-    tempfile = helpers.tempfile_tail(callback=lambda x: results.append(x))
-    with open(tempfile, "w") as f:
-        f.write("asdf\n")
-    sleep(0.1)
-    assert "asdf" in results
-
-    # test sudo + existence of environment variables
-    scan1.load_modules()
-    path_parts = os.environ.get("PATH", "").split(":")
-    assert "/tmp/.bbot_test/tools" in path_parts
-    run_lines = scan1.helpers.run(["env"]).stdout.splitlines()
-    assert f"BBOT_PLUMBUS=asdf" in run_lines
-    for line in run_lines:
-        if line.startswith("PATH="):
-            path_parts = line.split("=", 1)[-1].split(":")
-            assert "/tmp/.bbot_test/tools" in path_parts
-    run_lines_sudo = scan1.helpers.run(["env"], sudo=True).stdout.splitlines()
-    assert f"BBOT_PLUMBUS=asdf" in run_lines_sudo
-    for line in run_lines_sudo:
-        if line.startswith("PATH="):
-            path_parts = line.split("=", 1)[-1].split(":")
-            assert "/tmp/.bbot_test/tools" in path_parts
-    run_live_lines = list(scan1.helpers.run_live(["env"]))
-    assert f"BBOT_PLUMBUS=asdf\n" in run_live_lines
-    for line in run_live_lines:
-        if line.startswith("PATH="):
-            path_parts = line.strip().split("=", 1)[-1].split(":")
-            assert "/tmp/.bbot_test/tools" in path_parts
-    run_live_lines_sudo = list(scan1.helpers.run_live(["env"], sudo=True))
-    assert f"BBOT_PLUMBUS=asdf\n" in run_live_lines_sudo
-    for line in run_live_lines_sudo:
-        if line.startswith("PATH="):
-            path_parts = line.strip().split("=", 1)[-1].split(":")
-            assert "/tmp/.bbot_test/tools" in path_parts
-
     ### CACHE ###
     helpers.cache_put("string", "wat")
     helpers.cache_put("binary", b"wat")
@@ -444,32 +377,6 @@ def plumbus_generator():
     assert len(cache_dict) == 10
     assert tuple(cache_dict) == tuple(hash(str(x)) for x in range(10, 20))
 
-    ### WEB ###
-    with requests_mock.Mocker() as m:
-        # test base request
-        m.get("http://blacklanternsecurity.com/yep", text="yep")
-        assert getattr(helpers.request("http://blacklanternsecurity.com/yep"), "text", "") == "yep"
-        # test cached request
-        m.get("http://blacklanternsecurity.com/yepyep", text="yepyep")
-        assert getattr(helpers.request("http://blacklanternsecurity.com/yepyep", cache_for=60), "text", "") == "yepyep"
-        # test caching
-        m.get("http://blacklanternsecurity.com/yepyep", text="nope")
-        assert getattr(helpers.request("http://blacklanternsecurity.com/yepyep", cache_for=60), "text", "") == "yepyep"
-        # test downloading
-        m.get("http://blacklanternsecurity.com/download", text="downloaded")
-        filename = helpers.download("http://blacklanternsecurity.com/download", cache_hrs=1)
-        assert Path(str(filename)).is_file()
-        assert helpers.is_cached("http://blacklanternsecurity.com/download")
-        # test wordlist
-        m.get("http://blacklanternsecurity.com/wordlist", text="wordlist")
-        assert helpers.wordlist("http://blacklanternsecurity.com/wordlist").is_file()
-
-    # custom headers
-    bbot_httpserver.expect_request("/test-custom-http-headers-requests", headers={"test": "header"}).respond_with_data(
-        "OK"
-    )
-    assert scan.helpers.request(bbot_httpserver.url_for("/test-custom-http-headers-requests")).status_code == 200
-
     test_file = Path(scan.config["home"]) / "testfile.asdf"
     with open(test_file, "w") as f:
         for i in range(100):
diff --git a/bbot/test/test_step_2/test_http.py b/bbot/test/test_step_2/test_http.py
index 47b6c584dc..0fa4d9091e 100644
--- a/bbot/test/test_step_2/test_http.py
+++ b/bbot/test/test_step_2/test_http.py
@@ -17,10 +17,10 @@ async def test_http_helpers(bbot_scanner, bbot_config, bbot_httpserver):
     bbot_httpserver.expect_request(uri="/test_http_helpers", headers=headers).respond_with_data(
         "test_http_helpers_yep"
     )
-    response = await scan1.helpers.request_async(url)
+    response = await scan1.helpers.request(url)
     # should fail because URL is not in-scope
     assert response.status_code == 500
-    response = await scan2.helpers.request_async(url)
+    response = await scan2.helpers.request(url)
     # should suceed because URL is in-scope
     assert response.status_code == 200
     assert response.text == "test_http_helpers_yep"
@@ -30,7 +30,7 @@ async def test_http_helpers(bbot_scanner, bbot_config, bbot_httpserver):
     url = bbot_httpserver.url_for(path)
     download_content = "test_http_helpers_download_yep"
     bbot_httpserver.expect_request(uri=path).respond_with_data(download_content)
-    filename = await scan1.helpers.download_async(url)
+    filename = await scan1.helpers.download(url)
     assert Path(str(filename)).is_file()
     assert scan1.helpers.is_cached(url)
     with open(filename) as f:
@@ -40,7 +40,7 @@ async def test_http_helpers(bbot_scanner, bbot_config, bbot_httpserver):
     url = bbot_httpserver.url_for(path)
     download_content = "404"
     bbot_httpserver.expect_request(uri=path).respond_with_data(download_content, status=404)
-    filename = await scan1.helpers.download_async(url)
+    filename = await scan1.helpers.download(url)
     assert filename is None
     assert not scan1.helpers.is_cached(url)
 
@@ -49,11 +49,45 @@ async def test_http_helpers(bbot_scanner, bbot_config, bbot_httpserver):
     url = bbot_httpserver.url_for(path)
     download_content = "a\ncool\nword\nlist"
     bbot_httpserver.expect_request(uri=path).respond_with_data(download_content)
-    filename = await scan1.helpers.wordlist_async(url)
+    filename = await scan1.helpers.wordlist(url)
     assert Path(str(filename)).is_file()
     assert scan1.helpers.is_cached(url)
-    with open(filename) as f:
-        assert f.read().splitlines() == ["a", "cool", "word", "list"]
+    assert list(scan1.helpers.read_file(filename)) == ["a", "cool", "word", "list"]
+
+    # page iteration
+    base_path = "/test_http_page_iteration"
+    template_path = base_path + "/{page}?page_size={page_size}&offset={offset}"
+    template_url = bbot_httpserver.url_for(template_path)
+    bbot_httpserver.expect_request(
+        uri=f"{base_path}/1", query_string={"page_size": "100", "offset": "0"}
+    ).respond_with_data("page1")
+    bbot_httpserver.expect_request(
+        uri=f"{base_path}/2", query_string={"page_size": "100", "offset": "100"}
+    ).respond_with_data("page2")
+    bbot_httpserver.expect_request(
+        uri=f"{base_path}/3", query_string={"page_size": "100", "offset": "200"}
+    ).respond_with_data("page3")
+    results = []
+    agen = scan1.helpers.api_page_iter(template_url)
+    try:
+        async for result in agen:
+            if result and result.text.startswith("page"):
+                results.append(result)
+            else:
+                break
+    finally:
+        await agen.aclose()
+    assert not results
+    agen = scan1.helpers.api_page_iter(template_url, json=False)
+    try:
+        async for result in agen:
+            if result and result.text.startswith("page"):
+                results.append(result)
+            else:
+                break
+    finally:
+        await agen.aclose()
+    assert [r.text for r in results] == ["page1", "page2", "page3"]
 
 
 @pytest.mark.asyncio
diff --git a/poetry.lock b/poetry.lock
index f0fdf18237..3141b7e3fc 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1319,21 +1319,21 @@ files = [
 
 [[package]]
 name = "requests"
-version = "2.28.2"
+version = "2.30.0"
 description = "Python HTTP for Humans."
 category = "main"
 optional = false
-python-versions = ">=3.7, <4"
+python-versions = ">=3.7"
 files = [
-    {file = "requests-2.28.2-py3-none-any.whl", hash = "sha256:64299f4909223da747622c030b781c0d7811e359c37124b4bd368fb8c6518baa"},
-    {file = "requests-2.28.2.tar.gz", hash = "sha256:98b1b2782e3c6c4904938b84c0eb932721069dfdb9134313beff7c83c2df24bf"},
+    {file = "requests-2.30.0-py3-none-any.whl", hash = "sha256:10e94cc4f3121ee6da529d358cdaeaff2f1c409cd377dbc72b825852f2f7e294"},
+    {file = "requests-2.30.0.tar.gz", hash = "sha256:239d7d4458afcb28a692cdd298d87542235f4ca8d36d03a15bfc128a6559a2f4"},
 ]
 
 [package.dependencies]
 certifi = ">=2017.4.17"
 charset-normalizer = ">=2,<4"
 idna = ">=2.5,<4"
-urllib3 = ">=1.21.1,<1.27"
+urllib3 = ">=1.21.1,<3"
 
 [package.extras]
 socks = ["PySocks (>=1.5.6,!=1.5.7)"]
@@ -1705,4 +1705,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "7d520e30d4c148bb627da6aea282645e5e3452faeb11798bef27ae81d1941f88"
+content-hash = "5366646b07e8aa2c1189f64e976bab2ec624855eb5943bde2710376c8e115305"
diff --git a/pyproject.toml b/pyproject.toml
index cebea306f8..d8b6f50fc0 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -17,7 +17,6 @@ omegaconf = "^2.3.0"
 tldextract = "^3.4.0"
 psutil = "^5.9.4"
 wordninja = "^2.0.0"
-requests = "^2.28.2"
 dnspython = "^2.3.0"
 pydantic = "^1.10.6"
 ansible-runner = "^2.3.2"

From 0592f4b7f42c1a2b6d0f3115fc877b2fd0acd5ec Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 8 May 2023 17:00:32 -0400
Subject: [PATCH 008/387] better command tests

---
 bbot/core/helpers/command.py          | 21 +++++++++++----------
 bbot/core/helpers/helper.py           |  2 +-
 bbot/test/test_step_2/test_command.py |  8 +++++++-
 3 files changed, 19 insertions(+), 12 deletions(-)

diff --git a/bbot/core/helpers/command.py b/bbot/core/helpers/command.py
index 65b376bf66..426d76333e 100644
--- a/bbot/core/helpers/command.py
+++ b/bbot/core/helpers/command.py
@@ -15,7 +15,7 @@ async def run(self, *command, **kwargs):
         process = await run(["ls", "/tmp"])
         process.stdout --> "file1.txt\nfile2.txt"
     """
-    proc, _input = await self._spawn_proc(*command, **kwargs)
+    proc, _input, command = await self._spawn_proc(*command, **kwargs)
     if proc is not None:
         if _input is not None:
             _input = smart_encode(_input)
@@ -26,7 +26,7 @@ async def run(self, *command, **kwargs):
         stdout = smart_decode(stdout)
         if stderr and proc.returncode != 0:
             command_str = " ".join(command)
-            log.warning(f"Stderr for {command_str}:\n\t{stderr}")
+            log.warning(f"Stderr for run({command_str}):\n\t{stderr}")
 
         return CompletedProcess(command, proc.returncode, stdout, stderr)
 
@@ -37,7 +37,7 @@ async def run_live(self, *command, **kwargs):
         async for line in run_live(["ls", "/tmp"]):
             log.info(line)
     """
-    proc, _input = await self._spawn_proc(*command, **kwargs)
+    proc, _input, command = await self._spawn_proc(*command, **kwargs)
     if proc is not None:
         input_task = None
         if _input is not None:
@@ -54,13 +54,14 @@ async def run_live(self, *command, **kwargs):
         await proc.wait()
 
         # surface stderr
-        # if proc.stderr and proc.returncode != 0:
-        #     command_str = " ".join(command)
-        #     log.warning(f"Stderr for {command_str}:\n\t{stderr}")
+        if proc.returncode != 0:
+            stdout, stderr = await proc.communicate()
+            command_str = " ".join(command)
+            log.warning(f"Stderr for run_live({command_str}):\n\t{smart_decode(stderr)}")
 
 
 async def _spawn_proc(self, *command, **kwargs):
-    command, kwargs = self._prepare_command_kwargs_async(command, kwargs)
+    command, kwargs = self._prepare_command_kwargs(command, kwargs)
     _input = kwargs.pop("input", None)
     if _input is not None:
         if kwargs.get("stdin") is not None:
@@ -70,11 +71,11 @@ async def _spawn_proc(self, *command, **kwargs):
     log.hugeverbose(f"run: {' '.join(command)}")
     try:
         proc = await asyncio.create_subprocess_exec(*command, **kwargs)
-        return proc, _input
+        return proc, _input, command
     except FileNotFoundError as e:
         log.warning(f"{e} - missing executable?")
         log.trace(traceback.format_exc())
-    return None, None
+    return None, None, None
 
 
 async def _write_stdin(proc, _input):
@@ -88,7 +89,7 @@ async def _write_stdin(proc, _input):
         proc.stdin.close()
 
 
-def _prepare_command_kwargs_async(self, command, kwargs):
+def _prepare_command_kwargs(self, command, kwargs):
     if not "stdout" in kwargs:
         kwargs["stdout"] = asyncio.subprocess.PIPE
     if not "stderr" in kwargs:
diff --git a/bbot/core/helpers/helper.py b/bbot/core/helpers/helper.py
index cff12d7848..f25578d30b 100644
--- a/bbot/core/helpers/helper.py
+++ b/bbot/core/helpers/helper.py
@@ -23,8 +23,8 @@ class ConfigAwareHelper:
     from . import regexes
     from . import validators
     from .files import tempfile, feed_pipe, _feed_pipe, tempfile_tail
+    from .command import run, run_live, _spawn_proc, _prepare_command_kwargs
     from .cache import cache_get, cache_put, cache_filename, is_cached, CacheDict
-    from .command import run, run_live, _spawn_proc, _prepare_command_kwargs_async
 
     def __init__(self, config, scan=None):
         self.config = config
diff --git a/bbot/test/test_step_2/test_command.py b/bbot/test/test_step_2/test_command.py
index ad27ea1f5b..db2a069290 100644
--- a/bbot/test/test_step_2/test_command.py
+++ b/bbot/test/test_step_2/test_command.py
@@ -26,12 +26,18 @@ async def test_command(bbot_scanner, bbot_config):
         ["cat"], input=scan1.helpers.run_live(["echo", "-en", r"some\nrandom\nstdin"])
     ):
         lines.append(line)
-    log.critical(lines)
     assert lines == ["some", "random", "stdin"]
 
     # test missing executable
     result = await scan1.helpers.run(["sgkjlskdfsdf"])
     assert result is None
+    lines = [l async for l in scan1.helpers.run_live(["ljhsdghsdf"])]
+    assert not lines
+    # test stderr
+    result = await scan1.helpers.run(["ls", "/sldikgjasldkfsdf"])
+    assert "No such file or directory" in result.stderr
+    lines = [l async for l in scan1.helpers.run_live(["ls", "/sldikgjasldkfsdf"])]
+    assert not lines
 
     # test sudo + existence of environment variables
     scan1.load_modules()

From 65080555b707f6e2b06d8302cc49bdd4460a91a9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 8 May 2023 17:08:50 -0400
Subject: [PATCH 009/387] asyncified curl

---
 bbot/core/helpers/web.py                      | 12 +++---
 bbot/test/test_step_1/test_before_patching.py | 34 -----------------
 .../test_step_2/{test_http.py => test_web.py} | 37 ++++++++++++++++++-
 3 files changed, 41 insertions(+), 42 deletions(-)
 delete mode 100644 bbot/test/test_step_1/test_before_patching.py
 rename bbot/test/test_step_2/{test_http.py => test_web.py} (72%)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 3d44e298cc..ba642d3554 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -183,7 +183,7 @@ async def curl(self, *args, **kwargs):
             curl_command.append("--path-as-is")
 
         # respect global ssl verify settings
-        ssl_verify = self.config.get("ssl_verify")
+        ssl_verify = self.parent_helper.config.get("ssl_verify")
         if ssl_verify == False:
             curl_command.append("-k")
 
@@ -194,15 +194,15 @@ async def curl(self, *args, **kwargs):
         if ignore_bbot_global_settings:
             log.debug("ignore_bbot_global_settings enabled. Global settings will not be applied")
         else:
-            http_timeout = self.config.get("http_timeout", 20)
-            user_agent = self.config.get("user_agent", "BBOT")
+            http_timeout = self.parent_helper.config.get("http_timeout", 20)
+            user_agent = self.parent_helper.config.get("user_agent", "BBOT")
 
             if "User-Agent" not in headers:
                 headers["User-Agent"] = user_agent
 
             # only add custom headers if the URL is in-scope
-            if self.scan.in_scope(url):
-                for hk, hv in self.scan.config.get("http_headers", {}).items():
+            if self.parent_helper.scan.in_scope(url):
+                for hk, hv in self.parent_helper.scan.config.get("http_headers", {}).items():
                     headers[hk] = hv
 
             # add the timeout
@@ -257,5 +257,5 @@ async def curl(self, *args, **kwargs):
             curl_command.append("-d")
             curl_command.append(raw_body)
 
-        output = await self.run(curl_command).stdout
+        output = (await self.parent_helper.run(curl_command)).stdout
         return output
diff --git a/bbot/test/test_step_1/test_before_patching.py b/bbot/test/test_step_1/test_before_patching.py
deleted file mode 100644
index 5fe26b0fba..0000000000
--- a/bbot/test/test_step_1/test_before_patching.py
+++ /dev/null
@@ -1,34 +0,0 @@
-from ..bbot_fixtures import *  # noqa: F401
-from bbot.scanner import Scanner
-
-
-def test_curl(bbot_httpserver, bbot_config):
-    scan = Scanner("127.0.0.1", config=bbot_config)
-    helpers = scan.helpers
-    url = bbot_httpserver.url_for("/curl")
-    bbot_httpserver.expect_request(uri="/curl").respond_with_data("curl_yep")
-    bbot_httpserver.expect_request(uri="/index.html").respond_with_data("curl_yep_index")
-    assert helpers.curl(url=url) == "curl_yep"
-    assert helpers.curl(url=url, ignore_bbot_global_settings=True) == "curl_yep"
-    assert helpers.curl(url=url, head_mode=True).startswith("HTTP/")
-    assert helpers.curl(url=url, raw_body="body") == "curl_yep"
-    assert (
-        helpers.curl(
-            url=url,
-            raw_path=True,
-            headers={"test": "test", "test2": ["test2"]},
-            ignore_bbot_global_settings=False,
-            post_data={"test": "test"},
-            method="POST",
-            cookies={"test": "test"},
-            path_override="/index.html",
-        )
-        == "curl_yep_index"
-    )
-    # test custom headers
-    bbot_httpserver.expect_request("/test-custom-http-headers-curl", headers={"test": "header"}).respond_with_data(
-        "curl_yep_headers"
-    )
-    headers_url = bbot_httpserver.url_for("/test-custom-http-headers-curl")
-    curl_result = helpers.curl(url=headers_url)
-    assert curl_result == "curl_yep_headers"
diff --git a/bbot/test/test_step_2/test_http.py b/bbot/test/test_step_2/test_web.py
similarity index 72%
rename from bbot/test/test_step_2/test_http.py
rename to bbot/test/test_step_2/test_web.py
index 0fa4d9091e..323abf8c6f 100644
--- a/bbot/test/test_step_2/test_http.py
+++ b/bbot/test/test_step_2/test_web.py
@@ -2,7 +2,7 @@
 
 
 @pytest.mark.asyncio
-async def test_http_helpers(bbot_scanner, bbot_config, bbot_httpserver):
+async def test_web_helpers(bbot_scanner, bbot_config, bbot_httpserver):
     scan1 = bbot_scanner("8.8.8.8", config=bbot_config)
     scan2 = bbot_scanner("127.0.0.1", config=bbot_config)
 
@@ -91,7 +91,7 @@ async def test_http_helpers(bbot_scanner, bbot_config, bbot_httpserver):
 
 
 @pytest.mark.asyncio
-async def test_http_interactsh(bbot_scanner, bbot_config, bbot_httpserver):
+async def test_web_interactsh(bbot_scanner, bbot_config, bbot_httpserver):
     from bbot.core.helpers.interactsh import server_list
 
     scan1 = bbot_scanner("8.8.8.8", config=bbot_config)
@@ -106,3 +106,36 @@ async def async_callback(data):
     data_list = await interactsh_client.poll()
     assert isinstance(data_list, list)
     assert await interactsh_client.deregister() is None
+
+
+@pytest.mark.asyncio
+async def test_web_curl(bbot_scanner, bbot_config, bbot_httpserver):
+    scan = bbot_scanner("127.0.0.1", config=bbot_config)
+    helpers = scan.helpers
+    url = bbot_httpserver.url_for("/curl")
+    bbot_httpserver.expect_request(uri="/curl").respond_with_data("curl_yep")
+    bbot_httpserver.expect_request(uri="/index.html").respond_with_data("curl_yep_index")
+    assert await helpers.curl(url=url) == "curl_yep"
+    assert await helpers.curl(url=url, ignore_bbot_global_settings=True) == "curl_yep"
+    assert (await helpers.curl(url=url, head_mode=True)).startswith("HTTP/")
+    assert await helpers.curl(url=url, raw_body="body") == "curl_yep"
+    assert (
+        await helpers.curl(
+            url=url,
+            raw_path=True,
+            headers={"test": "test", "test2": ["test2"]},
+            ignore_bbot_global_settings=False,
+            post_data={"test": "test"},
+            method="POST",
+            cookies={"test": "test"},
+            path_override="/index.html",
+        )
+        == "curl_yep_index"
+    )
+    # test custom headers
+    bbot_httpserver.expect_request("/test-custom-http-headers-curl", headers={"test": "header"}).respond_with_data(
+        "curl_yep_headers"
+    )
+    headers_url = bbot_httpserver.url_for("/test-custom-http-headers-curl")
+    curl_result = await helpers.curl(url=headers_url)
+    assert curl_result == "curl_yep_headers"

From 229c381fc0b0b1d4ddf403b112746ef192a69dd6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 10 May 2023 14:01:05 -0400
Subject: [PATCH 010/387] httpx working

---
 bbot/agent/agent.py                   |   2 +-
 bbot/cli.py                           |   9 +-
 bbot/core/errors.py                   |   6 +-
 bbot/core/helpers/command.py          |  22 ++-
 bbot/core/helpers/dns.py              |  42 +++---
 bbot/core/helpers/interactsh.py       |   3 +-
 bbot/core/helpers/misc.py             |  21 +++
 bbot/core/logger/logger.py            |   1 +
 bbot/modules/base.py                  | 184 +++++++++++---------------
 bbot/modules/httpx.py                 |   8 +-
 bbot/modules/internal/speculate.py    |   4 +-
 bbot/modules/massdns.py               |   9 +-
 bbot/modules/naabu.py                 |  10 +-
 bbot/modules/paramminer_cookies.py    |   3 -
 bbot/modules/paramminer_getparams.py  |   3 -
 bbot/modules/paramminer_headers.py    |   6 +-
 bbot/modules/report/asn.py            |   3 -
 bbot/scanner/manager.py               | 130 +++++-------------
 bbot/scanner/scanner.py               | 168 ++++++++++++++++-------
 bbot/test/test_step_2/test_command.py |   6 +
 bbot/test/test_step_2/test_manager.py |  21 +--
 21 files changed, 329 insertions(+), 332 deletions(-)

diff --git a/bbot/agent/agent.py b/bbot/agent/agent.py
index be61e2d129..3076119bef 100644
--- a/bbot/agent/agent.py
+++ b/bbot/agent/agent.py
@@ -137,7 +137,7 @@ def stop_scan(self):
                     log.warning(msg)
                     return {"error": msg}
                 scan_id = str(self.scan.id)
-                self.scan.stop(wait=True)
+                self.scan.stop()
                 msg = f"Stopped scan {scan_id}"
                 log.warning(msg)
                 self.scan = None
diff --git a/bbot/cli.py b/bbot/cli.py
index c1c637839f..8538e269d2 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -320,12 +320,9 @@ def keyboard_listen():
             os._exit(1)
 
         # debug troublesome modules
-        """
-        from time import sleep
-        while 1:
-            scanner.manager.modules_status(_log=True)
-            sleep(1)
-        """
+        # while 1:
+        #     await scanner.manager.modules_status(_log=True)
+        #     await asyncio.sleep(1)
 
 
 def main():
diff --git a/bbot/core/errors.py b/bbot/core/errors.py
index ee93ee6065..24c94d4343 100644
--- a/bbot/core/errors.py
+++ b/bbot/core/errors.py
@@ -1,4 +1,4 @@
-from requests.exceptions import RequestException  # noqa F401
+from httpx import RequestError  # noqa
 
 
 class BBOTError(Exception):
@@ -9,10 +9,6 @@ class ScanError(BBOTError):
     pass
 
 
-class ScanCancelledError(BBOTError):
-    pass
-
-
 class ValidationError(BBOTError):
     pass
 
diff --git a/bbot/core/helpers/command.py b/bbot/core/helpers/command.py
index 426d76333e..219fa1bc73 100644
--- a/bbot/core/helpers/command.py
+++ b/bbot/core/helpers/command.py
@@ -18,7 +18,10 @@ async def run(self, *command, **kwargs):
     proc, _input, command = await self._spawn_proc(*command, **kwargs)
     if proc is not None:
         if _input is not None:
-            _input = smart_encode(_input)
+            if isinstance(_input, (list, tuple)):
+                _input = b"\n".join(smart_encode(i) for i in _input) + b"\n"
+            else:
+                _input = smart_encode(_input)
         stdout, stderr = await proc.communicate(_input)
 
         # surface stderr
@@ -50,14 +53,18 @@ async def run_live(self, *command, **kwargs):
             yield smart_decode(line).rstrip("\r\n")
 
         if input_task is not None:
-            await input_task
+            try:
+                await input_task
+            except BrokenPipeError:
+                log.trace(traceback.format_exc())
         await proc.wait()
 
         # surface stderr
         if proc.returncode != 0:
             stdout, stderr = await proc.communicate()
-            command_str = " ".join(command)
-            log.warning(f"Stderr for run_live({command_str}):\n\t{smart_decode(stderr)}")
+            if stderr:
+                command_str = " ".join(command)
+                log.warning(f"Stderr for run_live({command_str}):\n\t{smart_decode(stderr)}")
 
 
 async def _spawn_proc(self, *command, **kwargs):
@@ -80,8 +87,11 @@ async def _spawn_proc(self, *command, **kwargs):
 
 async def _write_stdin(proc, _input):
     if _input is not None:
-        if isinstance(_input, str):
-            proc.stdin.write(smart_encode(_input))
+        if isinstance(_input, (str, bytes)):
+            _input = [_input]
+        if isinstance(_input, (list, tuple)):
+            for chunk in _input:
+                proc.stdin.write(smart_encode(chunk) + b"\n")
         else:
             async for chunk in _input:
                 proc.stdin.write(smart_encode(chunk) + b"\n")
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 56e24262fd..2e1bd093fd 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -72,11 +72,13 @@ async def resolve(self, query, **kwargs):
         }
         """
         results = set()
-        raw_results, errors = await self.resolve_raw(query, **kwargs)
-        for rdtype, answers in raw_results:
-            for answer in answers:
-                for _, t in self.extract_targets(answer):
-                    results.add(t)
+        r = await self.resolve_raw(query, **kwargs)
+        if r:
+            raw_results, errors = r
+            for rdtype, answers in raw_results:
+                for answer in answers:
+                    for _, t in self.extract_targets(answer):
+                        results.add(t)
         return results
 
     async def resolve_raw(self, query, **kwargs):
@@ -350,22 +352,24 @@ def event_cache_get(self, host):
         except KeyError:
             return set(), None, None, set()
 
+    async def _resolve_batch_coro_wrapper(self, q, **kwargs):
+        """
+        Helps us correlate task results back to their original arguments
+        """
+        result = await self.resolve(q, **kwargs)
+        return (q, result)
+
     async def resolve_batch(self, queries, **kwargs):
         """
-        await resolve_batch("www.evilcorp.com", "evilcorp.com") --> [
+        await resolve_batch(["www.evilcorp.com", "evilcorp.com"]) --> [
             ("www.evilcorp.com", {"1.1.1.1"}),
             ("evilcorp.com", {"2.2.2.2"})
         ]
         """
 
-        async def coro_wrapper(q, **_kwargs):
-            """
-            Helps us correlate task results back to their original arguments
-            """
-            result = await self.resolve(q, **_kwargs)
-            return (q, result)
-
-        for task in asyncio.as_completed([coro_wrapper(q, **kwargs) for q in queries]):
+        for task in asyncio.as_completed(
+            [asyncio.create_task(self._resolve_batch_coro_wrapper(q, **kwargs)) for q in queries]
+        ):
             yield await task
 
     def extract_targets(self, record):
@@ -439,10 +443,6 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
         # skip check if the query is a domain
         if is_domain(query):
             return {}
-        # skip check if the query's parent domain is excluded in the config
-        for d in self.wildcard_ignore:
-            if self.parent_helper.host_in_host(query, d):
-                return {}
 
         parent = parent_domain(query)
         parents = list(domain_parents(query))
@@ -513,6 +513,12 @@ async def is_wildcard_domain(self, domain, log_info=False):
         wildcard_domain_results = {}
         domain = self._clean_dns_record(domain)
 
+        # skip check if the query's parent domain is excluded in the config
+        for d in self.wildcard_ignore:
+            if self.parent_helper.host_in_host(domain, d):
+                log.debug(f"Skipping wildcard detection on {domain} because it is excluded in the config")
+                return {}
+
         # make a list of its parents
         parents = list(domain_parents(domain, include_self=True))
         # and check each of them, beginning with the highest parent (i.e. the root domain)
diff --git a/bbot/core/helpers/interactsh.py b/bbot/core/helpers/interactsh.py
index f3303960f4..6cb679b4e9 100644
--- a/bbot/core/helpers/interactsh.py
+++ b/bbot/core/helpers/interactsh.py
@@ -126,7 +126,8 @@ async def poll(self):
         return ret
 
     async def poll_loop(self, callback):
-        return await self.parent_helper.scan.manager.catch(self._poll_loop, callback, _force=True)
+        async with self.parent_helper.scan.acatch(context=self._poll_loop):
+            return await self._poll_loop(callback)
 
     async def _poll_loop(self, callback):
         while 1:
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 8395d285a0..5e95899200 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -1031,3 +1031,24 @@ async def execute_sync_or_async(callback, *args, **kwargs):
         return await callback(*args, **kwargs)
     else:
         return callback(*args, **kwargs)
+
+
+def get_exception_chain(e):
+    """
+    Get the full chain of exceptions that led to the current one
+    """
+    exception_chain = []
+    current_exception = e
+    while current_exception is not None:
+        exception_chain.append(current_exception)
+        current_exception = getattr(current_exception, "__context__", None)
+    return exception_chain
+
+
+def get_traceback_details(e):
+    tb = traceback.extract_tb(e.__traceback__)
+    last_frame = tb[-1]  # Get the last frame in the traceback (the one where the exception was raised)
+    filename = last_frame.filename
+    lineno = last_frame.lineno
+    funcname = last_frame.name
+    return filename, lineno, funcname
diff --git a/bbot/core/logger/logger.py b/bbot/core/logger/logger.py
index c5668b1d89..e7ffe96628 100644
--- a/bbot/core/logger/logger.py
+++ b/bbot/core/logger/logger.py
@@ -221,6 +221,7 @@ def set_log_level(level, logger=None):
     _log_level_override = level
     log = logging.getLogger("bbot")
     log.setLevel(level)
+    logging.getLogger("asyncio").setLevel(level)
 
 
 def toggle_log_level(logger=None):
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 3f8ebedd86..75c9f08c40 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -7,7 +7,7 @@
 
 from ..core.helpers.misc import get_size
 from ..core.helpers.async_helpers import TaskCounter
-from ..core.errors import ScanCancelledError, ValidationError, WordlistError
+from ..core.errors import ValidationError, WordlistError
 
 
 class BaseModule:
@@ -98,6 +98,8 @@ def __init__(self, scan):
         # track number of failures (for .request_with_fail_count())
         self._request_failures = 0
 
+        self._event_received = asyncio.Condition()
+
     async def setup(self):
         """
         Perform setup functions at the beginning of the scan.
@@ -200,56 +202,26 @@ def get_watched_events(self):
             self._watched_events = set(self.watched_events)
         return self._watched_events
 
-    def submit_task(self, *args, **kwargs):
-        kwargs["_block"] = False
-        return self.thread_pool.submit_task(self.catch, *args, **kwargs)
-
-    async def catch(self, *args, **kwargs):
-        return await self.scan.manager.catch(*args, **kwargs)
-
-    async def _postcheck_and_run(self, callback, event):
-        acceptable, reason = await self._event_postcheck(event)
-        if not acceptable:
-            if reason:
-                self.debug(f"Not accepting {event} because {reason}")
-            return
-        self.scan.stats.event_consumed(event, self)
-        return await callback(event)
-
-    async def _register_running(self, callback, *args, **kwargs):
-        with self._task_counter:
-            return await callback(*args, **kwargs)
-
-    def _handle_batch(self, force=False):
+    async def _handle_batch(self):
+        submitted = False
         if self.batch_size <= 1:
             return
-        if self.num_queued_events > 0 and (force or self.num_queued_events >= self.batch_size):
-            on_finish_callback = None
-            events, finish, report = self.events_waiting
-            if finish:
-                on_finish_callback = self.finish
-            elif report:
-                on_finish_callback = self.report
-            checked_events = []
-            for e in events:
-                acceptable, reason = self._event_postcheck(e)
-                if not acceptable:
-                    if reason:
-                        self.debug(f"Not accepting {e} because {reason}")
-                    continue
-                checked_events.append(e)
-            if checked_events:
+        if self.num_queued_events > 0:
+            events, finish, report = await self.events_waiting()
+            if not self.errored:
                 self.debug(f"Handling batch of {len(events):,} events")
-                if not self.errored:
-                    self._internal_thread_pool.submit_task(
-                        self.catch,
-                        self._register_running,
-                        self.handle_batch,
-                        *checked_events,
-                        _on_finish_callback=on_finish_callback,
-                    )
-                return True
-        return False
+                if events:
+                    submitted = True
+                    async with self.scan.acatch(context=f"{self.name}.handle_batch"):
+                        with self._task_counter:
+                            await self.handle_batch(*events)
+                if finish:
+                    async with self.scan.acatch(context=f"{self.name}.finish"):
+                        await self.finish()
+                elif report:
+                    async with self.scan.acatch(context=f"{self.name}.report"):
+                        await self.report()
+        return submitted
 
     def make_event(self, *args, **kwargs):
         raise_error = kwargs.pop("raise_error", False)
@@ -271,8 +243,7 @@ def emit_event(self, *args, **kwargs):
         event = self.make_event(*args, **event_kwargs)
         self.scan.manager.queue_event(event)
 
-    @property
-    def events_waiting(self):
+    async def events_waiting(self):
         """
         yields all events in queue, up to maximum batch size
         """
@@ -284,11 +255,16 @@ def events_waiting(self):
                 break
             try:
                 event = self.incoming_event_queue.get_nowait()
-                if event.type == "FINISHED":
-                    finish = True
-                else:
-                    events.append(event)
-            except queue.Empty:
+                self.debug(f"Got {event} from {getattr(event, 'module', 'unknown_module')}")
+                acceptable, reason = await self._event_postcheck(event)
+                if acceptable:
+                    if event.type == "FINISHED":
+                        finish = True
+                    else:
+                        events.append(event)
+                elif reason:
+                    self.debug(f"Not accepting {event} because {reason}")
+            except asyncio.queues.QueueEmpty:
                 break
         return events, finish, report
 
@@ -323,53 +299,41 @@ async def _setup(self):
             self.trace()
         return self.name, status, str(msg)
 
-    @property
-    def _force_batch(self):
-        """
-        Determine whether a batch should be forcefully submitted
-        """
-        # if we're below our maximum threading potential
-        return self._internal_thread_pool.num_tasks < self.max_event_handlers
-
     async def _worker(self):
-        try:
-            while not self.scan.stopping:
-                # hold the reigns if our outgoing queue is full
-                # if self._qsize and self.outgoing_event_queue.qsize() >= self._qsize:
-                #     with self.event_received:
-                #         await self.event_received.wait()
-
-                if self.batch_size > 1:
-                    pass
-                    # submitted = self._handle_batch(force=self._force_batch)
-                    # if not submitted:
-                    #     with self.event_received:
-                    #         await self.event_received.wait()
-
-                else:
-                    try:
-                        if self.incoming_event_queue:
-                            e = await self.incoming_event_queue.get()
-                        else:
-                            self.debug(f"Event queue is in bad state")
-                            return
-                    except queue.Empty:
-                        continue
-                    self.debug(f"Got {e} from {getattr(e, 'module', 'unknown_module')}")
-                    # if we receive the special "FINISHED" event
-                    if e.type == "FINISHED":
-                        await self.catch(self._register_running, self.finish)
-                    else:
-                        await self.catch(self._register_running, self._postcheck_and_run, self.handle_event, e)
+        while not self.scan.stopping:
+            # hold the reigns if our outgoing queue is full
+            # if self._qsize and self.outgoing_event_queue.qsize() >= self._qsize:
+            #     with self.event_received:
+            #         await self.event_received.wait()
+
+            if self.batch_size > 1:
+                submitted = await self._handle_batch()
+                if not submitted:
+                    async with self._event_received:
+                        await self._event_received.wait()
 
-        except KeyboardInterrupt:
-            self.debug(f"Interrupted")
-            self.scan.stop()
-        except ScanCancelledError as e:
-            self.verbose(f"Scan cancelled, {e}")
-        except Exception as e:
-            self.set_error_state(f"Exception ({e.__class__.__name__}) in module {self.name}:\n{e}")
-            self.trace()
+            else:
+                try:
+                    if self.incoming_event_queue:
+                        event = await self.incoming_event_queue.get()
+                    else:
+                        self.debug(f"Event queue is in bad state")
+                        return
+                except asyncio.queues.QueueEmpty:
+                    continue
+                self.debug(f"Got {event} from {getattr(event, 'module', 'unknown_module')}")
+                acceptable, reason = await self._event_postcheck(event)
+                if not acceptable:
+                    self.debug(f"Not accepting {event} because {reason}")
+                if acceptable:
+                    if event.type == "FINISHED":
+                        async with self.scan.acatch(context=f"{self.name}.finish"):
+                            with self._task_counter:
+                                await self.finish()
+                    else:
+                        async with self.scan.acatch(context=f"{self.name}.handle_event"):
+                            with self._task_counter:
+                                await self.handle_event(event)
 
     @property
     def max_scope_distance(self):
@@ -416,12 +380,16 @@ async def _event_postcheck(self, event):
         Check if an event should be accepted by the module
         Used when taking an event FROM the module's queue (immediately before it's handled)
         """
+        # special exception for "FINISHED" event
         if event.type in ("FINISHED",):
             return True, ""
 
+        # reject out-of-scope events for active modules
+        # TODO: reconsider this
         if "active" in self.flags and "target" in event.tags and event not in self.scan.whitelist:
             return False, "it is not in whitelist and module has active flag"
 
+        # check scope distance
         if self._type != "output":
             if self.in_scope_only:
                 if event.scope_distance > 0:
@@ -436,7 +404,7 @@ async def _event_postcheck(self, event):
                     )
 
         # custom filtering
-        try:
+        async with self.scan.acatch(context=self.filter_event):
             filter_result = await self.filter_event(event)
             msg = str(self._custom_filter_criteria_msg)
             with suppress(ValueError, TypeError):
@@ -444,16 +412,12 @@ async def _event_postcheck(self, event):
                 msg += f": {reason}"
             if not filter_result:
                 return False, msg
-        except ScanCancelledError:
-            return False, "Scan cancelled"
-        except Exception as e:
-            self.error(f"Error in filter_event({event}): {e}")
-            self.trace()
 
         if self._type == "output" and not event._stats_recorded:
             event._stats_recorded = True
             self.scan.stats.event_produced(event)
 
+        self.debug(f"{event} passed post-check")
         return True, ""
 
     async def _cleanup(self):
@@ -461,9 +425,11 @@ async def _cleanup(self):
             self._cleanedup = True
             for callback in [self.cleanup] + self.cleanup_callbacks:
                 if callable(callback):
-                    await self.catch(self._register_running, callback, _force=True)
+                    async with self.scan.acatch(context=self.name):
+                        with self._task_counter:
+                            await self.helpers.execute_sync_or_async(callback)
 
-    def queue_event(self, event):
+    async def queue_event(self, event):
         if self.incoming_event_queue in (None, False):
             self.debug(f"Not in an acceptable state to queue event")
             return
@@ -474,6 +440,8 @@ def queue_event(self, event):
             return
         try:
             self.incoming_event_queue.put_nowait(event)
+            async with self._event_received:
+                self._event_received.notify()
         except AttributeError:
             self.debug(f"Not in an acceptable state to queue event")
 
diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index 6641b38301..16ca7294c2 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -32,7 +32,7 @@ class httpx(BaseModule):
     scope_distance_modifier = 1
     _priority = 2
 
-    def setup(self):
+    async def setup(self):
         self.threads = self.config.get("threads", 50)
         self.timeout = self.scan.config.get("httpx_timeout", 5)
         self.retries = self.scan.config.get("httpx_retries", 1)
@@ -40,7 +40,7 @@ def setup(self):
         self.visited = set()
         return True
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if "_wildcard" in str(event.host).split("."):
             return False, "event is wildcard"
 
@@ -62,7 +62,7 @@ def filter_event(self, event):
         # note: speculate makes open ports from
         return True
 
-    def handle_batch(self, *events):
+    async def handle_batch(self, *events):
         stdin = {}
         for e in events:
             url_hash = None
@@ -106,7 +106,7 @@ def handle_batch(self, *events):
         proxy = self.scan.config.get("http_proxy", "")
         if proxy:
             command += ["-http-proxy", proxy]
-        for line in self.helpers.run_live(command, input=list(stdin), stderr=subprocess.DEVNULL):
+        async for line in self.helpers.run_live(command, input=list(stdin), stderr=subprocess.DEVNULL):
             try:
                 j = json.loads(line)
             except json.decoder.JSONDecodeError:
diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index 7e9d65f969..079f8076ed 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -29,6 +29,7 @@ async def setup(self):
         self.open_port_consumers = any(["OPEN_TCP_PORT" in m.watched_events for m in self.scan.modules.values()])
         self.portscanner_enabled = any(["portscan" in m.flags for m in self.scan.modules.values()])
         self.range_to_ip = True
+        self.dns_resolution = self.scan.config.get("dns_resolution", True)
 
         self.ports = self.config.get("ports", [80, 443])
         if isinstance(self.ports, int):
@@ -88,10 +89,9 @@ async def handle_event(self, event):
         # from hosts
         if emit_open_ports:
             # don't act on unresolved DNS_NAMEs
-
             usable_dns = False
             if event.type == "DNS_NAME":
-                if "a-record" in event.tags or "aaaa-record" in event.tags:
+                if (not self.dns_resolution) or ("a-record" in event.tags or "aaaa-record" in event.tags):
                     usable_dns = True
 
             if event.type == "IP_ADDRESS" or usable_dns:
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index e986206fa8..addef9fc3e 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -98,7 +98,7 @@ async def handle_event(self, event):
         if not h in self.source_events:
             self.source_events[h] = event
 
-        self.info(f"Brute-forcing subdomains for {query}")
+        self.info(f"Brute-forcing subdomains for {query} ({event})")
         for hostname in await self.massdns(query, self.helpers.read_file(self.subdomain_file)):
             self.emit_result(hostname, event, query)
 
@@ -141,9 +141,12 @@ async def _canary_check(self, domain, num_checks=50):
         random_subdomains = list(self.gen_random_subdomains(num_checks))
         self.verbose(f"Testing {len(random_subdomains):,} canaries against {domain}")
         canary_results = [l async for l in self._massdns(domain, random_subdomains)]
-        for result in canary_results:
-            if await self.helpers.resolve(result):
+        async for result in self.helpers.resolve_batch(canary_results):
+            if result:
                 return True
+        # for result in canary_results:
+        #     if await self.helpers.resolve(result):
+        #         return True
         return False
 
     async def _massdns(self, domain, subdomains):
diff --git a/bbot/modules/naabu.py b/bbot/modules/naabu.py
index d806ab7082..f81424df89 100644
--- a/bbot/modules/naabu.py
+++ b/bbot/modules/naabu.py
@@ -20,7 +20,7 @@ class naabu(BaseModule):
         "skip_host_discovery": "skip host discovery (-Pn)",
         "version": "naabu version",
     }
-    max_event_handlers = 2
+    max_event_handlers = 1
     batch_size = 256
     _priority = 2
 
@@ -56,15 +56,15 @@ class naabu(BaseModule):
         },
     ]
 
-    def setup(self):
+    async def setup(self):
         self.helpers.depsinstaller.ensure_root(message="Naabu requires root privileges")
         self.skip_host_discovery = self.config.get("skip_host_discovery", True)
         return True
 
-    def handle_batch(self, *events):
+    async def handle_batch(self, *events):
         _input = [str(e.data) for e in events]
         command = self.construct_command()
-        for line in self.helpers.run_live(command, input=_input, stderr=subprocess.DEVNULL, sudo=False):
+        async for line in self.helpers.run_live(command, input=_input, stderr=subprocess.DEVNULL, sudo=False):
             try:
                 j = json.loads(line)
             except Exception as e:
@@ -115,6 +115,6 @@ def construct_command(self):
             command += ["-top-ports", top_ports]
         return command
 
-    def cleanup(self):
+    async def cleanup(self):
         resume_file = self.helpers.current_dir / "resume.cfg"
         resume_file.unlink(missing_ok=True)
diff --git a/bbot/modules/paramminer_cookies.py b/bbot/modules/paramminer_cookies.py
index be2318dc4c..64f3965191 100644
--- a/bbot/modules/paramminer_cookies.py
+++ b/bbot/modules/paramminer_cookies.py
@@ -1,4 +1,3 @@
-from bbot.core.errors import ScanCancelledError
 from .paramminer_headers import paramminer_headers
 
 
@@ -22,8 +21,6 @@ class paramminer_cookies(paramminer_headers):
     compare_mode = "cookie"
 
     def check_batch(self, compare_helper, url, cookie_list):
-        if self.scan.stopping:
-            raise ScanCancelledError()
         cookies = {p: self.rand_string(14) for p in cookie_list}
         return compare_helper.compare(url, cookies=cookies)
 
diff --git a/bbot/modules/paramminer_getparams.py b/bbot/modules/paramminer_getparams.py
index 688f394628..7ad778c0e4 100644
--- a/bbot/modules/paramminer_getparams.py
+++ b/bbot/modules/paramminer_getparams.py
@@ -1,4 +1,3 @@
-from bbot.core.errors import ScanCancelledError
 from .paramminer_headers import paramminer_headers
 
 
@@ -21,8 +20,6 @@ class paramminer_getparams(paramminer_headers):
     compare_mode = "getparam"
 
     def check_batch(self, compare_helper, url, getparam_list):
-        if self.scan.stopping:
-            raise ScanCancelledError()
         test_getparams = {p: self.rand_string(14) for p in getparam_list}
         return compare_helper.compare(self.helpers.add_get_params(url, test_getparams).geturl())
 
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 0b0678825b..1009a4a33f 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -1,5 +1,5 @@
 from bbot.modules.base import BaseModule
-from bbot.core.errors import HttpCompareError, ScanCancelledError
+from bbot.core.errors import HttpCompareError
 
 
 class paramminer_headers(BaseModule):
@@ -70,8 +70,6 @@ def handle_event(self, event):
                         )
                         results.clear()
                         assert False
-        except ScanCancelledError:
-            return
         except AssertionError:
             pass
 
@@ -130,8 +128,6 @@ def binary_search(self, compare_helper, url, group, reasons=None, reflection=Fal
             self.warning(f"Submitted group of size 0 to binary_search()")
 
     def check_batch(self, compare_helper, url, header_list):
-        if self.scan.stopping:
-            raise ScanCancelledError()
         rand = self.rand_string()
         test_headers = {}
         for header in header_list:
diff --git a/bbot/modules/report/asn.py b/bbot/modules/report/asn.py
index 331fddafd1..592ec1ff63 100644
--- a/bbot/modules/report/asn.py
+++ b/bbot/modules/report/asn.py
@@ -1,4 +1,3 @@
-from bbot.core.errors import ScanCancelledError
 from bbot.modules.report.base import BaseReportModule
 
 
@@ -90,8 +89,6 @@ def get_asn(self, ip, retries=1):
         """
         for attempt in range(retries + 1):
             for i, source in enumerate(list(self.sources)):
-                if self.scan.stopping:
-                    raise ScanCancelledError()
                 get_asn_fn = getattr(self, f"get_asn_{source}")
                 res = get_asn_fn(ip)
                 if res == False:
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index e2bf595064..65a123f3e4 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -4,9 +4,9 @@
 import traceback
 from contextlib import suppress
 
+from ..core.errors import ValidationError
 from ..core.helpers.queueing import EventQueue
 from ..core.helpers.async_helpers import TaskCounter
-from ..core.errors import ScanCancelledError, ValidationError
 
 log = logging.getLogger("bbot.scanner.manager")
 
@@ -32,16 +32,14 @@ async def init_events(self):
         """
         seed scanner with target events
         """
-        with self._task_counter:
-            self.distribute_event(self.scan.root_event)
-            sorted_events = sorted(self.scan.target.events, key=lambda e: len(e.data))
-            for event in sorted_events:
-                self.scan.verbose(f"Target: {event}")
-                self.queue_event(event)
-            # force submit batches
-            # for mod in self.scan.modules.values():
-            #     mod._handle_batch(force=True)
-            self.scan._finished_init = True
+        async with self.scan.acatch(context=self.init_events):
+            with self._task_counter:
+                await self.distribute_event(self.scan.root_event)
+                sorted_events = sorted(self.scan.target.events, key=lambda e: len(e.data))
+                for event in sorted_events:
+                    self.scan.verbose(f"Target: {event}")
+                    self.queue_event(event)
+                self.scan._finished_init = True
 
     async def emit_event(self, event, *args, **kwargs):
         """
@@ -56,38 +54,20 @@ async def emit_event(self, event, *args, **kwargs):
                 event._resolved.set()
                 return False
 
+            log.debug(f'Module "{event.module}" raised {event}')
+
             # "quick" queues the event immediately
             quick = kwargs.pop("quick", False)
             if quick:
                 log.debug(f'Module "{event.module}" raised {event}')
                 event._resolved.set()
-                for kwarg in ["abort_if", "on_success_callback", "_block"]:
+                for kwarg in ["abort_if", "on_success_callback"]:
                     kwargs.pop(kwarg, None)
-                try:
-                    self.distribute_event(event, *args, **kwargs)
-                    return True
-                except ScanCancelledError:
-                    return False
-                except Exception as e:
-                    log.error(f"Unexpected error in manager.emit_event(): {e}")
-                    log.trace(traceback.format_exc())
+                async with self.scan.acatch(context=self.distribute_event):
+                    await self.distribute_event(event, *args, **kwargs)
             else:
-                # don't raise an exception if the thread pool has been shutdown
-                error = True
-                try:
-                    await self.catch(self._emit_event, event, *args, **kwargs)
-                    error = False
-                    log.debug(f'Module "{event.module}" raised {event}')
-                    return True
-                except ScanCancelledError:
-                    return False
-                except Exception as e:
-                    log.error(f"Unexpected error in manager.emit_event(): {e}")
-                    log.trace(traceback.format_exc())
-                finally:
-                    if error:
-                        event._resolved.set()
-            return False
+                async with self.scan.acatch(context=self._emit_event, finally_callback=event._resolved.set):
+                    await self._emit_event(event, *args, **kwargs)
 
     def _event_precheck(self, event, exclude=("DNS_NAME",)):
         """
@@ -203,7 +183,8 @@ async def _emit_event(self, event, *args, **kwargs):
 
             # now that the event is properly tagged, we can finally make decisions about it
             if callable(abort_if):
-                abort_result = abort_if(event)
+                async with self.scan.acatch(context=abort_if):
+                    abort_result = await self.helpers.execute_sync_or_async(abort_if, event)
                 msg = f"{event.module}: not raising event {event} due to custom criteria in abort_if()"
                 with suppress(ValueError, TypeError):
                     abort_result, reason = abort_result
@@ -218,7 +199,8 @@ async def _emit_event(self, event, *args, **kwargs):
             # run success callback before distributing event (so it can add tags, etc.)
             if distribute_event:
                 if callable(on_success_callback):
-                    self.catch(on_success_callback, event)
+                    async with self.scan.acatch(context=on_success_callback):
+                        await self.scan.helpers.execute_sync_or_async(on_success_callback, event)
 
             if not event.host or (event.always_emit and not event_is_duplicate):
                 log.debug(
@@ -229,7 +211,7 @@ async def _emit_event(self, event, *args, **kwargs):
                     self.queue_event(s)
 
             if distribute_event:
-                self.distribute_event(event)
+                await self.distribute_event(event)
                 event_distributed = True
 
             # speculate DNS_NAMES and IP_ADDRESSes from other event types
@@ -277,9 +259,6 @@ async def _emit_event(self, event, *args, **kwargs):
                     for child_event in dns_child_events:
                         self.queue_event(child_event)
 
-        except KeyboardInterrupt:
-            self.scan.stop()
-
         except ValidationError as e:
             log.warning(f"Event validation failed with args={args}, kwargs={kwargs}: {e}")
             log.trace(traceback.format_exc())
@@ -322,66 +301,29 @@ def accept_event(self, event):
             return False
         return True
 
-    async def catch(self, callback, *args, **kwargs):
-        """
-        Wrapper to ensure error messages get surfaced to the user
-        """
-        ret = None
-        on_finish_callback = kwargs.pop("_on_finish_callback", None)
-        force = kwargs.pop("_force", False)
-        fn = callback
-        for arg in args:
-            if callable(arg):
-                fn = arg
-            else:
-                break
-        try:
-            if not self.scan.stopping or force:
-                ret = await self.scan.helpers.execute_sync_or_async(callback, *args, **kwargs)
-        except ScanCancelledError as e:
-            log.debug(f"ScanCancelledError in {fn.__qualname__}(): {e}")
-        except BrokenPipeError as e:
-            log.debug(f"BrokenPipeError in {fn.__qualname__}(): {e}")
-        except Exception as e:
-            log.error(f"Error in {fn.__qualname__}(): {e}")
-            log.trace(traceback.format_exc())
-        except KeyboardInterrupt:
-            log.debug(f"Interrupted")
-            self.scan.stop()
-        except asyncio.CancelledError as e:
-            log.debug(f"{e}")
-        if callable(on_finish_callback):
-            try:
-                await self.scan.helpers.execute_sync_or_async(on_finish_callback)
-            except Exception as e:
-                log.error(
-                    f"Error in on_finish_callback {on_finish_callback.__qualname__}() after {fn.__qualname__}(): {e}"
-                )
-                log.trace(traceback.format_exc())
-        return ret
-
     async def _register_running(self, callback, *args, **kwargs):
         with self._task_counter:
             return await callback(*args, **kwargs)
 
-    def distribute_event(self, *args, **kwargs):
+    async def distribute_event(self, *args, **kwargs):
         """
         Queue event with modules
         """
-        event = self.scan.make_event(*args, **kwargs)
+        async with self.scan.acatch(context=self.distribute_event):
+            event = self.scan.make_event(*args, **kwargs)
 
-        event_hash = hash(event)
-        dup = event_hash in self.events_distributed
-        if dup:
-            self.scan.verbose(f"{event.module}: Duplicate event: {event}")
-        else:
-            self.events_distributed.add(event_hash)
-        # absorb event into the word cloud if it's in scope
-        if not dup and -1 < event.scope_distance < 1:
-            self.scan.word_cloud.absorb_event(event)
-        for mod in self.scan.modules.values():
-            if not dup or mod.accept_dupes:
-                mod.queue_event(event)
+            event_hash = hash(event)
+            dup = event_hash in self.events_distributed
+            if dup:
+                self.scan.verbose(f"{event.module}: Duplicate event: {event}")
+            else:
+                self.events_distributed.add(event_hash)
+            # absorb event into the word cloud if it's in scope
+            if not dup and -1 < event.scope_distance < 1:
+                self.scan.word_cloud.absorb_event(event)
+            for mod in self.scan.modules.values():
+                if not dup or mod.accept_dupes:
+                    await mod.queue_event(event)
 
     async def _worker_loop(self):
         try:
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index df7bb80e15..f2f3fee371 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -1,12 +1,14 @@
 import queue
+
+# import signal
 import asyncio
 import logging
 import traceback
+import contextlib
 from sys import exc_info
 from pathlib import Path
 from datetime import datetime
 from omegaconf import OmegaConf
-from contextlib import suppress
 from collections import OrderedDict
 
 from bbot import config as bbot_config
@@ -22,7 +24,7 @@
 from bbot.core.logger import init_logging, get_log_level
 from bbot.core.helpers.names_generator import random_name
 from bbot.core.configurator.environ import prepare_environment
-from bbot.core.errors import BBOTError, ScanError, ScanCancelledError, ValidationError
+from bbot.core.errors import BBOTError, ScanError, ValidationError
 
 log = logging.getLogger("bbot.scanner")
 
@@ -159,7 +161,15 @@ def __init__(
         self._finished_init = False
         self._cleanedup = False
 
+        self._loop = asyncio.get_event_loop()
+
+    def _on_keyboard_interrupt(self, loop, event):
+        self.stop()
+
     async def prep(self):
+        # event = asyncio.Event()
+        # self._loop.add_signal_handler(signal.SIGINT, self._on_keyboard_interrupt, loop, event)
+
         self.helpers.mkdir(self.home)
         if not self._prepped:
             start_msg = f"Scan with {len(self._scan_modules):,} modules seeded with {len(self.target):,} targets"
@@ -224,14 +234,7 @@ async def start(self):
             while 1:
                 # abort if we're aborting
                 if self.aborting:
-                    # Empty event queues
-                    for module in self.modules.values():
-                        with suppress(queue.Empty):
-                            while 1:
-                                module.incoming_event_queue.get_nowait()
-                    with suppress(queue.Empty):
-                        while 1:
-                            self.incoming_event_queue.get_nowait()
+                    self.drain_queues()
                     break
 
                 if "python" in self.modules:
@@ -239,48 +242,37 @@ async def start(self):
                     for e in events:
                         yield e
 
+                # if initialization finished and the scan is no longer active
                 if self._finished_init and not self.manager.active:
-                    # And if new events were generated since last time we were here
-                    if self.manager._new_activity:
-                        self.manager._new_activity = False
-                        self.status = "FINISHING"
-                        # Trigger .finished() on every module and start over
-                        log.info("Finishing scan")
-                        finished_event = self.make_event("FINISHED", "FINISHED", dummy=True)
-                        for module in self.modules.values():
-                            module.queue_event(finished_event)
-                    else:
-                        # Otherwise stop the scan if no new events were generated since last time
+                    new_activity = await self.finish()
+                    if not new_activity:
                         break
 
                 await asyncio.sleep(0.01)
 
-            # for module in self.modules.values():
-            #     for task in module.tasks:
-            #         await task
-
-            failed = False
-
-        except KeyboardInterrupt:
-            self.stop()
             failed = False
 
-        except ScanCancelledError:
-            self.debug("Scan cancelled")
-
-        except ScanError as e:
-            self.error(f"{e}")
+        except BaseException as e:
+            exception_chain = self.helpers.get_exception_chain(e)
+            if any(isinstance(exc, KeyboardInterrupt) for exc in exception_chain):
+                self.stop()
+                failed = False
+            else:
+                try:
+                    raise
+                except ScanError as e:
+                    self.error(f"{e}")
 
-        except BBOTError as e:
-            self.critical(f"Error during scan: {e}")
-            self.trace()
+                except BBOTError as e:
+                    self.critical(f"Error during scan: {e}")
+                    self.trace()
 
-        except Exception:
-            self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
+                except Exception:
+                    self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
 
         finally:
             init_events_task.cancel()
-            with suppress(asyncio.CancelledError):
+            with contextlib.suppress(asyncio.CancelledError):
                 await init_events_task
 
             await self.report()
@@ -297,12 +289,12 @@ async def start(self):
                 self.status = "FINISHED"
 
             ticker_task.cancel()
-            with suppress(asyncio.CancelledError):
+            with contextlib.suppress(asyncio.CancelledError):
                 await ticker_task
 
             for t in manager_worker_loop_tasks:
                 t.cancel()
-                with suppress(asyncio.CancelledError):
+                with contextlib.suppress(asyncio.CancelledError):
                     await t
 
             scan_run_time = datetime.now() - scan_start_time
@@ -346,16 +338,49 @@ async def setup_modules(self, remove_failed=True):
         elif total_failed > 0:
             self.warning(f"Setup failed for {total_failed:,} modules")
 
-    def stop(self, wait=False):
+    def stop(self):
         if self.status != "ABORTING":
             self.status = "ABORTING"
             self.hugewarning(f"Aborting scan")
+            self.trace()
+            self.drain_queues()
             self.helpers.kill_children()
+            self.drain_queues()
             self.helpers.kill_children()
 
+    async def finish(self):
+        # if new events were generated since last time we were here
+        if self.manager._new_activity:
+            self.manager._new_activity = False
+            self.status = "FINISHING"
+            # Trigger .finished() on every module and start over
+            log.info("Finishing scan")
+            finished_event = self.make_event("FINISHED", "FINISHED", dummy=True)
+            for module in self.modules.values():
+                await module.queue_event(finished_event)
+            self.verbose("Completed finish()")
+            return True
+        # Return False if no new events were generated since last time
+        self.verbose("Completed final finish()")
+        return False
+
+    def drain_queues(self):
+        # Empty event queues
+        self.debug("Draining queues")
+        for module in self.modules.values():
+            with contextlib.suppress(asyncio.queues.QueueEmpty):
+                while 1:
+                    module.incoming_event_queue.get_nowait()
+        with contextlib.suppress(queue.Empty):
+            while 1:
+                self.manager.incoming_event_queue.get_nowait()
+        self.debug("Finished draining queues")
+
     async def report(self):
         for mod in self.modules.values():
-            await self.manager.catch(mod._register_running, mod.report)
+            async with self.acatch(context=mod.report):
+                with mod._task_counter:
+                    await mod.report()
 
     async def cleanup(self):
         # clean up modules
@@ -364,7 +389,7 @@ async def cleanup(self):
             await mod._cleanup()
         if not self._cleanedup:
             self._cleanedup = True
-            with suppress(Exception):
+            with contextlib.suppress(Exception):
                 self.home.rmdir()
             self.helpers.clean_old_scans()
 
@@ -606,6 +631,53 @@ def _load_modules(self, modules):
         return loaded_modules, failed
 
     async def _status_ticker(self, interval=15):
-        while not self.stopped:
-            await asyncio.sleep(interval)
-            await self.manager.modules_status(_log=True)
+        async with self.acatch():
+            # while not self.stopped:
+            while 1:
+                await asyncio.sleep(interval)
+                await self.manager.modules_status(_log=True)
+
+    @contextlib.contextmanager
+    def catch(self, context="scan", finally_callback=None):
+        """
+        Handle common errors by stopping scan, logging tracebacks, etc.
+
+        with catch():
+            do_stuff()
+        """
+        try:
+            yield
+        except BaseException as e:
+            self._handle_exception(e, context=context)
+
+    @contextlib.asynccontextmanager
+    async def acatch(self, context="scan", finally_callback=None):
+        """
+        Async version of catch()
+
+        async with catch():
+            await do_stuff()
+        """
+        try:
+            yield
+        except BaseException as e:
+            self._handle_exception(e, context=context)
+
+    def _handle_exception(self, e, context="scan", finally_callback=None):
+        if callable(context):
+            context = f"{context.__qualname__}()"
+        filename, lineno, funcname = self.helpers.get_traceback_details(e)
+        exception_chain = self.helpers.get_exception_chain(e)
+        if any(isinstance(exc, KeyboardInterrupt) for exc in exception_chain):
+            log.debug(f"Interrupted")
+            self.stop()
+        elif isinstance(e, BrokenPipeError):
+            log.debug(f"BrokenPipeError in {filename}:{lineno}:{funcname}(): {e}")
+        elif isinstance(e, asyncio.CancelledError):
+            log.debug(f"asyncio CancelledError: {e}")
+            log.trace(traceback.format_exc())
+        elif isinstance(e, Exception):
+            log.error(f"Error in {context}: {filename}:{lineno}:{funcname}(): {e}")
+            log.trace(traceback.format_exc())
+        if callable(finally_callback):
+            self.helpers.execute_sync_or_async(finally_callback, e)
diff --git a/bbot/test/test_step_2/test_command.py b/bbot/test/test_step_2/test_command.py
index db2a069290..5f56d248b0 100644
--- a/bbot/test/test_step_2/test_command.py
+++ b/bbot/test/test_step_2/test_command.py
@@ -9,6 +9,8 @@ async def test_command(bbot_scanner, bbot_config):
     assert "plumbus\n" == (await scan1.helpers.run(["echo", "plumbus"])).stdout
     result = (await scan1.helpers.run(["cat"], input="some\nrandom\nstdin")).stdout
     assert result.splitlines() == ["some", "random", "stdin"]
+    result = (await scan1.helpers.run(["cat"], input=["some", "random", "stdin"])).stdout
+    assert result.splitlines() == ["some", "random", "stdin"]
 
     # run_live
     lines = []
@@ -19,6 +21,10 @@ async def test_command(bbot_scanner, bbot_config):
     async for line in scan1.helpers.run_live(["cat"], input="some\nrandom\nstdin"):
         lines.append(line)
     assert lines == ["some", "random", "stdin"]
+    lines = []
+    async for line in scan1.helpers.run_live(["cat"], input=["some", "random", "stdin"]):
+        lines.append(line)
+    assert lines == ["some", "random", "stdin"]
 
     # test piping
     lines = []
diff --git a/bbot/test/test_step_2/test_manager.py b/bbot/test/test_step_2/test_manager.py
index 4a0bcff54a..eff5190e4d 100644
--- a/bbot/test/test_step_2/test_manager.py
+++ b/bbot/test/test_step_2/test_manager.py
@@ -89,23 +89,10 @@ class DummyModule3:
 
     # error catching
     msg = "Ignore this error, it belongs here"
-
-    def raise_e():
-        raise Exception(msg)
-
-    def raise_k():
-        raise KeyboardInterrupt(msg)
-
-    def raise_s():
-        raise ScanCancelledError(msg)
-
-    def raise_b():
-        raise BrokenPipeError(msg)
-
-    manager.catch(raise_e, _on_finish_callback=raise_e)
-    manager.catch(raise_k)
-    manager.catch(raise_s)
-    manager.catch(raise_b)
+    exceptions = (Exception(msg), KeyboardInterrupt(msg), BrokenPipeError(msg))
+    for e in exceptions:
+        with manager.catch():
+            raise e
 
 
 def test_scope_distance(bbot_scanner, bbot_config):

From 7e8b3c01624d6a8671d26948fd596f0e7b3d9487 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 10 May 2023 14:32:07 -0400
Subject: [PATCH 011/387] httpx tests

---
 bbot/core/helpers/dns.py                   | 10 ----------
 bbot/core/helpers/helper.py                |  4 ----
 bbot/modules/output/python.py              |  2 +-
 bbot/scanner/scanner.py                    |  2 +-
 bbot/test/helpers.py                       | 12 +++++++++---
 bbot/test/modules_test_classes.py          |  4 ++--
 bbot/test/test_step_1/test_modules_full.py |  5 +++--
 7 files changed, 16 insertions(+), 23 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 2e1bd093fd..23fd8601f8 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -127,8 +127,6 @@ async def _resolve_hostname(self, query, **kwargs):
         parent_hash = hash(f"{parent}:{rdtype}")
         dns_cache_hash = hash(f"{query}:{rdtype}")
         while tries_left > 0:
-            # if self.parent_helper.scan_stopping:
-            #     break
             try:
                 try:
                     results = self._dns_cache[dns_cache_hash]
@@ -176,8 +174,6 @@ async def _resolve_ip(self, query, **kwargs):
         errors = []
         dns_cache_hash = hash(f"{query}:PTR")
         while tries_left > 0:
-            # if self.parent_helper.scan_stopping:
-            #     break
             try:
                 if dns_cache_hash in self._dns_cache:
                     result = self._dns_cache[dns_cache_hash]
@@ -586,9 +582,3 @@ def _get_dummy_module(self, name):
             dummy_module = self.parent_helper._make_dummy_module(name=name, _type="DNS")
             self._dummy_modules[name] = dummy_module
         return dummy_module
-
-    def dns_warning(self, msg):
-        msg_hash = hash(msg)
-        if msg_hash not in self._dns_warnings:
-            log.warning(msg)
-            self._dns_warnings.add(msg_hash)
diff --git a/bbot/core/helpers/helper.py b/bbot/core/helpers/helper.py
index f25578d30b..7d0a00d7d7 100644
--- a/bbot/core/helpers/helper.py
+++ b/bbot/core/helpers/helper.py
@@ -81,10 +81,6 @@ def scan(self):
             self._scan = Scanner()
         return self._scan
 
-    @property
-    def scan_stopping(self):
-        return getattr(self.scan, "stopping", False)
-
     @property
     def in_tests(self):
         return os.environ.get("BBOT_TESTING", "") == "True"
diff --git a/bbot/modules/output/python.py b/bbot/modules/output/python.py
index d7ec521d96..3aebfeb527 100644
--- a/bbot/modules/output/python.py
+++ b/bbot/modules/output/python.py
@@ -5,5 +5,5 @@ class python(BaseOutputModule):
     watched_events = ["*"]
     meta = {"description": "Output via Python API"}
 
-    def _worker(self):
+    async def _worker(self):
         pass
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index f2f3fee371..80aae3e62b 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -238,7 +238,7 @@ async def start(self):
                     break
 
                 if "python" in self.modules:
-                    events, finish, report = self.modules["python"].events_waiting
+                    events, finish, report = await self.modules["python"].events_waiting()
                     for e in events:
                         yield e
 
diff --git a/bbot/test/helpers.py b/bbot/test/helpers.py
index 50ae08635b..4654c036ca 100644
--- a/bbot/test/helpers.py
+++ b/bbot/test/helpers.py
@@ -1,7 +1,10 @@
+import logging
 import requests_mock
 from abc import abstractmethod
 from omegaconf import OmegaConf
 
+log = logging.getLogger("bbot.test.helpers")
+
 
 class MockHelper:
     targets = ["blacklanternsecurity.com"]
@@ -13,17 +16,16 @@ class MockHelper:
     def __init__(self, config, bbot_scanner, *args, **kwargs):
         self.name = kwargs.get("module_name", self.__class__.__name__.lower())
         self.config = OmegaConf.merge(config, OmegaConf.create(self.config_overrides))
+        modules = [self.name] + self.additional_modules
         self.scan = bbot_scanner(
             *self.targets,
-            modules=[self.name] + self.additional_modules,
+            modules=modules,
             name=f"{self.name}_test",
             config=self.config,
             whitelist=self.whitelist,
             blacklist=self.blacklist,
         )
         self.patch_scan(self.scan)
-        self.scan.prep()
-        self.module = self.scan.modules[self.name]
         self.setup()
 
     def patch_scan(self, scan):
@@ -41,6 +43,10 @@ def run(self):
     def check_events(self, events):
         raise NotImplementedError
 
+    @property
+    def module(self):
+        return self.scan.modules[self.name]
+
 
 class RequestMockHelper(MockHelper):
     @abstractmethod
diff --git a/bbot/test/modules_test_classes.py b/bbot/test/modules_test_classes.py
index aedf31891a..c1bf5bf552 100644
--- a/bbot/test/modules_test_classes.py
+++ b/bbot/test/modules_test_classes.py
@@ -13,8 +13,8 @@ def mock_args(self):
         respond_args = dict(response_data=json.dumps({"foo": "bar"}))
         self.set_expect_requests(request_args, respond_args)
 
-    def run(self):
-        events = list(self.scan.start())
+    async def run(self):
+        events = [e async for e in self.scan.start()]
         assert self.check_events(events)
 
     def check_events(self, events):
diff --git a/bbot/test/test_step_1/test_modules_full.py b/bbot/test/test_step_1/test_modules_full.py
index 8203f14acf..8d1f58204b 100644
--- a/bbot/test/test_step_1/test_modules_full.py
+++ b/bbot/test/test_step_1/test_modules_full.py
@@ -11,9 +11,10 @@ def test_gowitness(bbot_config, bbot_scanner, bbot_httpserver):
     x.run()
 
 
-def test_httpx(bbot_config, bbot_scanner, bbot_httpserver):
+@pytest.mark.asyncio
+async def test_httpx(bbot_config, bbot_scanner, bbot_httpserver):
     x = Httpx(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+    await x.run()
 
 
 def test_excavate(bbot_config, bbot_scanner, bbot_httpserver):

From 700347bafa270deee2a41f4b19ef546f0a767cd9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 11 May 2023 16:35:19 -0400
Subject: [PATCH 012/387] module tests up to masscan

---
 bbot/core/helpers/command.py                 |  39 ++-
 bbot/core/helpers/depsinstaller/installer.py |  29 +-
 bbot/core/helpers/diff.py                    | 143 +++++-----
 bbot/core/helpers/misc.py                    |  17 ++
 bbot/modules/anubisdb.py                     |   8 +-
 bbot/modules/badsecrets.py                   |   2 +-
 bbot/modules/base.py                         |  91 ++++---
 bbot/modules/crobat.py                       |  14 +-
 bbot/modules/fingerprintx.py                 |   4 +-
 bbot/modules/gowitness.py                    |  25 +-
 bbot/modules/leakix.py                       |   4 +-
 bbot/modules/masscan.py                      |  15 +-
 bbot/modules/paramminer_cookies.py           |   4 +-
 bbot/modules/paramminer_getparams.py         |   4 +-
 bbot/modules/paramminer_headers.py           |  29 +-
 bbot/modules/robots.py                       |   6 +-
 bbot/modules/secretsdb.py                    |   6 +-
 bbot/modules/subdomain_hijack.py             |  22 +-
 bbot/modules/telerik.py                      |  54 ++--
 bbot/scanner/manager.py                      |  14 +-
 bbot/scanner/scanner.py                      |  49 ++--
 bbot/test/helpers.py                         |  49 ++--
 bbot/test/modules_test_classes.py            | 251 +++++++++---------
 bbot/test/test_step_1/test_modules_full.py   | 263 +++++++++++--------
 bbot/test/test_step_2/test_command.py        |  38 ++-
 poetry.lock                                  |  41 ++-
 pyproject.toml                               |   2 +-
 27 files changed, 689 insertions(+), 534 deletions(-)

diff --git a/bbot/core/helpers/command.py b/bbot/core/helpers/command.py
index 219fa1bc73..be66d04eec 100644
--- a/bbot/core/helpers/command.py
+++ b/bbot/core/helpers/command.py
@@ -2,14 +2,14 @@
 import asyncio
 import logging
 import traceback
-from subprocess import CompletedProcess
+from subprocess import CompletedProcess, CalledProcessError
 
 from .misc import smart_decode, smart_encode
 
 log = logging.getLogger("bbot.core.helpers.command")
 
 
-async def run(self, *command, **kwargs):
+async def run(self, *command, check=False, text=True, **kwargs):
     """
     Simple helper for running a command, and getting its output as a string
         process = await run(["ls", "/tmp"])
@@ -25,16 +25,20 @@ async def run(self, *command, **kwargs):
         stdout, stderr = await proc.communicate(_input)
 
         # surface stderr
-        stderr = smart_decode(stderr)
-        stdout = smart_decode(stdout)
-        if stderr and proc.returncode != 0:
-            command_str = " ".join(command)
-            log.warning(f"Stderr for run({command_str}):\n\t{stderr}")
+        if text:
+            stderr = smart_decode(stderr)
+            stdout = smart_decode(stdout)
+        if proc.returncode:
+            if check:
+                raise CalledProcessError(proc.returncode, command, output=stdout, stderr=stderr)
+            if stderr:
+                command_str = " ".join(command)
+                log.warning(f"Stderr for run({command_str}):\n\t{stderr}")
 
         return CompletedProcess(command, proc.returncode, stdout, stderr)
 
 
-async def run_live(self, *command, **kwargs):
+async def run_live(self, *command, check=False, text=True, **kwargs):
     """
     Simple helper for running a command and iterating through its output line by line in realtime
         async for line in run_live(["ls", "/tmp"]):
@@ -50,7 +54,11 @@ async def run_live(self, *command, **kwargs):
             line = await proc.stdout.readline()
             if not line:
                 break
-            yield smart_decode(line).rstrip("\r\n")
+            if text:
+                line = smart_decode(line).rstrip("\r\n")
+            else:
+                line = line.rstrip(b"\r\n")
+            yield line
 
         if input_task is not None:
             try:
@@ -59,12 +67,17 @@ async def run_live(self, *command, **kwargs):
                 log.trace(traceback.format_exc())
         await proc.wait()
 
-        # surface stderr
-        if proc.returncode != 0:
+        if proc.returncode:
             stdout, stderr = await proc.communicate()
+            if text:
+                stderr = smart_decode(stderr)
+                stdout = smart_decode(stdout)
+            if check:
+                raise CalledProcessError(proc.returncode, command, output=stdout, stderr=stderr)
+            # surface stderr
             if stderr:
                 command_str = " ".join(command)
-                log.warning(f"Stderr for run_live({command_str}):\n\t{smart_decode(stderr)}")
+                log.warning(f"Stderr for run_live({command_str}):\n\t{stderr}")
 
 
 async def _spawn_proc(self, *command, **kwargs):
@@ -100,6 +113,8 @@ async def _write_stdin(proc, _input):
 
 
 def _prepare_command_kwargs(self, command, kwargs):
+    # limit = 10MB (this is needed for cases like httpx that are sending large JSON blobs over stdout)
+    kwargs["limit"] = 1024 * 1024 * 10
     if not "stdout" in kwargs:
         kwargs["stdout"] = asyncio.subprocess.PIPE
     if not "stderr" in kwargs:
diff --git a/bbot/core/helpers/depsinstaller/installer.py b/bbot/core/helpers/depsinstaller/installer.py
index 31c37a6dba..2195237f38 100644
--- a/bbot/core/helpers/depsinstaller/installer.py
+++ b/bbot/core/helpers/depsinstaller/installer.py
@@ -29,6 +29,7 @@ def __init__(self, parent_helper):
         os.environ["ANSIBLE_TIMEOUT"] = str(http_timeout)
 
         self.askpass_filename = "sudo_askpass.py"
+        self._installed_sudo_askpass = False
         self._sudo_password = os.environ.get("BBOT_SUDO_PASS", None)
         if self._sudo_password is None:
             if configurator.bbot_sudo_pass is not None:
@@ -55,7 +56,7 @@ def __init__(self, parent_helper):
 
         self.ensure_root_lock = Lock()
 
-    def install(self, *modules):
+    async def install(self, *modules):
         self.install_core_deps()
         succeeded = []
         failed = []
@@ -95,7 +96,7 @@ def install(self, *modules):
                         # get sudo access if we need it
                         if preloaded.get("sudo", False) == True:
                             self.ensure_root(f'Module "{m}" needs root privileges to install its dependencies.')
-                        success = self.install_module(m)
+                        success = await self.install_module(m)
                         self.setup_status[module_hash] = success
                         if success or self.ignore_failed_deps:
                             log.debug(f'Setup succeeded for module "{m}"')
@@ -122,7 +123,7 @@ def install(self, *modules):
         failed.sort()
         return succeeded, failed
 
-    def install_module(self, module):
+    async def install_module(self, module):
         success = True
         preloaded = self.all_modules_preloaded[module]
 
@@ -145,11 +146,11 @@ def install_module(self, module):
         deps_pip = preloaded["deps"]["pip"]
         deps_pip_constraints = preloaded["deps"]["pip_constraints"]
         if deps_pip:
-            success &= self.pip_install(deps_pip, constraints=deps_pip_constraints)
+            success &= await self.pip_install(deps_pip, constraints=deps_pip_constraints)
 
         return success
 
-    def pip_install(self, packages, constraints=None):
+    async def pip_install(self, packages, constraints=None):
         packages_str = ",".join(packages)
         log.info(f"Installing the following pip packages: {packages_str}")
 
@@ -162,7 +163,7 @@ def pip_install(self, packages, constraints=None):
 
         process = None
         try:
-            process = self.parent_helper.run(command, check=True)
+            process = await self.parent_helper.run(command, check=True)
             message = f'Successfully installed pip packages "{packages_str}"'
             output = process.stdout.splitlines()[-1]
             if output:
@@ -297,6 +298,7 @@ def write_setup_status(self):
             json.dump(self.setup_status, f)
 
     def ensure_root(self, message=""):
+        self._install_sudo_askpass()
         with self.ensure_root_lock:
             if os.geteuid() != 0 and self._sudo_password is None:
                 if message:
@@ -314,11 +316,7 @@ def ensure_root(self, message=""):
 
     def install_core_deps(self):
         to_install = set()
-        # install custom askpass script
-        askpass_src = Path(__file__).resolve().parent / self.askpass_filename
-        askpass_dst = self.parent_helper.tools_dir / self.askpass_filename
-        shutil.copy(askpass_src, askpass_dst)
-        askpass_dst.chmod(askpass_dst.stat().st_mode | stat.S_IEXEC)
+        self._install_sudo_askpass()
         # ensure tldextract data is cached
         self.parent_helper.tldextract("evilcorp.co.uk")
         # command: package_name
@@ -329,3 +327,12 @@ def install_core_deps(self):
         if to_install:
             self.ensure_root()
             self.apt_install(list(to_install))
+
+    def _install_sudo_askpass(self):
+        if not self._installed_sudo_askpass:
+            self._installed_sudo_askpass = True
+            # install custom askpass script
+            askpass_src = Path(__file__).resolve().parent / self.askpass_filename
+            askpass_dst = self.parent_helper.tools_dir / self.askpass_filename
+            shutil.copy(askpass_src, askpass_dst)
+            askpass_dst.chmod(askpass_dst.stat().st_mode | stat.S_IEXEC)
diff --git a/bbot/core/helpers/diff.py b/bbot/core/helpers/diff.py
index 43f668dfd8..2f191e0db6 100644
--- a/bbot/core/helpers/diff.py
+++ b/bbot/core/helpers/diff.py
@@ -1,6 +1,5 @@
 import logging
 import xmltodict
-from time import sleep
 from deepdiff import DeepDiff
 from contextlib import suppress
 from xml.parsers.expat import ExpatError
@@ -14,69 +13,77 @@ def __init__(self, baseline_url, parent_helper, method="GET", allow_redirects=Fa
         self.parent_helper = parent_helper
         self.baseline_url = baseline_url
         self.include_cache_buster = include_cache_buster
+        self.method = method
+        self.allow_redirects = allow_redirects
+        self._baselined = False
+
+    async def _baseline(self):
+        if not self._baselined:
+            self._baselined = True
+            # vanilla URL
+            if self.include_cache_buster:
+                url_1 = self.parent_helper.add_get_params(self.baseline_url, self.gen_cache_buster()).geturl()
+            else:
+                url_1 = self.baseline_url
+            baseline_1 = await self.parent_helper.request(
+                url_1, follow_redirects=self.allow_redirects, method=self.method
+            )
+            await self.parent_helper.sleep(1)
+            # put random parameters in URL, headers, and cookies
+            get_params = {self.parent_helper.rand_string(6): self.parent_helper.rand_string(6)}
+
+            if self.include_cache_buster:
+                get_params.update(self.gen_cache_buster())
+            url_2 = self.parent_helper.add_get_params(self.baseline_url, get_params).geturl()
+            baseline_2 = await self.parent_helper.request(
+                url_2,
+                headers={self.parent_helper.rand_string(6): self.parent_helper.rand_string(6)},
+                cookies={self.parent_helper.rand_string(6): self.parent_helper.rand_string(6)},
+                follow_redirects=self.allow_redirects,
+                method=self.method,
+            )
 
-        # vanilla URL
-        if self.include_cache_buster:
-            url_1 = self.parent_helper.add_get_params(self.baseline_url, self.gen_cache_buster()).geturl()
-        else:
-            url_1 = self.baseline_url
-        baseline_1 = self.parent_helper.request(url_1, allow_redirects=allow_redirects, method=method)
-        sleep(1)
-        # put random parameters in URL, headers, and cookies
-        get_params = {self.parent_helper.rand_string(6): self.parent_helper.rand_string(6)}
-
-        if self.include_cache_buster:
-            get_params.update(self.gen_cache_buster())
-        url_2 = self.parent_helper.add_get_params(self.baseline_url, get_params).geturl()
-        baseline_2 = self.parent_helper.request(
-            url_2,
-            headers={self.parent_helper.rand_string(6): self.parent_helper.rand_string(6)},
-            cookies={self.parent_helper.rand_string(6): self.parent_helper.rand_string(6)},
-            allow_redirects=allow_redirects,
-            method=method,
-        )
-
-        self.baseline = baseline_1
-
-        if baseline_1 is None or baseline_2 is None:
-            log.debug("HTTP error while establishing baseline, aborting")
-            raise HttpCompareError("Can't get baseline from source URL")
-        if baseline_1.status_code != baseline_2.status_code:
-            log.debug("Status code not stable during baseline, aborting")
-            raise HttpCompareError("Can't get baseline from source URL")
-        try:
-            baseline_1_json = xmltodict.parse(baseline_1.text)
-            baseline_2_json = xmltodict.parse(baseline_2.text)
-        except ExpatError:
-            log.debug(f"Cant HTML parse for {baseline_url}. Switching to text parsing as a backup")
-            baseline_1_json = baseline_1.text.split("\n")
-            baseline_2_json = baseline_2.text.split("\n")
-
-        ddiff = DeepDiff(baseline_1_json, baseline_2_json, ignore_order=True, view="tree")
-        self.ddiff_filters = []
-
-        for k, v in ddiff.items():
-            for x in list(ddiff[k]):
-                log.debug(f"Added {k} filter for path: {x.path()}")
-                self.ddiff_filters.append(x.path())
-
-        self.baseline_json = baseline_1_json
-
-        self.baseline_ignore_headers = [
-            h.lower()
-            for h in [
-                "date",
-                "last-modified",
-                "content-length",
-                "ETag",
-                "X-Pad",
-                "X-Backside-Transport",
+            self.baseline = baseline_1
+
+            if baseline_1 is None or baseline_2 is None:
+                log.debug("HTTP error while establishing baseline, aborting")
+                raise HttpCompareError("Can't get baseline from source URL")
+            if baseline_1.status_code != baseline_2.status_code:
+                log.debug("Status code not stable during baseline, aborting")
+                raise HttpCompareError("Can't get baseline from source URL")
+            try:
+                baseline_1_json = xmltodict.parse(baseline_1.text)
+                baseline_2_json = xmltodict.parse(baseline_2.text)
+            except ExpatError:
+                log.debug(f"Cant HTML parse for {self.baseline_url}. Switching to text parsing as a backup")
+                baseline_1_json = baseline_1.text.split("\n")
+                baseline_2_json = baseline_2.text.split("\n")
+
+            ddiff = DeepDiff(baseline_1_json, baseline_2_json, ignore_order=True, view="tree")
+            self.ddiff_filters = []
+
+            for k, v in ddiff.items():
+                for x in list(ddiff[k]):
+                    log.debug(f"Added {k} filter for path: {x.path()}")
+                    self.ddiff_filters.append(x.path())
+
+            self.baseline_json = baseline_1_json
+
+            self.baseline_ignore_headers = [
+                h.lower()
+                for h in [
+                    "date",
+                    "last-modified",
+                    "content-length",
+                    "ETag",
+                    "X-Pad",
+                    "X-Backside-Transport",
+                ]
             ]
-        ]
-        dynamic_headers = self.compare_headers(baseline_1.headers, baseline_2.headers)
+            dynamic_headers = self.compare_headers(baseline_1.headers, baseline_2.headers)
 
-        self.baseline_ignore_headers += [x.lower() for x in dynamic_headers]
-        self.baseline_body_distance = self.compare_body(baseline_1_json, baseline_2_json)
+            self.baseline_ignore_headers += [x.lower() for x in dynamic_headers]
+            self.baseline_body_distance = self.compare_body(baseline_1_json, baseline_2_json)
 
     def gen_cache_buster(self):
         return {self.parent_helper.rand_string(6): "1"}
@@ -114,7 +121,7 @@ def compare_body(self, content_1, content_2):
             log.debug(ddiff)
             return False
 
-    def compare(
+    async def compare(
         self, subject, headers=None, cookies=None, check_reflection=False, method="GET", allow_redirects=False
     ):
         """
@@ -125,6 +132,7 @@ def compare(
                 "reason" is the location of the change ("code", "body", "header", or None), and
                 "reflection" is whether the value was reflected in the HTTP response
         """
+        await self._baseline()
 
         reflection = False
         if self.include_cache_buster:
@@ -132,8 +140,8 @@ def compare(
             url = self.parent_helper.add_get_params(subject, {cache_key: cache_value}).geturl()
         else:
             url = subject
-        subject_response = self.parent_helper.request(
-            url, headers=headers, cookies=cookies, allow_redirects=allow_redirects, method=method
+        subject_response = await self.parent_helper.request(
+            url, headers=headers, cookies=cookies, follow_redirects=allow_redirects, method=method
         )
 
         if not subject_response:
@@ -184,10 +192,11 @@ def compare(
         else:
             return (False, diff_reasons, reflection, subject_response)
 
-    def canary_check(self, url, mode, rounds=6):
+    async def canary_check(self, url, mode, rounds=6):
         """
         test detection using a canary to find hosts giving bad results
         """
+        await self._baseline()
         headers = None
         cookies = None
         for i in range(0, rounds):
@@ -202,7 +211,9 @@ def canary_check(self, url, mode, rounds=6):
             else:
                 raise ValueError(f'Invalid mode: "{mode}", choose from: getparam, header, cookie')
 
-            match, reasons, reflection, subject_response = self.compare(new_url, headers=headers, cookies=cookies)
+            match, reasons, reflection, subject_response = await self.compare(
+                new_url, headers=headers, cookies=cookies
+            )
 
             # a nonsense header "caused" a difference, we need to abort
             if match == False:
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 5e95899200..243901231f 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -10,6 +10,7 @@
 import shutil
 import signal
 import string
+import asyncio
 import difflib
 import inspect
 import logging
@@ -18,6 +19,7 @@
 import traceback
 import subprocess as sp
 from pathlib import Path
+from asyncio import sleep  # noqa
 from itertools import islice
 from datetime import datetime
 from tabulate import tabulate
@@ -1052,3 +1054,18 @@ def get_traceback_details(e):
     lineno = last_frame.lineno
     funcname = last_frame.name
     return filename, lineno, funcname
+
+
+def create_task(*args, **kwargs):
+    return asyncio.create_task(*args, **kwargs)
+
+
+def as_completed(*args, **kwargs):
+    yield from asyncio.as_completed(*args, **kwargs)
+
+
+async def cancel_tasks(tasks):
+    for task in tasks:
+        task.cancel()
+        with suppress(asyncio.CancelledError):
+            await task
diff --git a/bbot/modules/anubisdb.py b/bbot/modules/anubisdb.py
index affb579eec..c580c9e9da 100644
--- a/bbot/modules/anubisdb.py
+++ b/bbot/modules/anubisdb.py
@@ -10,9 +10,9 @@ class anubisdb(crobat):
     base_url = "https://jldc.me/anubis/subdomains"
     dns_abort_depth = 5
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/{self.helpers.quote(query)}"
-        return self.request_with_fail_count(url)
+        return await self.request_with_fail_count(url)
 
     def abort_if_pre(self, hostname):
         """
@@ -24,11 +24,11 @@ def abort_if_pre(self, hostname):
             return True
         return False
 
-    def abort_if(self, event):
+    async def abort_if(self, event):
         # abort if dns name is unresolved
         if not "resolved" in event.tags:
             return True, "DNS name is unresolved"
-        return super().abort_if(event)
+        return await super().abort_if(event)
 
     def parse_results(self, r, query):
         results = set()
diff --git a/bbot/modules/badsecrets.py b/bbot/modules/badsecrets.py
index 82bf3c1453..99194eae3d 100644
--- a/bbot/modules/badsecrets.py
+++ b/bbot/modules/badsecrets.py
@@ -11,7 +11,7 @@ class badsecrets(BaseModule):
     max_event_handlers = 2
     deps_pip = ["badsecrets~=0.1.287"]
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         resp_body = event.data.get("body", None)
         resp_headers = event.data.get("header", None)
         resp_cookies = {}
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 75c9f08c40..4d1f626541 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -1,4 +1,3 @@
-import queue
 import asyncio
 import logging
 import traceback
@@ -98,6 +97,7 @@ def __init__(self, scan):
         # track number of failures (for .request_with_fail_count())
         self._request_failures = 0
 
+        self._tasks = []
         self._event_received = asyncio.Condition()
 
     async def setup(self):
@@ -238,10 +238,13 @@ def make_event(self, *args, **kwargs):
 
     def emit_event(self, *args, **kwargs):
         event_kwargs = dict(kwargs)
+        emit_kwargs = {}
         for o in ("on_success_callback", "abort_if", "quick"):
-            event_kwargs.pop(o, None)
+            v = event_kwargs.pop(o, None)
+            if v is not None:
+                emit_kwargs[o] = v
         event = self.make_event(*args, **event_kwargs)
-        self.scan.manager.queue_event(event)
+        self.scan.manager.queue_event(event, **emit_kwargs)
 
     async def events_waiting(self):
         """
@@ -262,6 +265,7 @@ async def events_waiting(self):
                         finish = True
                     else:
                         events.append(event)
+                        self.scan.stats.event_consumed(event, self)
                 elif reason:
                     self.debug(f"Not accepting {event} because {reason}")
             except asyncio.queues.QueueEmpty:
@@ -276,7 +280,7 @@ def num_queued_events(self):
         return ret
 
     def start(self):
-        self.tasks = [asyncio.create_task(self._worker()) for _ in range(self.max_event_handlers)]
+        self._tasks = [asyncio.create_task(self._worker()) for _ in range(self.max_event_handlers)]
 
     async def _setup(self):
         status_codes = {False: "hard-fail", None: "soft-fail", True: "success"}
@@ -300,40 +304,42 @@ async def _setup(self):
         return self.name, status, str(msg)
 
     async def _worker(self):
-        while not self.scan.stopping:
-            # hold the reigns if our outgoing queue is full
-            # if self._qsize and self.outgoing_event_queue.qsize() >= self._qsize:
-            #     with self.event_received:
-            #         await self.event_received.wait()
-
-            if self.batch_size > 1:
-                submitted = await self._handle_batch()
-                if not submitted:
-                    async with self._event_received:
-                        await self._event_received.wait()
-
-            else:
-                try:
-                    if self.incoming_event_queue:
-                        event = await self.incoming_event_queue.get()
-                    else:
-                        self.debug(f"Event queue is in bad state")
-                        return
-                except asyncio.queues.QueueEmpty:
-                    continue
-                self.debug(f"Got {event} from {getattr(event, 'module', 'unknown_module')}")
-                acceptable, reason = await self._event_postcheck(event)
-                if not acceptable:
-                    self.debug(f"Not accepting {event} because {reason}")
-                if acceptable:
-                    if event.type == "FINISHED":
-                        async with self.scan.acatch(context=f"{self.name}.finish"):
-                            with self._task_counter:
-                                await self.finish()
-                    else:
-                        async with self.scan.acatch(context=f"{self.name}.handle_event"):
-                            with self._task_counter:
-                                await self.handle_event(event)
+        async with self.scan.acatch(context=self._worker):
+            while not self.scan.stopping:
+                # hold the reigns if our outgoing queue is full
+                # if self._qsize and self.outgoing_event_queue.qsize() >= self._qsize:
+                #     with self.event_received:
+                #         await self.event_received.wait()
+
+                if self.batch_size > 1:
+                    submitted = await self._handle_batch()
+                    if not submitted:
+                        async with self._event_received:
+                            await self._event_received.wait()
+
+                else:
+                    try:
+                        if self.incoming_event_queue:
+                            event = await self.incoming_event_queue.get()
+                        else:
+                            self.debug(f"Event queue is in bad state")
+                            return
+                    except asyncio.queues.QueueEmpty:
+                        continue
+                    self.debug(f"Got {event} from {getattr(event, 'module', 'unknown_module')}")
+                    acceptable, reason = await self._event_postcheck(event)
+                    if not acceptable:
+                        self.debug(f"Not accepting {event} because {reason}")
+                    if acceptable:
+                        if event.type == "FINISHED":
+                            async with self.scan.acatch(context=f"{self.name}.finish"):
+                                with self._task_counter:
+                                    await self.finish()
+                        else:
+                            self.scan.stats.event_consumed(event, self)
+                            async with self.scan.acatch(context=f"{self.name}.handle_event"):
+                                with self._task_counter:
+                                    await self.handle_event(event)
 
     @property
     def max_scope_distance(self):
@@ -454,7 +460,7 @@ def set_error_state(self, message=None):
             # clear incoming queue
             if self.incoming_event_queue:
                 self.debug(f"Emptying event_queue")
-                with suppress(queue.Empty):
+                with suppress(asyncio.queues.QueueEmpty):
                     while 1:
                         self.incoming_event_queue.get_nowait()
                 # set queue to None to prevent its use
@@ -493,8 +499,8 @@ def finished(self):
         """
         return not self.running and self.num_queued_events <= 0 and self.outgoing_event_queue.qsize() <= 0
 
-    def request_with_fail_count(self, *args, **kwargs):
-        r = self.helpers.request(*args, **kwargs)
+    async def request_with_fail_count(self, *args, **kwargs):
+        r = await self.helpers.request(*args, **kwargs)
         if r is None:
             self._request_failures += 1
         else:
@@ -550,8 +556,7 @@ def memory_usage(self):
         """
         Return how much memory the module is currently using in bytes
         """
-        seen = set(self.scan.pools.values())
-        seen.update({self.scan, self.helpers, self.log})
+        seen = {self.scan, self.helpers, self.log}
         return get_size(self, max_depth=3, seen=seen)
 
     def __str__(self):
diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index 66c0f70b62..da4191911f 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -77,17 +77,17 @@ def already_processed(self, hostname):
                 return True
         return False
 
-    def abort_if(self, event):
+    async def abort_if(self, event):
         # this helps weed out unwanted results when scanning IP_RANGES and wildcard domains
         if "in-scope" not in event.tags:
             return True
-        if self._is_wildcard(event.data):
+        if await self._is_wildcard(event.data):
             return True
         return False
 
     async def handle_event(self, event):
         query = self.make_query(event)
-        results = self.query(query)
+        results = await self.query(query)
         if results:
             for hostname in set(results):
                 if hostname:
@@ -99,9 +99,9 @@ async def handle_event(self, event):
                     if hostname and hostname.endswith(f".{query}") and not hostname == event.data:
                         self.emit_event(hostname, "DNS_NAME", event, abort_if=self.abort_if)
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/subdomains/{self.helpers.quote(query)}"
-        return self.request_with_fail_count(url)
+        return await self.request_with_fail_count(url)
 
     def make_query(self, event):
         if "target" in event.tags:
@@ -116,13 +116,13 @@ def parse_results(self, r, query=None):
             for hostname in json:
                 yield hostname
 
-    def query(self, query, parse_fn=None, request_fn=None):
+    async def query(self, query, parse_fn=None, request_fn=None):
         if parse_fn is None:
             parse_fn = self.parse_results
         if request_fn is None:
             request_fn = self.request_url
         try:
-            results = list(parse_fn(request_fn(query), query))
+            results = list(parse_fn(await request_fn(query), query))
             if results:
                 return results
             self.debug(f'No results for "{query}"')
diff --git a/bbot/modules/fingerprintx.py b/bbot/modules/fingerprintx.py
index e6b76227e0..3bc36da66f 100644
--- a/bbot/modules/fingerprintx.py
+++ b/bbot/modules/fingerprintx.py
@@ -26,10 +26,10 @@ class fingerprintx(BaseModule):
         },
     ]
 
-    def handle_batch(self, *events):
+    async def handle_batch(self, *events):
         _input = {e.data: e for e in events}
         command = ["fingerprintx", "--json"]
-        for line in self.helpers.run_live(command, input=list(_input), stderr=subprocess.DEVNULL):
+        async for line in self.helpers.run_live(command, input=list(_input), stderr=subprocess.DEVNULL):
             try:
                 j = json.loads(line)
             except Exception as e:
diff --git a/bbot/modules/gowitness.py b/bbot/modules/gowitness.py
index 3972f4f105..867f1534bc 100644
--- a/bbot/modules/gowitness.py
+++ b/bbot/modules/gowitness.py
@@ -80,7 +80,7 @@ class gowitness(BaseModule):
     # this is one hop further than the default
     scope_distance_modifier = 1
 
-    def setup(self):
+    async def setup(self):
         self.timeout = self.config.get("timeout", 10)
         self.threads = self.config.get("threads", 4)
         self.proxy = self.scan.config.get("http_proxy", "")
@@ -113,7 +113,7 @@ def prep(self):
                 copymode(self.helpers.tools_dir / "gowitness", self.base_path / "gowitness")
             self.prepped = True
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         # Ignore URLs that are redirects
         if any(t.startswith("status-30") for t in event.tags):
             return False, "URL is a redirect"
@@ -122,12 +122,12 @@ def filter_event(self, event):
             return False, "event is from self"
         return True
 
-    def handle_batch(self, *events):
+    async def handle_batch(self, *events):
         self.prep()
         stdin = "\n".join([str(e.data) for e in events])
         events = {e.data: e for e in events}
 
-        for line in self.helpers.run_live(self.command, input=stdin):
+        async for line in self.helpers.run_live(self.command, input=stdin):
             self.debug(line)
 
         # emit web screenshots
@@ -242,12 +242,11 @@ def cur_execute(self, cur, query):
             self.trace()
             return []
 
-    def report(self):
-        with self._report_lock:
-            if self.screenshots_taken:
-                self.success(f"{len(self.screenshots_taken):,} web screenshots captured. To view:")
-                self.success(f"    - Start gowitness")
-                self.success(f"        - cd {self.base_path} && ./gowitness server")
-                self.success(f"    - Browse to http://localhost:7171")
-            else:
-                self.info(f"No web screenshots captured")
+    async def report(self):
+        if self.screenshots_taken:
+            self.success(f"{len(self.screenshots_taken):,} web screenshots captured. To view:")
+            self.success(f"    - Start gowitness")
+            self.success(f"        - cd {self.base_path} && ./gowitness server")
+            self.success(f"    - Browse to http://localhost:7171")
+        else:
+            self.info(f"No web screenshots captured")
diff --git a/bbot/modules/leakix.py b/bbot/modules/leakix.py
index e692ae838f..d494683afc 100644
--- a/bbot/modules/leakix.py
+++ b/bbot/modules/leakix.py
@@ -9,9 +9,9 @@ class leakix(crobat):
 
     base_url = "https://leakix.net"
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/api/subdomains/{self.helpers.quote(query)}"
-        return self.request_with_fail_count(url, headers={"Accept": "application/json"})
+        return await self.request_with_fail_count(url, headers={"Accept": "application/json"})
 
     def parse_results(self, r, query=None):
         json = r.json()
diff --git a/bbot/modules/masscan.py b/bbot/modules/masscan.py
index b7f594f3e7..9e8282702f 100644
--- a/bbot/modules/masscan.py
+++ b/bbot/modules/masscan.py
@@ -50,7 +50,7 @@ class masscan(BaseModule):
     ]
     _qsize = 100
 
-    def setup(self):
+    async def setup(self):
         self.ports = self.config.get("ports", "80,443")
         self.rate = self.config.get("rate", 600)
         self.wait = self.config.get("wait", 10)
@@ -61,7 +61,7 @@ def setup(self):
         if not self.helpers.in_tests:
             try:
                 dry_run_command = self._build_masscan_command(self._target_findkey, dry_run=True)
-                dry_run_result = self.helpers.run(dry_run_command)
+                dry_run_result = await self.helpers.run(dry_run_command)
                 self.masscan_config = dry_run_result.stdout
                 self.masscan_config = "\n".join(l for l in self.masscan_config.splitlines() if "nocapture" not in l)
             except subprocess.CalledProcessError as e:
@@ -91,7 +91,7 @@ def setup(self):
         self.syn_cache_fd = None
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         if self.use_cache:
             self.emit_from_cache()
         else:
@@ -114,7 +114,7 @@ def handle_event(self, event):
             if self.ping_first:
                 self.verbose("Starting masscan (ping scan)")
 
-                self.masscan(targets, result_callback=self.append_alive_host, exclude=exclude, ping=True)
+                await self.masscan(targets, result_callback=self.append_alive_host, exclude=exclude, ping=True)
                 targets = ",".join(str(h) for h in self.alive_hosts)
                 if not targets:
                     self.warning("No hosts responded to pings")
@@ -123,13 +123,13 @@ def handle_event(self, event):
             # TCP SYN scan
             if self.ports:
                 self.verbose("Starting masscan (TCP SYN scan)")
-                self.masscan(targets, result_callback=self.emit_open_tcp_port, exclude=exclude)
+                await self.masscan(targets, result_callback=self.emit_open_tcp_port, exclude=exclude)
             else:
                 self.verbose("No ports specified, skipping TCP SYN scan")
             # save memory
             self.alive_hosts.clear()
 
-    def masscan(self, targets, result_callback, exclude=None, ping=False):
+    async def masscan(self, targets, result_callback, exclude=None, ping=False):
         # config file
         masscan_config = self.masscan_config.replace(self._target_findkey, targets)
         self.debug("Masscan config:")
@@ -145,7 +145,8 @@ def masscan(self, targets, result_callback, exclude=None, ping=False):
         stats_file = self.helpers.tempfile_tail(callback=self.verbose)
         try:
             with open(stats_file, "w") as stats_fh:
-                for line in self.helpers.run_live(command, sudo=True, stderr=stats_fh):
+                self.critical(f"masscan: {command}")
+                async for line in self.helpers.run_live(command, sudo=True, stderr=stats_fh):
                     self.process_output(line, result_callback=result_callback)
         finally:
             stats_file.unlink()
diff --git a/bbot/modules/paramminer_cookies.py b/bbot/modules/paramminer_cookies.py
index 64f3965191..0d4e28b0e6 100644
--- a/bbot/modules/paramminer_cookies.py
+++ b/bbot/modules/paramminer_cookies.py
@@ -20,9 +20,9 @@ class paramminer_cookies(paramminer_headers):
     in_scope_only = True
     compare_mode = "cookie"
 
-    def check_batch(self, compare_helper, url, cookie_list):
+    async def check_batch(self, compare_helper, url, cookie_list):
         cookies = {p: self.rand_string(14) for p in cookie_list}
-        return compare_helper.compare(url, cookies=cookies)
+        return await compare_helper.compare(url, cookies=cookies)
 
     def gen_count_args(self, url):
         cookie_count = 40
diff --git a/bbot/modules/paramminer_getparams.py b/bbot/modules/paramminer_getparams.py
index 7ad778c0e4..6b79053434 100644
--- a/bbot/modules/paramminer_getparams.py
+++ b/bbot/modules/paramminer_getparams.py
@@ -19,9 +19,9 @@ class paramminer_getparams(paramminer_headers):
     in_scope_only = True
     compare_mode = "getparam"
 
-    def check_batch(self, compare_helper, url, getparam_list):
+    async def check_batch(self, compare_helper, url, getparam_list):
         test_getparams = {p: self.rand_string(14) for p in getparam_list}
-        return compare_helper.compare(self.helpers.add_get_params(url, test_getparams).geturl())
+        return await compare_helper.compare(self.helpers.add_get_params(url, test_getparams).geturl())
 
     def gen_count_args(self, url):
         getparam_count = 40
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 1009a4a33f..8357ea4db9 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -29,28 +29,28 @@ class paramminer_headers(BaseModule):
     in_scope_only = True
     compare_mode = "header"
 
-    def setup(self):
+    async def setup(self):
         wordlist_url = self.config.get("wordlist", "")
-        self.wordlist = self.helpers.wordlist(wordlist_url)
+        self.wordlist = await self.helpers.wordlist(wordlist_url)
         return True
 
     def rand_string(self, *args, **kwargs):
         return self.helpers.rand_string(*args, **kwargs)
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         url = event.data
         try:
             compare_helper = self.helpers.http_compare(url)
         except HttpCompareError as e:
             self.debug(e)
             return
-        batch_size = self.count_test(url)
+        batch_size = await self.count_test(url)
         if batch_size == None or batch_size <= 0:
             self.debug(f"Failed to get baseline max {self.compare_mode} count, aborting")
             return
         self.debug(f"Resolved batch_size at {str(batch_size)}")
 
-        if compare_helper.canary_check(url, mode=self.compare_mode) == False:
+        if await compare_helper.canary_check(url, mode=self.compare_mode) == False:
             self.verbose(f'Aborting "{url}" due to failed canary check')
             return
 
@@ -62,7 +62,7 @@ def handle_event(self, event):
         abort_threshold = 25
         try:
             for group in self.helpers.grouper(wordlist_cleaned, batch_size):
-                for result, reasons, reflection in self.binary_search(compare_helper, url, group):
+                async for result, reasons, reflection in self.binary_search(compare_helper, url, group):
                     results.add((result, ",".join(reasons), reflection))
                     if len(results) >= abort_threshold:
                         self.warning(
@@ -85,14 +85,14 @@ def handle_event(self, event):
                 tags=tags,
             )
 
-    def count_test(self, url):
-        baseline = self.helpers.request(url)
+    async def count_test(self, url):
+        baseline = await self.helpers.request(url)
         if baseline is None:
             return
         if str(baseline.status_code)[0] in ("4", "5"):
             return
         for count, args, kwargs in self.gen_count_args(url):
-            r = self.helpers.request(*args, **kwargs)
+            r = await self.helpers.request(*args, **kwargs)
             if r is not None and not ((str(r.status_code)[0] in ("4", "5"))):
                 return count
 
@@ -112,7 +112,7 @@ def clean_list(self, header):
             return True
         return False
 
-    def binary_search(self, compare_helper, url, group, reasons=None, reflection=False):
+    async def binary_search(self, compare_helper, url, group, reasons=None, reflection=False):
         if reasons is None:
             reasons = []
         self.debug(f"Entering recursive binary_search with {len(group):,} sized group")
@@ -121,15 +121,16 @@ def binary_search(self, compare_helper, url, group, reasons=None, reflection=Fal
                 yield group[0], reasons, reflection
         elif len(group) > 1:
             for group_slice in self.helpers.split_list(group):
-                match, reasons, reflection, subject_response = self.check_batch(compare_helper, url, group_slice)
+                match, reasons, reflection, subject_response = await self.check_batch(compare_helper, url, group_slice)
                 if match == False:
-                    yield from self.binary_search(compare_helper, url, group_slice, reasons, reflection)
+                    async for r in self.binary_search(compare_helper, url, group_slice, reasons, reflection):
+                        yield r
         else:
             self.warning(f"Submitted group of size 0 to binary_search()")
 
-    def check_batch(self, compare_helper, url, header_list):
+    async def check_batch(self, compare_helper, url, header_list):
         rand = self.rand_string()
         test_headers = {}
         for header in header_list:
             test_headers[header] = rand
-        return compare_helper.compare(url, headers=test_headers, check_reflection=(len(header_list) == 1))
+        return await compare_helper.compare(url, headers=test_headers, check_reflection=(len(header_list) == 1))
diff --git a/bbot/modules/robots.py b/bbot/modules/robots.py
index 97cdfffacf..da4908fcef 100644
--- a/bbot/modules/robots.py
+++ b/bbot/modules/robots.py
@@ -16,11 +16,11 @@ class robots(BaseModule):
 
     in_scope_only = True
 
-    def setup(self):
+    async def setup(self):
         self.scanned_hosts = set()
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         parsed_host = event.parsed
         host = f"{parsed_host.scheme}://{parsed_host.netloc}/"
         host_hash = hash(host)
@@ -32,7 +32,7 @@ def handle_event(self, event):
 
         result = None
         url = f"{host}robots.txt"
-        result = self.helpers.request(url)
+        result = await self.helpers.request(url)
         if result:
             body = result.text
 
diff --git a/bbot/modules/secretsdb.py b/bbot/modules/secretsdb.py
index 42ed0445f3..db74f7acc3 100644
--- a/bbot/modules/secretsdb.py
+++ b/bbot/modules/secretsdb.py
@@ -19,10 +19,10 @@ class secretsdb(BaseModule):
     }
     deps_pip = ["pyyaml~=6.0"]
 
-    def setup(self):
+    async def setup(self):
         self.rules = []
         self.min_confidence = self.config.get("min_confidence", 99)
-        self.sig_file = self.helpers.wordlist(self.config.get("signatures", ""))
+        self.sig_file = await self.helpers.wordlist(self.config.get("signatures", ""))
         with open(self.sig_file) as f:
             rules_yaml = yaml.safe_load(f).get("patterns", [])
         for r in rules_yaml:
@@ -41,7 +41,7 @@ def setup(self):
                     self.debug(f"Error compiling regex: r'{regex}'")
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         resp_body = event.data.get("body", "")
         resp_headers = event.data.get("raw_header", "")
         for r in self.rules:
diff --git a/bbot/modules/subdomain_hijack.py b/bbot/modules/subdomain_hijack.py
index cfcc441139..201e8b4a36 100644
--- a/bbot/modules/subdomain_hijack.py
+++ b/bbot/modules/subdomain_hijack.py
@@ -1,6 +1,6 @@
 import re
 import json
-import requests
+import httpx
 
 from bbot.modules.base import BaseModule
 from bbot.core.helpers.misc import tldextract
@@ -18,9 +18,9 @@ class subdomain_hijack(BaseModule):
     scope_distance_modifier = 3
     max_event_handlers = 5
 
-    def setup(self):
+    async def setup(self):
         fingerprints_url = self.config.get("fingerprints")
-        fingerprints_file = self.helpers.wordlist(fingerprints_url)
+        fingerprints_file = await self.helpers.wordlist(fingerprints_url)
         with open(fingerprints_file) as f:
             fingerprints = json.load(f)
         self.fingerprints = []
@@ -40,8 +40,8 @@ def setup(self):
         self.debug(f"Successfully processed {len(self.fingerprints):,} fingerprints")
         return True
 
-    def handle_event(self, event):
-        hijackable, reason = self.check_subdomain(event)
+    async def handle_event(self, event):
+        hijackable, reason = await self.check_subdomain(event)
         if hijackable:
             source_hosts = []
             e = event
@@ -66,7 +66,7 @@ def handle_event(self, event):
         else:
             self.debug(reason)
 
-    def check_subdomain(self, event):
+    async def check_subdomain(self, event):
         for f in self.fingerprints:
             for domain in f.domains:
                 self_matches = self.helpers.host_in_host(event.data, domain)
@@ -81,25 +81,25 @@ def check_subdomain(self, event):
                                 return False, "Scan cancelled"
                             # first, try base request
                             url = f"{scheme}://{event.data}"
-                            match, reason = self._verify_fingerprint(f, url, cache_for=60 * 60 * 24)
+                            match, reason = await self._verify_fingerprint(f, url, cache_for=60 * 60 * 24)
                             if match:
                                 return match, reason
                             # next, try subdomain -[CNAME]-> other_domain
                             url = f"{scheme}://{domain}"
                             headers = {"Host": event.data}
-                            match, reason = self._verify_fingerprint(f, url, headers=headers)
+                            match, reason = await self._verify_fingerprint(f, url, headers=headers)
                             if match:
                                 return match, reason
         return False, f'Subdomain "{event.data}" not hijackable'
 
-    def _verify_fingerprint(self, fingerprint, *args, **kwargs):
+    async def _verify_fingerprint(self, fingerprint, *args, **kwargs):
         kwargs["raise_error"] = True
         kwargs["timeout"] = 10
         kwargs["retries"] = 0
         if fingerprint.http_status is not None:
             kwargs["allow_redirects"] = False
         try:
-            r = self.helpers.request(*args, **kwargs)
+            r = await self.helpers.request(*args, **kwargs)
             if fingerprint.http_status is not None and r.status_code == fingerprint.http_status:
                 return True, f"HTTP status == {fingerprint.http_status}"
             text = getattr(r, "text", "")
@@ -109,7 +109,7 @@ def _verify_fingerprint(self, fingerprint, *args, **kwargs):
                 and fingerprint.fingerprint_regex.findall(text)
             ):
                 return True, "Fingerprint match"
-        except requests.exceptions.RequestException as e:
+        except httpx.RequestError as e:
             if fingerprint.nxdomain and "Name or service not known" in str(e):
                 return True, f"NXDOMAIN"
         return False, "No match"
diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index 2465ae875e..5166e45b73 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -1,6 +1,8 @@
-from bbot.modules.base import BaseModule
-from urllib.parse import urlparse
+import asyncio
 from sys import executable
+from urllib.parse import urlparse
+
+from bbot.modules.base import BaseModule
 
 
 class telerik(BaseModule):
@@ -156,12 +158,12 @@ class telerik(BaseModule):
 
     max_event_handlers = 5
 
-    def setup(self):
+    async def setup(self):
         self.scanned_hosts = set()
         self.timeout = self.scan.config.get("httpx_timeout", 5)
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
         host_hash = hash(host)
         if host_hash in self.scanned_hosts:
@@ -171,7 +173,7 @@ def handle_event(self, event):
             self.scanned_hosts.add(host_hash)
 
         webresource = "Telerik.Web.UI.WebResource.axd?type=rau"
-        result = self.test_detector(event.data, webresource)
+        result, _ = await self.test_detector(event.data, webresource)
         if result:
             if "RadAsyncUpload handler is registered succesfully" in result.text:
                 self.debug(f"Detected Telerik instance (Telerik.Web.UI.WebResource.axd?type=rau)")
@@ -198,7 +200,7 @@ def handle_event(self, event):
                                 str(root_tool_path / "testfile.txt"),
                                 result.url,
                             ]
-                            output = self.helpers.run(command)
+                            output = await self.helpers.run(command)
                             description = f"[CVE-2017-11317] [{str(version)}] {webresource}"
                             if "fileInfo" in output.stdout:
                                 self.debug(f"Confirmed Vulnerable Telerik (version: {str(version)}")
@@ -214,15 +216,16 @@ def handle_event(self, event):
                                 )
                                 break
 
-        futures = {}
+        tasks = []
         for dh in self.DialogHandlerUrls:
-            future = self.submit_task(self.test_detector, event.data, f"{dh}?dp=1")
-            futures[future] = dh
+            tasks.append(self.helpers.create_task(self.test_detector(event.data, f"{dh}?dp=1")))
 
         fail_count = 0
-        for future in self.helpers.as_completed(futures):
-            dh = futures[future]
-            result = future.result()
+        for task in self.helpers.as_completed(tasks):
+            try:
+                result, dh = await task
+            except asyncio.CancelledError:
+                continue
 
             # cancel if we run into timeouts etc.
             if result is None:
@@ -232,14 +235,11 @@ def handle_event(self, event):
                 if fail_count < 2:
                     continue
                 self.debug(f"Cancelling run against {event.data} due to failed request")
-                for future in futures:
-                    future.cancel()
+                self.helpers.cancel_tasks(tasks)
                 break
-            if result:
+            else:
                 if "Cannot deserialize dialog parameters" in result.text:
-                    for future in futures:
-                        future.cancel()
-
+                    self.helpers.cancel_tasks(tasks)
                     self.debug(f"Detected Telerik UI instance ({dh})")
                     description = f"Telerik DialogHandler detected"
                     self.emit_event(
@@ -247,16 +247,18 @@ def handle_event(self, event):
                         "FINDING",
                         event,
                     )
-                # Once we have a match we need to stop, because the basic handler (Telerik.Web.UI.DialogHandler.aspx) usually works with a path wildcard
-                break
+                    # Once we have a match we need to stop, because the basic handler (Telerik.Web.UI.DialogHandler.aspx) usually works with a path wildcard
+                    break
+
+        self.helpers.cancel_tasks(tasks)
 
         spellcheckhandler = "Telerik.Web.UI.SpellCheckHandler.axd"
-        result = self.test_detector(event.data, spellcheckhandler)
+        result, _ = await self.test_detector(event.data, spellcheckhandler)
         try:
             # The standard behavior for the spellcheck handler without parameters is a 500
             if result.status_code == 500:
                 # Sometimes webapps will just return 500 for everything, so rule out the false positive
-                validate_result = self.test_detector(event.data, self.helpers.rand_string())
+                validate_result, _ = await self.test_detector(event.data, self.helpers.rand_string())
                 self.debug(validate_result)
                 if validate_result.status_code != 500:
                     self.debug(f"Detected Telerik UI instance (Telerik.Web.UI.SpellCheckHandler.axd)")
@@ -273,16 +275,16 @@ def handle_event(self, event):
         except Exception:
             pass
 
-    def test_detector(self, baseurl, detector):
+    async def test_detector(self, baseurl, detector):
         result = None
         if "/" != baseurl[-1]:
             url = f"{baseurl}/{detector}"
         else:
             url = f"{baseurl}{detector}"
-        result = self.helpers.request(url, timeout=self.timeout)
-        return result
+        result = await self.helpers.request(url, timeout=self.timeout)
+        return result, detector
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if "endpoint" in event.tags:
             return False
         else:
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 65a123f3e4..377b690f32 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -182,9 +182,10 @@ async def _emit_event(self, event, *args, **kwargs):
                         await self.scan.helpers.dns.handle_wildcard_event(event, dns_children)
 
             # now that the event is properly tagged, we can finally make decisions about it
+            abort_result = False
             if callable(abort_if):
                 async with self.scan.acatch(context=abort_if):
-                    abort_result = await self.helpers.execute_sync_or_async(abort_if, event)
+                    abort_result = await self.scan.helpers.execute_sync_or_async(abort_if, event)
                 msg = f"{event.module}: not raising event {event} due to custom criteria in abort_if()"
                 with suppress(ValueError, TypeError):
                     abort_result, reason = abort_result
@@ -430,6 +431,17 @@ async def modules_status(self, _log=False):
             else:
                 self.scan.info(f"{self.scan.name}: No events in queue")
 
+            if self.scan.log_level <= logging.DEBUG:
+                # log module memory usage
+                module_memory_usage = []
+                for module in self.scan.modules.values():
+                    memory_usage = module.memory_usage
+                    module_memory_usage.append((module.name, memory_usage))
+                module_memory_usage.sort(key=lambda x: x[-1], reverse=True)
+                self.scan.debug(f"MODULE MEMORY USAGE:")
+                for module_name, usage in module_memory_usage:
+                    self.scan.debug(f"    - {module_name}: {self.scan.helpers.bytes_to_human(usage)}")
+
             # Uncomment these lines to enable debugging of event queues
 
             # queued_events = self.incoming_event_queue.events
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 80aae3e62b..c43f702a15 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -162,6 +162,9 @@ def __init__(
         self._cleanedup = False
 
         self._loop = asyncio.get_event_loop()
+        self.manager_worker_loop_tasks = []
+        self.init_events_task = None
+        self.ticker_task = None
 
     def _on_keyboard_interrupt(self, loop, event):
         self.stop()
@@ -182,7 +185,7 @@ async def prep(self):
                 start_msg += f" ({', '.join(details)})"
             self.hugeinfo(start_msg)
 
-            self.load_modules()
+            await self.load_modules()
 
             self.info(f"Setting up modules...")
             await self.setup_modules()
@@ -203,7 +206,7 @@ async def start(self):
             self.warning(f"No scan targets specified")
 
         # start status ticker
-        ticker_task = asyncio.create_task(self._status_ticker(self.status_frequency))
+        self.ticker_task = asyncio.create_task(self._status_ticker(self.status_frequency))
 
         scan_start_time = datetime.now()
         try:
@@ -219,12 +222,12 @@ async def start(self):
             self.dispatcher.on_start(self)
 
             # start manager worker loops
-            manager_worker_loop_tasks = [
+            self.manager_worker_loop_tasks = [
                 asyncio.create_task(self.manager._worker_loop()) for _ in range(self.max_workers)
             ]
 
             # distribute seed events
-            init_events_task = asyncio.create_task(self.manager.init_events())
+            self.init_events_task = asyncio.create_task(self.manager.init_events())
 
             self.status = "RUNNING"
             self.start_modules()
@@ -271,10 +274,7 @@ async def start(self):
                     self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
 
         finally:
-            init_events_task.cancel()
-            with contextlib.suppress(asyncio.CancelledError):
-                await init_events_task
-
+            await self.cancel_tasks()
             await self.report()
             await self.cleanup()
 
@@ -288,15 +288,6 @@ async def start(self):
             else:
                 self.status = "FINISHED"
 
-            ticker_task.cancel()
-            with contextlib.suppress(asyncio.CancelledError):
-                await ticker_task
-
-            for t in manager_worker_loop_tasks:
-                t.cancel()
-                with contextlib.suppress(asyncio.CancelledError):
-                    await t
-
             scan_run_time = datetime.now() - scan_start_time
             scan_run_time = self.helpers.human_timedelta(scan_run_time)
             log_fn(f"Scan {self.name} completed in {scan_run_time} with status {self.status}")
@@ -309,7 +300,7 @@ def start_modules(self):
             module.start()
 
     async def setup_modules(self, remove_failed=True):
-        self.load_modules()
+        await self.load_modules()
         self.verbose(f"Setting up modules")
         hard_failed = []
         soft_failed = []
@@ -376,6 +367,24 @@ def drain_queues(self):
                 self.manager.incoming_event_queue.get_nowait()
         self.debug("Finished draining queues")
 
+    async def cancel_tasks(self):
+        tasks = []
+        # module workers
+        for m in self.modules.values():
+            tasks += getattr(m, "_tasks", [])
+        # init events
+        if self.init_events_task:
+            tasks.append(self.init_events_task)
+        # ticker
+        if self.ticker_task:
+            tasks.append(self.ticker_task)
+        # manager worker loops
+        tasks += self.manager_worker_loop_tasks
+        for t in tasks:
+            t.cancel()
+            with contextlib.suppress(asyncio.CancelledError):
+                await t
+
     async def report(self):
         for mod in self.modules.values():
             async with self.acatch(context=mod.report):
@@ -540,7 +549,7 @@ def _internal_modules(self):
             if self.config.get(modname, True):
                 yield modname
 
-    def load_modules(self):
+    async def load_modules(self):
         if not self._modules_loaded:
             all_modules = list(set(self._scan_modules + self._output_modules + self._internal_modules))
             if not all_modules:
@@ -551,7 +560,7 @@ def load_modules(self):
                 self.warning(f"No scan modules to load")
 
             # install module dependencies
-            succeeded, failed = self.helpers.depsinstaller.install(
+            succeeded, failed = await self.helpers.depsinstaller.install(
                 *self._scan_modules, *self._output_modules, *self._internal_modules
             )
             if failed:
diff --git a/bbot/test/helpers.py b/bbot/test/helpers.py
index 4654c036ca..fd457795b8 100644
--- a/bbot/test/helpers.py
+++ b/bbot/test/helpers.py
@@ -1,5 +1,4 @@
 import logging
-import requests_mock
 from abc import abstractmethod
 from omegaconf import OmegaConf
 
@@ -13,11 +12,13 @@ class MockHelper:
     config_overrides = {}
     additional_modules = []
 
-    def __init__(self, config, bbot_scanner, *args, **kwargs):
+    def __init__(self, request, **kwargs):
         self.name = kwargs.get("module_name", self.__class__.__name__.lower())
-        self.config = OmegaConf.merge(config, OmegaConf.create(self.config_overrides))
+        self.bbot_config = request.getfixturevalue("bbot_config")
+        self.bbot_scanner = request.getfixturevalue("bbot_scanner")
+        self.config = OmegaConf.merge(self.bbot_config, OmegaConf.create(self.config_overrides))
         modules = [self.name] + self.additional_modules
-        self.scan = bbot_scanner(
+        self.scan = self.bbot_scanner(
             *self.targets,
             modules=modules,
             name=f"{self.name}_test",
@@ -25,8 +26,6 @@ def __init__(self, config, bbot_scanner, *args, **kwargs):
             whitelist=self.whitelist,
             blacklist=self.blacklist,
         )
-        self.patch_scan(self.scan)
-        self.setup()
 
     def patch_scan(self, scan):
         return
@@ -34,10 +33,13 @@ def patch_scan(self, scan):
     def setup(self):
         pass
 
-    def run(self):
-        events = list(self.scan.start())
-        events = [e for e in events if e.module == self.module]
-        assert self.check_events(events)
+    async def run(self):
+        await self.scan.prep()
+        self.setup()
+        self.patch_scan(self.scan)
+        self._after_scan_prep()
+        events = [e async for e in self.scan.start()]
+        self.check_events(events)
 
     @abstractmethod
     def check_events(self, events):
@@ -47,29 +49,29 @@ def check_events(self, events):
     def module(self):
         return self.scan.modules[self.name]
 
+    def _after_scan_prep(self):
+        pass
+
 
 class RequestMockHelper(MockHelper):
+    def __init__(self, request, **kwargs):
+        self.httpx_mock = request.getfixturevalue("httpx_mock")
+        super().__init__(request, **kwargs)
+
     @abstractmethod
     def mock_args(self):
         raise NotImplementedError
 
-    def register_uri(self, uri, method="GET", **kwargs):
-        self.m.register_uri(method, uri, **kwargs)
-
-    def run(self):
-        with requests_mock.Mocker() as m:
-            self.m = m
-            self.mock_args()
-            return super().run()
+    def _after_scan_prep(self):
+        self.mock_args()
 
 
 class HttpxMockHelper(MockHelper):
     targets = ["http://127.0.0.1:8888/"]
 
-    def __init__(self, config, bbot_scanner, bbot_httpserver, *args, **kwargs):
-        self.bbot_httpserver = bbot_httpserver
-        super().__init__(config, bbot_scanner, *args, **kwargs)
-        self.mock_args()
+    def __init__(self, request, **kwargs):
+        self.bbot_httpserver = request.getfixturevalue("bbot_httpserver")
+        super().__init__(request, **kwargs)
 
     @abstractmethod
     def mock_args(self):
@@ -80,6 +82,9 @@ def set_expect_requests(self, expect_args={}, respond_args={}):
             expect_args["uri"] = "/"
         self.bbot_httpserver.expect_request(**expect_args).respond_with_data(**respond_args)
 
+    def _after_scan_prep(self):
+        self.mock_args()
+
 
 def tempwordlist(content):
     tmp_path = "/tmp/.bbot_test/"
diff --git a/bbot/test/modules_test_classes.py b/bbot/test/modules_test_classes.py
index c1bf5bf552..f763318bca 100644
--- a/bbot/test/modules_test_classes.py
+++ b/bbot/test/modules_test_classes.py
@@ -8,22 +8,30 @@
 
 
 class Httpx(HttpxMockHelper):
+    targets = ["http://127.0.0.1:8888/url", "127.0.0.1:8888"]
+
     def mock_args(self):
-        request_args = dict(headers={"test": "header"})
-        respond_args = dict(response_data=json.dumps({"foo": "bar"}))
+        request_args = dict(uri="/", headers={"test": "header"})
+        respond_args = dict(response_data=json.dumps({"open": "port"}))
+        self.set_expect_requests(request_args, respond_args)
+        request_args = dict(uri="/url", headers={"test": "header"})
+        respond_args = dict(response_data=json.dumps({"url": "url"}))
         self.set_expect_requests(request_args, respond_args)
-
-    async def run(self):
-        events = [e async for e in self.scan.start()]
-        assert self.check_events(events)
 
     def check_events(self, events):
+        url = False
+        open_port = False
         for e in events:
             if e.type == "HTTP_RESPONSE":
                 j = json.loads(e.data["body"])
-                if j.get("foo", "") == "bar":
-                    return True
-        return False
+                if e.data["path"] == "/":
+                    if j.get("open", "") == "port":
+                        open_port = True
+                elif e.data["path"] == "/url":
+                    if j.get("url", "") == "url":
+                        url = True
+        assert url, "Failed to visit target URL"
+        assert open_port, "Failed to visit target OPEN_TCP_PORT"
 
 
 class Gowitness(HttpxMockHelper):
@@ -63,7 +71,6 @@ def check_events(self, events):
         assert url, "No URL emitted"
         assert webscreenshot, "No WEBSCREENSHOT emitted"
         assert technology, "No TECHNOLOGY emitted"
-        return True
 
 
 class Excavate(HttpxMockHelper):
@@ -158,7 +165,6 @@ def check_events(self, events):
             and "spider-danger" in e.tags
             for e in events
         )
-        return True
 
 
 class Excavate_relativelinks(HttpxMockHelper):
@@ -206,14 +212,10 @@ def check_events(self, events):
                 if e.data == "http://127.0.0.1:8888/subdir/rootrelative.html":
                     root_page_confusion_2 = True
 
-        if (
-            root_relative_detection
-            and page_relative_detection
-            and not root_page_confusion_1
-            and not root_page_confusion_2
-        ):
-            return True
-        return False
+        assert root_relative_detection, "Failed to properly excavate root-relative URL"
+        assert page_relative_detection, "Failed to properly excavate page-relative URL"
+        assert not root_page_confusion_1, "Incorrectly detected page-relative URL"
+        assert not root_page_confusion_2, "Incorrectly detected root-relative URL"
 
 
 class Subdomain_Hijack(HttpxMockHelper):
@@ -229,15 +231,13 @@ def mock_args(self):
         self.set_expect_requests(respond_args=respond_args)
 
     def check_events(self, events):
-        for event in events:
-            if (
-                event.type == "FINDING"
-                and event.data["description"].startswith("Hijackable Subdomain")
-                and self.rand_subdomain in event.data["description"]
-                and event.data["host"] == self.rand_subdomain
-            ):
-                return True
-        return False, f"No hijackable subdomains in {events}"
+        assert any(
+            event.type == "FINDING"
+            and event.data["description"].startswith("Hijackable Subdomain")
+            and self.rand_subdomain in event.data["description"]
+            and event.data["host"] == self.rand_subdomain
+            for event in events
+        ), f"No hijackable subdomains in {events}"
 
 
 class Fingerprintx(HttpxMockHelper):
@@ -247,22 +247,20 @@ def mock_args(self):
         pass
 
     def check_events(self, events):
-        for event in events:
-            if (
-                event.type == "PROTOCOL"
-                and event.host == self.scan.helpers.make_ip_type("127.0.0.1")
-                and event.port == 8888
-                and event.data["protocol"] == "HTTP"
-            ):
-                return True
-        return False
+        assert any(
+            event.type == "PROTOCOL"
+            and event.host == self.scan.helpers.make_ip_type("127.0.0.1")
+            and event.port == 8888
+            and event.data["protocol"] == "HTTP"
+            for event in events
+        ), "HTTP protocol not detected"
 
 
 class Otx(RequestMockHelper):
     def mock_args(self):
         for t in self.targets:
-            self.register_uri(
-                f"https://otx.alienvault.com/api/v1/indicators/domain/{t}/passive_dns",
+            self.httpx_mock.add_response(
+                url=f"https://otx.alienvault.com/api/v1/indicators/domain/{t}/passive_dns",
                 json={
                     "passive_dns": [
                         {
@@ -282,10 +280,7 @@ def mock_args(self):
             )
 
     def check_events(self, events):
-        for e in events:
-            if e.data == "asdf.blacklanternsecurity.com":
-                return True
-        return False
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
 
 
 class Anubisdb(RequestMockHelper):
@@ -294,16 +289,13 @@ def setup(self):
 
     def mock_args(self):
         for t in self.targets:
-            self.register_uri(
-                f"https://jldc.me/anubis/subdomains/{t}",
+            self.httpx_mock.add_response(
+                url=f"https://jldc.me/anubis/subdomains/{t}",
                 json=["asdf.blacklanternsecurity.com", "zzzz.blacklanternsecurity.com"],
             )
 
     def check_events(self, events):
-        for e in events:
-            if e.data == "asdf.blacklanternsecurity.com":
-                return True
-        return False
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
 
 
 class SecretsDB(HttpxMockHelper):
@@ -315,7 +307,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        return any(e.type == "FINDING" for e in events)
+        assert any(e.type == "FINDING" for e in events)
 
 
 class Badsecrets(HttpxMockHelper):
@@ -421,9 +413,10 @@ def check_events(self, events):
             ):
                 CookieBasedDetection_2 = True
 
-        if SecretFound and IdentifyOnly and CookieBasedDetection and CookieBasedDetection_2:
-            return True
-        return False
+        assert SecretFound, "No secret found"
+        assert IdentifyOnly, "No crypto product identified"
+        assert CookieBasedDetection, "No JWT cookie detected"
+        assert CookieBasedDetection_2, "No Express.js cookie detected"
 
 
 class Telerik(HttpxMockHelper):
@@ -491,18 +484,14 @@ def check_events(self, events):
                 telerik_spellcheck_detection = True
                 continue
 
-        if (
-            telerik_axd_detection
-            and telerik_axd_vulnerable
-            and telerik_spellcheck_detection
-            and telerik_dialoghandler_detection
-        ):
-            return True
-        return False
+        assert telerik_axd_detection, "Telerik AXD detection failed"
+        assert telerik_axd_vulnerable, "Telerik vulnerable AXD detection failed"
+        assert telerik_spellcheck_detection, "Telerik spellcheck detection failed"
+        assert telerik_dialoghandler_detection, "Telerik dialoghandler detection failed"
 
 
-class Paramminer_getparams(HttpxMockHelper):
-    getparam_body = """
+class Paramminer_headers(HttpxMockHelper):
+    headers_body = """
     <html>
     <title>the title</title>
     <body>
@@ -511,7 +500,7 @@ class Paramminer_getparams(HttpxMockHelper):
     </html>
     """
 
-    getparam_body_match = """
+    headers_body_match = """
     <html>
     <title>the title</title>
     <body>
@@ -521,7 +510,7 @@ class Paramminer_getparams(HttpxMockHelper):
     """
     additional_modules = ["httpx"]
 
-    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"])}}}
+    config_overrides = {"modules": {"paramminer_headers": {"wordlist": tempwordlist(["junkword1", "tracestate"])}}}
 
     def setup(self):
         from bbot.core.helpers import helper
@@ -530,22 +519,26 @@ def setup(self):
         helper.HttpCompare.gen_cache_buster = lambda *args, **kwargs: {"AAAAAA": "1"}
 
     def mock_args(self):
-        expect_args = {"query_string": b"id=AAAAAAAAAAAAAA&AAAAAA=1"}
-        respond_args = {"response_data": self.getparam_body_match}
+        expect_args = dict(headers={"tracestate": "AAAAAAAAAAAAAA"})
+        respond_args = {"response_data": self.headers_body_match}
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
-        respond_args = {"response_data": self.getparam_body}
+        respond_args = {"response_data": self.headers_body}
         self.set_expect_requests(respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [id] Reasons: [body]":
-                return True
-        return False
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [tracestate] Reasons: [body]"
+            for e in events
+        )
+        assert not any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [junkword1] Reasons: [body]"
+            for e in events
+        )
 
 
-class Paramminer_headers(HttpxMockHelper):
-    headers_body = """
+class Paramminer_getparams(HttpxMockHelper):
+    getparam_body = """
     <html>
     <title>the title</title>
     <body>
@@ -554,7 +547,7 @@ class Paramminer_headers(HttpxMockHelper):
     </html>
     """
 
-    headers_body_match = """
+    getparam_body_match = """
     <html>
     <title>the title</title>
     <body>
@@ -564,7 +557,7 @@ class Paramminer_headers(HttpxMockHelper):
     """
     additional_modules = ["httpx"]
 
-    config_overrides = {"modules": {"paramminer_headers": {"wordlist": tempwordlist(["junkword1", "tracestate"])}}}
+    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"])}}}
 
     def setup(self):
         from bbot.core.helpers import helper
@@ -573,18 +566,22 @@ def setup(self):
         helper.HttpCompare.gen_cache_buster = lambda *args, **kwargs: {"AAAAAA": "1"}
 
     def mock_args(self):
-        expect_args = dict(headers={"tracestate": "AAAAAAAAAAAAAA"})
-        respond_args = {"response_data": self.headers_body_match}
+        expect_args = {"query_string": b"id=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {"response_data": self.getparam_body_match}
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
-        respond_args = {"response_data": self.headers_body}
+        respond_args = {"response_data": self.getparam_body}
         self.set_expect_requests(respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [tracestate] Reasons: [body]":
-                return True
-        return False
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [id] Reasons: [body]"
+            for e in events
+        )
+        assert not any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [canary] Reasons: [body]"
+            for e in events
+        )
 
 
 class Paramminer_cookies(HttpxMockHelper):
@@ -624,16 +621,20 @@ def mock_args(self):
         self.set_expect_requests(respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [admincookie] Reasons: [body]":
-                return True
-        return False
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [admincookie] Reasons: [body]"
+            for e in events
+        )
+        assert not any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [junkcookie] Reasons: [body]"
+            for e in events
+        )
 
 
 class LeakIX(RequestMockHelper):
     def mock_args(self):
-        self.register_uri(
-            "https://leakix.net/api/subdomains/blacklanternsecurity.com",
+        self.httpx_mock.add_response(
+            url="https://leakix.net/api/subdomains/blacklanternsecurity.com",
             json=[
                 {
                     "subdomain": "www.blacklanternsecurity.com",
@@ -652,32 +653,33 @@ def check_events(self, events):
         www = False
         asdf = False
         for e in events:
-            if e.type in ("DNS_NAME", "DNS_NAME_UNRESOLVED"):
+            if e.type in ("DNS_NAME", "DNS_NAME_UNRESOLVED") and str(e.module) == "leakix":
                 if e.data == "www.blacklanternsecurity.com":
                     www = True
                 elif e.data == "asdf.blacklanternsecurity.com":
                     asdf = True
-        return www and asdf
+        assert www
+        assert asdf
 
 
-class Massdns(MockHelper):
+class Massdns(RequestMockHelper):
     subdomain_wordlist = tempwordlist(["www", "asdf"])
     config_overrides = {"modules": {"massdns": {"wordlist": str(subdomain_wordlist)}}}
 
-    def __init__(self, *args, **kwargs):
-        with requests_mock.Mocker() as m:
-            m.register_uri(
-                "GET",
-                "https://raw.githubusercontent.com/blacklanternsecurity/public-dns-servers/master/nameservers.txt",
-                text="8.8.8.8\n8.8.4.4\n1.1.1.1",
-            )
-            super().__init__(*args, **kwargs)
+    def __init__(self, request):
+        super().__init__(request)
+        self.httpx_mock.add_response(
+            url="https://raw.githubusercontent.com/blacklanternsecurity/public-dns-servers/master/nameservers.txt",
+            text="8.8.8.8\n8.8.4.4\n1.1.1.1",
+        )
+
+    def mock_args(self):
+        pass
 
     def check_events(self, events):
-        for e in events:
-            if e.type in ("DNS_NAME", "DNS_NAME_UNRESOLVED") and e.data == "www.blacklanternsecurity.com":
-                return True
-        return False
+        assert any(
+            e.type in ("DNS_NAME", "DNS_NAME_UNRESOLVED") and e.data == "www.blacklanternsecurity.com" for e in events
+        )
 
 
 class Robots(HttpxMockHelper):
@@ -700,7 +702,8 @@ def check_events(self, events):
 
         for e in events:
             if e.type == "URL_UNVERIFIED":
-                assert "spider-danger" in e.tags, f"{e} doesn't have spider-danger tag"
+                if str(e.module) != "TARGET":
+                    assert "spider-danger" in e.tags, f"{e} doesn't have spider-danger tag"
                 if e.data == "http://127.0.0.1:8888/allow/":
                     allow_bool = True
 
@@ -713,9 +716,10 @@ def check_events(self, events):
                 if re.match(r"http://127\.0\.0\.1:8888/\w+/wildcard\.txt", e.data):
                     wildcard_bool = True
 
-        if allow_bool and disallow_bool and sitemap_bool and wildcard_bool:
-            return True
-        return False
+        assert allow_bool
+        assert disallow_bool
+        assert sitemap_bool
+        assert wildcard_bool
 
 
 class Masscan(MockHelper):
@@ -734,13 +738,12 @@ class Masscan(MockHelper):
 ports = 
 range = 9.8.7.6"""
 
-    def __init__(self, config, bbot_scanner, *args, **kwargs):
-        super().__init__(config, bbot_scanner, *args, **kwargs)
+    def _after_scan_prep(self):
         self.scan.modules["masscan"].masscan_config = self.masscan_config
 
-        def setup_scan_2():
-            config2 = OmegaConf.merge(config, OmegaConf.create(self.config_overrides_2))
-            self.scan2 = bbot_scanner(
+        async def setup_scan_2():
+            config2 = OmegaConf.merge(self.config, OmegaConf.create(self.config_overrides_2))
+            self.scan2 = self.bbot_scanner(
                 *self.targets,
                 modules=[self.name] + self.additional_modules,
                 name=f"{self.name}_test",
@@ -749,35 +752,37 @@ def setup_scan_2():
                 blacklist=self.blacklist,
             )
             self.patch_scan(self.scan2)
-            self.scan2.prep()
+            await self.scan2.prep()
             self.scan2.modules["masscan"].masscan_config = self.masscan_config
 
         self.setup_scan_2 = setup_scan_2
         self.masscan_run = False
 
-    def run_masscan(self, command, *args, **kwargs):
-        if "masscan" in command[0]:
-            yield from self.masscan_output.splitlines()
+    async def run_masscan(self, command, *args, **kwargs):
+        log.critical(f"patched: {command}")
+        if "masscan" in command[:2]:
+            for l in self.masscan_output.splitlines():
+                yield l
             self.masscan_run = True
         else:
-            yield from self.scan.helpers.run_live(command, *args, **kwargs)
+            async for l in self.scan.helpers.run_live(command, *args, **kwargs):
+                yield l
 
     def patch_scan(self, scan):
         scan.helpers.run_live = self.run_masscan
 
-    def run(self):
-        super().run()
-        self.setup_scan_2()
+    async def run(self):
+        await super().run()
         assert self.masscan_run == True, "masscan didn't run when it was supposed to"
+        await self.setup_scan_2()
         self.masscan_run = False
-        events = list(self.scan2.start())
+        events = [e async for e in self.scan2.start()]
         self.check_events(events)
         assert self.masscan_run == False, "masscan ran when it wasn't supposed to"
 
     def check_events(self, events):
         assert any(e.type == "IP_ADDRESS" and e.data == "8.8.8.8" for e in events), "No IP_ADDRESS emitted"
         assert any(e.type == "OPEN_TCP_PORT" and e.data == "8.8.8.8:443" for e in events), "No OPEN_TCP_PORT emitted"
-        return True
 
 
 class Buckets(HttpxMockHelper, RequestMockHelper):
diff --git a/bbot/test/test_step_1/test_modules_full.py b/bbot/test/test_step_1/test_modules_full.py
index 8d1f58204b..3dea25d310 100644
--- a/bbot/test/test_step_1/test_modules_full.py
+++ b/bbot/test/test_step_1/test_modules_full.py
@@ -6,192 +6,229 @@
 log = logging.getLogger(f"bbot.test")
 
 
-def test_gowitness(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Gowitness(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_httpx(request):
+    x = Httpx(request)
+    await x.run()
 
 
 @pytest.mark.asyncio
-async def test_httpx(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Httpx(bbot_config, bbot_scanner, bbot_httpserver)
+async def test_gowitness(request):
+    x = Gowitness(request)
     await x.run()
 
 
-def test_excavate(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Excavate(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_excavate(request):
+    x = Excavate(request)
+    await x.run()
 
 
-def test_excavate_relativelinks(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Excavate_relativelinks(bbot_config, bbot_scanner, bbot_httpserver, module_name="excavate")
-    x.run()
+@pytest.mark.asyncio
+async def test_excavate_relativelinks(request):
+    x = Excavate_relativelinks(request, module_name="excavate")
+    await x.run()
 
 
-def test_subdomain_hijack(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Subdomain_Hijack(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_subdomain_hijack(request):
+    x = Subdomain_Hijack(request)
+    await x.run()
 
 
-def test_fingerprintx(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Fingerprintx(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_fingerprintx(request):
+    x = Fingerprintx(request)
+    await x.run()
 
 
-def test_otx(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Otx(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_otx(request):
+    x = Otx(request)
+    await x.run()
 
 
-def test_anubisdb(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Anubisdb(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_anubisdb(request):
+    x = Anubisdb(request)
+    await x.run()
 
 
-def test_paramminer_getparams(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Paramminer_getparams(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_secretsdb(request):
+    x = SecretsDB(request)
+    await x.run()
 
 
-def test_paramminer_headers(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Paramminer_headers(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_badsecrets(request):
+    x = Badsecrets(request)
+    await x.run()
 
 
-def test_paramminer_cookies(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Paramminer_cookies(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_telerik(request):
+    x = Telerik(request)
+    await x.run()
 
 
-def test_telerik(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Telerik(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_paramminer_headers(request):
+    x = Paramminer_headers(request)
+    await x.run()
 
 
-def test_leakix(bbot_config, bbot_scanner, bbot_httpserver):
-    x = LeakIX(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_paramminer_getparams(request):
+    x = Paramminer_getparams(request)
+    await x.run()
 
 
-def test_massdns(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Massdns(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_paramminer_cookies(request):
+    x = Paramminer_cookies(request)
+    await x.run()
 
 
-def test_masscan(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Masscan(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_leakix(request):
+    x = LeakIX(request)
+    await x.run()
 
 
-def test_secretsdb(bbot_config, bbot_scanner, bbot_httpserver):
-    x = SecretsDB(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_massdns(request):
+    x = Massdns(request)
+    await x.run()
 
 
-def test_badsecrets(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Badsecrets(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_masscan(request):
+    x = Masscan(request)
+    await x.run()
 
 
-def test_robots(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Robots(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_robots(request):
+    x = Robots(request)
+    await x.run()
 
 
-def test_buckets(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Buckets(bbot_config, bbot_scanner, bbot_httpserver, module_name="excavate")
-    x.run()
+@pytest.mark.asyncio
+async def test_buckets(request):
+    x = Buckets(request, module_name="excavate")
+    await x.run()
 
 
-def test_asn(bbot_config, bbot_scanner, bbot_httpserver):
-    x = ASN(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_asn(request):
+    x = ASN(request)
+    await x.run()
 
 
-def test_wafw00f(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Wafw00f(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_wafw00f(request):
+    x = Wafw00f(request)
+    await x.run()
 
 
-def test_ffuf(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Ffuf(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_ffuf(request):
+    x = Ffuf(request)
+    await x.run()
 
 
-def test_ffuf_extensions(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Ffuf_extensions(bbot_config, bbot_scanner, bbot_httpserver, module_name="ffuf")
-    x.run()
+@pytest.mark.asyncio
+async def test_ffuf_extensions(request):
+    x = Ffuf_extensions(request, module_name="ffuf")
+    await x.run()
 
 
-def test_bypass403(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Bypass403(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_bypass403(request):
+    x = Bypass403(request)
+    await x.run()
 
 
-def test_bypass403_waf(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Bypass403_waf(bbot_config, bbot_scanner, bbot_httpserver, module_name="bypass403")
-    x.run()
+@pytest.mark.asyncio
+async def test_bypass403_waf(request):
+    x = Bypass403_waf(request, module_name="bypass403")
+    await x.run()
 
 
-def test_bypass403_aspnetcookieless(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Bypass403_aspnetcookieless(bbot_config, bbot_scanner, bbot_httpserver, module_name="bypass403")
-    x.run()
+@pytest.mark.asyncio
+async def test_bypass403_aspnetcookieless(request):
+    x = Bypass403_aspnetcookieless(request, module_name="bypass403")
+    await x.run()
 
 
-def test_ffuf_shortnames(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Ffuf_shortnames(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_ffuf_shortnames(request):
+    x = Ffuf_shortnames(request)
+    await x.run()
 
 
-def test_iis_shortnames(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Iis_shortnames(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_iis_shortnames(request):
+    x = Iis_shortnames(request)
+    await x.run()
 
 
-def test_nuclei_technology(bbot_config, bbot_scanner, bbot_httpserver, caplog):
-    x = Nuclei_technology(bbot_config, bbot_scanner, bbot_httpserver, caplog, module_name="nuclei")
-    x.run()
+@pytest.mark.asyncio
+async def test_nuclei_technology(request, caplog):
+    x = Nuclei_technology(request, caplog, module_name="nuclei")
+    await x.run()
 
 
-def test_nuclei_manual(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Nuclei_manual(bbot_config, bbot_scanner, bbot_httpserver, module_name="nuclei")
-    x.run()
+@pytest.mark.asyncio
+async def test_nuclei_manual(request):
+    x = Nuclei_manual(request, module_name="nuclei")
+    await x.run()
 
 
-def test_nuclei_severe(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Nuclei_severe(bbot_config, bbot_scanner, bbot_httpserver, module_name="nuclei")
-    x.run()
+@pytest.mark.asyncio
+async def test_nuclei_severe(request):
+    x = Nuclei_severe(request, module_name="nuclei")
+    await x.run()
 
 
-def test_nuclei_budget(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Nuclei_budget(bbot_config, bbot_scanner, bbot_httpserver, module_name="nuclei")
-    x.run()
+@pytest.mark.asyncio
+async def test_nuclei_budget(request):
+    x = Nuclei_budget(request, module_name="nuclei")
+    await x.run()
 
 
-def test_url_manipulation(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Url_manipulation(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_url_manipulation(request):
+    x = Url_manipulation(request)
+    await x.run()
 
 
-def test_naabu(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Naabu(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_naabu(request):
+    x = Naabu(request)
+    await x.run()
 
 
-def test_hunt(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Hunt(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_hunt(request):
+    x = Hunt(request)
+    await x.run()
 
 
-def test_vhost(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Vhost(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_vhost(request):
+    x = Vhost(request)
+    await x.run()
 
 
-def test_speculate_subdirectories(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Speculate_subdirectories(bbot_config, bbot_scanner, bbot_httpserver, module_name="speculate")
-    x.run()
+@pytest.mark.asyncio
+async def test_speculate_subdirectories(request):
+    x = Speculate_subdirectories(request, module_name="speculate")
+    await x.run()
 
 
-def test_social(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Social(bbot_config, bbot_scanner, bbot_httpserver)
-    x.run()
+@pytest.mark.asyncio
+async def test_social(request):
+    x = Social(request)
+    await x.run()
diff --git a/bbot/test/test_step_2/test_command.py b/bbot/test/test_step_2/test_command.py
index 5f56d248b0..b45039c319 100644
--- a/bbot/test/test_step_2/test_command.py
+++ b/bbot/test/test_step_2/test_command.py
@@ -1,4 +1,5 @@
 from ..bbot_fixtures import *
+from subprocess import CalledProcessError
 
 
 @pytest.mark.asyncio
@@ -7,10 +8,15 @@ async def test_command(bbot_scanner, bbot_config):
 
     # run
     assert "plumbus\n" == (await scan1.helpers.run(["echo", "plumbus"])).stdout
+    assert b"plumbus\n" == (await scan1.helpers.run(["echo", "plumbus"], text=False)).stdout
     result = (await scan1.helpers.run(["cat"], input="some\nrandom\nstdin")).stdout
     assert result.splitlines() == ["some", "random", "stdin"]
+    result = (await scan1.helpers.run(["cat"], input=b"some\nrandom\nstdin", text=False)).stdout
+    assert result.splitlines() == [b"some", b"random", b"stdin"]
     result = (await scan1.helpers.run(["cat"], input=["some", "random", "stdin"])).stdout
     assert result.splitlines() == ["some", "random", "stdin"]
+    result = (await scan1.helpers.run(["cat"], input=[b"some", b"random", b"stdin"], text=False)).stdout
+    assert result.splitlines() == [b"some", b"random", b"stdin"]
 
     # run_live
     lines = []
@@ -18,6 +24,10 @@ async def test_command(bbot_scanner, bbot_config):
         lines.append(line)
     assert lines == ["plumbus"]
     lines = []
+    async for line in scan1.helpers.run_live(["echo", "plumbus"], text=False):
+        lines.append(line)
+    assert lines == [b"plumbus"]
+    lines = []
     async for line in scan1.helpers.run_live(["cat"], input="some\nrandom\nstdin"):
         lines.append(line)
     assert lines == ["some", "random", "stdin"]
@@ -26,6 +36,20 @@ async def test_command(bbot_scanner, bbot_config):
         lines.append(line)
     assert lines == ["some", "random", "stdin"]
 
+    # test check=True
+    with pytest.raises(CalledProcessError) as excinfo:
+        lines = [l async for line in scan1.helpers.run_live(["ls", "/aslkdjflasdkfsd"], check=True)]
+    assert "No such file or directory" in excinfo.value.stderr
+    with pytest.raises(CalledProcessError) as excinfo:
+        lines = [l async for line in scan1.helpers.run_live(["ls", "/aslkdjflasdkfsd"], check=True, text=False)]
+    assert b"No such file or directory" in excinfo.value.stderr
+    with pytest.raises(CalledProcessError) as excinfo:
+        await scan1.helpers.run(["ls", "/aslkdjflasdkfsd"], check=True)
+    assert "No such file or directory" in excinfo.value.stderr
+    with pytest.raises(CalledProcessError) as excinfo:
+        await scan1.helpers.run(["ls", "/aslkdjflasdkfsd"], check=True, text=False)
+    assert b"No such file or directory" in excinfo.value.stderr
+
     # test piping
     lines = []
     async for line in scan1.helpers.run_live(
@@ -33,6 +57,12 @@ async def test_command(bbot_scanner, bbot_config):
     ):
         lines.append(line)
     assert lines == ["some", "random", "stdin"]
+    lines = []
+    async for line in scan1.helpers.run_live(
+        ["cat"], input=scan1.helpers.run_live(["echo", "-en", r"some\nrandom\nstdin"], text=False), text=False
+    ):
+        lines.append(line)
+    assert lines == [b"some", b"random", b"stdin"]
 
     # test missing executable
     result = await scan1.helpers.run(["sgkjlskdfsdf"])
@@ -50,25 +80,25 @@ async def test_command(bbot_scanner, bbot_config):
     path_parts = os.environ.get("PATH", "").split(":")
     assert "/tmp/.bbot_test/tools" in path_parts
     run_lines = (await scan1.helpers.run(["env"])).stdout.splitlines()
-    assert f"BBOT_PLUMBUS=asdf" in run_lines
+    assert "BBOT_PLUMBUS=asdf" in run_lines
     for line in run_lines:
         if line.startswith("PATH="):
             path_parts = line.split("=", 1)[-1].split(":")
             assert "/tmp/.bbot_test/tools" in path_parts
     run_lines_sudo = (await scan1.helpers.run(["env"], sudo=True)).stdout.splitlines()
-    assert f"BBOT_PLUMBUS=asdf" in run_lines_sudo
+    assert "BBOT_PLUMBUS=asdf" in run_lines_sudo
     for line in run_lines_sudo:
         if line.startswith("PATH="):
             path_parts = line.split("=", 1)[-1].split(":")
             assert "/tmp/.bbot_test/tools" in path_parts
     run_live_lines = [l async for l in scan1.helpers.run_live(["env"])]
-    assert f"BBOT_PLUMBUS=asdf" in run_live_lines
+    assert "BBOT_PLUMBUS=asdf" in run_live_lines
     for line in run_live_lines:
         if line.startswith("PATH="):
             path_parts = line.strip().split("=", 1)[-1].split(":")
             assert "/tmp/.bbot_test/tools" in path_parts
     run_live_lines_sudo = [l async for l in scan1.helpers.run_live(["env"], sudo=True)]
-    assert f"BBOT_PLUMBUS=asdf" in run_live_lines_sudo
+    assert "BBOT_PLUMBUS=asdf" in run_live_lines_sudo
     for line in run_live_lines_sudo:
         if line.startswith("PATH="):
             path_parts = line.strip().split("=", 1)[-1].split(":")
diff --git a/poetry.lock b/poetry.lock
index 3141b7e3fc..146a03dd54 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1230,6 +1230,25 @@ files = [
 [package.dependencies]
 Werkzeug = ">=2.0.0"
 
+[[package]]
+name = "pytest-httpx"
+version = "0.22.0"
+description = "Send responses to httpx."
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "pytest_httpx-0.22.0-py3-none-any.whl", hash = "sha256:cefb7dcf66a4cb0601b0de05e576cca423b6081f3245e7912a4d84c58fa3eae8"},
+    {file = "pytest_httpx-0.22.0.tar.gz", hash = "sha256:3a82797f3a9a14d51e8c6b7fa97524b68b847ee801109c062e696b4744f4431c"},
+]
+
+[package.dependencies]
+httpx = ">=0.24.0,<0.25.0"
+pytest = ">=6.0,<8.0"
+
+[package.extras]
+testing = ["pytest-asyncio (>=0.20.0,<0.21.0)", "pytest-cov (>=4.0.0,<5.0.0)"]
+
 [[package]]
 name = "pytest-rerunfailures"
 version = "11.1.2"
@@ -1386,26 +1405,6 @@ files = [
 requests = ">=1.0.0"
 six = "*"
 
-[[package]]
-name = "requests-mock"
-version = "1.10.0"
-description = "Mock out responses from the requests package"
-category = "dev"
-optional = false
-python-versions = "*"
-files = [
-    {file = "requests-mock-1.10.0.tar.gz", hash = "sha256:59c9c32419a9fb1ae83ec242d98e889c45bd7d7a65d48375cc243ec08441658b"},
-    {file = "requests_mock-1.10.0-py2.py3-none-any.whl", hash = "sha256:2fdbb637ad17ee15c06f33d31169e71bf9fe2bdb7bc9da26185be0dd8d842699"},
-]
-
-[package.dependencies]
-requests = ">=2.3,<3"
-six = "*"
-
-[package.extras]
-fixture = ["fixtures"]
-test = ["fixtures", "mock", "purl", "pytest", "requests-futures", "sphinx", "testrepository (>=0.0.18)", "testtools"]
-
 [[package]]
 name = "resolvelib"
 version = "0.8.1"
@@ -1705,4 +1704,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "5366646b07e8aa2c1189f64e976bab2ec624855eb5943bde2710376c8e115305"
+content-hash = "e8bc6b97f09142c3d7099d7378d826270a470ee7b454bd39f8c52779d57153cf"
diff --git a/pyproject.toml b/pyproject.toml
index d8b6f50fc0..fb77583d86 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -35,11 +35,11 @@ pytest = "^7.2.2"
 flake8 = "^6.0.0"
 black = "^23.1.0"
 pytest-cov = "^4.0.0"
-requests-mock = "^1.10.0"
 poetry-dynamic-versioning = "^0.21.4"
 pytest-httpserver = "^1.0.6"
 pytest-rerunfailures = "^11.1.2"
 pytest-asyncio = "^0.21.0"
+pytest-httpx = "^0.22.0"
 
 [build-system]
 requires = ["poetry-core>=1.0.0", "poetry-dynamic-versioning"]

From fc5ab4aba5134dd01b8fb6795652c3b1152eabbb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 12 May 2023 16:57:33 -0400
Subject: [PATCH 013/387] asyncified more tests

---
 bbot/core/helpers/cloud/__init__.py |   8 +-
 bbot/core/helpers/cloud/base.py     |  34 ++++-
 bbot/core/helpers/dns.py            |  24 ++--
 bbot/core/helpers/misc.py           |  10 +-
 bbot/core/helpers/web.py            |  20 ++-
 bbot/modules/bucket_aws.py          |  50 ++++---
 bbot/modules/bucket_azure.py        |   6 +-
 bbot/modules/bucket_firebase.py     |   8 +-
 bbot/modules/bucket_gcp.py          |  10 +-
 bbot/modules/internal/excavate.py   |   9 +-
 bbot/modules/internal/speculate.py  |  14 +-
 bbot/modules/masscan.py             |   1 -
 bbot/modules/report/asn.py          |  36 +++---
 bbot/modules/wafw00f.py             |  13 +-
 bbot/scanner/scanner.py             |   4 +-
 bbot/test/helpers.py                |  25 ++--
 bbot/test/modules_test_classes.py   | 194 +++++++++++++---------------
 17 files changed, 253 insertions(+), 213 deletions(-)

diff --git a/bbot/core/helpers/cloud/__init__.py b/bbot/core/helpers/cloud/__init__.py
index 6c682d184a..e8fbf69e3b 100644
--- a/bbot/core/helpers/cloud/__init__.py
+++ b/bbot/core/helpers/cloud/__init__.py
@@ -25,9 +25,13 @@ def __init__(self, parent_helper):
             self.providers[provider_name] = provider
             setattr(self, provider_name, provider)
 
-    def excavate(self, event, http_body):
+    def excavate(self, *args, **kwargs):
         for provider in self.providers.values():
-            provider.excavate(event, http_body)
+            provider.excavate(*args, **kwargs)
+
+    def speculate(self, *args, **kwargs):
+        for provider in self.providers.values():
+            provider.speculate(*args, **kwargs)
 
     def __iter__(self):
         yield from self.providers.values()
diff --git a/bbot/core/helpers/cloud/base.py b/bbot/core/helpers/cloud/base.py
index 0e7d26ee94..bd7b8b236a 100644
--- a/bbot/core/helpers/cloud/base.py
+++ b/bbot/core/helpers/cloud/base.py
@@ -41,6 +41,25 @@ def excavate(self, event, http_body):
                         else:
                             self.emit_event(**kwargs)
 
+    def speculate(self, event):
+        base_kwargs = dict(source=event, tags=self.base_tags)
+
+        if event.type.startswith("DNS_NAME"):
+            # check for DNS_NAMEs that are buckets
+            for event_type, sigs in self.signatures.items():
+                found = set()
+                for sig in sigs:
+                    match = sig.match(event.data)
+                    if match:
+                        kwargs = dict(base_kwargs)
+                        kwargs["event_type"] = event_type
+                        if not event.data in found:
+                            found.add(event.data)
+                            if event_type == "STORAGE_BUCKET":
+                                self.emit_bucket(match.groups(), **kwargs)
+                            else:
+                                self.emit_event(**kwargs)
+
     def emit_bucket(self, match, **kwargs):
         bucket_name, bucket_domain = match
         kwargs["data"] = {"name": bucket_name, "url": f"https://{bucket_name}.{bucket_domain}"}
@@ -61,11 +80,16 @@ def tag_event(self, event):
             # its host directly matches this cloud provider's domains
             if isinstance(event.host, str) and self.domain_match(event.host):
                 event.tags.update(self.base_tags)
-                return
-            # or it has a CNAME that matches this cloud provider's domains
-            for rh in event.resolved_hosts:
-                if not self.parent_helper.is_ip(rh) and self.domain_match(rh):
-                    event.tags.update(self.base_tags)
+                # tag as buckets, etc.
+                for event_type, sigs in self.signatures.items():
+                    for sig in sigs:
+                        if sig.match(event.host):
+                            event.add_tag(f"cloud-{event_type}")
+            else:
+                # or it has a CNAME that matches this cloud provider's domains
+                for rh in event.resolved_hosts:
+                    if not self.parent_helper.is_ip(rh) and self.domain_match(rh):
+                        event.tags.update(self.base_tags)
 
     def domain_match(self, s):
         for r in self.domain_regexes:
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 23fd8601f8..4f4b651199 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -219,7 +219,7 @@ async def handle_wildcard_event(self, event, children):
                 event.add_tag(f"{rdtype.lower()}-{wildcard_tag}")
 
         # wildcard event modification (www.evilcorp.com --> _wildcard.evilcorp.com)
-        if not is_ip(event.host) and children and wildcard_rdtypes:
+        if not is_ip(event.host) and wildcard_rdtypes and children:
             # these are the rdtypes that successfully resolve
             resolved_rdtypes = set([c.upper() for c in children])
             # these are the rdtypes that have wildcards
@@ -228,16 +228,18 @@ async def handle_wildcard_event(self, event, children):
             event_is_wildcard = False
             if resolved_rdtypes:
                 event_is_wildcard = all(r in wildcard_rdtypes_set for r in resolved_rdtypes)
-            if event_is_wildcard and event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
-                wildcard_parent = self.parent_helper.parent_domain(event_host)
-                for rdtype, (_is_wildcard, _parent_domain) in wildcard_rdtypes.items():
-                    if _is_wildcard:
-                        wildcard_parent = _parent_domain
-                        break
-                wildcard_data = f"_wildcard.{wildcard_parent}"
-                if wildcard_data != event.data:
-                    log.debug(f'Wildcard detected, changing event.data "{event.data}" --> "{wildcard_data}"')
-                    event.data = wildcard_data
+            # if event_is_wildcard and event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
+            if event_is_wildcard:
+                if event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
+                    wildcard_parent = self.parent_helper.parent_domain(event_host)
+                    for rdtype, (_is_wildcard, _parent_domain) in wildcard_rdtypes.items():
+                        if _is_wildcard:
+                            wildcard_parent = _parent_domain
+                            break
+                    wildcard_data = f"_wildcard.{wildcard_parent}"
+                    if wildcard_data != event.data:
+                        log.debug(f'Wildcard detected, changing event.data "{event.data}" --> "{wildcard_data}"')
+                        event.data = wildcard_data
 
     async def resolve_event(self, event, minimal=False):
         """
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 243901231f..c2b39214a7 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -19,7 +19,6 @@
 import traceback
 import subprocess as sp
 from pathlib import Path
-from asyncio import sleep  # noqa
 from itertools import islice
 from datetime import datetime
 from tabulate import tabulate
@@ -28,6 +27,7 @@
 import cloudcheck as _cloudcheck
 import tldextract as _tldextract
 from hashlib import sha1 as hashlib_sha1
+from asyncio import as_completed, create_task, sleep  # noqa
 from urllib.parse import urlparse, quote, unquote, urlunparse  # noqa F401
 
 from .url import *  # noqa F401
@@ -1056,14 +1056,6 @@ def get_traceback_details(e):
     return filename, lineno, funcname
 
 
-def create_task(*args, **kwargs):
-    return asyncio.create_task(*args, **kwargs)
-
-
-def as_completed(*args, **kwargs):
-    yield from asyncio.as_completed(*args, **kwargs)
-
-
 async def cancel_tasks(tasks):
     for task in tasks:
         task.cancel()
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index ba642d3554..606cca4d3f 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -44,19 +44,32 @@ class WebHelper:
     For making HTTP requests
     """
 
-    client_options = ("auth", "params", "headers", "cookies", "timeout", "follow_redirects", "max_redirects")
+    client_options = (
+        "auth",
+        "params",
+        "headers",
+        "retries",
+        "cookies",
+        "verify",
+        "timeout",
+        "follow_redirects",
+        "max_redirects",
+    )
 
     def __init__(self, parent_helper):
         self.parent_helper = parent_helper
+        self.ssl_verify = self.parent_helper.config.get("ssl_verify", False)
 
     def AsyncClient(self, *args, **kwargs):
         kwargs["_bbot_scan"] = self.parent_helper.scan
         retries = kwargs.pop("retries", self.parent_helper.config.get("http_retries", 1))
-        kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries)
+        kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries, verify=self.ssl_verify)
         return BBOTAsyncClient(*args, **kwargs)
 
     async def request(self, *args, **kwargs):
         raise_error = kwargs.pop("raise_error", False)
+        # TODO: use this
+        cache_for = kwargs.pop("cache_for", None) # noqa
 
         # in case of URL only, assume GET request
         if len(args) == 1:
@@ -183,8 +196,7 @@ async def curl(self, *args, **kwargs):
             curl_command.append("--path-as-is")
 
         # respect global ssl verify settings
-        ssl_verify = self.parent_helper.config.get("ssl_verify")
-        if ssl_verify == False:
+        if self.ssl_verify == False:
             curl_command.append("-k")
 
         headers = kwargs.get("headers", {})
diff --git a/bbot/modules/bucket_aws.py b/bbot/modules/bucket_aws.py
index 4d72ef611c..012bb6df6f 100644
--- a/bbot/modules/bucket_aws.py
+++ b/bbot/modules/bucket_aws.py
@@ -19,13 +19,13 @@ class bucket_aws(BaseModule):
     regions = [None]
     supports_open_check = True
 
-    def setup(self):
+    async def setup(self):
         self.buckets_tried = set()
         self.cloud_helper = getattr(self.helpers.cloud, self.cloud_helper_name)
         self.permutations = self.config.get("permutations", False)
         return True
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if event.type == "DNS_NAME" and event.scope_distance > 0:
             return False, "only accepts in-scope DNS_NAMEs"
         if event.type == "STORAGE_BUCKET":
@@ -33,13 +33,13 @@ def filter_event(self, event):
                 return False, "bucket belongs to a different cloud provider"
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         if event.type == "DNS_NAME":
-            self.handle_dns_name(event)
+            await self.handle_dns_name(event)
         elif event.type == "STORAGE_BUCKET":
-            self.handle_storage_bucket(event)
+            await self.handle_storage_bucket(event)
 
-    def handle_dns_name(self, event):
+    async def handle_dns_name(self, event):
         buckets = set()
         base = event.data
         stem = self.helpers.domain_stem(base)
@@ -47,24 +47,24 @@ def handle_dns_name(self, event):
             split = b.split(".")
             for d in self.delimiters:
                 buckets.add(d.join(split))
-        for bucket_name, url, tags in self.brute_buckets(buckets, permutations=self.permutations):
+        async for bucket_name, url, tags in self.brute_buckets(buckets, permutations=self.permutations):
             self.emit_event({"name": bucket_name, "url": url}, "STORAGE_BUCKET", source=event, tags=tags)
 
-    def handle_storage_bucket(self, event):
+    async def handle_storage_bucket(self, event):
         url = event.data["url"]
         bucket_name = event.data["name"]
         if self.supports_open_check:
-            description, tags = self._check_bucket_open(bucket_name, url)
+            description, tags = await self._check_bucket_open(bucket_name, url)
             if description:
                 event_data = {"host": event.host, "url": url, "description": description}
                 self.emit_event(event_data, "FINDING", source=event, tags=tags)
 
-        for bucket_name, url, tags in self.brute_buckets(
+        async for bucket_name, url, tags in self.brute_buckets(
             [bucket_name], permutations=self.permutations, omit_base=True
         ):
             self.emit_event({"name": bucket_name, "url": url}, "STORAGE_BUCKET", source=event, tags=tags)
 
-    def brute_buckets(self, buckets, permutations=False, omit_base=False):
+    async def brute_buckets(self, buckets, permutations=False, omit_base=False):
         buckets = set(buckets)
         new_buckets = set(buckets)
         if permutations:
@@ -75,36 +75,34 @@ def brute_buckets(self, buckets, permutations=False, omit_base=False):
         if omit_base:
             new_buckets = new_buckets - buckets
         new_buckets = [b for b in new_buckets if self.valid_bucket_name(b)]
-        futures = {}
+        tasks = []
         for base_domain in self.base_domains:
             for region in self.regions:
                 for bucket_name in new_buckets:
                     url = self.build_url(bucket_name, base_domain, region)
-                    future = self.submit_task(self._check_bucket_exists, bucket_name, url)
-                    futures[future] = (bucket_name, url)
-        for future in self.helpers.as_completed(futures):
-            bucket_name, url = futures[future]
-            existent_bucket, tags = future.result()
+                    tasks.append(self.helpers.create_task(self._check_bucket_exists(bucket_name, url)))
+        for task in self.helpers.as_completed(tasks):
+            existent_bucket, tags, bucket_name, url = await task
             if existent_bucket:
                 yield bucket_name, url, tags
 
-    def _check_bucket_exists(self, bucket_name, url):
+    async def _check_bucket_exists(self, bucket_name, url):
         self.debug(f'Checking if bucket exists: "{bucket_name}"')
-        return self.check_bucket_exists(bucket_name, url)
+        return await self.check_bucket_exists(bucket_name, url)
 
-    def check_bucket_exists(self, bucket_name, url):
-        response = self.helpers.request(url)
+    async def check_bucket_exists(self, bucket_name, url):
+        response = await self.helpers.request(url)
         tags = self.gen_tags_exists(response)
         status_code = getattr(response, "status_code", 404)
         existent_bucket = status_code != 404
-        return (existent_bucket, tags)
+        return (existent_bucket, tags, bucket_name, url)
 
-    def _check_bucket_open(self, bucket_name, url):
+    async def _check_bucket_open(self, bucket_name, url):
         self.debug(f'Checking if bucket is misconfigured: "{bucket_name}"')
-        return self.check_bucket_open(bucket_name, url)
+        return await self.check_bucket_open(bucket_name, url)
 
-    def check_bucket_open(self, bucket_name, url):
-        response = self.helpers.request(url)
+    async def check_bucket_open(self, bucket_name, url):
+        response = await self.helpers.request(url)
         tags = self.gen_tags_exists(response)
         status_code = getattr(response, "status_code", 404)
         content = getattr(response, "text", "")
diff --git a/bbot/modules/bucket_azure.py b/bbot/modules/bucket_azure.py
index 64d20d1544..97d81fa231 100644
--- a/bbot/modules/bucket_azure.py
+++ b/bbot/modules/bucket_azure.py
@@ -18,9 +18,9 @@ class bucket_azure(bucket_aws):
     # Dirbusting is required to know whether a bucket is public
     supports_open_check = False
 
-    def check_bucket_exists(self, bucket_name, url):
+    async def check_bucket_exists(self, bucket_name, url):
         url = url.strip("/") + f"/{bucket_name}?restype=container"
-        response = self.helpers.request(url, retries=0)
+        response = await self.helpers.request(url, retries=0)
         status_code = getattr(response, "status_code", 0)
         existent_bucket = status_code != 0
-        return (existent_bucket, set())
+        return existent_bucket, set(), bucket_name, url
diff --git a/bbot/modules/bucket_firebase.py b/bbot/modules/bucket_firebase.py
index daab455dba..413457893a 100644
--- a/bbot/modules/bucket_firebase.py
+++ b/bbot/modules/bucket_firebase.py
@@ -16,13 +16,13 @@ class bucket_firebase(bucket_aws):
     delimiters = ("", "-")
     base_domains = ["firebaseio.com"]
 
-    def check_bucket_exists(self, bucket_name, url):
+    async def check_bucket_exists(self, bucket_name, url):
         url = url.strip("/") + "/.json"
-        return super().check_bucket_exists(bucket_name, url)
+        return await super().check_bucket_exists(bucket_name, url)
 
-    def check_bucket_open(self, bucket_name, url):
+    async def check_bucket_open(self, bucket_name, url):
         url = url.strip("/") + "/.json"
-        response = self.helpers.request(url)
+        response = await self.helpers.request(url)
         tags = self.gen_tags_exists(response)
         status_code = getattr(response, "status_code", 404)
         msg = ""
diff --git a/bbot/modules/bucket_gcp.py b/bbot/modules/bucket_gcp.py
index 5a2c2d7bc0..06cc588946 100644
--- a/bbot/modules/bucket_gcp.py
+++ b/bbot/modules/bucket_gcp.py
@@ -29,12 +29,12 @@ class bucket_gcp(bucket_aws):
     def build_url(self, bucket_name, base_domain, region):
         return f"https://www.googleapis.com/storage/v1/b/{bucket_name}"
 
-    def check_bucket_open(self, bucket_name, url):
+    async def check_bucket_open(self, bucket_name, url):
         bad_permissions = []
         try:
             list_permissions = "&".join(["=".join(("permissions", p)) for p in self.bad_permissions])
             url = f"https://www.googleapis.com/storage/v1/b/{bucket_name}/iam/testPermissions?" + list_permissions
-            response = self.helpers.request(url)
+            response = await self.helpers.request(url)
             permissions = response.json()
             if isinstance(permissions, dict):
                 bad_permissions = list(permissions.get("permissions", {}))
@@ -46,8 +46,8 @@ def check_bucket_open(self, bucket_name, url):
             msg = f"Open permissions on storage bucket ({perms_str})"
         return (msg, set())
 
-    def check_bucket_exists(self, bucket_name, url):
-        response = self.helpers.request(url)
+    async def check_bucket_exists(self, bucket_name, url):
+        response = await self.helpers.request(url)
         status_code = getattr(response, "status_code", 0)
         existent_bucket = status_code not in (0, 400, 404)
-        return existent_bucket, set()
+        return existent_bucket, set(), bucket_name, url
diff --git a/bbot/modules/internal/excavate.py b/bbot/modules/internal/excavate.py
index 6bf98a8604..25cef3d625 100644
--- a/bbot/modules/internal/excavate.py
+++ b/bbot/modules/internal/excavate.py
@@ -336,10 +336,11 @@ async def handle_event(self, event):
                 if scheme in ("http", "https"):
                     if num_redirects <= self.max_redirects:
                         url_event = self.make_event(location, "URL_UNVERIFIED", event)
-                        # inherit web spider distance from parent (don't increment)
-                        source_web_spider_distance = getattr(event, "web_spider_distance", 0)
-                        url_event.web_spider_distance = source_web_spider_distance
-                        self.emit_event(url_event)
+                        if url_event is not None:
+                            # inherit web spider distance from parent (don't increment)
+                            source_web_spider_distance = getattr(event, "web_spider_distance", 0)
+                            url_event.web_spider_distance = source_web_spider_distance
+                            self.emit_event(url_event)
                     else:
                         self.verbose(f"Exceeded max HTTP redirects ({self.max_redirects}): {location}")
                 elif scheme:
diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index 079f8076ed..b11bb60baf 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -10,7 +10,16 @@ class speculate(BaseInternalModule):
     in situations where e.g. a port scanner isn't enabled
     """
 
-    watched_events = ["IP_RANGE", "URL", "URL_UNVERIFIED", "DNS_NAME", "IP_ADDRESS", "HTTP_RESPONSE", "STORAGE_BUCKET"]
+    watched_events = [
+        "IP_RANGE",
+        "URL",
+        "URL_UNVERIFIED",
+        "DNS_NAME",
+        "DNS_NAME_UNRESOLVED",
+        "IP_ADDRESS",
+        "HTTP_RESPONSE",
+        "STORAGE_BUCKET",
+    ]
     produced_events = ["DNS_NAME", "OPEN_TCP_PORT", "IP_ADDRESS", "FINDING"]
     flags = ["passive"]
     meta = {"description": "Derive certain event types from others by common sense"}
@@ -104,6 +113,9 @@ async def handle_event(self, event):
                         quick=True,
                     )
 
+        # storage buckets etc.
+        self.helpers.cloud.speculate(event)
+
     async def filter_event(self, event):
         # don't accept IP_RANGE --> IP_ADDRESS events from self
         if str(event.module) == "speculate":
diff --git a/bbot/modules/masscan.py b/bbot/modules/masscan.py
index 9e8282702f..e7f2507b6f 100644
--- a/bbot/modules/masscan.py
+++ b/bbot/modules/masscan.py
@@ -145,7 +145,6 @@ async def masscan(self, targets, result_callback, exclude=None, ping=False):
         stats_file = self.helpers.tempfile_tail(callback=self.verbose)
         try:
             with open(stats_file, "w") as stats_fh:
-                self.critical(f"masscan: {command}")
                 async for line in self.helpers.run_live(command, sudo=True, stderr=stats_fh):
                     self.process_output(line, result_callback=result_callback)
         finally:
diff --git a/bbot/modules/report/asn.py b/bbot/modules/report/asn.py
index 592ec1ff63..1844e67006 100644
--- a/bbot/modules/report/asn.py
+++ b/bbot/modules/report/asn.py
@@ -11,7 +11,7 @@ class asn(BaseReportModule):
     # because sometimes IP addresses are re-emitted with lower scope distances
     accept_dupes = True
 
-    def setup(self):
+    async def setup(self):
         self.asn_counts = {}
         self.asn_cache = {}
         self.sources = ["bgpview", "ripe"]
@@ -24,15 +24,15 @@ def setup(self):
         }
         return True
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if getattr(event.host, "is_private", False):
             return False
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         host = event.host
         if self.cache_get(host) == False:
-            asns = list(self.get_asn(host))
+            asns = await self.get_asn(host)
             if not asns:
                 self.cache_put(self.unknown_asn)
             else:
@@ -81,7 +81,7 @@ def cache_get(self, ip):
                 continue
         return ret
 
-    def get_asn(self, ip, retries=1):
+    async def get_asn(self, ip, retries=1):
         """
         Takes in an IP
         returns a list of ASNs, e.g.:
@@ -90,7 +90,7 @@ def get_asn(self, ip, retries=1):
         for attempt in range(retries + 1):
             for i, source in enumerate(list(self.sources)):
                 get_asn_fn = getattr(self, f"get_asn_{source}")
-                res = get_asn_fn(ip)
+                res = await get_asn_fn(ip)
                 if res == False:
                     # demote the current source to lowest priority since it just failed
                     self.sources.append(self.sources.pop(i))
@@ -100,9 +100,9 @@ def get_asn(self, ip, retries=1):
         self.warning(f"Error retrieving ASN via for {ip}")
         return []
 
-    def get_asn_ripe(self, ip):
+    async def get_asn_ripe(self, ip):
         url = f"https://stat.ripe.net/data/network-info/data.json?resource={ip}"
-        response = self.get_url(url, "ASN")
+        response = await self.get_url(url, "ASN")
         asns = []
         if response == False:
             return False
@@ -116,19 +116,19 @@ def get_asn_ripe(self, ip):
         if not asn_numbers:
             asn_numbers = []
         for number in asn_numbers:
-            asn = self.get_asn_metadata_ripe(number)
+            asn = await self.get_asn_metadata_ripe(number)
             asn["subnet"] = prefix
             asns.append(asn)
         return asns
 
-    def get_asn_metadata_ripe(self, asn_number):
+    async def get_asn_metadata_ripe(self, asn_number):
         metadata_keys = {
             "name": ["ASName", "OrgId"],
             "description": ["OrgName", "OrgTechName", "RTechName"],
             "country": ["Country"],
         }
         url = f"https://stat.ripe.net/data/whois/data.json?resource={asn_number}"
-        response = self.get_url(url, "ASN Metadata", cache=True)
+        response = await self.get_url(url, "ASN Metadata", cache=True)
         if response == False:
             return False
         data = response.get("data", {})
@@ -155,9 +155,9 @@ def get_asn_metadata_ripe(self, asn_number):
         asn["asn"] = str(asn_number)
         return asn
 
-    def get_asn_bgpview(self, ip):
+    async def get_asn_bgpview(self, ip):
         url = f"https://api.bgpview.io/ip/{ip}"
-        data = self.get_url(url, "ASN")
+        data = await self.get_url(url, "ASN")
         asns = []
         asns_tried = set()
         if data == False:
@@ -175,7 +175,7 @@ def get_asn_bgpview(self, ip):
             country = details.get("country_code") or prefix.get("country_code") or ""
             emails = []
             if not asn in asns_tried:
-                emails = self.get_emails_bgpview(asn)
+                emails = await self.get_emails_bgpview(asn)
                 if emails == False:
                     return False
                 asns_tried.add(asn)
@@ -186,10 +186,10 @@ def get_asn_bgpview(self, ip):
             self.debug(f'No results for "{ip}"')
         return asns
 
-    def get_emails_bgpview(self, asn):
+    async def get_emails_bgpview(self, asn):
         contacts = []
         url = f"https://api.bgpview.io/asn/{asn}"
-        data = self.get_url(url, "ASN metadata", cache=True)
+        data = await self.get_url(url, "ASN metadata", cache=True)
         if data == False:
             return False
         data = data.get("data", {})
@@ -201,11 +201,11 @@ def get_emails_bgpview(self, asn):
         contacts = [l.strip().lower() for l in email_contacts + abuse_contacts]
         return list(set(contacts))
 
-    def get_url(self, url, data_type, cache=False):
+    async def get_url(self, url, data_type, cache=False):
         kwargs = {}
         if cache:
             kwargs["cache_for"] = 60 * 60 * 24
-        r = self.helpers.request(url, **kwargs)
+        r = await self.helpers.request(url, **kwargs)
         data = {}
         try:
             j = r.json()
diff --git a/bbot/modules/wafw00f.py b/bbot/modules/wafw00f.py
index 29a0f0c1f2..788e9d6254 100644
--- a/bbot/modules/wafw00f.py
+++ b/bbot/modules/wafw00f.py
@@ -19,11 +19,11 @@ class wafw00f(BaseModule):
 
     in_scope_only = True
 
-    def setup(self):
+    async def setup(self):
         self.scanned_hosts = set()
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         parsed_host = event.parsed
         host = f"{parsed_host.scheme}://{parsed_host.netloc}/"
         host_hash = hash(host)
@@ -33,14 +33,15 @@ def handle_event(self, event):
         else:
             self.scanned_hosts.add(host_hash)
 
-        WW = wafw00f_main.WAFW00F(host)
-        waf_detections = WW.identwaf()
+        WW = await self.scan.run_in_executor(wafw00f_main.WAFW00F, host)
+        waf_detections = await self.scan.run_in_executor(WW.identwaf)
         if waf_detections:
-            for waf in WW.identwaf():
+            for waf in waf_detections:
                 self.emit_event({"host": host, "WAF": waf}, "WAF", source=event)
         else:
             if self.config.get("generic_detect") == True:
-                if WW.genericdetect():
+                generic = await self.scan.run_in_executor(WW.genericdetect)
+                if generic:
                     self.emit_event(
                         {"host": host, "WAF": "generic detection", "info": WW.knowledge["generic"]["reason"]},
                         "WAF",
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index c43f702a15..d66330819d 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -641,7 +641,6 @@ def _load_modules(self, modules):
 
     async def _status_ticker(self, interval=15):
         async with self.acatch():
-            # while not self.stopped:
             while 1:
                 await asyncio.sleep(interval)
                 await self.manager.modules_status(_log=True)
@@ -672,6 +671,9 @@ async def acatch(self, context="scan", finally_callback=None):
         except BaseException as e:
             self._handle_exception(e, context=context)
 
+    def run_in_executor(self, *args, **kwargs):
+        return self._loop.run_in_executor(None, *args, **kwargs)
+
     def _handle_exception(self, e, context="scan", finally_callback=None):
         if callable(context):
             context = f"{context.__qualname__}()"
diff --git a/bbot/test/helpers.py b/bbot/test/helpers.py
index fd457795b8..0cfafafc99 100644
--- a/bbot/test/helpers.py
+++ b/bbot/test/helpers.py
@@ -18,7 +18,8 @@ def __init__(self, request, **kwargs):
         self.bbot_scanner = request.getfixturevalue("bbot_scanner")
         self.config = OmegaConf.merge(self.bbot_config, OmegaConf.create(self.config_overrides))
         modules = [self.name] + self.additional_modules
-        self.scan = self.bbot_scanner(
+        self.scans = []
+        self.scan = self.add_scan(
             *self.targets,
             modules=modules,
             name=f"{self.name}_test",
@@ -27,19 +28,25 @@ def __init__(self, request, **kwargs):
             blacklist=self.blacklist,
         )
 
-    def patch_scan(self, scan):
-        return
+    def add_scan(self, *args, **kwargs):
+        scan = self.bbot_scanner(*args, **kwargs)
+        self.scans.append(scan)
+        return scan
 
-    def setup(self):
+    def setup(self, scan):
         pass
 
     async def run(self):
-        await self.scan.prep()
-        self.setup()
-        self.patch_scan(self.scan)
+        for i, scan in enumerate(self.scans):
+            if i == 0:
+                self.scan = scan
+            await scan.prep()
+            self.setup(scan)
+
         self._after_scan_prep()
-        events = [e async for e in self.scan.start()]
-        self.check_events(events)
+        for i, scan in enumerate(self.scans):
+            events = [e async for e in scan.start()]
+            self.check_events(events)
 
     @abstractmethod
     def check_events(self, events):
diff --git a/bbot/test/modules_test_classes.py b/bbot/test/modules_test_classes.py
index f763318bca..11a99fe914 100644
--- a/bbot/test/modules_test_classes.py
+++ b/bbot/test/modules_test_classes.py
@@ -79,7 +79,7 @@ class Excavate(HttpxMockHelper):
 
     config_overrides = {"web_spider_distance": 1, "web_spider_depth": 1}
 
-    def setup(self):
+    def setup(self, scan):
         self.bbot_httpserver.no_handler_status_code = 404
 
     def mock_args(self):
@@ -172,7 +172,7 @@ class Excavate_relativelinks(HttpxMockHelper):
     targets = ["http://127.0.0.1:8888/", "test.notreal", "http://127.0.0.1:8888/subdir/"]
     config_overrides = {"web_spider_distance": 1, "web_spider_depth": 1}
 
-    def setup(self):
+    def setup(self, scan):
         self.bbot_httpserver.no_handler_status_code = 404
 
     def mock_args(self):
@@ -284,7 +284,7 @@ def check_events(self, events):
 
 
 class Anubisdb(RequestMockHelper):
-    def setup(self):
+    def setup(self, scan):
         self.module.abort_if = lambda e: False
 
     def mock_args(self):
@@ -512,7 +512,7 @@ class Paramminer_headers(HttpxMockHelper):
 
     config_overrides = {"modules": {"paramminer_headers": {"wordlist": tempwordlist(["junkword1", "tracestate"])}}}
 
-    def setup(self):
+    def setup(self, scan):
         from bbot.core.helpers import helper
 
         self.module.rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
@@ -559,7 +559,7 @@ class Paramminer_getparams(HttpxMockHelper):
 
     config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"])}}}
 
-    def setup(self):
+    def setup(self, scan):
         from bbot.core.helpers import helper
 
         self.module.rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
@@ -606,7 +606,7 @@ class Paramminer_cookies(HttpxMockHelper):
 
     config_overrides = {"modules": {"paramminer_cookies": {"wordlist": tempwordlist(["junkcookie", "admincookie"])}}}
 
-    def setup(self):
+    def setup(self, scan):
         from bbot.core.helpers import helper
 
         self.module.rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
@@ -738,28 +738,20 @@ class Masscan(MockHelper):
 ports = 
 range = 9.8.7.6"""
 
-    def _after_scan_prep(self):
-        self.scan.modules["masscan"].masscan_config = self.masscan_config
-
-        async def setup_scan_2():
-            config2 = OmegaConf.merge(self.config, OmegaConf.create(self.config_overrides_2))
-            self.scan2 = self.bbot_scanner(
-                *self.targets,
-                modules=[self.name] + self.additional_modules,
-                name=f"{self.name}_test",
-                config=config2,
-                whitelist=self.whitelist,
-                blacklist=self.blacklist,
-            )
-            self.patch_scan(self.scan2)
-            await self.scan2.prep()
-            self.scan2.modules["masscan"].masscan_config = self.masscan_config
-
-        self.setup_scan_2 = setup_scan_2
+    def __init__(self, request):
+        super().__init__(request)
+        config2 = OmegaConf.merge(self.config, OmegaConf.create(self.config_overrides_2))
+        self.add_scan(
+            *self.targets,
+            modules=[self.name] + self.additional_modules,
+            name=f"{self.name}_test",
+            config=config2,
+            whitelist=self.whitelist,
+            blacklist=self.blacklist,
+        )
         self.masscan_run = False
 
     async def run_masscan(self, command, *args, **kwargs):
-        log.critical(f"patched: {command}")
         if "masscan" in command[:2]:
             for l in self.masscan_output.splitlines():
                 yield l
@@ -768,26 +760,30 @@ async def run_masscan(self, command, *args, **kwargs):
             async for l in self.scan.helpers.run_live(command, *args, **kwargs):
                 yield l
 
-    def patch_scan(self, scan):
+    def setup(self, scan):
         scan.helpers.run_live = self.run_masscan
+        scan.modules["masscan"].masscan_config = self.masscan_config
 
     async def run(self):
-        await super().run()
-        assert self.masscan_run == True, "masscan didn't run when it was supposed to"
-        await self.setup_scan_2()
-        self.masscan_run = False
-        events = [e async for e in self.scan2.start()]
-        self.check_events(events)
-        assert self.masscan_run == False, "masscan ran when it wasn't supposed to"
+        for i, scan in enumerate(self.scans):
+            await scan.prep()
+            self.setup(scan)
+            events = [e async for e in scan.start()]
+            self.check_events(events)
+            if i == 0:
+                assert self.masscan_run == True, "masscan didn't run when it was supposed to"
+                self.masscan_run = False
+            else:
+                assert self.masscan_run == False, "masscan ran when it wasn't supposed to"
 
     def check_events(self, events):
         assert any(e.type == "IP_ADDRESS" and e.data == "8.8.8.8" for e in events), "No IP_ADDRESS emitted"
         assert any(e.type == "OPEN_TCP_PORT" and e.data == "8.8.8.8:443" for e in events), "No OPEN_TCP_PORT emitted"
 
 
-class Buckets(HttpxMockHelper, RequestMockHelper):
+class Buckets(HttpxMockHelper):
     providers = ["aws", "gcp", "azure", "digitalocean", "firebase"]
-    # providers = ["aws"]
+    # providers = ["azure"]
     additional_modules = ["excavate", "speculate", "httpx"] + [f"bucket_{p}" for p in providers]
     config_overrides = {
         "modules": {
@@ -817,7 +813,11 @@ class Buckets(HttpxMockHelper, RequestMockHelper):
   ]
 }"""
 
-    def patch_scan(self, scan):
+    def __init__(self, request, **kwargs):
+        self.httpx_mock = request.getfixturevalue("httpx_mock")
+        super().__init__(request, **kwargs)
+
+    def setup(self, scan):
         scan.helpers.word_cloud.mutations = lambda b, cloud=False: [
             (b, "dev"),
         ]
@@ -839,56 +839,43 @@ def mock_args(self):
         """
         self.set_expect_requests(expect_args=expect_args, respond_args={"response_data": body})
 
-    def mock_args_requests(self):
-        self.m.register_uri("GET", requests_mock.ANY, text="", status_code=404)
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}.s3-ap-southeast-2.amazonaws.com/",
+        self.httpx_mock.add_response(
+            url=f"https://{self.random_bucket_name_2}.s3-ap-southeast-2.amazonaws.com",
             text=self.open_aws_bucket,
         )
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}.fra1.digitaloceanspaces.com/",
+        self.httpx_mock.add_response(
+            url=f"https://{self.random_bucket_name_2}.fra1.digitaloceanspaces.com",
             text=self.open_digitalocean_bucket,
         )
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}.blob.core.windows.net/{self.random_bucket_name_2}?restype=container",
-            text="",
-        )
-        self.register_uri(
-            f"https://www.googleapis.com/storage/v1/b/{self.random_bucket_name_2}/iam/testPermissions?permissions=storage.buckets.setIamPolicy&permissions=storage.objects.list&permissions=storage.objects.get&permissions=storage.objects.create",
+        self.httpx_mock.add_response(
+            url=f"https://www.googleapis.com/storage/v1/b/{self.random_bucket_name_2}/iam/testPermissions?permissions=storage.buckets.setIamPolicy&permissions=storage.objects.list&permissions=storage.objects.get&permissions=storage.objects.create",
             text=self.open_gcp_bucket,
         )
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}.firebaseio.com/.json",
+        self.httpx_mock.add_response(
+            url=f"https://{self.random_bucket_name_2}.firebaseio.com/.json",
             text="",
         )
-
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}-dev.s3.amazonaws.com/",
+        self.httpx_mock.add_response(
+            url=f"https://{self.random_bucket_name_2}-dev.s3.amazonaws.com",
             text="",
         )
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}-dev.fra1.digitaloceanspaces.com/",
+        self.httpx_mock.add_response(
+            url=f"https://{self.random_bucket_name_2}-dev.fra1.digitaloceanspaces.com",
             text="",
         )
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}-dev.blob.core.windows.net/{self.random_bucket_name_2}-dev?restype=container",
+        self.httpx_mock.add_response(
+            url=f"https://{self.random_bucket_name_2}-dev.blob.core.windows.net/{self.random_bucket_name_2}-dev?restype=container",
             text="",
         )
-        self.register_uri(
-            f"https://www.googleapis.com/storage/v1/b/{self.random_bucket_name_2}-dev",
+        self.httpx_mock.add_response(
+            url=f"https://www.googleapis.com/storage/v1/b/{self.random_bucket_name_2}-dev",
             text="",
         )
-        self.register_uri(
-            f"https://{self.random_bucket_name_2}-dev.firebaseio.com/.json",
+        self.httpx_mock.add_response(
+            url=f"https://{self.random_bucket_name_2}-dev.firebaseio.com/.json",
             text="",
         )
-
-    def run(self):
-        with requests_mock.Mocker() as m:
-            self.m = m
-            self.mock_args_requests()
-            events = list(self.scan.start())
-            self.check_events(events)
+        self.httpx_mock.add_response(url=re.compile(".*"), text="", status_code=404)
 
     def check_events(self, events):
         for provider in self.providers:
@@ -906,6 +893,7 @@ def check_events(self, events):
                         url = e.data.get("url", "")
                         assert self.random_bucket_name_2 in url
                         assert not self.random_bucket_name_1 in url
+                        assert not f"{self.random_bucket_name_2}-dev" in url
             # make sure bucket mutations were found
             assert any(
                 e.type == "STORAGE_BUCKET"
@@ -915,7 +903,7 @@ def check_events(self, events):
             ), f'bucket (dev mutation) not found for provider "{provider}"'
 
 
-class ASN(RequestMockHelper):
+class ASN(HttpxMockHelper):
     targets = ["8.8.8.8"]
     response_get_asn_ripe = {
         "messages": [],
@@ -1115,39 +1103,41 @@ class ASN(RequestMockHelper):
     }
     config_overrides = {"scope_report_distance": 2}
 
-    def __init__(self, config, bbot_scanner, *args):
-        super().__init__(config, bbot_scanner, *args)
-        self.scan2 = bbot_scanner(
+    def __init__(self, request, **kwargs):
+        super().__init__(request, **kwargs)
+        self.scan2 = self.add_scan(
             *self.targets,
             modules=[self.name] + self.additional_modules,
             name=f"{self.name}_test_2",
             config=self.config,
         )
-        self.scan2.prep()
-        self.module2 = self.scan2.modules[self.name]
 
     def mock_args(self):
-        pass
+        self.httpx_mock.add_response(
+            url="https://stat.ripe.net/data/network-info/data.json?resource=8.8.8.8",
+            text=json.dumps(self.response_get_asn_ripe),
+        )
+        self.httpx_mock.add_response(
+            url="https://stat.ripe.net/data/whois/data.json?resource=15169",
+            text=json.dumps(self.response_get_asn_metadata_ripe),
+        )
+        self.httpx_mock.add_response(
+            url="https://api.bgpview.io/ip/8.8.8.8", text=json.dumps(self.response_get_asn_bgpview)
+        )
+        self.httpx_mock.add_response(
+            url="https://api.bgpview.io/asn/15169", text=json.dumps(self.response_get_emails_bgpview)
+        )
 
-    def run(self):
-        with requests_mock.Mocker() as m:
-            self.m = m
-            self.register_uri(
-                "https://stat.ripe.net/data/network-info/data.json?resource=8.8.8.8",
-                text=json.dumps(self.response_get_asn_ripe),
-            )
-            self.register_uri(
-                "https://stat.ripe.net/data/whois/data.json?resource=15169",
-                text=json.dumps(self.response_get_asn_metadata_ripe),
-            )
-            self.register_uri("https://api.bgpview.io/ip/8.8.8.8", text=json.dumps(self.response_get_asn_bgpview))
-            self.register_uri("https://api.bgpview.io/asn/15169", text=json.dumps(self.response_get_emails_bgpview))
-            self.module.sources = ["bgpview", "ripe"]
-            events = list(e for e in self.scan.start() if e.module == self.module)
-            assert self.check_events(events)
-            self.module2.sources = ["ripe", "bgpview"]
-            events2 = list(e for e in self.scan2.start() if e.module == self.module2)
-            assert self.check_events(events2)
+    async def run(self):
+        await self.scan.prep()
+        self.module.sources = ["bgpview", "ripe"]
+        events = [e async for e in self.scan.start() if e.module == self.module]
+        assert self.check_events(events)
+        await self.scan2.prep()
+        self.module2 = self.scan2.modules["asn"]
+        self.module2.sources = ["ripe", "bgpview"]
+        events2 = [e async for e in self.scan2.start() if e.module == self.module2]
+        assert self.check_events(events2)
 
     def check_events(self, events):
         asn = False
@@ -1169,11 +1159,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "WAF":
-                if "LiteSpeed" in e.data["WAF"]:
-                    return True
-        return False
+        assert any(e.type == "WAF" and "LiteSpeed" in e.data["WAF"] for e in events)
 
 
 class Ffuf(HttpxMockHelper):
@@ -1310,7 +1296,7 @@ class Ffuf_shortnames(HttpxMockHelper):
         }
     }
 
-    def setup(self):
+    def setup(self, scan):
         self.bbot_httpserver.no_handler_status_code = 404
 
         seed_events = []
@@ -1509,7 +1495,7 @@ class Iis_shortnames(HttpxMockHelper):
 
     config_overrides = {"modules": {"iis_shortnames": {"detect_only": False}}}
 
-    def setup(self):
+    def setup(self, scan):
         self.bbot_httpserver.no_handler_status_code = 404
 
     def mock_args(self):
@@ -1792,7 +1778,7 @@ class Bypass403(HttpxMockHelper):
 
     targets = ["http://127.0.0.1:8888/test"]
 
-    def setup(self):
+    def setup(self, scan):
         self.bbot_httpserver.no_handler_status_code = 403
 
     def mock_args(self):
@@ -1812,7 +1798,7 @@ class Bypass403_aspnetcookieless(HttpxMockHelper):
 
     targets = ["http://127.0.0.1:8888/admin.aspx"]
 
-    def setup(self):
+    def setup(self, scan):
         self.bbot_httpserver.no_handler_status_code = 403
 
     def mock_args(self):
@@ -1832,7 +1818,7 @@ class Bypass403_waf(HttpxMockHelper):
 
     targets = ["http://127.0.0.1:8888/test"]
 
-    def setup(self):
+    def setup(self, scan):
         self.bbot_httpserver.no_handler_status_code = 403
 
     def mock_args(self):

From 0a37a8e0095d0e0b353c57726333334e32bfb2fb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 12 May 2023 16:59:48 -0400
Subject: [PATCH 014/387] better error handling in speculate

---
 bbot/modules/internal/speculate.py | 9 +++++----
 1 file changed, 5 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index b11bb60baf..1e00d1bdb7 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -90,10 +90,11 @@ async def handle_event(self, event):
             url_parents = self.helpers.url_parents(event.data)
             for up in url_parents:
                 url_event = self.make_event(f"{up}/", "URL_UNVERIFIED", source=event)
-                # inherit web spider distance from parent (don't increment)
-                source_web_spider_distance = getattr(event, "web_spider_distance", 0)
-                url_event.web_spider_distance = source_web_spider_distance
-                self.emit_event(url_event)
+                if url_event is not None:
+                    # inherit web spider distance from parent (don't increment)
+                    source_web_spider_distance = getattr(event, "web_spider_distance", 0)
+                    url_event.web_spider_distance = source_web_spider_distance
+                    self.emit_event(url_event)
 
         # from hosts
         if emit_open_ports:

From 6286cc30b941ee5c85f0c6f526fe5a06eaa6b9d8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 12 May 2023 16:59:54 -0400
Subject: [PATCH 015/387] better error handling in speculate

---
 bbot/core/helpers/web.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 606cca4d3f..cd351b8dc9 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -69,7 +69,7 @@ def AsyncClient(self, *args, **kwargs):
     async def request(self, *args, **kwargs):
         raise_error = kwargs.pop("raise_error", False)
         # TODO: use this
-        cache_for = kwargs.pop("cache_for", None) # noqa
+        cache_for = kwargs.pop("cache_for", None)  # noqa
 
         # in case of URL only, assume GET request
         if len(args) == 1:

From 65e8263f5b136dd7b589d54ff07daa123ae5d761 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 12 May 2023 17:07:39 -0400
Subject: [PATCH 016/387] update readme

---
 README.md | 36 ++++++++++++++++++++----------------
 1 file changed, 20 insertions(+), 16 deletions(-)

diff --git a/README.md b/README.md
index 9b9c96e3eb..9b9e05f446 100644
--- a/README.md
+++ b/README.md
@@ -149,17 +149,26 @@ bbot -f subdomain-enum -t evilcorp.com --output-modules neo4j
 # Usage
 ~~~
 $ bbot --help
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-n SCAN_NAME] [-m MODULE [MODULE ...]] [-l] [-em MODULE [MODULE ...]]
-            [-f FLAG [FLAG ...]] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [-o DIR] [-c [CONFIG ...]] [--allow-deadly] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config]
-            [--save-wordcloud FILE] [--load-wordcloud FILE] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a] [--version]
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l] [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
+            [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--save-wordcloud FILE] [--load-wordcloud FILE]
+            [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a] [--version]
 
 Bighuge BLS OSINT Tool
 
 options:
   -h, --help            show this help message and exit
   --help-all            Display full help including module config options
-  -n SCAN_NAME, --name SCAN_NAME
-                        Name of scan (default: random)
+
+Target:
+  -t TARGET [TARGET ...], --targets TARGET [TARGET ...]
+                        Targets to seed the scan
+  -w WHITELIST [WHITELIST ...], --whitelist WHITELIST [WHITELIST ...]
+                        What's considered in-scope (by default it's the same as --targets)
+  -b BLACKLIST [BLACKLIST ...], --blacklist BLACKLIST [BLACKLIST ...]
+                        Don't touch these things
+  --strict-scope        Don't consider subdomains of target/whitelist to be in-scope
+
+Modules:
   -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
                         Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
   -l, --list-modules    List available modules.
@@ -168,15 +177,19 @@ options:
   -f FLAG [FLAG ...], --flags FLAG [FLAG ...]
                         Enable modules by flag. Choices: active,affiliates,aggressive,cloud-enum,deadly,email-enum,iis-shortnames,passive,portscan,report,safe,service-enum,slow,social-enum,subdomain-enum,subdomain-hijack,web-basic,web-paramminer,web-screenshots,web-thorough
   -rf FLAG [FLAG ...], --require-flags FLAG [FLAG ...]
-                        Disable modules that don't have these flags (e.g. -rf passive)
+                        Only enable modules with these flags (e.g. -rf passive)
   -ef FLAG [FLAG ...], --exclude-flags FLAG [FLAG ...]
                         Disable modules with these flags. (e.g. -ef aggressive)
   -om MODULE [MODULE ...], --output-modules MODULE [MODULE ...]
                         Output module(s). Choices: asset_inventory,csv,http,human,json,neo4j,python,web_report,websocket
+  --allow-deadly        Enable the use of highly aggressive modules
+
+Scan:
+  -n SCAN_NAME, --name SCAN_NAME
+                        Name of scan (default: random)
   -o DIR, --output-dir DIR
   -c [CONFIG ...], --config [CONFIG ...]
                         custom config file, or configuration options in key=value format: 'modules.shodan.api_key=1234'
-  --allow-deadly        Enable the use of highly aggressive modules
   -v, --verbose         Be more verbose
   -d, --debug           Enable debugging
   -s, --silent          Be quiet
@@ -185,15 +198,6 @@ options:
   --dry-run             Abort before executing scan
   --current-config      Show current config in YAML format
 
-Target:
-  -t TARGET [TARGET ...], --targets TARGET [TARGET ...]
-                        Targets to seed the scan
-  -w WHITELIST [WHITELIST ...], --whitelist WHITELIST [WHITELIST ...]
-                        What's considered in-scope (by default it's the same as --targets)
-  -b BLACKLIST [BLACKLIST ...], --blacklist BLACKLIST [BLACKLIST ...]
-                        Don't touch these things
-  --strict-scope        Don't consider subdomains of target/whitelist to be in-scope
-
 Word cloud:
   Save/load wordlist of common words gathered during a scan
 

From 245e6a425281949911b0feac638989203d1e88c4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 13 May 2023 21:41:28 -0400
Subject: [PATCH 017/387] all module tests passing

---
 bbot/core/helpers/misc.py                  |   8 +-
 bbot/core/helpers/web.py                   |   5 +
 bbot/modules/bucket_gcp.py                 |   2 +-
 bbot/modules/bypass403.py                  |   6 +-
 bbot/modules/deadly/ffuf.py                |  33 +++--
 bbot/modules/deadly/nuclei.py              |  22 ++--
 bbot/modules/deadly/vhost.py               |  57 +++------
 bbot/modules/ffuf_shortnames.py            |  32 ++---
 bbot/modules/hunt.py                       |   2 +-
 bbot/modules/iis_shortnames.py             |  54 ++++----
 bbot/modules/social.py                     |   4 +-
 bbot/modules/url_manipulation.py           |   6 +-
 bbot/scanner/manager.py                    |   1 +
 bbot/test/modules_test_classes.py          | 142 +++++++--------------
 bbot/test/test_step_1/test_modules_full.py |  40 +++---
 bbot/test/test_step_2/test_threadpool.py   |  17 ---
 16 files changed, 180 insertions(+), 251 deletions(-)
 delete mode 100644 bbot/test/test_step_2/test_threadpool.py

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index c2b39214a7..7a6391a768 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -45,6 +45,7 @@ def is_domain(d):
     "evilcorp.co.uk" --> True
     "www.evilcorp.co.uk" --> False
     """
+    d, _ = split_host_port(d)
     extracted = tldextract(d)
     if extracted.domain and not extracted.subdomain:
         return True
@@ -56,6 +57,7 @@ def is_subdomain(d):
     "www.evilcorp.co.uk" --> True
     "evilcorp.co.uk" --> False
     """
+    d, _ = split_host_port(d)
     extracted = tldextract(d)
     if extracted.domain and extracted.subdomain:
         return True
@@ -126,8 +128,9 @@ def parent_domain(d):
     "www.evilcorp.co.uk" --> "evilcorp.co.uk"
     "evilcorp.co.uk" --> "evilcorp.co.uk"
     """
+    host, port = split_host_port(d)
     if is_subdomain(d):
-        return ".".join(str(d).split(".")[1:])
+        return make_netloc(".".join(str(host).split(".")[1:]), port)
     return d
 
 
@@ -534,10 +537,13 @@ def gen_numbers(n, padding=2):
 
 def make_netloc(host, port):
     """
+    ("192.168.1.1", None) --> "192.168.1.1"
     ("192.168.1.1", 443) --> "192.168.1.1:443"
     ("evilcorp.com", 80) --> "evilcorp.com:80"
     ("dead::beef", 443) --> "[dead::beef]:443"
     """
+    if port is None:
+        return host
     if is_ip(host, version=6):
         host = f"[{host}]"
     return f"{host}:{port}"
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index cd351b8dc9..6ed9fe8427 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -71,6 +71,11 @@ async def request(self, *args, **kwargs):
         # TODO: use this
         cache_for = kwargs.pop("cache_for", None)  # noqa
 
+        # allow vs follow, httpx why??
+        allow_redirects = kwargs.pop("allow_redirects", None)
+        if allow_redirects is not None and "follow_redirects" not in kwargs:
+            kwargs["follow_redirects"] = allow_redirects
+
         # in case of URL only, assume GET request
         if len(args) == 1:
             kwargs["url"] = args[0]
diff --git a/bbot/modules/bucket_gcp.py b/bbot/modules/bucket_gcp.py
index 06cc588946..b7e96d5b1d 100644
--- a/bbot/modules/bucket_gcp.py
+++ b/bbot/modules/bucket_gcp.py
@@ -39,7 +39,7 @@ async def check_bucket_open(self, bucket_name, url):
             if isinstance(permissions, dict):
                 bad_permissions = list(permissions.get("permissions", {}))
         except Exception as e:
-            self.warning(f'Failed to enumerate permissions for bucket "{bucket_name}": {e}')
+            self.info(f'Failed to enumerate permissions for bucket "{bucket_name}": {e}')
         msg = ""
         if bad_permissions:
             perms_str = ",".join(bad_permissions)
diff --git a/bbot/modules/bypass403.py b/bbot/modules/bypass403.py
index b1205cec33..d798c03441 100644
--- a/bbot/modules/bypass403.py
+++ b/bbot/modules/bypass403.py
@@ -81,7 +81,7 @@ class bypass403(BaseModule):
     meta = {"description": "Check 403 pages for common bypasses"}
     in_scope_only = True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         try:
             compare_helper = self.helpers.http_compare(event.data, allow_redirects=True)
         except HttpCompareError as e:
@@ -94,7 +94,7 @@ def handle_event(self, event):
                 headers = dict(sig[2])
             else:
                 headers = None
-            match, reasons, reflection, subject_response = compare_helper.compare(
+            match, reasons, reflection, subject_response = await compare_helper.compare(
                 sig[1], headers=headers, method=sig[0], allow_redirects=True
             )
 
@@ -121,7 +121,7 @@ def handle_event(self, event):
                 else:
                     self.debug(f"Status code changed to {str(subject_response.status_code)}, ignoring")
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if ("status-403" in event.tags) or ("status-401" in event.tags):
             return True
         return False
diff --git a/bbot/modules/deadly/ffuf.py b/bbot/modules/deadly/ffuf.py
index a034261490..709b1d1be6 100644
--- a/bbot/modules/deadly/ffuf.py
+++ b/bbot/modules/deadly/ffuf.py
@@ -46,20 +46,18 @@ class ffuf(BaseModule):
 
     in_scope_only = True
 
-    def setup(self):
+    async def setup(self):
         self.canary = "".join(random.choice(string.ascii_lowercase) for i in range(10))
         wordlist_url = self.config.get("wordlist", "")
         self.debug(f"Using wordlist [{wordlist_url}]")
-        self.wordlist = self.helpers.wordlist(wordlist_url)
-        f = open(self.wordlist, "r")
-        self.wordlist_lines = f.readlines()
-        f.close()
+        self.wordlist = await self.helpers.wordlist(wordlist_url)
+        self.wordlist_lines = list(self.helpers.read_file(self.wordlist))
         self.tempfile, tempfile_len = self.generate_templist()
         self.verbose(f"Generated dynamic wordlist with length [{str(tempfile_len)}]")
-        self.extensions = self.config.get("extensions")
+        self.extensions = self.config.get("extensions", "")
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         if self.helpers.url_depth(event.data) > self.config.get("max_depth"):
             self.debug(f"Exceeded max depth, aborting event")
             return
@@ -77,17 +75,17 @@ def handle_event(self, event):
             for ext in self.extensions.split(","):
                 exts.append(f".{ext}")
 
-        filters = self.baseline_ffuf(fixed_url, exts=exts)
-        for r in self.execute_ffuf(self.tempfile, fixed_url, exts=exts, filters=filters):
+        filters = await self.baseline_ffuf(fixed_url, exts=exts)
+        async for r in self.execute_ffuf(self.tempfile, fixed_url, exts=exts, filters=filters):
             self.emit_event(r["url"], "URL_UNVERIFIED", source=event, tags=[f"status-{r['status']}"])
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if "endpoint" in event.tags:
             self.debug(f"rejecting URL [{event.data}] because we don't ffuf endpoints")
             return False
         return True
 
-    def baseline_ffuf(self, url, exts=[""], prefix="", suffix="", mode="normal"):
+    async def baseline_ffuf(self, url, exts=[""], prefix="", suffix="", mode="normal"):
         filters = {}
         for ext in exts:
             self.debug(f"running baseline for URL [{url}] with ext [{ext}]")
@@ -102,7 +100,7 @@ def baseline_ffuf(self, url, exts=[""], prefix="", suffix="", mode="normal"):
                 canary_length += 2
 
             canary_temp_file = self.helpers.tempfile(canary_list, pipe=False)
-            for canary_r in self.execute_ffuf(
+            async for canary_r in self.execute_ffuf(
                 canary_temp_file,
                 url,
                 prefix=prefix,
@@ -194,7 +192,7 @@ def baseline_ffuf(self, url, exts=[""], prefix="", suffix="", mode="normal"):
 
         return filters
 
-    def execute_ffuf(
+    async def execute_ffuf(
         self,
         tempfile,
         url,
@@ -261,7 +259,7 @@ def execute_ffuf(
                 command.append("-mc")
                 command.append("all")
 
-            for found in self.helpers.run_live(command):
+            async for found in self.helpers.run_live(command):
                 try:
                     found_json = json.loads(found)
                     input_json = found_json.get("input", {})
@@ -280,8 +278,9 @@ def execute_ffuf(
                             if mode == "normal":
                                 # before emitting, we are going to send another baseline. This will immediately catch things like a WAF flipping blocking on us mid-scan
                                 if baseline == False:
-                                    pre_emit_temp_canary = list(
-                                        self.execute_ffuf(
+                                    pre_emit_temp_canary = [
+                                        f
+                                        async for f in self.execute_ffuf(
                                             self.helpers.tempfile(
                                                 ["".join(random.choice(string.ascii_lowercase) for i in range(4))],
                                                 pipe=False,
@@ -294,7 +293,7 @@ def execute_ffuf(
                                             baseline=True,
                                             filters=filters,
                                         )
-                                    )
+                                    ]
                                     if len(pre_emit_temp_canary) == 0:
                                         yield found_json
                                     else:
diff --git a/bbot/modules/deadly/nuclei.py b/bbot/modules/deadly/nuclei.py
index 9a36387162..f7c7ee2c86 100644
--- a/bbot/modules/deadly/nuclei.py
+++ b/bbot/modules/deadly/nuclei.py
@@ -13,7 +13,7 @@ class nuclei(BaseModule):
     batch_size = 25
 
     options = {
-        "version": "2.8.9",
+        "version": "2.9.4",
         "tags": "",
         "templates": "",
         "severity": "",
@@ -50,11 +50,11 @@ class nuclei(BaseModule):
     deps_pip = ["pyyaml~=6.0"]
     in_scope_only = True
 
-    def setup(self):
+    async def setup(self):
         # attempt to update nuclei templates
         self.nuclei_templates_dir = self.helpers.tools_dir / "nuclei-templates"
         self.info("Updating Nuclei templates")
-        update_results = self.helpers.run(
+        update_results = await self.helpers.run(
             ["nuclei", "-update-template-dir", self.nuclei_templates_dir, "-update-templates"]
         )
         if update_results.stderr:
@@ -127,10 +127,10 @@ def setup(self):
 
         return True
 
-    def handle_batch(self, *events):
+    async def handle_batch(self, *events):
         temp_target = self.helpers.make_target(events)
         nuclei_input = [str(e.data) for e in events]
-        for severity, template, host, url, name, extracted_results in self.execute_nuclei(nuclei_input):
+        async for severity, template, host, url, name, extracted_results in self.execute_nuclei(nuclei_input):
             # this is necessary because sometimes nuclei is inconsistent about the data returned in the host field
             cleaned_host = temp_target.get(host)
             source_event = self.correlate_event(events, cleaned_host)
@@ -170,10 +170,10 @@ def correlate_event(self, events, host):
                 return event
         self.warning("Failed to correlate nuclei result with event")
 
-    def execute_nuclei(self, nuclei_input):
+    async def execute_nuclei(self, nuclei_input):
         command = [
             "nuclei",
-            "-json",
+            "-jsonl",
             "-update-template-dir",
             self.nuclei_templates_dir,
             "-rate-limit",
@@ -207,7 +207,7 @@ def execute_nuclei(self, nuclei_input):
         stats_file = self.helpers.tempfile_tail(callback=self.log_nuclei_status)
         try:
             with open(stats_file, "w") as stats_fh:
-                for line in self.helpers.run_live(command, input=nuclei_input, stderr=stats_fh):
+                async for line in self.helpers.run_live(command, input=nuclei_input, stderr=stats_fh):
                     try:
                         j = json.loads(line)
                     except json.decoder.JSONDecodeError:
@@ -258,11 +258,11 @@ def log_nuclei_status(self, line):
         status = f"[{duration}] | Templates: {templates} | Hosts: {hosts} | RPS: {rps} | Matched: {matched} | Errors: {errors} | Requests: {requests}/{total} ({percent}%)"
         self.info(status)
 
-    def cleanup(self):
+    async def cleanup(self):
         resume_file = self.helpers.current_dir / "resume.cfg"
         resume_file.unlink(missing_ok=True)
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if self.config.get("directory_only", True):
             if "endpoint" in event.tags:
                 self.debug(
@@ -299,7 +299,7 @@ def find_budget_paths(self, budget):
 
     def get_yaml_request_attr(self, yf, attr):
         p = self.parse_yaml(yf)
-        requests = p.get("requests", [])
+        requests = p.get("http", [])
         for r in requests:
             raw = r.get("raw")
             if not raw:
diff --git a/bbot/modules/deadly/vhost.py b/bbot/modules/deadly/vhost.py
index 3c0a5c27a8..f4675e10fe 100644
--- a/bbot/modules/deadly/vhost.py
+++ b/bbot/modules/deadly/vhost.py
@@ -1,9 +1,7 @@
-from bbot.modules.deadly.ffuf import ffuf
-
-from urllib.parse import urlparse
-import random
-import string
 import base64
+from urllib.parse import urlparse
+
+from bbot.modules.deadly.ffuf import ffuf
 
 
 class vhost(ffuf):
@@ -38,29 +36,12 @@ class vhost(ffuf):
 
     in_scope_only = True
 
-    def setup(self):
-        self.canary = "".join(random.choice(string.ascii_lowercase) for i in range(10))
+    async def setup(self):
         self.scanned_hosts = {}
         self.wordcloud_tried_hosts = set()
-        self.wordlist = self.helpers.wordlist(self.config.get("wordlist"))
-        f = open(self.wordlist, "r")
-        self.wordlist_lines = f.readlines()
-        f.close()
-        self.ignore_redirects = True
-        self.tempfile, tempfile_len = self.generate_templist()
-        return True
-
-    @staticmethod
-    def get_parent_domain(domain):
-        domain_parts = domain.split(".")
-
-        if len(domain_parts) >= 3:
-            parent_domain = ".".join(domain_parts[1:])
-            return parent_domain
-        else:
-            return domain
-
-    def handle_event(self, event):
+        return await super().setup()
+
+    async def handle_event(self, event):
         if not self.helpers.is_ip(event.host) or self.config.get("force_basehost"):
             host = f"{event.parsed.scheme}://{event.parsed.netloc}"
             if host in self.scanned_hosts.keys():
@@ -73,24 +54,24 @@ def handle_event(self, event):
             if self.config.get("force_basehost"):
                 basehost = self.config.get("force_basehost")
             else:
-                basehost = self.get_parent_domain(event.parsed.netloc)
+                basehost = self.helpers.parent_domain(event.parsed.netloc)
 
             self.debug(f"Using basehost: {basehost}")
-            for vhost in self.ffuf_vhost(host, f".{basehost}", event):
+            async for vhost in self.ffuf_vhost(host, f".{basehost}", event):
                 self.verbose(f"Starting mutations check for {vhost}")
-                for vhost in self.ffuf_vhost(host, f".{basehost}", event, wordlist=self.mutations_check(vhost)):
+                async for vhost in self.ffuf_vhost(host, f".{basehost}", event, wordlist=self.mutations_check(vhost)):
                     pass
 
             # check existing host for mutations
             self.verbose("Checking for vhost mutations on main host")
-            for vhost in self.ffuf_vhost(
+            async for vhost in self.ffuf_vhost(
                 host, f".{basehost}", event, wordlist=self.mutations_check(event.parsed.netloc.split(".")[0])
             ):
                 pass
 
             # special vhost list
             self.verbose("Checking special vhost list")
-            for vhost in self.ffuf_vhost(
+            async for vhost in self.ffuf_vhost(
                 host,
                 "",
                 event,
@@ -99,13 +80,15 @@ def handle_event(self, event):
             ):
                 pass
 
-    def ffuf_vhost(self, host, basehost, event, wordlist=None, skip_dns_host=False):
-        filters = self.baseline_ffuf(f"{host}/", exts=[""], suffix=basehost, mode="hostheader")
+    async def ffuf_vhost(self, host, basehost, event, wordlist=None, skip_dns_host=False):
+        filters = await self.baseline_ffuf(f"{host}/", exts=[""], suffix=basehost, mode="hostheader")
         self.debug(f"Baseline completed and returned these filters:")
         self.debug(filters)
         if not wordlist:
             wordlist = self.tempfile
-        for r in self.execute_ffuf(wordlist, host, exts=[""], suffix=basehost, filters=filters, mode="hostheader"):
+        async for r in self.execute_ffuf(
+            wordlist, host, exts=[""], suffix=basehost, filters=filters, mode="hostheader"
+        ):
             found_vhost_b64 = r["input"]["FUZZ"]
             vhost_dict = {"host": str(event.host), "url": host, "vhost": base64.b64decode(found_vhost_b64).decode()}
             if f"{vhost_dict['vhost']}{basehost}" != event.parsed.netloc:
@@ -123,7 +106,7 @@ def mutations_check(self, vhost):
         mutations_list_file = self.helpers.tempfile(mutations_list, pipe=False)
         return mutations_list_file
 
-    def finish(self):
+    async def finish(self):
         # check existing hosts with wordcloud
         tempfile = self.helpers.tempfile(list(self.helpers.word_cloud.keys()), pipe=False)
 
@@ -135,9 +118,9 @@ def finish(self):
                 if self.config.get("force_basehost"):
                     basehost = self.config.get("force_basehost")
                 else:
-                    basehost = self.get_parent_domain(event.parsed.netloc)
+                    basehost = self.helpers.parent_domain(event.parsed.netloc)
 
-                for vhost in self.ffuf_vhost(host, f".{basehost}", event, wordlist=tempfile):
+                async for vhost in self.ffuf_vhost(host, f".{basehost}", event, wordlist=tempfile):
                     pass
 
                 self.wordcloud_tried_hosts.add(host)
diff --git a/bbot/modules/ffuf_shortnames.py b/bbot/modules/ffuf_shortnames.py
index 513f61267b..d181319f03 100644
--- a/bbot/modules/ffuf_shortnames.py
+++ b/bbot/modules/ffuf_shortnames.py
@@ -72,22 +72,20 @@ class ffuf_shortnames(ffuf):
 
     in_scope_only = True
 
-    def setup(self):
+    async def setup(self):
         self.canary = "".join(random.choice(string.ascii_lowercase) for i in range(10))
         wordlist = self.config.get("wordlist", "")
         if not wordlist:
             wordlist = f"{self.helpers.wordlist_dir}/ffuf_shortname_candidates.txt"
         self.debug(f"Using [{wordlist}] for shortname candidate list")
-        self.wordlist = self.helpers.wordlist(wordlist)
-        f = open(self.wordlist, "r")
-        self.wordlist_lines = f.readlines()
-        f.close()
+        self.wordlist = await self.helpers.wordlist(wordlist)
+        self.wordlist_lines = list(self.helpers.read_file(self.wordlist))
 
         wordlist_extensions = self.config.get("wordlist_extensions", "")
         if not wordlist_extensions:
             wordlist_extensions = f"{self.helpers.wordlist_dir}/raft-small-extensions-lowercase_CLEANED.txt"
         self.debug(f"Using [{wordlist_extensions}] for shortname candidate extension list")
-        self.wordlist_extensions = self.helpers.wordlist(wordlist_extensions)
+        self.wordlist_extensions = await self.helpers.wordlist(wordlist_extensions)
         self.extensions = self.config.get("extensions")
         self.ignore_redirects = self.config.get("ignore_redirects")
 
@@ -116,10 +114,10 @@ def find_delimeter(self, hint):
                     return d, hint.split(d)[0], hint.split(d)[1]
         return None
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         if event.source.type == "URL":
             filename_hint = re.sub(r"~\d", "", event.parsed.path.rsplit(".", 1)[0].split("/")[-1]).lower()
 
@@ -151,11 +149,11 @@ def handle_event(self, event):
             if tempfile_len > 0:
                 if "shortname-file" in event.tags:
                     for ext in used_extensions:
-                        for r in self.execute_ffuf(tempfile, root_url, suffix=f".{ext}"):
+                        async for r in self.execute_ffuf(tempfile, root_url, suffix=f".{ext}"):
                             self.emit_event(r["url"], "URL_UNVERIFIED", source=event, tags=[f"status-{r['status']}"])
 
                 elif "shortname-directory" in event.tags:
-                    for r in self.execute_ffuf(tempfile, root_url, exts=["/"]):
+                    async for r in self.execute_ffuf(tempfile, root_url, exts=["/"]):
                         r_url = f"{r['url'].rstrip('/')}/"
                         self.emit_event(r_url, "URL_UNVERIFIED", source=event, tags=[f"status-{r['status']}"])
 
@@ -166,7 +164,9 @@ def handle_event(self, event):
                         delimeter, prefix, partial_hint = delimeter_r
                         self.verbose(f"Detected delimeter [{delimeter}] in hint [{filename_hint}]")
                         tempfile, tempfile_len = self.generate_templist(prefix=partial_hint)
-                        for r in self.execute_ffuf(tempfile, root_url, prefix=f"{prefix}{delimeter}", exts=["/"]):
+                        async for r in self.execute_ffuf(
+                            tempfile, root_url, prefix=f"{prefix}{delimeter}", exts=["/"]
+                        ):
                             self.emit_event(r["url"], "URL_UNVERIFIED", source=event, tags=[f"status-{r['status']}"])
 
                 elif "shortname-file" in event.tags:
@@ -176,14 +176,14 @@ def handle_event(self, event):
                             delimeter, prefix, partial_hint = delimeter_r
                             self.verbose(f"Detected delimeter [{delimeter}] in hint [{filename_hint}]")
                             tempfile, tempfile_len = self.generate_templist(prefix=partial_hint)
-                            for r in self.execute_ffuf(
+                            async for r in self.execute_ffuf(
                                 tempfile, root_url, prefix=f"{prefix}{delimeter}", suffix=f".{ext}"
                             ):
                                 self.emit_event(
                                     r["url"], "URL_UNVERIFIED", source=event, tags=[f"status-{r['status']}"]
                                 )
 
-    def finish(self):
+    async def finish(self):
         if self.config.get("find_common_prefixes"):
             per_host_collection = dict(self.per_host_collection)
             self.per_host_collection.clear()
@@ -208,7 +208,7 @@ def finish(self):
                                         f"Running common prefix check for URL_HINT: {hint} with prefix: {prefix} and partial_hint: {partial_hint}"
                                     )
 
-                                    for r in self.execute_ffuf(tempfile, url, prefix=prefix, exts=["/"]):
+                                    async for r in self.execute_ffuf(tempfile, url, prefix=prefix, exts=["/"]):
                                         self.emit_event(
                                             r["url"],
                                             "URL_UNVERIFIED",
@@ -222,7 +222,9 @@ def finish(self):
                                         self.verbose(
                                             f"Running common prefix check for URL_HINT: {hint} with prefix: {prefix}, extension: .{ext}, and partial_hint: {partial_hint}"
                                         )
-                                        for r in self.execute_ffuf(tempfile, url, prefix=prefix, suffix=f".{ext}"):
+                                        async for r in self.execute_ffuf(
+                                            tempfile, url, prefix=prefix, suffix=f".{ext}"
+                                        ):
                                             self.emit_event(
                                                 r["url"],
                                                 "URL_UNVERIFIED",
diff --git a/bbot/modules/hunt.py b/bbot/modules/hunt.py
index 8f61a5a2af..64abd181eb 100644
--- a/bbot/modules/hunt.py
+++ b/bbot/modules/hunt.py
@@ -326,7 +326,7 @@ def extract_params(self, body):
                     self.debug(f"FOUND PARAM ({s}) IN A TAG GET PARAMS")
                     yield s
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         body = event.data.get("body", "")
         for p in self.extract_params(body):
             for k in hunt_param_dict.keys():
diff --git a/bbot/modules/iis_shortnames.py b/bbot/modules/iis_shortnames.py
index 779781f52a..3ee204321f 100644
--- a/bbot/modules/iis_shortnames.py
+++ b/bbot/modules/iis_shortnames.py
@@ -24,7 +24,7 @@ class iis_shortnames(BaseModule):
 
     max_event_handlers = 8
 
-    def detect(self, target):
+    async def detect(self, target):
         technique = None
         detections = []
         random_string = self.helpers.rand_string(8)
@@ -32,8 +32,8 @@ def detect(self, target):
         test_url = f"{target}*~1*/a.aspx"
 
         for method in ["GET", "POST", "OPTIONS", "DEBUG", "HEAD", "TRACE"]:
-            control = self.helpers.request(method=method, url=control_url, allow_redirects=False, timeout=10)
-            test = self.helpers.request(method=method, url=test_url, allow_redirects=False, timeout=10)
+            control = await self.helpers.request(method=method, url=control_url, allow_redirects=False, timeout=10)
+            test = await self.helpers.request(method=method, url=test_url, allow_redirects=False, timeout=10)
             if (control != None) and (test != None):
                 if control.status_code != test.status_code:
                     technique = f"{str(control.status_code)}/{str(test.status_code)} HTTP Code"
@@ -46,7 +46,7 @@ def detect(self, target):
                     technique = "HTTP Body Error Message"
         return detections
 
-    def setup(self):
+    async def setup(self):
         self.scanned_tracker_lock = Lock()
         self.scanned_tracker = set()
         return True
@@ -55,10 +55,10 @@ def setup(self):
     def normalize_url(url):
         return str(url.rstrip("/") + "/").lower()
 
-    def directory_confirm(self, target, method, url_hint, affirmative_status_code):
+    async def directory_confirm(self, target, method, url_hint, affirmative_status_code):
         payload = encode_all(f"{url_hint}")
         url = f"{target}{payload}"
-        directory_confirm_result = self.helpers.request(
+        directory_confirm_result = await self.helpers.request(
             method=method, url=url, allow_redirects=False, retries=2, timeout=10
         )
 
@@ -67,7 +67,7 @@ def directory_confirm(self, target, method, url_hint, affirmative_status_code):
         else:
             return False
 
-    def duplicate_check(self, target, method, url_hint, affirmative_status_code):
+    async def duplicate_check(self, target, method, url_hint, affirmative_status_code):
         duplicates = []
         count = 2
         base_hint = re.sub(r"~\d", "", url_hint)
@@ -77,7 +77,7 @@ def duplicate_check(self, target, method, url_hint, affirmative_status_code):
             payload = encode_all(f"{base_hint}~{str(count)}*")
             url = f"{target}{payload}{suffix}"
 
-            duplicate_check_results = self.helpers.request(
+            duplicate_check_results = await self.helpers.request(
                 method=method, url=url, allow_redirects=False, retries=2, timeout=10
             )
             if duplicate_check_results.status_code != affirmative_status_code:
@@ -92,30 +92,30 @@ def duplicate_check(self, target, method, url_hint, affirmative_status_code):
 
         return duplicates
 
-    def threaded_request(self, method, url, affirmative_status_code):
-        r = self.helpers.request(method=method, url=url, allow_redirects=False, retries=2, timeout=10)
+    async def threaded_request(self, method, url, affirmative_status_code, c):
+        r = await self.helpers.request(method=method, url=url, allow_redirects=False, retries=2, timeout=10)
         if r is not None:
             if r.status_code == affirmative_status_code:
-                return True
+                return True, c
+        return None, c
 
-    def solve_shortname_recursive(
+    async def solve_shortname_recursive(
         self, method, target, prefix, affirmative_status_code, extension_mode=False, node_count=0
     ):
         url_hint_list = []
         found_results = False
 
-        futures = {}
+        tasks = []
         for c in valid_chars:
             suffix = "\\a.aspx"
             wildcard = "*" if extension_mode else "*~1*"
             payload = encode_all(f"{prefix}{c}{wildcard}")
             url = f"{target}{payload}{suffix}"
-            future = self.submit_task(self.threaded_request, method, url, affirmative_status_code)
-            futures[future] = c
+            task = self.helpers.create_task(self.threaded_request(method, url, affirmative_status_code, c))
+            tasks.append(task)
 
-        for future in self.helpers.as_completed(futures):
-            c = futures[future]
-            result = future.result()
+        for task in self.helpers.as_completed(tasks):
+            result, c = await task
             if result:
                 found_results = True
                 node_count += 1
@@ -130,12 +130,12 @@ def solve_shortname_recursive(
                 wildcard = "~1*"
                 payload = encode_all(f"{prefix}{c}{wildcard}")
                 url = f"{target}{payload}{suffix}"
-                r = self.helpers.request(method=method, url=url, allow_redirects=False, retries=2, timeout=10)
+                r = await self.helpers.request(method=method, url=url, allow_redirects=False, retries=2, timeout=10)
                 if r is not None:
                     if r.status_code == affirmative_status_code:
                         url_hint_list.append(f"{prefix}{c}")
 
-                url_hint_list += self.solve_shortname_recursive(
+                url_hint_list += await self.solve_shortname_recursive(
                     method, target, f"{prefix}{c}", affirmative_status_code, extension_mode, node_count=node_count
                 )
         if len(prefix) > 0 and found_results == False:
@@ -143,12 +143,12 @@ def solve_shortname_recursive(
             self.verbose(f"Found new (possibly partial) URL_HINT: {prefix} from node {target}")
         return url_hint_list
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         normalized_url = self.normalize_url(event.data)
         with self.scanned_tracker_lock:
             self.scanned_tracker.add(normalized_url)
 
-        detections = self.detect(normalized_url)
+        detections = await self.detect(normalized_url)
 
         technique_strings = []
         if detections:
@@ -171,7 +171,7 @@ def handle_event(self, event):
                         break
 
                     file_name_hints = list(
-                        set(self.solve_shortname_recursive(method, normalized_url, "", affirmative_status_code))
+                        set(await self.solve_shortname_recursive(method, normalized_url, "", affirmative_status_code))
                     )
                     if len(file_name_hints) == 0:
                         continue
@@ -184,19 +184,19 @@ def handle_event(self, event):
                     file_name_hints_dedupe = file_name_hints[:]
 
                     for x in file_name_hints_dedupe:
-                        duplicates = self.duplicate_check(normalized_url, method, x, affirmative_status_code)
+                        duplicates = await self.duplicate_check(normalized_url, method, x, affirmative_status_code)
                         if duplicates:
                             file_name_hints += duplicates
 
                     # check for the case of a folder and file with the same filename
 
                     for d in file_name_hints:
-                        if self.directory_confirm(normalized_url, method, d, affirmative_status_code):
+                        if await self.directory_confirm(normalized_url, method, d, affirmative_status_code):
                             self.verbose(f"Confirmed Directory URL_HINT: {d} from node {normalized_url}")
                             url_hint_list.append(d)
 
                     for y in file_name_hints:
-                        file_name_extension_hints = self.solve_shortname_recursive(
+                        file_name_extension_hints = await self.solve_shortname_recursive(
                             method, normalized_url, f"{y}.", affirmative_status_code, extension_mode=True
                         )
                         for z in file_name_extension_hints:
@@ -212,7 +212,7 @@ def handle_event(self, event):
                             hint_type = "shortname-directory"
                         self.emit_event(f"{normalized_url}/{url_hint}", "URL_HINT", event, tags=[hint_type])
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if "dir" in event.tags:
             with self.scanned_tracker_lock:
                 if self.normalize_url(event.data) not in self.scanned_tracker:
diff --git a/bbot/modules/social.py b/bbot/modules/social.py
index ed890daf2e..14af427d1b 100644
--- a/bbot/modules/social.py
+++ b/bbot/modules/social.py
@@ -22,11 +22,11 @@ class social(BaseModule):
 
     scope_distance_modifier = 1
 
-    def setup(self):
+    async def setup(self):
         self.compiled_regexes = {k: re.compile(v) for k, v in self.social_media_regex.items()}
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         for platform, regex in self.compiled_regexes.items():
             for match in regex.findall(event.data):
                 social_media_links = {"platform": platform, "url": match}
diff --git a/bbot/modules/url_manipulation.py b/bbot/modules/url_manipulation.py
index 91eb4c5c50..851761dc2a 100644
--- a/bbot/modules/url_manipulation.py
+++ b/bbot/modules/url_manipulation.py
@@ -14,7 +14,7 @@ class url_manipulation(BaseModule):
         "allow_redirects": "Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default."
     }
 
-    def setup(self):
+    async def setup(self):
         # ([string]method,[string]path,[bool]strip trailing slash)
         self.signatures = []
 
@@ -38,7 +38,7 @@ def setup(self):
         self.allow_redirects = self.config.get("allow_redirects", True)
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         try:
             compare_helper = self.helpers.http_compare(
                 event.data, allow_redirects=self.allow_redirects, include_cache_buster=False
@@ -53,7 +53,7 @@ def handle_event(self, event):
 
         for sig in self.signatures:
             sig = self.format_signature(sig, event)
-            match, reasons, reflection, subject_response = compare_helper.compare(
+            match, reasons, reflection, subject_response = await compare_helper.compare(
                 sig[1], method=sig[0], allow_redirects=self.allow_redirects
             )
 
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 377b690f32..7538bb89c2 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -39,6 +39,7 @@ async def init_events(self):
                 for event in sorted_events:
                     self.scan.verbose(f"Target: {event}")
                     self.queue_event(event)
+                await asyncio.sleep(0.1)
                 self.scan._finished_init = True
 
     async def emit_event(self, event, *args, **kwargs):
diff --git a/bbot/test/modules_test_classes.py b/bbot/test/modules_test_classes.py
index 11a99fe914..30088c65cf 100644
--- a/bbot/test/modules_test_classes.py
+++ b/bbot/test/modules_test_classes.py
@@ -1184,11 +1184,8 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "URL_UNVERIFIED":
-                if "admin" in e.data:
-                    return True
-        return False
+        assert any(e.type == "URL_UNVERIFIED" and "admin" in e.data for e in events)
+        assert not any(e.type == "URL_UNVERIFIED" and "11111111" in e.data for e in events)
 
 
 class Ffuf_extensions(HttpxMockHelper):
@@ -1207,11 +1204,8 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "URL_UNVERIFIED":
-                if "console" in e.data:
-                    return True
-        return False
+        assert any(e.type == "URL_UNVERIFIED" and "console" in e.data for e in events)
+        assert not any(e.type == "URL_UNVERIFIED" and "11111111" in e.data for e in events)
 
 
 class Vhost(HttpxMockHelper):
@@ -1273,15 +1267,11 @@ def check_events(self, events):
                 if e.data["vhost"] == "secret":
                     wordcloud_detection = True
 
-        if (
-            basic_detection
-            and mutaton_of_detected
-            and basehost_mutation
-            and special_vhost_list
-            and wordcloud_detection
-        ):
-            return True
-        return False
+        assert basic_detection
+        assert mutaton_of_detected
+        assert basehost_mutation
+        assert special_vhost_list
+        assert wordcloud_detection
 
 
 class Ffuf_shortnames(HttpxMockHelper):
@@ -1477,17 +1467,13 @@ def check_events(self, events):
                 if e.data == "http://127.0.0.1:8888/short.pl":
                     short_extensions_detection = True
 
-        if (
-            basic_detection
-            and directory_detection
-            and prefix_detection
-            and delimeter_detection
-            and directory_delimeter_detection
-            and prefix_delimeter_detection
-            and short_extensions_detection
-        ):
-            return True
-        return False
+        assert basic_detection
+        assert directory_detection
+        assert prefix_detection
+        assert delimeter_detection
+        assert directory_delimeter_detection
+        assert prefix_delimeter_detection
+        assert short_extensions_detection
 
 
 class Iis_shortnames(HttpxMockHelper):
@@ -1540,9 +1526,8 @@ def check_events(self, events):
             if e.type == "URL_HINT" and e.data == "http://127.0.0.1:8888/BLSHAX~1":
                 url_hintEmitted = True
 
-        if vulnerabilityEmitted and url_hintEmitted:
-            return True
-        return False
+        assert vulnerabilityEmitted
+        assert url_hintEmitted
 
 
 class Nuclei_manual(HttpxMockHelper):
@@ -1568,10 +1553,11 @@ class Nuclei_manual(HttpxMockHelper):
         "web_spider_depth": 1,
         "modules": {
             "nuclei": {
+                "version": "2.9.4",
                 "mode": "manual",
                 "concurrency": 2,
                 "ratelimit": 10,
-                "templates": "/tmp/.bbot_test/tools/nuclei-templates/miscellaneous/",
+                "templates": "/tmp/.bbot_test/tools/nuclei-templates/http/miscellaneous/",
                 "interactsh_disable": True,
                 "directory_only": False,
             }
@@ -1596,9 +1582,8 @@ def check_events(self, events):
                     first_run_detect = True
                 elif "Copyright" in e.data["description"]:
                     second_run_detect = True
-        if first_run_detect and second_run_detect:
-            return True
-        return False
+        assert first_run_detect
+        assert second_run_detect
 
 
 class Nuclei_severe(HttpxMockHelper):
@@ -1621,11 +1606,10 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "VULNERABILITY":
-                if "Generic Linux - Local File Inclusion" in e.data["description"]:
-                    return True
-        return False
+        assert any(
+            e.type == "VULNERABILITY" and "Generic Linux - Local File Inclusion" in e.data["description"]
+            for e in events
+        )
 
 
 class Nuclei_technology(HttpxMockHelper):
@@ -1636,9 +1620,9 @@ class Nuclei_technology(HttpxMockHelper):
         "modules": {"nuclei": {"mode": "technology", "concurrency": 2, "tags": "apache"}},
     }
 
-    def __init__(self, config, bbot_scanner, bbot_httpserver, caplog, *args, **kwargs):
+    def __init__(self, request, caplog, **kwargs):
         self.caplog = caplog
-        super().__init__(config, bbot_scanner, bbot_httpserver, *args, **kwargs)
+        super().__init__(request, **kwargs)
 
     def mock_args(self):
         expect_args = {"method": "GET", "uri": "/"}
@@ -1651,12 +1635,7 @@ def mock_args(self):
     def check_events(self, events):
         if "Using Interactsh Server" in self.caplog.text:
             return False
-
-        for e in events:
-            if e.type == "FINDING":
-                if "apache" in e.data["description"]:
-                    return True
-        return False
+        assert any(e.type == "FINDING" and "apache" in e.data["description"] for e in events)
 
 
 class Nuclei_budget(HttpxMockHelper):
@@ -1680,11 +1659,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "FINDING":
-                if "SpiderFoot" in e.data["description"]:
-                    return True
-        return False
+        assert any(e.type == "FINDING" and "SpiderFoot" in e.data["description"] for e in events)
 
 
 class Url_manipulation(HttpxMockHelper):
@@ -1716,14 +1691,12 @@ def mock_args(self):
         self.set_expect_requests(respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if (
-                e.type == "FINDING"
-                and e.data["description"]
-                == f"Url Manipulation: [body] Sig: [Modified URL: http://127.0.0.1:8888/?{self.module.rand_string}=.xml]"
-            ):
-                return True
-        return False
+        assert any(
+            e.type == "FINDING"
+            and e.data["description"]
+            == f"Url Manipulation: [body] Sig: [Modified URL: http://127.0.0.1:8888/?{self.module.rand_string}=.xml]"
+            for e in events
+        )
 
 
 class Naabu(HttpxMockHelper):
@@ -1733,10 +1706,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "OPEN_TCP_PORT":
-                return True
-        return False
+        assert any(e.type == "OPEN_TCP_PORT" for e in events)
 
 
 class Social(HttpxMockHelper):
@@ -1748,11 +1718,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "SOCIAL":
-                if e.data["platform"] == "discord":
-                    return True
-        return False
+        assert any(e.type == "SOCIAL" and e.data["platform"] == "discord" for e in events)
 
 
 class Hunt(HttpxMockHelper):
@@ -1764,13 +1730,10 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if (
-                e.type == "FINDING"
-                and e.data["description"] == "Found potential INSECURE CRYPTOGRAPHY parameter [cipher]"
-            ):
-                return True
-        return False
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "Found potential INSECURE CRYPTOGRAPHY parameter [cipher]"
+            for e in events
+        )
 
 
 class Bypass403(HttpxMockHelper):
@@ -1787,10 +1750,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "FINDING":
-                return True
-        return False
+        assert any(e.type == "FINDING" for e in events)
 
 
 class Bypass403_aspnetcookieless(HttpxMockHelper):
@@ -1807,10 +1767,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "FINDING":
-                return True
-        return False
+        assert any(e.type == "FINDING" for e in events)
 
 
 class Bypass403_waf(HttpxMockHelper):
@@ -1827,10 +1784,7 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "FINDING":
-                return False
-        return True
+        assert not any(e.type == "FINDING" for e in events)
 
 
 class Speculate_subdirectories(HttpxMockHelper):
@@ -1851,8 +1805,4 @@ def mock_args(self):
         self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
     def check_events(self, events):
-        for e in events:
-            if e.type == "URL_UNVERIFIED":
-                if e.data == "http://127.0.0.1:8888/subdir1/":
-                    return True
-        return False
+        assert any(e.type == "URL_UNVERIFIED" and e.data == "http://127.0.0.1:8888/subdir1/" for e in events)
diff --git a/bbot/test/test_step_1/test_modules_full.py b/bbot/test/test_step_1/test_modules_full.py
index 3dea25d310..5c6ec38651 100644
--- a/bbot/test/test_step_1/test_modules_full.py
+++ b/bbot/test/test_step_1/test_modules_full.py
@@ -145,44 +145,50 @@ async def test_ffuf_extensions(request):
 
 
 @pytest.mark.asyncio
-async def test_bypass403(request):
-    x = Bypass403(request)
+async def test_vhost(request):
+    x = Vhost(request)
     await x.run()
 
 
 @pytest.mark.asyncio
-async def test_bypass403_waf(request):
-    x = Bypass403_waf(request, module_name="bypass403")
+async def test_ffuf_shortnames(request):
+    x = Ffuf_shortnames(request)
     await x.run()
 
 
 @pytest.mark.asyncio
-async def test_bypass403_aspnetcookieless(request):
-    x = Bypass403_aspnetcookieless(request, module_name="bypass403")
+async def test_iis_shortnames(request):
+    x = Iis_shortnames(request)
     await x.run()
 
 
 @pytest.mark.asyncio
-async def test_ffuf_shortnames(request):
-    x = Ffuf_shortnames(request)
+async def test_nuclei_manual(request):
+    x = Nuclei_manual(request, module_name="nuclei")
     await x.run()
 
 
 @pytest.mark.asyncio
-async def test_iis_shortnames(request):
-    x = Iis_shortnames(request)
+async def test_bypass403(request):
+    x = Bypass403(request)
     await x.run()
 
 
 @pytest.mark.asyncio
-async def test_nuclei_technology(request, caplog):
-    x = Nuclei_technology(request, caplog, module_name="nuclei")
+async def test_bypass403_waf(request):
+    x = Bypass403_waf(request, module_name="bypass403")
     await x.run()
 
 
 @pytest.mark.asyncio
-async def test_nuclei_manual(request):
-    x = Nuclei_manual(request, module_name="nuclei")
+async def test_bypass403_aspnetcookieless(request):
+    x = Bypass403_aspnetcookieless(request, module_name="bypass403")
+    await x.run()
+
+
+@pytest.mark.asyncio
+async def test_nuclei_technology(request, caplog):
+    x = Nuclei_technology(request, caplog, module_name="nuclei")
     await x.run()
 
 
@@ -216,12 +222,6 @@ async def test_hunt(request):
     await x.run()
 
 
-@pytest.mark.asyncio
-async def test_vhost(request):
-    x = Vhost(request)
-    await x.run()
-
-
 @pytest.mark.asyncio
 async def test_speculate_subdirectories(request):
     x = Speculate_subdirectories(request, module_name="speculate")
diff --git a/bbot/test/test_step_2/test_threadpool.py b/bbot/test/test_step_2/test_threadpool.py
deleted file mode 100644
index d4238b0062..0000000000
--- a/bbot/test/test_step_2/test_threadpool.py
+++ /dev/null
@@ -1,17 +0,0 @@
-def test_threadpool():
-    from bbot.core.helpers.threadpool import BBOTThreadPoolExecutor, ThreadPoolWrapper, NamedLock, as_completed
-
-    with BBOTThreadPoolExecutor(max_workers=3) as executor:
-        pool = ThreadPoolWrapper(executor)
-        add_one = lambda x: x + 1
-        futures = [pool.submit_task(add_one, y) for y in [0, 1, 2, 3, 4]]
-        results = []
-        for f in as_completed(futures):
-            results.append(f.result())
-        assert tuple(sorted(results)) == (1, 2, 3, 4, 5)
-
-    nl = NamedLock(max_size=5)
-    for i in range(50):
-        nl.get_lock(str(i))
-    assert len(nl._cache) == 5
-    assert tuple(nl._cache.keys()) == tuple(hash(str(x)) for x in [45, 46, 47, 48, 49])

From 530c5e20b123c907d9d18b9da934c5e0aa1bb20e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 13 May 2023 22:01:54 -0400
Subject: [PATCH 018/387] fixing more tests

---
 bbot/core/helpers/misc.py                   |   1 +
 bbot/test/test_step_2/test_helpers.py       |  38 +-
 bbot/test/test_step_2/test_modules_basic.py | 451 ++++++++++----------
 bbot/test/test_step_2/test_web.py           |  14 +
 4 files changed, 246 insertions(+), 258 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 7a6391a768..fda9cc8f2a 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -125,6 +125,7 @@ def split_host_port(d):
 def parent_domain(d):
     """
     "www.internal.evilcorp.co.uk" --> "internal.evilcorp.co.uk"
+    "www.internal.evilcorp.co.uk:8080" --> "internal.evilcorp.co.uk:8080"
     "www.evilcorp.co.uk" --> "evilcorp.co.uk"
     "evilcorp.co.uk" --> "evilcorp.co.uk"
     """
diff --git a/bbot/test/test_step_2/test_helpers.py b/bbot/test/test_step_2/test_helpers.py
index e3f9bc1d3b..2d9c6809df 100644
--- a/bbot/test/test_step_2/test_helpers.py
+++ b/bbot/test/test_step_2/test_helpers.py
@@ -1,12 +1,12 @@
 import re
 import datetime
 import ipaddress
-import requests_mock
 
 from ..bbot_fixtures import *
 
 
-def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
+@pytest.mark.asyncio
+async def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
     ### URL ###
     bad_urls = (
         "http://e.co/index.html",
@@ -46,17 +46,6 @@ def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
     assert helpers.url_depth("http://evilcorp.com/") == 0
     assert helpers.url_depth("http://evilcorp.com") == 0
 
-    ### HTTP COMPARE ###
-    with requests_mock.Mocker() as m:
-        m.get(re.compile(r"http://www.example.com.*"), text="wat")
-        compare_helper = helpers.http_compare("http://www.example.com")
-        compare_helper.compare("http://www.example.com", headers={"asdf": "asdf"})
-        compare_helper.compare("http://www.example.com", cookies={"asdf": "asdf"})
-        compare_helper.compare("http://www.example.com", check_reflection=True)
-        compare_helper.compare_body({"asdf": "fdsa"}, {"fdsa": "asdf"})
-        for mode in ("getparam", "header", "cookie"):
-            compare_helper.canary_check("http://www.example.com", mode=mode) == True
-
     ### MISC ###
     assert helpers.is_domain("evilcorp.co.uk")
     assert not helpers.is_domain("www.evilcorp.co.uk")
@@ -382,12 +371,12 @@ def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
         for i in range(100):
             f.write(f"{i}\n")
     assert len(list(open(test_file).readlines())) == 100
-    assert helpers.wordlist(test_file).is_file()
-    truncated_file = helpers.wordlist(test_file, lines=10)
+    assert (await helpers.wordlist(test_file)).is_file()
+    truncated_file = await helpers.wordlist(test_file, lines=10)
     assert truncated_file.is_file()
     assert len(list(open(truncated_file).readlines())) == 10
     with pytest.raises(WordlistError):
-        helpers.wordlist("/tmp/a9pseoysadf/asdkgjaosidf")
+        await helpers.wordlist("/tmp/a9pseoysadf/asdkgjaosidf")
     test_file.unlink()
 
     # misc DNS helpers
@@ -406,21 +395,6 @@ def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
     with pytest.raises(NTLMError):
         helpers.ntlm.ntlmdecode("asdf")
 
-    # interact.sh
-    with requests_mock.Mocker() as m:
-        from bbot.core.helpers.interactsh import server_list
-
-        for server in server_list:
-            m.post(re.compile(rf"https://{server}/.*"), text="nope")
-
-        interactsh_client = helpers.interactsh()
-        with pytest.raises(InteractshError):
-            interactsh_client.register()
-        with pytest.raises(InteractshError):
-            list(interactsh_client.poll())
-        with pytest.raises(InteractshError):
-            interactsh_client.deregister()
-
     test_filesize = Path("/tmp/test_filesize")
     test_filesize.touch()
     assert test_filesize.is_file()
@@ -435,7 +409,7 @@ def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
     assert helpers.human_to_bytes("428.24GB") == 459819198709
 
     scan1 = bbot_scanner(modules="ipneighbor")
-    scan1.load_modules()
+    await scan1.load_modules()
     assert int(helpers.get_size(scan1.modules["ipneighbor"])) > 0
 
 
diff --git a/bbot/test/test_step_2/test_modules_basic.py b/bbot/test/test_step_2/test_modules_basic.py
index 7ab5de917b..301ca2ce16 100644
--- a/bbot/test/test_step_2/test_modules_basic.py
+++ b/bbot/test/test_step_2/test_modules_basic.py
@@ -1,242 +1,241 @@
 import re
-import requests_mock
 from contextlib import suppress
 
 from ..bbot_fixtures import *
 
 
-def test_modules_basic(patch_commands, patch_ansible, scan, helpers, events, bbot_config, bbot_scanner):
+@pytest.mark.asyncio
+async def test_modules_basic(patch_commands, patch_ansible, scan, helpers, events, bbot_config, bbot_scanner, httpx_mock):
     fallback_nameservers = scan.helpers.temp_dir / "nameservers.txt"
     with open(fallback_nameservers, "w") as f:
         f.write("8.8.8.8\n")
 
-    with requests_mock.Mocker() as m:
-        for http_method in ("GET", "CONNECT", "HEAD", "POST", "PUT", "TRACE", "DEBUG", "PATCH", "DELETE", "OPTIONS"):
-            m.request(http_method, re.compile(r".*"), text='{"test": "test"}')
-
-        # event filtering
-        from bbot.modules.base import BaseModule
-        from bbot.modules.output.base import BaseOutputModule
-        from bbot.modules.report.base import BaseReportModule
-        from bbot.modules.internal.base import BaseInternalModule
-
-        # output module specific event filtering tests
-        base_output_module = BaseOutputModule(scan)
-        base_output_module.watched_events = ["IP_ADDRESS"]
-        localhost = scan.make_event("127.0.0.1", source=scan.root_event)
-        assert base_output_module._event_precheck(localhost)[0] == True
-        localhost._internal = True
-        assert base_output_module._event_precheck(localhost)[0] == False
-        localhost._force_output = True
-        assert base_output_module._event_precheck(localhost)[0] == True
-        localhost._omit = True
-        assert base_output_module._event_precheck(localhost)[0] == False
-
-        # common event filtering tests
-        for module_class in (BaseModule, BaseOutputModule, BaseReportModule, BaseInternalModule):
-            base_module = module_class(scan)
-            localhost2 = scan.make_event("127.0.0.2", source=events.subdomain)
-            localhost2.make_in_scope()
-            # base cases
-            base_module._watched_events = None
-            base_module.watched_events = ["*"]
-            assert base_module._event_precheck(events.emoji)[0] == True
-            base_module._watched_events = None
-            base_module.watched_events = ["IP_ADDRESS"]
-            assert base_module._event_precheck(events.ipv4)[0] == True
-            assert base_module._event_precheck(events.domain)[0] == False
-            assert base_module._event_precheck(events.localhost)[0] == True
-            assert base_module._event_precheck(localhost2)[0] == True
-            # target only
-            base_module.target_only = True
-            assert base_module._event_precheck(localhost2)[0] == False
-            localhost2.add_tag("target")
-            assert base_module._event_precheck(localhost2)[0] == True
-            base_module.target_only = False
-            # special case for IPs and ranges
-            base_module.watched_events = ["IP_ADDRESS", "IP_RANGE"]
-            ip_range = scan.make_event("127.0.0.0/24", dummy=True)
-            localhost4 = scan.make_event("127.0.0.1", source=ip_range)
-            localhost4.make_in_scope()
-            localhost4.module = "plumbus"
-            assert base_module._event_precheck(localhost4)[0] == True
-            localhost4.module = "speculate"
-            assert base_module._event_precheck(localhost4)[0] == False
-
-            # in scope only
-            base_module.in_scope_only = True
-            localhost3 = scan.make_event("127.0.0.2", source=events.subdomain)
-            valid, reason = base_module._event_postcheck(localhost3)
-            if base_module._type == "output":
-                assert valid
-            else:
-                assert not valid
-                assert reason == "it did not meet in_scope_only filter criteria"
-            base_module.in_scope_only = False
-            base_module.scope_distance_modifier = 0
-            localhost4 = scan.make_event("127.0.0.1", source=events.subdomain)
-            valid, reason = base_module._event_postcheck(events.localhost)
+    for http_method in ("GET", "CONNECT", "HEAD", "POST", "PUT", "TRACE", "DEBUG", "PATCH", "DELETE", "OPTIONS"):
+        httpx_mock.add_response(method=http_method, url=re.compile(r".*"), json={"test": "test"})
+
+    # event filtering
+    from bbot.modules.base import BaseModule
+    from bbot.modules.output.base import BaseOutputModule
+    from bbot.modules.report.base import BaseReportModule
+    from bbot.modules.internal.base import BaseInternalModule
+
+    # output module specific event filtering tests
+    base_output_module = BaseOutputModule(scan)
+    base_output_module.watched_events = ["IP_ADDRESS"]
+    localhost = scan.make_event("127.0.0.1", source=scan.root_event)
+    assert base_output_module._event_precheck(localhost)[0] == True
+    localhost._internal = True
+    assert base_output_module._event_precheck(localhost)[0] == False
+    localhost._force_output = True
+    assert base_output_module._event_precheck(localhost)[0] == True
+    localhost._omit = True
+    assert base_output_module._event_precheck(localhost)[0] == False
+
+    # common event filtering tests
+    for module_class in (BaseModule, BaseOutputModule, BaseReportModule, BaseInternalModule):
+        base_module = module_class(scan)
+        localhost2 = scan.make_event("127.0.0.2", source=events.subdomain)
+        localhost2.make_in_scope()
+        # base cases
+        base_module._watched_events = None
+        base_module.watched_events = ["*"]
+        assert base_module._event_precheck(events.emoji)[0] == True
+        base_module._watched_events = None
+        base_module.watched_events = ["IP_ADDRESS"]
+        assert base_module._event_precheck(events.ipv4)[0] == True
+        assert base_module._event_precheck(events.domain)[0] == False
+        assert base_module._event_precheck(events.localhost)[0] == True
+        assert base_module._event_precheck(localhost2)[0] == True
+        # target only
+        base_module.target_only = True
+        assert base_module._event_precheck(localhost2)[0] == False
+        localhost2.add_tag("target")
+        assert base_module._event_precheck(localhost2)[0] == True
+        base_module.target_only = False
+        # special case for IPs and ranges
+        base_module.watched_events = ["IP_ADDRESS", "IP_RANGE"]
+        ip_range = scan.make_event("127.0.0.0/24", dummy=True)
+        localhost4 = scan.make_event("127.0.0.1", source=ip_range)
+        localhost4.make_in_scope()
+        localhost4.module = "plumbus"
+        assert base_module._event_precheck(localhost4)[0] == True
+        localhost4.module = "speculate"
+        assert base_module._event_precheck(localhost4)[0] == False
+
+        # in scope only
+        base_module.in_scope_only = True
+        localhost3 = scan.make_event("127.0.0.2", source=events.subdomain)
+        valid, reason = await base_module._event_postcheck(localhost3)
+        if base_module._type == "output":
             assert valid
-
-        base_output_module = BaseOutputModule(scan)
-        base_output_module.watched_events = ["IP_ADDRESS"]
-
-        scan2 = bbot_scanner(
-            modules=list(set(available_modules + available_internal_modules)),
-            output_modules=list(available_output_modules),
-            config=bbot_config,
-        )
-        scan2.helpers.dns.fallback_nameservers_file = fallback_nameservers
-        patch_commands(scan2)
-        patch_ansible(scan2)
-        scan2.load_modules()
-        scan2.status = "RUNNING"
-
-        # attributes, descriptions, etc.
-        for module_name, module in scan2.modules.items():
-            # flags
-            assert module._type in ("internal", "output", "scan")
-
-        # module preloading
-        all_preloaded = module_loader.preloaded()
-        assert "massdns" in all_preloaded
-        assert "DNS_NAME" in all_preloaded["massdns"]["watched_events"]
-        assert "DNS_NAME" in all_preloaded["massdns"]["produced_events"]
-        assert "subdomain-enum" in all_preloaded["massdns"]["flags"]
-        assert "wordlist" in all_preloaded["massdns"]["config"]
-        assert type(all_preloaded["massdns"]["config"]["max_resolvers"]) == int
-        assert all_preloaded["sslcert"]["deps"]["pip"]
-        assert all_preloaded["sslcert"]["deps"]["apt"]
-        assert all_preloaded["massdns"]["deps"]["ansible"]
-
-        for module_name, preloaded in all_preloaded.items():
-            # either active or passive and never both
-            flags = preloaded.get("flags", [])
-            if preloaded["type"] == "scan":
-                assert ("active" in flags and not "passive" in flags) or (
-                    not "active" in flags and "passive" in flags
-                ), f'module "{module_name}" must have either "active" or "passive" flag'
-                assert preloaded.get("meta", {}).get("description", ""), f"{module_name} must have a description"
-
-            # attribute checks
-            watched_events = preloaded.get("watched_events")
-            produced_events = preloaded.get("produced_events")
-
-            assert type(watched_events) == list
-            assert type(produced_events) == list
-            if not preloaded.get("type", "") in ("internal",):
-                assert watched_events, f"{module_name}.watched_events must not be empty"
-            assert type(watched_events) == list, f"{module_name}.watched_events must be of type list"
-            assert type(produced_events) == list, f"{module_name}.produced_events must be of type list"
-            assert all(
-                [type(t) == str for t in watched_events]
-            ), f"{module_name}.watched_events entries must be of type string"
-            assert all(
-                [type(t) == str for t in produced_events]
-            ), f"{module_name}.produced_events entries must be of type string"
-
-            assert type(preloaded.get("deps_pip", [])) == list, f"{module_name}.deps_pip must be of type list"
-            assert (
-                type(preloaded.get("deps_pip_constraints", [])) == list
-            ), f"{module_name}.deps_pip_constraints must be of type list"
-            assert type(preloaded.get("deps_apt", [])) == list, f"{module_name}.deps_apt must be of type list"
-            assert type(preloaded.get("deps_shell", [])) == list, f"{module_name}.deps_shell must be of type list"
-            assert type(preloaded.get("config", None)) == dict, f"{module_name}.options must be of type list"
+        else:
+            assert not valid
+            assert reason == "it did not meet in_scope_only filter criteria"
+        base_module.in_scope_only = False
+        base_module.scope_distance_modifier = 0
+        localhost4 = scan.make_event("127.0.0.1", source=events.subdomain)
+        valid, reason = await base_module._event_postcheck(events.localhost)
+        assert valid
+
+    base_output_module = BaseOutputModule(scan)
+    base_output_module.watched_events = ["IP_ADDRESS"]
+
+    scan2 = bbot_scanner(
+        modules=list(set(available_modules + available_internal_modules)),
+        output_modules=list(available_output_modules),
+        config=bbot_config,
+    )
+    scan2.helpers.dns.fallback_nameservers_file = fallback_nameservers
+    patch_commands(scan2)
+    patch_ansible(scan2)
+    scan2.load_modules()
+    scan2.status = "RUNNING"
+
+    # attributes, descriptions, etc.
+    for module_name, module in scan2.modules.items():
+        # flags
+        assert module._type in ("internal", "output", "scan")
+
+    # module preloading
+    all_preloaded = module_loader.preloaded()
+    assert "massdns" in all_preloaded
+    assert "DNS_NAME" in all_preloaded["massdns"]["watched_events"]
+    assert "DNS_NAME" in all_preloaded["massdns"]["produced_events"]
+    assert "subdomain-enum" in all_preloaded["massdns"]["flags"]
+    assert "wordlist" in all_preloaded["massdns"]["config"]
+    assert type(all_preloaded["massdns"]["config"]["max_resolvers"]) == int
+    assert all_preloaded["sslcert"]["deps"]["pip"]
+    assert all_preloaded["sslcert"]["deps"]["apt"]
+    assert all_preloaded["massdns"]["deps"]["ansible"]
+
+    for module_name, preloaded in all_preloaded.items():
+        # either active or passive and never both
+        flags = preloaded.get("flags", [])
+        if preloaded["type"] == "scan":
+            assert ("active" in flags and not "passive" in flags) or (
+                not "active" in flags and "passive" in flags
+            ), f'module "{module_name}" must have either "active" or "passive" flag'
+            assert preloaded.get("meta", {}).get("description", ""), f"{module_name} must have a description"
+
+        # attribute checks
+        watched_events = preloaded.get("watched_events")
+        produced_events = preloaded.get("produced_events")
+
+        assert type(watched_events) == list
+        assert type(produced_events) == list
+        if not preloaded.get("type", "") in ("internal",):
+            assert watched_events, f"{module_name}.watched_events must not be empty"
+        assert type(watched_events) == list, f"{module_name}.watched_events must be of type list"
+        assert type(produced_events) == list, f"{module_name}.produced_events must be of type list"
+        assert all(
+            [type(t) == str for t in watched_events]
+        ), f"{module_name}.watched_events entries must be of type string"
+        assert all(
+            [type(t) == str for t in produced_events]
+        ), f"{module_name}.produced_events entries must be of type string"
+
+        assert type(preloaded.get("deps_pip", [])) == list, f"{module_name}.deps_pip must be of type list"
+        assert (
+            type(preloaded.get("deps_pip_constraints", [])) == list
+        ), f"{module_name}.deps_pip_constraints must be of type list"
+        assert type(preloaded.get("deps_apt", [])) == list, f"{module_name}.deps_apt must be of type list"
+        assert type(preloaded.get("deps_shell", [])) == list, f"{module_name}.deps_shell must be of type list"
+        assert type(preloaded.get("config", None)) == dict, f"{module_name}.options must be of type list"
+        assert (
+            type(preloaded.get("options_desc", None)) == dict
+        ), f"{module_name}.options_desc must be of type list"
+        # options must have descriptions
+        assert set(preloaded.get("config", {})) == set(
+            preloaded.get("options_desc", {})
+        ), f"{module_name}.options do not match options_desc"
+        # descriptions most not be blank
+        assert all(
+            o for o in preloaded.get("options_desc", {}).values()
+        ), f"{module_name}.options_desc descriptions must not be blank"
+
+    # setups
+    futures = {}
+    for module_name, module in scan2.modules.items():
+        log.info(f"Testing {module_name}.setup()")
+        future = scan2._thread_pool.submit(module.setup)
+        futures[future] = module
+    for future in helpers.as_completed(futures):
+        module = futures[future]
+        result = future.result()
+        if type(result) == tuple:
+            assert len(result) == 2, f"if tuple, {module.name}.setup() return value must have length of 2"
+            status, msg = result
+            assert status in (
+                True,
+                False,
+                None,
+            ), f"if tuple, the first element of {module.name}.setup()'s return value must be either True, False, or None"
             assert (
-                type(preloaded.get("options_desc", None)) == dict
-            ), f"{module_name}.options_desc must be of type list"
-            # options must have descriptions
-            assert set(preloaded.get("config", {})) == set(
-                preloaded.get("options_desc", {})
-            ), f"{module_name}.options do not match options_desc"
-            # descriptions most not be blank
-            assert all(
-                o for o in preloaded.get("options_desc", {}).values()
-            ), f"{module_name}.options_desc descriptions must not be blank"
-
-        # setups
-        futures = {}
-        for module_name, module in scan2.modules.items():
-            log.info(f"Testing {module_name}.setup()")
-            future = scan2._thread_pool.submit(module.setup)
+                type(msg) == str
+            ), f"if tuple, the second element of {module.name}.setup()'s return value must be a message of type str"
+        else:
+            assert result in (
+                True,
+                False,
+                None,
+            ), f"{module.name}.setup() must return a status of either True, False, or None"
+        if result == False:
+            module.set_error_state()
+
+    futures.clear()
+
+    # handle_event / handle_batch
+    futures = {}
+    for module_name, module in scan2.modules.items():
+        module.emit_event = lambda *args, **kwargs: None
+        module._filter = lambda *args, **kwargs: True, ""
+        events_to_submit = [e for e in events.all if e.type in module.watched_events]
+        if module.batch_size > 1:
+            log.info(f"Testing {module_name}.handle_batch()")
+            future = scan2._thread_pool.submit(module.handle_batch, *events_to_submit)
             futures[future] = module
-        for future in helpers.as_completed(futures):
-            module = futures[future]
-            result = future.result()
-            if type(result) == tuple:
-                assert len(result) == 2, f"if tuple, {module.name}.setup() return value must have length of 2"
-                status, msg = result
-                assert status in (
-                    True,
-                    False,
-                    None,
-                ), f"if tuple, the first element of {module.name}.setup()'s return value must be either True, False, or None"
-                assert (
-                    type(msg) == str
-                ), f"if tuple, the second element of {module.name}.setup()'s return value must be a message of type str"
-            else:
-                assert result in (
-                    True,
-                    False,
-                    None,
-                ), f"{module.name}.setup() must return a status of either True, False, or None"
-            if result == False:
-                module.set_error_state()
-
-        futures.clear()
-
-        # handle_event / handle_batch
-        futures = {}
-        for module_name, module in scan2.modules.items():
-            module.emit_event = lambda *args, **kwargs: None
-            module._filter = lambda *args, **kwargs: True, ""
-            events_to_submit = [e for e in events.all if e.type in module.watched_events]
-            if module.batch_size > 1:
-                log.info(f"Testing {module_name}.handle_batch()")
-                future = scan2._thread_pool.submit(module.handle_batch, *events_to_submit)
+        else:
+            for e in events_to_submit:
+                log.info(f"Testing {module_name}.handle_event()")
+                future = scan2._thread_pool.submit(module.handle_event, e)
                 futures[future] = module
-            else:
-                for e in events_to_submit:
-                    log.info(f"Testing {module_name}.handle_event()")
-                    future = scan2._thread_pool.submit(module.handle_event, e)
-                    futures[future] = module
-        for future in helpers.as_completed(futures):
-            try:
-                assert future.result() == None
-            except Exception as e:
-                import traceback
-
-                module = futures[future]
-                assert module.errored == True, f'Error in module "{module}": {e}\n{traceback.format_exc()}'
-        futures.clear()
-
-        # finishes
-        futures = {}
-        for module_name, module in scan2.modules.items():
-            log.info(f"Testing {module_name}.finish()")
-            future = scan2._thread_pool.submit(module.finish)
-            futures[future] = module
-        for future in helpers.as_completed(futures):
+    for future in helpers.as_completed(futures):
+        try:
             assert future.result() == None
-        futures.clear()
+        except Exception as e:
+            import traceback
 
-        # cleanups
-        futures = {}
-        for module_name, module in scan2.modules.items():
-            log.info(f"Testing {module_name}.cleanup()")
-            future = scan2._thread_pool.submit(module.cleanup)
-            futures[future] = module
-        for future in helpers.as_completed(futures):
-            assert future.result() == None
-        futures.clear()
-
-        # event filters
-        for module_name, module in scan2.modules.items():
-            log.info(f"Testing {module_name}.filter_event()")
-            result = module.filter_event(events.emoji)
-            with suppress(ValueError, TypeError):
-                result, reason = result
-            assert result in (
-                True,
-                False,
-            ), f"{module_name}.filter_event() must return either True or False"
+            module = futures[future]
+            assert module.errored == True, f'Error in module "{module}": {e}\n{traceback.format_exc()}'
+    futures.clear()
+
+    # finishes
+    futures = {}
+    for module_name, module in scan2.modules.items():
+        log.info(f"Testing {module_name}.finish()")
+        future = scan2._thread_pool.submit(module.finish)
+        futures[future] = module
+    for future in helpers.as_completed(futures):
+        assert future.result() == None
+    futures.clear()
+
+    # cleanups
+    futures = {}
+    for module_name, module in scan2.modules.items():
+        log.info(f"Testing {module_name}.cleanup()")
+        future = scan2._thread_pool.submit(module.cleanup)
+        futures[future] = module
+    for future in helpers.as_completed(futures):
+        assert future.result() == None
+    futures.clear()
+
+    # event filters
+    for module_name, module in scan2.modules.items():
+        log.info(f"Testing {module_name}.filter_event()")
+        result = module.filter_event(events.emoji)
+        with suppress(ValueError, TypeError):
+            result, reason = result
+        assert result in (
+            True,
+            False,
+        ), f"{module_name}.filter_event() must return either True or False"
diff --git a/bbot/test/test_step_2/test_web.py b/bbot/test/test_step_2/test_web.py
index 323abf8c6f..92fcfa1afe 100644
--- a/bbot/test/test_step_2/test_web.py
+++ b/bbot/test/test_step_2/test_web.py
@@ -1,3 +1,5 @@
+import re
+
 from ..bbot_fixtures import *
 
 
@@ -139,3 +141,15 @@ async def test_web_curl(bbot_scanner, bbot_config, bbot_httpserver):
     headers_url = bbot_httpserver.url_for("/test-custom-http-headers-curl")
     curl_result = await helpers.curl(url=headers_url)
     assert curl_result == "curl_yep_headers"
+
+
+@pytest.mark.asyncio
+async def test_web_http_compare(httpx_mock, helpers):
+    httpx_mock.add_response(re.compile(r"http://www.example.com.*"), text="wat")
+    compare_helper = helpers.http_compare("http://www.example.com")
+    await compare_helper.compare("http://www.example.com", headers={"asdf": "asdf"})
+    await compare_helper.compare("http://www.example.com", cookies={"asdf": "asdf"})
+    await compare_helper.compare("http://www.example.com", check_reflection=True)
+    compare_helper.compare_body({"asdf": "fdsa"}, {"fdsa": "asdf"})
+    for mode in ("getparam", "header", "cookie"):
+        assert await compare_helper.canary_check("http://www.example.com", mode=mode) == True

From 7a737f92fde2afbd5aa50164d01a217e40f2276c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 13 May 2023 22:02:46 -0400
Subject: [PATCH 019/387] blacked

---
 bbot/test/test_step_2/test_helpers.py       | 1 -
 bbot/test/test_step_2/test_modules_basic.py | 8 ++++----
 2 files changed, 4 insertions(+), 5 deletions(-)

diff --git a/bbot/test/test_step_2/test_helpers.py b/bbot/test/test_step_2/test_helpers.py
index 2d9c6809df..9639f6110c 100644
--- a/bbot/test/test_step_2/test_helpers.py
+++ b/bbot/test/test_step_2/test_helpers.py
@@ -1,4 +1,3 @@
-import re
 import datetime
 import ipaddress
 
diff --git a/bbot/test/test_step_2/test_modules_basic.py b/bbot/test/test_step_2/test_modules_basic.py
index 301ca2ce16..5c5285ad2c 100644
--- a/bbot/test/test_step_2/test_modules_basic.py
+++ b/bbot/test/test_step_2/test_modules_basic.py
@@ -5,7 +5,9 @@
 
 
 @pytest.mark.asyncio
-async def test_modules_basic(patch_commands, patch_ansible, scan, helpers, events, bbot_config, bbot_scanner, httpx_mock):
+async def test_modules_basic(
+    patch_commands, patch_ansible, scan, helpers, events, bbot_config, bbot_scanner, httpx_mock
+):
     fallback_nameservers = scan.helpers.temp_dir / "nameservers.txt"
     with open(fallback_nameservers, "w") as f:
         f.write("8.8.8.8\n")
@@ -141,9 +143,7 @@ async def test_modules_basic(patch_commands, patch_ansible, scan, helpers, event
         assert type(preloaded.get("deps_apt", [])) == list, f"{module_name}.deps_apt must be of type list"
         assert type(preloaded.get("deps_shell", [])) == list, f"{module_name}.deps_shell must be of type list"
         assert type(preloaded.get("config", None)) == dict, f"{module_name}.options must be of type list"
-        assert (
-            type(preloaded.get("options_desc", None)) == dict
-        ), f"{module_name}.options_desc must be of type list"
+        assert type(preloaded.get("options_desc", None)) == dict, f"{module_name}.options_desc must be of type list"
         # options must have descriptions
         assert set(preloaded.get("config", {})) == set(
             preloaded.get("options_desc", {})

From 92b3a886a718aff0b68da4a408733a296c5d478a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 15 May 2023 13:41:09 -0400
Subject: [PATCH 020/387] agent tests

---
 bbot/agent/agent.py                         | 176 ++++++++++++--------
 bbot/agent/messages.py                      |   4 +-
 bbot/cli.py                                 |   8 +-
 bbot/core/configurator/environ.py           |  17 +-
 bbot/core/helpers/misc.py                   |   4 +-
 bbot/modules/base.py                        |   1 +
 bbot/modules/ipneighbor.py                  |   6 +-
 bbot/scanner/dispatcher.py                  |  19 ++-
 bbot/scanner/scanner.py                     |  32 ++--
 bbot/test/bbot_fixtures.py                  |  24 +--
 bbot/test/test.conf                         |   2 +-
 bbot/test/test_step_2/test_agent.py         | 149 +++++++++++++++--
 bbot/test/test_step_2/test_cloud_helpers.py |   5 +-
 bbot/test/test_step_2/test_config.py        |   5 +-
 14 files changed, 313 insertions(+), 139 deletions(-)

diff --git a/bbot/agent/agent.py b/bbot/agent/agent.py
index 3076119bef..f2a98b0cd1 100644
--- a/bbot/agent/agent.py
+++ b/bbot/agent/agent.py
@@ -1,15 +1,16 @@
 import json
+import asyncio
 import logging
-import threading
 import traceback
-import websocket
-from time import sleep
+import websockets
 from omegaconf import OmegaConf
 
 from . import messages
 import bbot.core.errors
 from bbot.scanner import Scanner
 from bbot.scanner.dispatcher import Dispatcher
+from bbot.core.helpers.misc import urlparse, split_host_port
+from bbot.core.configurator.environ import prepare_environment
 
 log = logging.getLogger("bbot.core.agent")
 
@@ -17,55 +18,97 @@
 class Agent:
     def __init__(self, config):
         self.config = config
+        prepare_environment(self.config)
         self.url = self.config.get("agent_url", "")
+        self.parsed_url = urlparse(self.url)
+        self.host, self.port = split_host_port(self.parsed_url.netloc)
         self.token = self.config.get("agent_token", "")
         self.scan = None
-        self.thread = None
-        self._scan_lock = threading.Lock()
+        self.task = None
+        self._ws = None
+        self._scan_lock = asyncio.Lock()
 
         self.dispatcher = Dispatcher()
         self.dispatcher.on_status = self.on_scan_status
         self.dispatcher.on_finish = self.on_scan_finish
 
     def setup(self):
-        websocket.enableTrace(False)
         if not self.url:
             log.error(f"Must specify agent_url")
             return False
         if not self.token:
             log.error(f"Must specify agent_token")
             return False
-        self.ws = websocket.WebSocketApp(
-            f"{self.url}/control/",
-            on_open=self.on_open,
-            on_message=self.on_message,
-            on_error=self.on_error,
-            on_close=self.on_close,
-            header={"Authorization": f"Bearer {self.token}"},
-        )
         return True
 
-    def start(self):
-        not_keyboardinterrupt = False
+    async def ws(self, rebuild=False):
+        if self._ws is None or rebuild:
+            kwargs = {"close_timeout": 0.5}
+            if self.token:
+                kwargs.update({"extra_headers": {"Authorization": f"Bearer {self.token}"}})
+            verbs = ("Building", "Built")
+            if rebuild:
+                verbs = ("Rebuilding", "Rebuilt")
+            log.debug(f"{verbs[0]} websocket connection to {self.url}")
+            self._ws = await websockets.connect(self.url, **kwargs)
+            log.debug(f"{verbs[1]} websocket connection to {self.url}")
+        return self._ws
+
+    async def start(self):
+        rebuild = False
         while 1:
-            not_keyboardinterrupt = self.ws.run_forever()
-            if not not_keyboardinterrupt:
-                break
-            sleep(1)
+            ws = await self.ws(rebuild=rebuild)
+            rebuild = False
+            try:
+                message = await ws.recv()
+                log.debug(f"Got message: {message}")
+                try:
+                    message = json.loads(message)
+                    message = messages.Message(**message)
+
+                    if message.command == "ping":
+                        if self.scan is None:
+                            await self.send({"conversation": str(message.conversation), "message_type": "pong"})
+
+                    command_type = getattr(messages, message.command, None)
+                    if command_type is None:
+                        log.warning(f'Invalid command: "{message.command}"')
+                        continue
+
+                    command_args = command_type(**message.arguments)
+                    command_fn = getattr(self, message.command)
+                    response = await self.err_handle(command_fn, **command_args.dict())
+                    log.info(str(response))
+                    await self.send({"conversation": str(message.conversation), "message": response})
+
+                except json.decoder.JSONDecodeError as e:
+                    log.warning(f'Failed to decode message "{message}": {e}')
+                    log.trace(traceback.format_exc())
+                    continue
+            except Exception as e:
+                log.debug(f"Error receiving message: {e}")
+                log.debug(traceback.format_exc())
+                await asyncio.sleep(1)
+                rebuild = True
 
-    def send(self, message):
+    async def send(self, message):
+        rebuild = False
         while 1:
             try:
-                self.ws.send(json.dumps(message))
+                ws = await self.ws(rebuild=rebuild)
+                j = json.dumps(message)
+                log.debug(f"Sending message of length {len(message)}")
+                await ws.send(j)
+                rebuild = False
                 break
             except Exception as e:
-                if getattr(self.scan, "stopping", True):
-                    break
                 log.warning(f"Error sending message: {e}, retrying")
                 log.trace(traceback.format_exc())
-                sleep(1)
+                await asyncio.sleep(1)
+                # rebuild = True
 
-    def on_message(self, ws, message):
+    async def on_message(self, websocket, path):
+        message = await websocket.recv()
         try:
             message = json.loads(message)
         except Exception as e:
@@ -75,8 +118,10 @@ def on_message(self, ws, message):
 
         if message.command == "ping":
             if self.scan is None:
-                self.send({"conversation": str(message.conversation), "message_type": "pong"})
-            return
+                await self.send({"conversation": str(message.conversation), "message_type": "pong"})
+                return
+            else:
+                log.warning(f'Invalid command: "{message.command}"')
 
         command_type = None
         try:
@@ -86,21 +131,13 @@ def on_message(self, ws, message):
 
         command_args = command_type(**message.arguments)
         command_fn = getattr(self, message.command)
-        response = self.err_handle(command_fn, **command_args.dict())
-        log.info(str(response))
-        self.send({"conversation": str(message.conversation), "message": response})
-
-    def on_error(self, ws, error):
-        log.warning(f"on_error: {error}")
-
-    def on_close(self, ws, close_status_code, close_msg):
-        log.warning("Closed connection")
+        async with self.error_hndle():
+            response = await command_fn(**command_args.dict())
+            log.info(str(response))
+            await self.send({"conversation": str(message.conversation), "message": response})
 
-    def on_open(self, ws):
-        log.success("Opened connection")
-
-    def start_scan(self, scan_id="", targets=[], modules=[], output_modules=[], config={}):
-        with self._scan_lock:
+    async def start_scan(self, scan_id="", name=None, targets=[], modules=[], output_modules=[], config={}):
+        async with self._scan_lock:
             if self.scan is None:
                 log.success(
                     f"Starting scan with targets={targets}, modules={modules}, output_modules={output_modules}"
@@ -111,27 +148,40 @@ def start_scan(self, scan_id="", targets=[], modules=[], output_modules=[], conf
                 config = OmegaConf.create(config)
                 config = OmegaConf.merge(self.config, config, output_module_config)
                 output_modules = list(set(output_modules + ["websocket"]))
-                self.scan = Scanner(
+                scan = Scanner(
                     *targets,
                     scan_id=scan_id,
+                    name=name,
                     modules=modules,
                     output_modules=output_modules,
                     config=config,
                     dispatcher=self.dispatcher,
                 )
-                self.thread = threading.Thread(target=self._start_scan, args=(self.scan,), daemon=True)
-                self.thread.start()
+                self.task = asyncio.create_task(self._start_scan_task(scan))
 
-                return {"success": f"Started scan", "scan_id": self.scan.id}
+                return {"success": f"Started scan", "scan_id": scan.id}
             else:
                 msg = f"Scan {self.scan.id} already in progress"
                 log.warning(msg)
                 return {"error": msg, "scan_id": self.scan.id}
 
-    def stop_scan(self):
+    async def _start_scan_task(self, scan):
+        self.scan = scan
+        try:
+            await scan.start_without_generator()
+        except bbot.core.errors.ScanError as e:
+            log.error(f"Scan error: {e}")
+            log.trace(traceback.format_exc())
+        except Exception:
+            log.critical(f"Encountered error: {traceback.format_exc()}")
+            self.on_scan_status("FAILED", scan.id)
+        finally:
+            self.task = None
+
+    async def stop_scan(self):
         log.warning("Stopping scan")
         try:
-            with self._scan_lock:
+            async with self._scan_lock:
                 if self.scan is None:
                     msg = "Scan not in progress"
                     log.warning(msg)
@@ -147,40 +197,28 @@ def stop_scan(self):
             log.trace(traceback.format_exc())
         finally:
             self.scan = None
-            self.thread = None
+            self.task = None
 
-    def scan_status(self):
-        with self._scan_lock:
+    async def scan_status(self):
+        async with self._scan_lock:
             if self.scan is None:
-                self.thread = None
                 msg = "Scan not in progress"
                 log.warning(msg)
                 return {"error": msg}
         return {"success": "Polled scan", "scan_status": self.scan.status}
 
-    def on_scan_status(self, status, scan_id):
-        self.send({"message_type": "scan_status_change", "status": str(status), "scan_id": scan_id})
+    async def on_scan_status(self, status, scan_id):
+        await self.send({"message_type": "scan_status_change", "status": str(status), "scan_id": scan_id})
 
-    def on_scan_finish(self, scan):
+    async def on_scan_finish(self, scan):
         self.scan = None
-        self.thread = None
+        self.task = None
 
-    @staticmethod
-    def err_handle(callback, *args, **kwargs):
+    async def err_handle(self, callback, *args, **kwargs):
         try:
-            return callback(*args, **kwargs)
+            return await callback(*args, **kwargs)
         except Exception as e:
             msg = f"Error in {callback.__qualname__}(): {e}"
             log.error(msg)
             log.trace(traceback.format_exc())
             return {"error": msg}
-
-    def _start_scan(self, scan):
-        try:
-            scan.start_without_generator()
-        except bbot.core.errors.ScanError as e:
-            log.error(f"Scan error: {e}")
-            log.trace(traceback.format_exc())
-        except Exception:
-            log.critical(f"Encountered error: {traceback.format_exc()}")
-            self.on_scan_status("FAILED", scan.id)
diff --git a/bbot/agent/messages.py b/bbot/agent/messages.py
index 3530fed114..34fd2c15c9 100644
--- a/bbot/agent/messages.py
+++ b/bbot/agent/messages.py
@@ -1,11 +1,12 @@
 from uuid import UUID
+from typing import Optional
 from pydantic import BaseModel
 
 
 class Message(BaseModel):
     conversation: UUID
     command: str
-    arguments: dict
+    arguments: Optional[dict] = {}
 
 
 ### COMMANDS ###
@@ -17,6 +18,7 @@ class start_scan(BaseModel):
     modules: list
     output_modules: list = []
     config: dict = {}
+    name: Optional[str] = None
 
 
 class stop_scan(BaseModel):
diff --git a/bbot/cli.py b/bbot/cli.py
index 8538e269d2..bc292f7c75 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -20,7 +20,7 @@
 from bbot.modules import module_loader
 from bbot.core.configurator.args import parser
 from bbot.core.helpers.logger import log_to_stderr
-from bbot.core.configurator import ensure_config_files, check_cli_args
+from bbot.core.configurator import ensure_config_files, check_cli_args, environ
 
 log = logging.getLogger("bbot.cli")
 sys.stdout.reconfigure(line_buffering=True)
@@ -39,6 +39,7 @@
 async def _main():
     global err
     global scan_name
+    environ.cli_execution = True
 
     ensure_config_files()
 
@@ -70,7 +71,7 @@ async def _main():
             agent = Agent(config)
             success = agent.setup()
             if success:
-                agent.start()
+                await agent.start()
 
         else:
             from bbot.scanner import Scanner
@@ -293,9 +294,6 @@ def keyboard_listen():
                 log_to_stderr(str(e), level="ERROR")
             except Exception:
                 raise
-            finally:
-                with suppress(NameError):
-                    await scanner.cleanup()
 
     except bbot.core.errors.BBOTError as e:
         log_to_stderr(f"{e} (--debug for details)", level="ERROR")
diff --git a/bbot/core/configurator/environ.py b/bbot/core/configurator/environ.py
index c405037b14..23c7e78627 100644
--- a/bbot/core/configurator/environ.py
+++ b/bbot/core/configurator/environ.py
@@ -8,6 +8,10 @@
 from ..helpers.misc import cpu_architecture, os_platform, os_platform_friendly
 
 
+# keep track of whether BBOT is being executed via the CLI
+cli_execution = False
+
+
 def flatten_config(config, base="bbot"):
     """
     Flatten a JSON-like config into a list of environment variables:
@@ -76,7 +80,7 @@ def prepare_environment(bbot_config):
     os.environ["BBOT_CPU_ARCH"] = cpu_architecture()
 
     # exchange certain options between CLI args and config
-    if args.cli_options is not None:
+    if cli_execution and args.cli_options is not None:
         # deps
         bbot_config["retry_deps"] = args.cli_options.retry_deps
         bbot_config["force_deps"] = args.cli_options.force_deps
@@ -88,6 +92,17 @@ def prepare_environment(bbot_config):
         if args.cli_options.output_dir:
             bbot_config["output_dir"] = args.cli_options.output_dir
 
+    import logging
+
+    log = logging.getLogger()
+    if bbot_config.get("debug", False):
+        global _log_level_override
+        bbot_config["silent"] = False
+        _log_level_override = logging.DEBUG
+        log = logging.getLogger("bbot")
+        log.setLevel(logging.DEBUG)
+        logging.getLogger("asyncio").setLevel(logging.DEBUG)
+
     # copy config to environment
     bbot_environ = flatten_config(bbot_config)
     os.environ.update(bbot_environ)
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index fda9cc8f2a..4f5bc3d615 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -111,9 +111,9 @@ def split_host_port(d):
     host = None
     with suppress(ValueError):
         if parsed.port is None:
-            if parsed.scheme == "https":
+            if parsed.scheme in ("https", "wss"):
                 port = 443
-            elif parsed.scheme == "http":
+            elif parsed.scheme in ("http", "ws"):
                 port = 80
         else:
             port = int(parsed.port)
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 4d1f626541..2e06ae3381 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -297,6 +297,7 @@ async def _setup(self):
             self.debug(f"Finished setting up module {self.name}")
         except Exception as e:
             self.set_error_state()
+            # soft-fail if it's only a wordlist error
             if isinstance(e, WordlistError):
                 status = None
             msg = f"{e}"
diff --git a/bbot/modules/ipneighbor.py b/bbot/modules/ipneighbor.py
index 3cfe82ea77..207bbe99cb 100644
--- a/bbot/modules/ipneighbor.py
+++ b/bbot/modules/ipneighbor.py
@@ -13,17 +13,17 @@ class ipneighbor(BaseModule):
     scope_distance_modifier = 1
     _scope_shepherding = False
 
-    def setup(self):
+    async def setup(self):
         self.processed = set()
         self.num_bits = max(1, int(self.config.get("num_bits", 4)))
         return True
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if str(event.module) in ("speculate", "ipneighbor"):
             return False
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         main_ip = event.host
         netmask = main_ip.max_prefixlen - min(main_ip.max_prefixlen, self.num_bits)
         network = ipaddress.ip_network(f"{main_ip}/{netmask}", strict=False)
diff --git a/bbot/scanner/dispatcher.py b/bbot/scanner/dispatcher.py
index 763da4c62e..a9c56c2b72 100644
--- a/bbot/scanner/dispatcher.py
+++ b/bbot/scanner/dispatcher.py
@@ -1,3 +1,9 @@
+import logging
+import traceback
+
+log = logging.getLogger("bbot.scanner.dispatcher")
+
+
 class Dispatcher:
     """
     Enables custom hooks/callbacks on certain scan events
@@ -6,14 +12,21 @@ class Dispatcher:
     def set_scan(self, scan):
         self.scan = scan
 
-    def on_start(self, scan):
+    async def on_start(self, scan):
         return
 
-    def on_finish(self, scan):
+    async def on_finish(self, scan):
         return
 
-    def on_status(self, status, scan_id):
+    async def on_status(self, status, scan_id):
         """
         Execute an event when the scan's status is updated
         """
         self.scan.debug(f"Setting scan status to {status}")
+
+    async def catch(self, callback, *args, **kwargs):
+        try:
+            return await callback(*args, **kwargs)
+        except Exception as e:
+            log.error(f"Error in {callback.__qualname__}(): {e}")
+            log.trace(traceback.format_exc())
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index d66330819d..c2459ad1cd 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -21,10 +21,10 @@
 from bbot.core.event import make_event
 from bbot.core.helpers.misc import sha1, rand_string
 from bbot.core.helpers.helper import ConfigAwareHelper
-from bbot.core.logger import init_logging, get_log_level
 from bbot.core.helpers.names_generator import random_name
 from bbot.core.configurator.environ import prepare_environment
 from bbot.core.errors import BBOTError, ScanError, ValidationError
+from bbot.core.logger import init_logging, get_log_level, set_log_level
 
 log = logging.getLogger("bbot.scanner")
 
@@ -74,6 +74,8 @@ def __init__(
             config = OmegaConf.create(config)
         self.config = OmegaConf.merge(bbot_config, config)
         prepare_environment(self.config)
+        if self.config.get("debug", False):
+            set_log_level(logging.DEBUG)
 
         self.strict_scope = strict_scope
         self.force_start = force_start
@@ -198,18 +200,17 @@ async def start_without_generator(self):
             pass
 
     async def start(self):
-        await self.prep()
-
         failed = True
+        scan_start_time = datetime.now()
+        try:
+            await self.prep()
 
-        if not self.target:
-            self.warning(f"No scan targets specified")
+            if not self.target:
+                self.warning(f"No scan targets specified")
 
-        # start status ticker
-        self.ticker_task = asyncio.create_task(self._status_ticker(self.status_frequency))
+            # start status ticker
+            self.ticker_task = asyncio.create_task(self._status_ticker(self.status_frequency))
 
-        scan_start_time = datetime.now()
-        try:
             self.status = "STARTING"
 
             if not self.modules:
@@ -219,7 +220,7 @@ async def start(self):
             else:
                 self.hugesuccess(f"Starting scan {self.name}")
 
-            self.dispatcher.on_start(self)
+            await self.dispatcher.on_start(self)
 
             # start manager worker loops
             self.manager_worker_loop_tasks = [
@@ -292,7 +293,7 @@ async def start(self):
             scan_run_time = self.helpers.human_timedelta(scan_run_time)
             log_fn(f"Scan {self.name} completed in {scan_run_time} with status {self.status}")
 
-            self.dispatcher.on_finish(self)
+            await self.dispatcher.on_finish(self)
 
     def start_modules(self):
         self.verbose(f"Starting module worker loops")
@@ -455,9 +456,12 @@ def status(self, status):
             if self.status == "ABORTING" and not status == "ABORTED":
                 self.debug(f'Attempt to set invalid status "{status}" on aborted scan')
             else:
-                self._status = status
-                self._status_code = self._status_codes[status]
-                self.dispatcher.on_status(self._status, self.id)
+                if status != self._status:
+                    self._status = status
+                    self._status_code = self._status_codes[status]
+                    asyncio.create_task(self.dispatcher.catch(self.dispatcher.on_status, self._status, self.id))
+                else:
+                    self.debug(f'Scan status is already "{status}"')
         else:
             self.debug(f'Attempt to set invalid status "{status}" on scan')
 
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index 6ad61b914b..0306b3819b 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -298,36 +298,14 @@ class bbot_events:
 
 
 @pytest.fixture
-def agent(monkeypatch, websocketapp, bbot_config):
+def agent(monkeypatch, bbot_config):
     from bbot import agent
-    from bbot.modules.output.websocket import Websocket
-
-    monkeypatch.setattr(Websocket, "send", lambda *args, **kwargs: True)
 
     test_agent = agent.Agent(bbot_config)
     test_agent.setup()
-    monkeypatch.setattr(test_agent, "ws", websocketapp())
     return test_agent
 
 
-@pytest.fixture
-def websocketapp():
-    class WebSocketApp:
-        def __init__(*args, **kwargs):
-            return
-
-        def send(self, message):
-            assert type(message) == str
-
-        def run_forever(*args, **kwargs):
-            return False
-
-        def close(self):
-            return
-
-    return WebSocketApp
-
-
 # bbot config
 from bbot import config as default_config
 
diff --git a/bbot/test/test.conf b/bbot/test/test.conf
index 5e534f5067..80daae5a53 100644
--- a/bbot/test/test.conf
+++ b/bbot/test/test.conf
@@ -33,7 +33,7 @@ dns_debug: true
 user_agent: "BBOT Test User-Agent"
 http_debug: false
 keep_scans: 1
-agent_url: test
+agent_url: ws://127.0.0.1:8765
 agent_token: test
 dns_resolution: false
 speculate: false
diff --git a/bbot/test/test_step_2/test_agent.py b/bbot/test/test_step_2/test_agent.py
index e64d3ed162..d5fc2b35ba 100644
--- a/bbot/test/test_step_2/test_agent.py
+++ b/bbot/test/test_step_2/test_agent.py
@@ -1,17 +1,140 @@
-from time import sleep
+import json
+import asyncio
 
 from ..bbot_fixtures import *  # noqa: F401
 
 
-def test_agent(agent):
-    agent.start()
-    agent.on_error(agent.ws, "test")
-    agent.on_close(agent.ws, "test", "test")
-    agent.on_open(agent.ws)
-    agent.on_message(
-        agent.ws,
-        '{"conversation": "90196cc1-299f-4555-82a0-bc22a4247590", "command": "start_scan", "arguments": {"scan_id": "90196cc1-299f-4555-82a0-bc22a4247590", "targets": ["www.blacklanternsecurity.com"], "modules": ["ipneighbor"], "output_modules": ["human"]}}',
-    )
-    sleep(0.5)
-    agent.scan_status()
-    agent.stop_scan()
+_first_run = True
+success = False
+scan_done = asyncio.Event()
+
+
+async def websocket_handler(websocket, path):
+    # whether this is the first run
+    global _first_run
+    first_run = int(_first_run)
+    # whether the test succeeded
+    global success
+    # test phase
+    phase = "ping"
+    # control channel or event channel?
+    control = True
+
+    if path == "/" and first_run:
+        # test ping
+        await websocket.send(json.dumps({"conversation": "90196cc1-299f-4555-82a0-bc22a4247590", "command": "ping"}))
+        _first_run = False
+    else:
+        control = False
+
+    # Bearer token
+    assert websocket.request_headers["Authorization"] == "Bearer test"
+
+    async for message in websocket:
+        log.debug(f"PHASE: {phase}, MESSAGE: {message}")
+        if not control or not first_run:
+            continue
+        m = json.loads(message)
+        # ping
+        if phase == "ping":
+            assert json.loads(message)["message_type"] == "pong"
+            phase = "start_scan_bad"
+        if phase == "start_scan_bad":
+            await websocket.send(
+                json.dumps(
+                    {
+                        "conversation": "90196cc1-299f-4555-82a0-bc22a4247590",
+                        "command": "start_scan",
+                        "arguments": {
+                            "scan_id": "90196cc1-299f-4555-82a0-bc22a4247590",
+                            "targets": ["127.0.0.2"],
+                            "modules": ["asdf"],
+                            "output_modules": ["human"],
+                            "name": "agent_test_scan_bad",
+                        },
+                    }
+                )
+            )
+            phase = "success"
+            continue
+        # scan start success
+        if phase == "success":
+            assert m["message"]["success"] == "Started scan"
+            phase = "cleaning_up"
+            continue
+        # CLEANING_UP status message
+        if phase == "cleaning_up":
+            assert m["message_type"] == "scan_status_change"
+            assert m["status"] == "CLEANING_UP"
+            phase = "failed"
+            continue
+        # FAILED status message
+        if phase == "failed":
+            assert m["message_type"] == "scan_status_change"
+            assert m["status"] == "FAILED"
+            phase = "start_scan"
+        # start good scan
+        if phase == "start_scan":
+            await websocket.send(
+                json.dumps(
+                    {
+                        "conversation": "90196cc1-299f-4555-82a0-bc22a4247590",
+                        "command": "start_scan",
+                        "arguments": {
+                            "scan_id": "90196cc1-299f-4555-82a0-bc22a4247590",
+                            "targets": ["127.0.0.2"],
+                            "modules": ["ipneighbor"],
+                            "output_modules": ["human"],
+                            "name": "agent_test_scan",
+                        },
+                    }
+                )
+            )
+            phase = "success_2"
+            continue
+        # scan start success
+        if phase == "success_2":
+            assert m["message"]["success"] == "Started scan"
+            phase = "starting"
+            continue
+        # STARTING status message
+        if phase == "starting":
+            assert m["message_type"] == "scan_status_change"
+            assert m["status"] == "STARTING"
+            phase = "running"
+            continue
+        # RUNNING status message
+        if phase == "running":
+            assert m["message_type"] == "scan_status_change"
+            assert m["status"] == "RUNNING"
+            phase = "finishing"
+            continue
+        # FINISHING status message
+        if phase == "finishing":
+            assert m["message_type"] == "scan_status_change"
+            assert m["status"] == "FINISHING"
+            phase = "cleaning_up_2"
+            continue
+        # CLEANING_UP status message
+        if phase == "cleaning_up_2":
+            assert m["message_type"] == "scan_status_change"
+            assert m["status"] == "CLEANING_UP"
+            phase = "finished_2"
+            continue
+        # FINISHED status message
+        if phase == "finished_2":
+            assert m["message_type"] == "scan_status_change"
+            assert m["status"] == "FINISHED"
+            success = True
+            scan_done.set()
+            break
+
+
+@pytest.mark.asyncio
+async def test_agent(agent):
+    global success
+    async with websockets.serve(websocket_handler, "127.0.0.1", 8765):
+        asyncio.create_task(agent.start())
+        # wait for 30 seconds
+        await asyncio.wait_for(scan_done.wait(), 10)
+        assert success
diff --git a/bbot/test/test_step_2/test_cloud_helpers.py b/bbot/test/test_step_2/test_cloud_helpers.py
index 49f5a74109..c4494037bc 100644
--- a/bbot/test/test_step_2/test_cloud_helpers.py
+++ b/bbot/test/test_step_2/test_cloud_helpers.py
@@ -1,9 +1,10 @@
 from ..bbot_fixtures import *  # noqa: F401
 
 
-def test_cloud_helpers(monkeypatch, bbot_scanner, bbot_config):
+@pytest.mark.asyncio
+async def test_cloud_helpers(monkeypatch, bbot_scanner, bbot_config):
     scan1 = bbot_scanner("127.0.0.1", config=bbot_config)
-    scan1.load_modules()
+    await scan1.load_modules()
     aws_event1 = scan1.make_event("amazonaws.com", source=scan1.root_event)
     aws_event2 = scan1.make_event("asdf.amazonaws.com", source=scan1.root_event)
     aws_event3 = scan1.make_event("asdfamazonaws.com", source=scan1.root_event)
diff --git a/bbot/test/test_step_2/test_config.py b/bbot/test/test_step_2/test_config.py
index 3fa7961f27..2d9980a2c7 100644
--- a/bbot/test/test_step_2/test_config.py
+++ b/bbot/test/test_step_2/test_config.py
@@ -1,9 +1,10 @@
 from ..bbot_fixtures import *  # noqa: F401
 
 
-def test_config(bbot_config, bbot_scanner):
+@pytest.mark.asyncio
+async def test_config(bbot_config, bbot_scanner):
     scan1 = bbot_scanner("127.0.0.1", modules=["ipneighbor", "speculate"], config=bbot_config)
-    scan1.load_modules()
+    await scan1.load_modules()
     assert scan1.config.plumbus == "asdf"
     assert scan1.modules["ipneighbor"].config.test_option == "ipneighbor"
     assert scan1.modules["python"].config.test_option == "asdf"

From b8ee5ad561587434e63da422c704a11db448b1cb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 15 May 2023 14:20:47 -0400
Subject: [PATCH 021/387] fix NameError

---
 bbot/test/test_step_2/test_agent.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/test/test_step_2/test_agent.py b/bbot/test/test_step_2/test_agent.py
index d5fc2b35ba..63121d6d19 100644
--- a/bbot/test/test_step_2/test_agent.py
+++ b/bbot/test/test_step_2/test_agent.py
@@ -1,5 +1,6 @@
 import json
 import asyncio
+import websockets
 
 from ..bbot_fixtures import *  # noqa: F401
 

From 8683f042f0c5c2cf583494e5976e880a7fa8562f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 15 May 2023 15:12:23 -0400
Subject: [PATCH 022/387] manager tests passing

---
 bbot/scanner/manager.py                  |  1 +
 bbot/test/bbot_fixtures.py               | 12 +++-
 bbot/test/test_step_2/test_agent.py      |  1 -
 bbot/test/test_step_2/test_events.py     |  3 +-
 bbot/test/test_step_2/test_manager.py    | 74 +++++++++++++++---------
 bbot/test/test_step_2/test_python_api.py |  1 +
 bbot/test/test_step_2/test_scan.py       |  3 +-
 bbot/test/test_step_2/test_scope.py      | 10 ++--
 8 files changed, 67 insertions(+), 38 deletions(-)

diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 7538bb89c2..d61fa5b14b 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -237,6 +237,7 @@ async def _emit_event(self, event, *args, **kwargs):
             if self.dns_resolution:
                 emit_children = -1 < event.scope_distance < self.scan.dns_search_distance
                 if emit_children:
+                    # only emit DNS children once for each unique host
                     host_hash = hash(str(event.host))
                     if host_hash in self.events_accepted:
                         emit_children = False
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index 0306b3819b..5b8d2ffe0e 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -1,6 +1,7 @@
 import os
 import sys
 import pytest
+import asyncio  # noqa
 import logging
 import subprocess
 import tldextract
@@ -71,6 +72,8 @@ def patch_commands():
         # ffuf
         """{"input":{"FUZZ":"L2luZGV4Lmh0bWw="},"position":1,"status":200,"length":1256,"words":298,"lines":47,"content-type":"text/html;charset=UTF-8","redirectlocation":"","url":"http://example.com:80//index.html","duration":101243249,"resultfile":"","host":"example.com:80"}""",
         "https://api.publicapis.org:443/health",
+        # fingerprintx
+        """{"ip":"8.8.8.8","port":443,"protocol":"https","tls":true,"transport":"tcp","version":"HTTP server (unknown)","metadata":{"status":"302 Found","statusCode":302,"responseHeaders":{"Access-Control-Allow-Origin":["*"],"Alt-Svc":["h3=\":443\"; ma=2592000,h3-29=\":443\"; ma=2592000"],"Content-Length":["216"],"Content-Type":["text/html; charset=UTF-8"],"Date":["Mon, 15 May 2023 18:34:49 GMT"],"Location":["https://dns.google/"],"Server":["HTTP server (unknown)"],"X-Content-Type-Options":["nosniff"],"X-Frame-Options":["SAMEORIGIN"],"X-Xss-Protection":["0"]},"technologies":["HTTP/3"]}}"""
         # open port
         "api.publicapis.org:443",
         # host
@@ -80,10 +83,11 @@ def patch_commands():
     ]
 
     def patch_scan_commands(scanner):
-        def run(*args, **kwargs):
+        async def run(*args, **kwargs):
             log.debug(f"helpers.command.run(args={args}, kwargs={kwargs})")
             text = kwargs.get("text", True)
-            return subprocess.run(["echo", "\n".join(sample_output)], text=text, stdout=subprocess.PIPE)
+            output = "\n".join(sample_output)
+            return subprocess.run(["echo", output], text=text)
 
         def run_live(*args, **kwargs):
             log.debug(f"helpers.command.run_live(args={args}, kwargs={kwargs})")
@@ -156,7 +160,6 @@ def scan(monkeypatch, patch_ansible, patch_commands, bbot_config):
     bbot_scan = Scanner("127.0.0.1", modules=["ipneighbor"], config=bbot_config)
     patch_commands(bbot_scan)
     patch_ansible(bbot_scan)
-    bbot_scan.status = "RUNNING"
 
     fallback_nameservers_file = bbot_scan.helpers.bbot_home / "fallback_nameservers.txt"
     with open(fallback_nameservers_file, "w") as f:
@@ -312,6 +315,9 @@ def agent(monkeypatch, bbot_config):
 test_config = OmegaConf.load(Path(__file__).parent / "test.conf")
 test_config = OmegaConf.merge(default_config, test_config)
 
+if test_config.get("debug", False):
+    logging.getLogger("bbot").setLevel(logging.DEBUG)
+
 
 @pytest.fixture
 def bbot_config():
diff --git a/bbot/test/test_step_2/test_agent.py b/bbot/test/test_step_2/test_agent.py
index 63121d6d19..a673effeae 100644
--- a/bbot/test/test_step_2/test_agent.py
+++ b/bbot/test/test_step_2/test_agent.py
@@ -1,5 +1,4 @@
 import json
-import asyncio
 import websockets
 
 from ..bbot_fixtures import *  # noqa: F401
diff --git a/bbot/test/test_step_2/test_events.py b/bbot/test/test_step_2/test_events.py
index f184f91b60..03ebde6354 100644
--- a/bbot/test/test_step_2/test_events.py
+++ b/bbot/test/test_step_2/test_events.py
@@ -5,7 +5,8 @@
 from ..bbot_fixtures import *
 
 
-def test_events(events, scan, helpers, bbot_config):
+@pytest.mark.asyncio
+async def test_events(events, scan, helpers, bbot_config):
     assert events.ipv4.type == "IP_ADDRESS"
     assert events.ipv6.type == "IP_ADDRESS"
     assert events.netv4.type == "IP_RANGE"
diff --git a/bbot/test/test_step_2/test_manager.py b/bbot/test/test_step_2/test_manager.py
index eff5190e4d..6b43ce07d8 100644
--- a/bbot/test/test_step_2/test_manager.py
+++ b/bbot/test/test_step_2/test_manager.py
@@ -1,7 +1,8 @@
 from ..bbot_fixtures import *  # noqa: F401
 
 
-def test_manager(bbot_config, bbot_scanner):
+@pytest.mark.asyncio
+async def test_manager(bbot_config, bbot_scanner):
     dns_config = OmegaConf.merge(
         default_config, OmegaConf.create({"dns_resolution": True, "scope_report_distance": 1})
     )
@@ -9,14 +10,25 @@ def test_manager(bbot_config, bbot_scanner):
     # test _emit_event
     results = []
     output = []
+    event_children = []
+
+    async def results_append(e):
+        results.append(e)
+
+    async def output_append(e):
+        output.append(e)
+
+    def event_children_append(e):
+        event_children.append(e)
+
     success_callback = lambda e: results.append("success")
     scan1 = bbot_scanner("127.0.0.1", modules=["ipneighbor"], output_modules=["human"], config=dns_config)
-    scan1.load_modules()
+    await scan1.load_modules()
     module = scan1.modules["ipneighbor"]
     module.scope_distance_modifier = 0
-    module.queue_event = lambda e: results.append(e)
+    module.queue_event = results_append
     output_module = scan1.modules["human"]
-    output_module.queue_event = lambda e: output.append(e)
+    output_module.queue_event = output_append
     scan1.status = "RUNNING"
     manager = scan1.manager
     # manager.distribute_event = lambda e: results.append(e)
@@ -36,11 +48,17 @@ class DummyModule3:
 
     localhost.module = DummyModule1()
     # make sure abort_if works as intended
-    manager._emit_event(localhost, abort_if=lambda e: e.module._type == "output")
+    await manager._emit_event(localhost, abort_if=lambda e: e.module._type == "output")
     assert len(results) == 0
     manager.events_accepted.clear()
+    manager.events_distributed.clear()
+    await manager._emit_event(localhost, abort_if=lambda e: e.module._type != "output")
+    assert len(results) == 1
+    results.clear()
+    manager.events_accepted.clear()
+    manager.events_distributed.clear()
     # make sure success_callback works as intended
-    manager._emit_event(
+    await manager._emit_event(
         localhost, on_success_callback=success_callback, abort_if=lambda e: e.module._type == "plumbus"
     )
     assert localhost in results
@@ -55,9 +73,8 @@ class DummyModule3:
     googledns.module = DummyModule2()
     googledns.source = "asdf"
     googledns.make_in_scope()
-    event_children = []
-    manager.emit_event = lambda e, *args, **kwargs: event_children.append(e)
-    manager._emit_event(googledns)
+    manager.queue_event = event_children_append
+    await manager._emit_event(googledns)
     assert len(event_children) > 0
     assert googledns in results
     assert googledns in output
@@ -65,7 +82,7 @@ class DummyModule3:
     output.clear()
     event_children.clear()
     # make sure deduplication catches the same event
-    manager._emit_event(googledns)
+    await manager._emit_event(googledns)
     assert len(output) == 0
     assert len(results) == 0
     assert len(event_children) == 0
@@ -73,7 +90,7 @@ class DummyModule3:
     event_children.clear()
     # make sure _force_output overrides dup detection
     googledns._force_output = True
-    manager._emit_event(googledns)
+    await manager._emit_event(googledns)
     assert googledns in output
     assert len(event_children) == 0
     googledns._force_output = False
@@ -83,7 +100,7 @@ class DummyModule3:
     source_event = manager.scan.make_event("1.2.3.4", "IP_ADDRESS", source=manager.scan.root_event)
     source_event._resolved.set()
     googledns.source = source_event
-    manager._emit_event(googledns)
+    await manager._emit_event(googledns)
     assert len(event_children) == 0
     assert googledns in output
 
@@ -91,21 +108,22 @@ class DummyModule3:
     msg = "Ignore this error, it belongs here"
     exceptions = (Exception(msg), KeyboardInterrupt(msg), BrokenPipeError(msg))
     for e in exceptions:
-        with manager.catch():
+        with manager.scan.catch():
             raise e
 
 
-def test_scope_distance(bbot_scanner, bbot_config):
+@pytest.mark.asyncio
+async def test_scope_distance(bbot_scanner, bbot_config):
     # event filtering based on scope_distance
     scan1 = bbot_scanner(
         "127.0.0.1", "evilcorp.com", modules=["ipneighbor"], output_modules=["json"], config=bbot_config
     )
     scan1.status = "RUNNING"
-    scan1.load_modules()
+    await scan1.load_modules()
     module = scan1.modules["ipneighbor"]
-    module_queue = module.incoming_event_queue.queue
+    module_queue = module.incoming_event_queue._queue
     output_module = scan1.modules["json"]
-    output_queue = output_module.incoming_event_queue.queue
+    output_queue = output_module.incoming_event_queue._queue
     manager = scan1.manager
     test_event1 = scan1.make_event("127.0.0.1", source=scan1.root_event)
 
@@ -114,7 +132,7 @@ def test_scope_distance(bbot_scanner, bbot_config):
     assert module.scope_distance_modifier == 1
 
     # test _emit_event() with scope_distance == 0
-    manager._emit_event(test_event1)
+    await manager._emit_event(test_event1)
     assert test_event1.scope_distance == 0
     assert test_event1._internal == False
     assert test_event1 in output_queue
@@ -127,41 +145,41 @@ def test_scope_distance(bbot_scanner, bbot_config):
     dns_event = scan1.make_event("evilcorp.com", source=scan1.root_event)
 
     # non-watched event type
-    manager._emit_event(dns_event)
+    await manager._emit_event(dns_event)
     assert dns_event.scope_distance == 0
     assert dns_event in output_queue
     assert dns_event not in module_queue
 
     # test _emit_event() with scope_distance == 1
     assert test_event2.scope_distance == 1
-    manager._emit_event(test_event2)
+    await manager._emit_event(test_event2)
     assert test_event2.scope_distance == 1
     assert test_event2._internal == True
     assert test_event2 not in output_queue
     assert test_event2 in module_queue
-    valid, reason = module._event_postcheck(test_event2)
+    valid, reason = await module._event_postcheck(test_event2)
     assert valid
 
     # test _emit_event() with scope_distance == 2
     assert test_event3.scope_distance == 2
-    manager._emit_event(test_event3)
+    await manager._emit_event(test_event3)
     assert test_event3.scope_distance == 2
     assert test_event3._internal == True
     assert test_event3 not in output_queue
     assert test_event3 in module_queue
-    valid, reason = module._event_postcheck(test_event3)
+    valid, reason = await module._event_postcheck(test_event3)
     assert not valid
     assert reason.startswith("its scope_distance (2) exceeds the maximum allowed by the scan")
 
     # test _emit_event() with scope_distance == 2 and _force_output == True
     assert test_event4.scope_distance == 2
-    manager._emit_event(test_event4)
+    await manager._emit_event(test_event4)
     assert test_event4.scope_distance == 2
     assert test_event4._internal == True
     assert test_event4._force_output == True
     assert test_event4 in output_queue
     assert test_event4 in module_queue
-    valid, reason = module._event_postcheck(test_event4)
+    valid, reason = await module._event_postcheck(test_event4)
     assert not valid
     assert reason.startswith("its scope_distance (2) exceeds the maximum allowed by the scan")
 
@@ -170,7 +188,7 @@ def test_scope_distance(bbot_scanner, bbot_config):
     assert geoevent.scope_distance == 3
     assert geoevent.always_emit == True
     assert geoevent._force_output == False
-    manager._emit_event(geoevent)
+    await manager._emit_event(geoevent)
     assert geoevent._force_output == True
     assert geoevent in output_queue
     assert geoevent not in module_queue
@@ -183,10 +201,10 @@ def test_scope_distance(bbot_scanner, bbot_config):
     assert affiliate_event._always_emit == False
     assert affiliate_event.always_emit == True
     assert affiliate_event._force_output == False
-    manager._emit_event(affiliate_event)
+    await manager._emit_event(affiliate_event)
     assert affiliate_event._force_output == True
     assert affiliate_event in output_queue
     assert affiliate_event in module_queue
-    valid, reason = module._event_postcheck(affiliate_event)
+    valid, reason = await module._event_postcheck(affiliate_event)
     assert not valid
     assert reason.startswith("its scope_distance (3) exceeds the maximum allowed by the scan")
diff --git a/bbot/test/test_step_2/test_python_api.py b/bbot/test/test_step_2/test_python_api.py
index 00b26f3a6e..f4ef428af9 100644
--- a/bbot/test/test_step_2/test_python_api.py
+++ b/bbot/test/test_step_2/test_python_api.py
@@ -1,6 +1,7 @@
 from ..bbot_fixtures import *
 
 
+@pytest.mark.asyncio
 def test_python_api(bbot_config):
     from bbot.scanner import Scanner
 
diff --git a/bbot/test/test_step_2/test_scan.py b/bbot/test/test_step_2/test_scan.py
index 6e60c2190e..2bde71a382 100644
--- a/bbot/test/test_step_2/test_scan.py
+++ b/bbot/test/test_step_2/test_scan.py
@@ -1,7 +1,8 @@
 from ..bbot_fixtures import *
 
 
-def test_scan(
+@pytest.mark.asyncio
+async def test_scan(
     patch_ansible,
     patch_commands,
     events,
diff --git a/bbot/test/test_step_2/test_scope.py b/bbot/test/test_step_2/test_scope.py
index 2fe92373b2..55838d3458 100644
--- a/bbot/test/test_step_2/test_scope.py
+++ b/bbot/test/test_step_2/test_scope.py
@@ -36,11 +36,13 @@ def check_events(self, events):
         return True
 
 
-def test_scope_blacklist(bbot_config, bbot_scanner, bbot_httpserver):
+@pytest.mark.asyncio
+async def test_scope_blacklist(bbot_config, bbot_scanner, bbot_httpserver):
     x = Scope_test_blacklist(bbot_config, bbot_scanner, bbot_httpserver, module_name="httpx")
-    x.run()
+    await x.run()
 
 
-def test_scope_whitelist(bbot_config, bbot_scanner, bbot_httpserver):
+@pytest.mark.asyncio
+async def test_scope_whitelist(bbot_config, bbot_scanner, bbot_httpserver):
     x = Scope_test_whitelist(bbot_config, bbot_scanner, bbot_httpserver, module_name="httpx")
-    x.run()
+    await x.run()

From 47a659aaaaedc5c6396b0e448677d4b304d042ce Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 15 May 2023 16:52:02 -0400
Subject: [PATCH 023/387] working through asyncifying modules

---
 bbot/core/helpers/depsinstaller/installer.py |  6 +-
 bbot/modules/azure_tenant.py                 | 10 +--
 bbot/modules/base.py                         |  2 +-
 bbot/modules/bevigil.py                      | 18 +++---
 bbot/modules/binaryedge.py                   | 10 +--
 bbot/modules/builtwith.py                    | 16 ++---
 bbot/modules/c99.py                          |  8 +--
 bbot/modules/censys.py                       | 20 +++---
 bbot/modules/crt.py                          |  6 +-
 bbot/modules/dnscommonsrv.py                 |  8 +--
 bbot/modules/dnszonetransfer.py              | 14 ++---
 bbot/modules/fullhunt.py                     | 10 +--
 bbot/modules/generic_ssrf.py                 | 43 ++++++-------
 bbot/modules/github.py                       | 66 +++++++++++---------
 bbot/modules/host_header.py                  | 23 +++----
 bbot/modules/httpx.py                        |  2 +-
 bbot/modules/ipstack.py                      |  8 +--
 bbot/modules/ntlm.py                         | 49 +++++++--------
 bbot/modules/output/asset_inventory.py       |  4 +-
 bbot/modules/output/http.py                  | 56 +++++++++--------
 bbot/modules/report/affiliates.py            |  6 +-
 bbot/modules/shodan_dns.py                   | 10 +--
 bbot/modules/sslcert.py                      |  2 +-
 bbot/modules/viewdns.py                      | 12 ++--
 bbot/test/test_step_2/test_modules_basic.py  | 13 +++-
 25 files changed, 218 insertions(+), 204 deletions(-)

diff --git a/bbot/core/helpers/depsinstaller/installer.py b/bbot/core/helpers/depsinstaller/installer.py
index 2195237f38..72f6b5575c 100644
--- a/bbot/core/helpers/depsinstaller/installer.py
+++ b/bbot/core/helpers/depsinstaller/installer.py
@@ -165,9 +165,9 @@ async def pip_install(self, packages, constraints=None):
         try:
             process = await self.parent_helper.run(command, check=True)
             message = f'Successfully installed pip packages "{packages_str}"'
-            output = process.stdout.splitlines()[-1]
-            if output:
-                message = output
+            output = process.stdout
+            if output is not None:
+                message = output.splitlines()[-1]
             log.info(message)
             return True
         except CalledProcessError as err:
diff --git a/bbot/modules/azure_tenant.py b/bbot/modules/azure_tenant.py
index fafa391a76..b2626810e1 100644
--- a/bbot/modules/azure_tenant.py
+++ b/bbot/modules/azure_tenant.py
@@ -12,14 +12,14 @@ class azure_tenant(viewdns):
     base_url = "https://autodiscover-s.outlook.com"
     in_scope_only = True
 
-    def setup(self):
+    async def setup(self):
         self.processed = set()
         self.d_xml_regex = re.compile(r"<Domain>([^<>/]*)</Domain>", re.I)
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         _, query = self.helpers.split_domain(event.data)
-        domains, _ = self.query(query)
+        domains, _ = await self.query(query)
         if domains:
             self.success(f'Found {len(domains):,} domains under tenant for "{query}"')
         for domain in domains:
@@ -27,7 +27,7 @@ def handle_event(self, event):
                 self.emit_event(domain, "DNS_NAME", source=event, tags=["affiliate"])
         # todo: tenants?
 
-    def query(self, domain):
+    async def query(self, domain):
         url = f"{self.base_url}/autodiscover/autodiscover.svc"
         data = f"""<?xml version="1.0" encoding="utf-8"?>
 <soap:Envelope xmlns:exm="http://schemas.microsoft.com/exchange/services/2006/messages" xmlns:ext="http://schemas.microsoft.com/exchange/services/2006/types" xmlns:a="http://www.w3.org/2005/08/addressing" xmlns:soap="http://schemas.xmlsoap.org/soap/envelope/" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:xsd="http://www.w3.org/2001/XMLSchema">
@@ -56,7 +56,7 @@ def query(self, domain):
 
         self.debug(f"Retrieving tenant domains at {url}")
 
-        r = self.request_with_fail_count(url, method="POST", headers=headers, data=data)
+        r = await self.request_with_fail_count(url, method="POST", headers=headers, data=data)
         status_code = getattr(r, "status_code", 0)
         if status_code not in (200, 421):
             self.warning(f'Error retrieving azure_tenant domains for "{domain}" (status code: {status_code})')
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 2e06ae3381..e359ed7816 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -173,7 +173,7 @@ def require_api_key(self):
         else:
             return None, "No API key set"
 
-    def ping(self):
+    async def ping(self):
         """
         Used in conjuction with require_api_key to ensure an API is up and responding
 
diff --git a/bbot/modules/bevigil.py b/bbot/modules/bevigil.py
index d81a081a91..a24d6331c1 100644
--- a/bbot/modules/bevigil.py
+++ b/bbot/modules/bevigil.py
@@ -15,35 +15,35 @@ class bevigil(shodan_dns):
 
     base_url = "https://osint.bevigil.com/api"
 
-    def setup(self):
+    async def setup(self):
         self.api_key = self.config.get("api_key", "")
         self.headers = {"X-Access-Token": self.api_key}
         self.urls = self.config.get("urls", False)
         return super().setup()
 
-    def ping(self):
+    async def ping(self):
         pass
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
-        subdomains = self.query(query, request_fn=self.request_subdomains, parse_fn=self.parse_subdomains)
+        subdomains = await self.query(query, request_fn=self.request_subdomains, parse_fn=self.parse_subdomains)
         if subdomains:
             for subdomain in subdomains:
                 self.emit_event(subdomain, "DNS_NAME", source=event)
 
         if self.urls:
-            urls = self.query(query, request_fn=self.request_urls, parse_fn=self.parse_urls)
+            urls = await self.query(query, request_fn=self.request_urls, parse_fn=self.parse_urls)
             if urls:
                 for parsed_url in self.helpers.collapse_urls(urls):
                     self.emit_event(parsed_url.geturl(), "URL_UNVERIFIED", source=event)
 
-    def request_subdomains(self, query):
+    async def request_subdomains(self, query):
         url = f"{self.base_url}/{self.helpers.quote(query)}/subdomains/"
-        return self.request_with_fail_count(url, headers=self.headers)
+        return await self.request_with_fail_count(url, headers=self.headers)
 
-    def request_urls(self, query):
+    async def request_urls(self, query):
         url = f"{self.base_url}/{self.helpers.quote(query)}/urls/"
-        return self.request_with_fail_count(url, headers=self.headers)
+        return await self.request_with_fail_count(url, headers=self.headers)
 
     def parse_subdomains(self, r, query=None):
         results = set()
diff --git a/bbot/modules/binaryedge.py b/bbot/modules/binaryedge.py
index 7bcb266806..497dd03069 100644
--- a/bbot/modules/binaryedge.py
+++ b/bbot/modules/binaryedge.py
@@ -14,20 +14,20 @@ class binaryedge(shodan_dns):
 
     base_url = "https://api.binaryedge.io/v2"
 
-    def setup(self):
+    async def setup(self):
         self.max_records = self.config.get("max_records", 1000)
         self.headers = {"X-Key": self.config.get("api_key", "")}
         return super().setup()
 
-    def ping(self):
+    async def ping(self):
         url = f"{self.base_url}/user/subscription"
-        j = self.request_with_fail_count(url, headers=self.headers).json()
+        j = (await self.request_with_fail_count(url, headers=self.headers)).json()
         assert j.get("requests_left", 0) > 0
 
-    def request_url(self, query):
+    async def request_url(self, query):
         # todo: host query (certs + services)
         url = f"{self.base_url}/query/domains/subdomain/{self.helpers.quote(query)}"
-        return self.request_with_fail_count(url, headers=self.headers)
+        return await self.request_with_fail_count(url, headers=self.headers)
 
     def parse_results(self, r, query):
         j = r.json()
diff --git a/bbot/modules/builtwith.py b/bbot/modules/builtwith.py
index 8a920f6a24..e8139d5dd8 100644
--- a/bbot/modules/builtwith.py
+++ b/bbot/modules/builtwith.py
@@ -22,33 +22,33 @@ class builtwith(shodan_dns):
     options_desc = {"api_key": "Builtwith API key", "redirects": "Also look up inbound and outbound redirects"}
     base_url = "https://api.builtwith.com"
 
-    def ping(self):
+    async def ping(self):
         # builtwith does not have a ping feature, so we skip it to save API credits
         return
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
         # domains
-        subdomains = self.query(query, parse_fn=self.parse_domains, request_fn=self.request_domains)
+        subdomains = await self.query(query, parse_fn=self.parse_domains, request_fn=self.request_domains)
         if subdomains:
             for s in subdomains:
                 if s != event:
                     self.emit_event(s, "DNS_NAME", source=event)
         # redirects
         if self.config.get("redirects", True):
-            redirects = self.query(query, parse_fn=self.parse_redirects, request_fn=self.request_redirects)
+            redirects = await self.query(query, parse_fn=self.parse_redirects, request_fn=self.request_redirects)
             if redirects:
                 for r in redirects:
                     if r != event:
                         self.emit_event(r, "DNS_NAME", source=event, tags=["affiliate"])
 
-    def request_domains(self, query):
+    async def request_domains(self, query):
         url = f"{self.base_url}/v20/api.json?KEY={self.api_key}&LOOKUP={query}&NOMETA=yes&NOATTR=yes&HIDETEXT=yes&HIDEDL=yes"
-        return self.request_with_fail_count(url)
+        return await self.request_with_fail_count(url)
 
-    def request_redirects(self, query):
+    async def request_redirects(self, query):
         url = f"{self.base_url}/redirect1/api.json?KEY={self.api_key}&LOOKUP={query}"
-        return self.request_with_fail_count(url)
+        return await self.request_with_fail_count(url)
 
     def parse_domains(self, r, query):
         """
diff --git a/bbot/modules/c99.py b/bbot/modules/c99.py
index 7fde17dcd9..5b0179def4 100644
--- a/bbot/modules/c99.py
+++ b/bbot/modules/c99.py
@@ -11,14 +11,14 @@ class c99(shodan_dns):
 
     base_url = "https://api.c99.nl"
 
-    def ping(self):
+    async def ping(self):
         url = f"{self.base_url}/randomnumber?key={self.api_key}&between=1,100&json"
-        response = self.request_with_fail_count(url)
+        response = await self.request_with_fail_count(url)
         assert response.json()["success"] == True
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/subdomainfinder?key={self.api_key}&domain={self.helpers.quote(query)}&json"
-        return self.request_with_fail_count(url)
+        return await self.request_with_fail_count(url)
 
     def parse_results(self, r, query):
         j = r.json()
diff --git a/bbot/modules/censys.py b/bbot/modules/censys.py
index ab6ca65a0b..ed713472d7 100644
--- a/bbot/modules/censys.py
+++ b/bbot/modules/censys.py
@@ -21,7 +21,7 @@ class censys(shodan_dns):
 
     deps_pip = ["censys~=2.1.9"]
 
-    def setup(self):
+    async def setup(self):
         self.max_records = self.config.get("max_records", 1000)
         self.api_id = self.config.get("api_id", "")
         self.api_secret = self.config.get("api_secret", "")
@@ -32,13 +32,13 @@ def setup(self):
             self.certificates = CensysCertificates(api_id=self.api_id, api_secret=self.api_secret)
         return super().setup()
 
-    def ping(self):
+    async def ping(self):
         quota = self.certificates.quota()
         used = int(quota["used"])
         allowance = int(quota["allowance"])
         assert used < allowance, "No quota remaining"
 
-    def query(self, query):
+    async def query(self, query):
         emails = set()
         dns_names = set()
         ip_addresses = dict()
@@ -46,9 +46,10 @@ def query(self, query):
             # certificates
             certificate_query = f"parsed.names: {query}"
             certificate_fields = ["parsed.names", "parsed.issuer_dn", "parsed.subject_dn"]
-            for result in self.certificates.search(
-                certificate_query, fields=certificate_fields, max_records=self.max_records
-            ):
+            results = await self.scan.run_in_executor(
+                self.certificates.search, certificate_query, fields=certificate_fields, max_records=self.max_records
+            )
+            for result in results:
                 parsed_names = result.get("parsed.names", [])
                 # helps filter out third-party certs with a lot of garbage names
                 _filter = lambda x: True
@@ -64,7 +65,10 @@ def query(self, query):
             per_page = 100
             pages = max(1, int(self.max_records / per_page))
             hosts_query = f"services.tls.certificates.leaf_data.names: {query} or services.tls.certificates.leaf_data.subject.email_address: {query}"
-            for i, page in enumerate(self.hosts.search(hosts_query, per_page=per_page, pages=pages)):
+            hosts_results = await self.scan.run_in_executor(
+                self.hosts.search, hosts_query, per_page=per_page, pages=pages
+            )
+            for i, page in enumerate(hosts_results):
                 for result in page:
                     ip = result.get("ip", "")
                     if not ip:
@@ -90,7 +94,7 @@ def query(self, query):
 
         return emails, dns_names, ip_addresses
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
         emails, dns_names, ip_addresses = self.query(query)
         for email in emails:
diff --git a/bbot/modules/crt.py b/bbot/modules/crt.py
index ca8aefed1f..a4410354ce 100644
--- a/bbot/modules/crt.py
+++ b/bbot/modules/crt.py
@@ -10,14 +10,14 @@ class crt(crobat):
     base_url = "https://crt.sh"
     reject_wildcards = False
 
-    def setup(self):
+    async def setup(self):
         self.cert_ids = set()
         return super().setup()
 
-    def request_url(self, query):
+    async def request_url(self, query):
         params = {"q": f"%.{query}", "output": "json"}
         url = self.helpers.add_get_params(self.base_url, params).geturl()
-        return self.request_with_fail_count(url, timeout=self.http_timeout + 10)
+        return await self.request_with_fail_count(url, timeout=self.http_timeout + 10)
 
     def parse_results(self, r, query):
         j = r.json()
diff --git a/bbot/modules/dnscommonsrv.py b/bbot/modules/dnscommonsrv.py
index 8333e8293b..ab8f9029e7 100644
--- a/bbot/modules/dnscommonsrv.py
+++ b/bbot/modules/dnscommonsrv.py
@@ -96,14 +96,14 @@ class dnscommonsrv(BaseModule):
     meta = {"description": "Check for common SRV records"}
     max_event_handlers = 10
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         # skip SRV wildcards
-        if "SRV" in self.helpers.is_wildcard(event.host):
+        if "SRV" in await self.helpers.is_wildcard(event.host):
             return False
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         queries = [event.data] + [f"{srv}.{event.data}" for srv in common_srvs]
-        for query, results in self.helpers.resolve_batch(queries, type="srv"):
+        async for query, results in self.helpers.resolve_batch(queries, type="srv"):
             if results:
                 self.emit_event(query, "DNS_NAME", tags=["srv-record"], source=event)
diff --git a/bbot/modules/dnszonetransfer.py b/bbot/modules/dnszonetransfer.py
index 6e56284f92..4a3fb5a58b 100644
--- a/bbot/modules/dnszonetransfer.py
+++ b/bbot/modules/dnszonetransfer.py
@@ -14,29 +14,29 @@ class dnszonetransfer(BaseModule):
     max_event_handlers = 5
     suppress_dupes = False
 
-    def setup(self):
+    async def setup(self):
         self.timeout = self.config.get("timeout", 10)
         return True
 
-    def filter_event(self, event):
-        if any([x in event.tags for x in ("ns_record", "soa_record")]):
+    async def filter_event(self, event):
+        if any([x in event.tags for x in ("ns-record", "soa-record")]):
             return True
         return False
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         domain = event.data
         self.debug("Finding nameservers with NS/SOA query")
-        nameservers = list(self.helpers.resolve(event.data, type=("NS", "SOA")))
+        nameservers = list(await self.helpers.resolve(event.data, type=("NS", "SOA")))
         nameserver_ips = set()
         for n in nameservers:
-            nameserver_ips.update(self.helpers.resolve(n))
+            nameserver_ips.update(await self.helpers.resolve(n))
         self.debug(f"Found {len(nameservers):} nameservers for domain {domain}")
         for nameserver in nameserver_ips:
             if self.scan.stopping:
                 break
             try:
                 self.debug(f"Attempting zone transfer against {nameserver} for domain {domain}")
-                xfr_answer = dns.query.xfr(nameserver, domain, timeout=self.timeout, lifetime=self.timeout)
+                xfr_answer = await dns.asyncquery.xfr(nameserver, domain, timeout=self.timeout, lifetime=self.timeout)
                 zone = dns.zone.from_xfr(xfr_answer)
             except Exception as e:
                 self.debug(f"Error retrieving zone: {e}")
diff --git a/bbot/modules/fullhunt.py b/bbot/modules/fullhunt.py
index e0c051c561..4d6e740b09 100644
--- a/bbot/modules/fullhunt.py
+++ b/bbot/modules/fullhunt.py
@@ -11,20 +11,20 @@ class fullhunt(shodan_dns):
 
     base_url = "https://fullhunt.io/api/v1"
 
-    def setup(self):
+    async def setup(self):
         self.api_key = self.config.get("api_key", "")
         self.headers = {"x-api-key": self.api_key}
         return super().setup()
 
-    def ping(self):
+    async def ping(self):
         url = f"{self.base_url}/auth/status"
-        j = self.request_with_fail_count(url, headers=self.headers).json()
+        j = await self.request_with_fail_count(url, headers=self.headers).json()
         remaining = j["user_credits"]["remaining_credits"]
         assert remaining > 0, "No credits remaining"
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/domain/{self.helpers.quote(query)}/subdomains"
-        return self.request_with_fail_count(url, headers=self.headers)
+        return await self.request_with_fail_count(url, headers=self.headers)
 
     def parse_results(self, r, query):
         return r.json().get("hosts", [])
diff --git a/bbot/modules/generic_ssrf.py b/bbot/modules/generic_ssrf.py
index db0aa2a3c6..91e1721ab1 100644
--- a/bbot/modules/generic_ssrf.py
+++ b/bbot/modules/generic_ssrf.py
@@ -49,7 +49,7 @@ def set_base_url(self, event):
     def create_paths(self):
         return self.paths
 
-    def test(self, event):
+    async def test(self, event):
         base_url = self.set_base_url(event)
 
         for test_path in self.test_paths:
@@ -59,7 +59,7 @@ def test(self, event):
             )
             test_url = f"{base_url}{test_path_prepared}"
             self.parent_module.debug(f"Sending request to URL: {test_url}")
-            r = self.parent_module.helpers.curl(url=test_url)
+            r = await self.parent_module.helpers.curl(url=test_url)
             if r:
                 self.process(event, r, subdomain_tag)
 
@@ -104,7 +104,7 @@ class Generic_SSRF_POST(BaseSubmodule):
     def set_base_url(self, event):
         return event.data
 
-    def test(self, event):
+    async def test(self, event):
         test_url = f"{event.data}"
 
         subdomain_tag = self.parent_module.helpers.rand_string(4, digits=False)
@@ -121,7 +121,7 @@ def test(self, event):
         post_data_list = [(subdomain_tag, post_data), (subdomain_tag_lower, post_data_lower)]
 
         for tag, pd in post_data_list:
-            r = self.parent_module.helpers.curl(url=test_url, method="POST", post_data=pd)
+            r = await self.parent_module.helpers.curl(url=test_url, method="POST", post_data=pd)
             self.process(event, r, tag)
 
 
@@ -130,7 +130,7 @@ class Generic_XXE(BaseSubmodule):
     severity = "HIGH"
     paths = None
 
-    def test(self, event):
+    async def test(self, event):
         rand_entity = self.parent_module.helpers.rand_string(4, digits=False)
         subdomain_tag = self.parent_module.helpers.rand_string(4, digits=False)
 
@@ -141,7 +141,7 @@ def test(self, event):
 ]>
 <foo>&{rand_entity};</foo>"""
         test_url = f"{event.parsed.scheme}://{event.parsed.netloc}/"
-        r = self.parent_module.helpers.curl(
+        r = await self.parent_module.helpers.curl(
             url=test_url, method="POST", raw_body=post_body, headers={"Content-type": "application/xml"}
         )
         if r:
@@ -157,7 +157,7 @@ class generic_ssrf(BaseModule):
 
     deps_apt = ["curl"]
 
-    def setup(self):
+    async def setup(self):
         self.submodules = {}
         self.interactsh_subdomain_tags = {}
         self.severity = None
@@ -166,7 +166,7 @@ def setup(self):
         if self.scan.config.get("interactsh_disable", False) == False:
             try:
                 self.interactsh_instance = self.helpers.interactsh()
-                self.interactsh_domain = self.interactsh_instance.register(callback=self.interactsh_callback)
+                self.interactsh_domain = await self.interactsh_instance.register(callback=self.interactsh_callback)
             except InteractshError as e:
                 self.warning(f"Interactsh failure: {e}")
                 return False
@@ -184,12 +184,9 @@ def setup(self):
 
         return True
 
-    def handle_event(self, event):
-        self.test_submodules(self.submodules, event)
-
-    def test_submodules(self, submodules, event, **kwargs):
-        for s in submodules.values():
-            s.test(event, **kwargs)
+    async def handle_event(self, event):
+        for s in self.submodules.values():
+            await s.test(event)
 
     def interactsh_callback(self, r):
         full_id = r.get("full-id", None)
@@ -217,13 +214,11 @@ def interactsh_callback(self, r):
                 # this is likely caused by something trying to resolve the base domain first and can be ignored
                 self.debug("skipping result because subdomain tag was missing")
 
-    def finish(self):
-        from time import sleep
-
-        sleep(5)
-
-        try:
-            for r in self.interactsh_instance.poll():
-                self.interactsh_callback(r)
-        except InteractshError as e:
-            self.debug(f"Error in interact.sh: {e}")
+    async def finish(self):
+        if self.scan.config.get("interactsh_disable", False) == False:
+            await self.helpers.sleep(5)
+            try:
+                for r in await self.interactsh_instance.poll():
+                    self.interactsh_callback(r)
+            except InteractshError as e:
+                self.debug(f"Error in interact.sh: {e}")
diff --git a/bbot/modules/github.py b/bbot/modules/github.py
index c94bcfcdb4..9fddf0393e 100644
--- a/bbot/modules/github.py
+++ b/bbot/modules/github.py
@@ -11,19 +11,19 @@ class github(shodan_dns):
 
     base_url = "https://api.github.com"
 
-    def setup(self):
-        ret = super().setup()
+    async def setup(self):
+        ret = await super().setup()
         self.headers = {"Authorization": f"token {self.api_key}"}
         return ret
 
-    def ping(self):
+    async def ping(self):
         url = f"{self.base_url}/zen"
-        response = self.helpers.request(url)
+        response = await self.helpers.request(url)
         assert getattr(response, "status_code", 0) == 200
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
-        for repo_url, raw_urls in self.query(query).items():
+        for repo_url, raw_urls in (await self.query(query)).items():
             repo_event = self.make_event({"url": repo_url}, "CODE_REPOSITORY", source=event)
             if repo_event is None:
                 continue
@@ -35,33 +35,37 @@ def handle_event(self, event):
                 url_event.scope_distance = repo_event.scope_distance
                 self.emit_event(url_event)
 
-    def query(self, query):
+    async def query(self, query):
         repos = {}
         url = f"{self.base_url}/search/code?per_page=100&type=Code&q={self.helpers.quote(query)}&page=" + "{page}"
-        for r in self.helpers.api_page_iter(url, headers=self.headers, json=False):
-            if r is None:
-                continue
-            status_code = getattr(r, "status_code", 0)
-            if status_code == 429:
-                "Github is rate-limiting us (HTTP status: 429)"
-                break
-            try:
-                j = r.json()
-            except Exception as e:
-                self.warning(f"Failed to decode JSON for {r.url} (HTTP status: {status_code}): {e}")
-                continue
-            items = j.get("items", [])
-            if not items:
-                break
-            for item in items:
-                htlm_url = item.get("html_url", "")
-                raw_url = self.raw_url(htlm_url)
-                repo_url = item.get("repository", {}).get("html_url", "")
-                if raw_url and repo_url:
-                    try:
-                        repos[repo_url].append(raw_url)
-                    except KeyError:
-                        repos[repo_url] = [raw_url]
+        agen = self.helpers.api_page_iter(url, headers=self.headers, json=False)
+        try:
+            async for r in agen:
+                if r is None:
+                    continue
+                status_code = getattr(r, "status_code", 0)
+                if status_code == 429:
+                    "Github is rate-limiting us (HTTP status: 429)"
+                    break
+                try:
+                    j = r.json()
+                except Exception as e:
+                    self.warning(f"Failed to decode JSON for {r.url} (HTTP status: {status_code}): {e}")
+                    continue
+                items = j.get("items", [])
+                if not items:
+                    break
+                for item in items:
+                    htlm_url = item.get("html_url", "")
+                    raw_url = self.raw_url(htlm_url)
+                    repo_url = item.get("repository", {}).get("html_url", "")
+                    if raw_url and repo_url:
+                        try:
+                            repos[repo_url].append(raw_url)
+                        except KeyError:
+                            repos[repo_url] = [raw_url]
+        finally:
+            agen.aclose()
         return repos
 
     @staticmethod
diff --git a/bbot/modules/host_header.py b/bbot/modules/host_header.py
index d469488dbb..0bb0f88e94 100644
--- a/bbot/modules/host_header.py
+++ b/bbot/modules/host_header.py
@@ -12,14 +12,14 @@ class host_header(BaseModule):
 
     deps_apt = ["curl"]
 
-    def setup(self):
+    async def setup(self):
         self.scanned_hosts = set()
 
         self.subdomain_tags = {}
         if self.scan.config.get("interactsh_disable", False) == False:
             try:
                 self.interactsh_instance = self.helpers.interactsh()
-                self.domain = self.interactsh_instance.register(callback=self.interactsh_callback)
+                self.domain = await self.interactsh_instance.register(callback=self.interactsh_callback)
             except InteractshError as e:
                 self.warning(f"Interactsh failure: {e}")
                 return False
@@ -54,25 +54,26 @@ def interactsh_callback(self, r):
                 # this is likely caused by something trying to resolve the base domain first and can be ignored
                 self.debug("skipping results because subdomain tag was missing")
 
-    def finish(self):
+    async def finish(self):
         if self.scan.config.get("interactsh_disable", False) == False:
+            await self.helpers.sleep(5)
             try:
-                for r in self.interactsh_instance.poll():
+                for r in await self.interactsh_instance.poll():
                     self.interactsh_callback(r)
             except InteractshError as e:
                 self.debug(f"Error in interact.sh: {e}")
 
-    def cleanup(self):
+    async def cleanup(self):
         if self.scan.config.get("interactsh_disable", False) == False:
             try:
-                self.interactsh_instance.deregister()
+                await self.interactsh_instance.deregister()
                 self.debug(
                     f"successfully deregistered interactsh session with correlation_id {self.interactsh_instance.correlation_id}"
                 )
             except InteractshError as e:
                 self.warning(f"Interactsh failure: {e}")
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
         host_hash = hash(host)
         if host_hash in self.scanned_hosts:
@@ -100,7 +101,7 @@ def handle_event(self, event):
         self.debug(f"Performing {technique_description} case")
         subdomain_tag = self.rand_string(4, digits=False)
         self.subdomain_tags[subdomain_tag] = (event, technique_description)
-        output = self.helpers.curl(
+        output = await self.helpers.curl(
             url=event.data["url"],
             headers={"Host": f"{subdomain_tag}.{self.domain}"},
             ignore_bbot_global_settings=True,
@@ -114,7 +115,7 @@ def handle_event(self, event):
         self.debug(f"Performing {technique_description} case")
         subdomain_tag = self.rand_string(4, digits=False)
         self.subdomain_tags[subdomain_tag] = (event, technique_description)
-        output = self.helpers.curl(
+        output = await self.helpers.curl(
             url=event.data["url"],
             headers={"Host": f"{subdomain_tag}.{self.domain}"},
             path_override=event.data["url"],
@@ -126,7 +127,7 @@ def handle_event(self, event):
 
         # duplicate host header tolerance
         technique_description = "duplicate host header tolerance"
-        output = self.helpers.curl(
+        output = await self.helpers.curl(
             url=event.data["url"],
             # Sending a blank HOST first as a hack to trick curl. This makes it no longer an "internal header", thereby allowing for duplicates
             # The fact that it's accepting two host headers is rare enough to note on its own, and not too noisy. Having the 3rd header be an interactsh would result in false negatives for the slightly less interesting cases.
@@ -167,7 +168,7 @@ def handle_event(self, event):
         for oh in override_headers_list:
             override_headers[oh] = f"{subdomain_tag}.{self.domain}"
 
-        output = self.helpers.curl(
+        output = await self.helpers.curl(
             url=event.data["url"],
             headers=override_headers,
             cookies=added_cookies,
diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index 16ca7294c2..4b110bea5d 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -145,6 +145,6 @@ async def handle_batch(self, *events):
                 # HTTP response
                 self.emit_event(j, "HTTP_RESPONSE", url_event, internal=True)
 
-    def cleanup(self):
+    async def cleanup(self):
         resume_file = self.helpers.current_dir / "resume.cfg"
         resume_file.unlink(missing_ok=True)
diff --git a/bbot/modules/ipstack.py b/bbot/modules/ipstack.py
index 8aef3d1dde..a5636ed62f 100644
--- a/bbot/modules/ipstack.py
+++ b/bbot/modules/ipstack.py
@@ -19,15 +19,15 @@ class Ipstack(shodan_dns):
 
     base_url = "http://api.ipstack.com/"
 
-    def ping(self):
-        r = self.request_with_fail_count(f"{self.base_url}/check?access_key={self.api_key}")
+    async def ping(self):
+        r = await self.request_with_fail_count(f"{self.base_url}/check?access_key={self.api_key}")
         resp_content = getattr(r, "text", "")
         assert getattr(r, "status_code", 0) == 200, resp_content
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         try:
             url = f"{self.base_url}/{event.data}?access_key={self.api_key}"
-            result = self.request_with_fail_count(url)
+            result = await self.request_with_fail_count(url)
             if result:
                 j = result.json()
                 if not j:
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index 684267806c..6ef511560c 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -1,7 +1,5 @@
-from threading import Lock
-
 from bbot.modules.base import BaseModule
-from bbot.core.errors import NTLMError, RequestException
+from bbot.core.errors import NTLMError, RequestError
 
 ntlm_discovery_endpoints = [
     "",
@@ -70,14 +68,13 @@ class ntlm(BaseModule):
 
     in_scope_only = True
 
-    def setup(self):
+    async def setup(self):
         self.processed = set()
-        self.processed_lock = Lock()
         self.found = set()
         self.try_all = self.config.get("try_all", False)
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         found_hash = hash(f"{event.host}:{event.port}")
         if found_hash not in self.found:
             result_FQDN, request_url = self.handle_url(event)
@@ -94,7 +91,7 @@ def handle_event(self, event):
                 )
                 self.emit_event(result_FQDN, "DNS_NAME", source=event)
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if self.try_all:
             return True
         if event.type == "HTTP_RESPONSE":
@@ -104,7 +101,7 @@ def filter_event(self, event):
                     return True
         return False
 
-    def handle_url(self, event):
+    async def handle_url(self, event):
         if event.type == "URL":
             urls = {
                 event.data,
@@ -117,35 +114,33 @@ def handle_url(self, event):
             for endpoint in ntlm_discovery_endpoints:
                 urls.add(f"{event.parsed.scheme}://{event.parsed.netloc}/{endpoint}")
 
-        futures = {}
+        tasks = []
         for url in urls:
-            future = self.submit_task(self.check_ntlm, url)
-            futures[future] = url
+            url_hash = hash(url)
+            if url_hash in self.processed:
+                continue
+            self.processed.add(url_hash)
+            task = self.helpers.create_task(self.check_ntlm(url))
+            tasks.append(task)
 
-        for future in self.helpers.as_completed(futures):
-            url = futures[future]
+        for task in self.helpers.as_completed(tasks):
             try:
-                result = future.result()
+                result, url = await task
                 if result:
-                    for future in futures:
-                        future.cancel()
+                    self.helpers.cancel_tasks(tasks)
                     return str(result["FQDN"]), url
-            except RequestException as e:
+            except RequestError as e:
                 self.warning(str(e))
+                # cancel all the tasks if there's an error
+                self.helpers.cancel_tasks(tasks)
+                break
 
         return None, None
 
-    def check_ntlm(self, test_url):
-        url_hash = hash(test_url)
-
-        with self.processed_lock:
-            if url_hash in self.processed:
-                return
-            self.processed.add(url_hash)
-
+    async def check_ntlm(self, test_url):
         # use lower timeout value
         http_timeout = self.config.get("httpx_timeout", 5)
-        r = self.helpers.request(
+        r = await self.helpers.request(
             test_url, headers=NTLM_test_header, raise_error=True, allow_redirects=False, timeout=http_timeout
         )
         ntlm_resp = r.headers.get("WWW-Authenticate", "")
@@ -154,6 +149,6 @@ def check_ntlm(self, test_url):
             try:
                 ntlm_resp_decoded = self.helpers.ntlm.ntlmdecode(ntlm_resp_b64)
                 if ntlm_resp_decoded:
-                    return ntlm_resp_decoded
+                    return ntlm_resp_decoded, test_url
             except NTLMError as e:
                 self.verbose(str(e))
diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index 5ffb3d86ae..d55794b74a 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -44,7 +44,7 @@ async def setup(self):
         ret = await super().setup()
         return ret
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if event._internal:
             return False, "event is internal"
         if event.type not in self.watched_events:
@@ -159,7 +159,7 @@ def emit_contents(self):
                     f"use_previous=True was set but no previous asset inventory was found at {self.output_file}"
                 )
 
-    def finish(self):
+    async def finish(self):
         self.emit_contents()
 
     def _run_hooks(self):
diff --git a/bbot/modules/output/http.py b/bbot/modules/output/http.py
index 1e3449df3b..93fa92f3ed 100644
--- a/bbot/modules/output/http.py
+++ b/bbot/modules/output/http.py
@@ -1,6 +1,4 @@
-import requests
-from requests.auth import HTTPBasicAuth
-from requests.exceptions import RequestException
+from bbot.core.errors import RequestError
 
 from bbot.modules.output.base import BaseOutputModule
 
@@ -26,31 +24,39 @@ class HTTP(BaseOutputModule):
     }
 
     async def setup(self):
-        self.session = requests.Session()
-        if not self.config.get("url", ""):
+        self.url = self.config.get("url", "")
+        self.method = self.config.get("method", "POST")
+        self.timeout = self.config.get("timeout", 10)
+        self.headers = {}
+        bearer = self.config.get("bearer", "")
+        if bearer:
+            self.headers["Authorization"] = f"Bearer {bearer}"
+        username = self.config.get("username", "")
+        password = self.config.get("password", "")
+        self.auth = None
+        if username:
+            self.auth = (username, password)
+        if not self.url:
             self.warning("Must set URL")
             return False
-        if not self.config.get("method", ""):
+        if not self.method:
             self.warning("Must set HTTP method")
             return False
         return True
 
-    def handle_event(self, event):
-        r = requests.Request(
-            url=self.config.get("url"),
-            method=self.config.get("method", "POST"),
-        )
-        r.headers["User-Agent"] = self.scan.useragent
-        r.json = dict(event)
-        username = self.config.get("username", "")
-        password = self.config.get("password", "")
-        if username:
-            r.auth = HTTPBasicAuth(username, password)
-        bearer = self.config.get("bearer", "")
-        if bearer:
-            r.headers["Authorization"] = f"Bearer {bearer}"
-        try:
-            timeout = self.config.get("timeout", 10)
-            self.session.send(r.prepare(), timeout=timeout)
-        except RequestException as e:
-            self.warning(f"Error sending {event}: {e}")
+    async def handle_event(self, event):
+        while 1:
+            try:
+                await self.helpers.request(
+                    url=self.url,
+                    method=self.method,
+                    auth=self.auth,
+                    headers=self.headers,
+                    json=dict(event),
+                    raise_error=True,
+                )
+                break
+            except RequestError as e:
+                self.warning(f"Error sending {event}: {e}, retrying...")
+                self.trace()
+                await self.helpers.sleep(1)
diff --git a/bbot/modules/report/affiliates.py b/bbot/modules/report/affiliates.py
index 34a34abb8f..bb6323664d 100644
--- a/bbot/modules/report/affiliates.py
+++ b/bbot/modules/report/affiliates.py
@@ -9,14 +9,14 @@ class affiliates(BaseReportModule):
     scope_distance_modifier = None
     accept_dupes = True
 
-    def setup(self):
+    async def setup(self):
         self.affiliates = {}
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         self.add_affiliate(event)
 
-    def report(self):
+    async def report(self):
         affiliates = sorted(self.affiliates.items(), key=lambda x: x[-1]["weight"], reverse=True)
         header = ["Affiliate", "Score", "Count"]
         table = []
diff --git a/bbot/modules/shodan_dns.py b/bbot/modules/shodan_dns.py
index ded5e4ee94..9cefdae204 100644
--- a/bbot/modules/shodan_dns.py
+++ b/bbot/modules/shodan_dns.py
@@ -16,18 +16,18 @@ class shodan_dns(crobat):
 
     base_url = "https://api.shodan.io"
 
-    def setup(self):
+    async def setup(self):
         super().setup()
         return self.require_api_key()
 
-    def ping(self):
-        r = self.request_with_fail_count(f"{self.base_url}/api-info?key={self.api_key}")
+    async def ping(self):
+        r = await self.request_with_fail_count(f"{self.base_url}/api-info?key={self.api_key}")
         resp_content = getattr(r, "text", "")
         assert getattr(r, "status_code", 0) == 200, resp_content
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/dns/domain/{self.helpers.quote(query)}?key={self.api_key}"
-        return self.request_with_fail_count(url)
+        return await self.request_with_fail_count(url)
 
     def parse_results(self, r, query):
         json = r.json()
diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index 30d1281450..b49e88a09b 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -7,7 +7,7 @@
 
 from bbot.modules.base import BaseModule
 from bbot.core.errors import ValidationError
-from bbot.core.helpers.threadpool import NamedLock
+from bbot.core.helpers.async_helpers import NamedLock
 
 
 class sslcert(BaseModule):
diff --git a/bbot/modules/viewdns.py b/bbot/modules/viewdns.py
index 19386eb6b2..0714bdc8e5 100644
--- a/bbot/modules/viewdns.py
+++ b/bbot/modules/viewdns.py
@@ -20,27 +20,27 @@ class viewdns(BaseModule):
     in_scope_only = True
     _qsize = 1
 
-    def setup(self):
+    async def setup(self):
         self.processed = set()
         self.date_regex = re.compile(r"\d{4}-\d{2}-\d{2}")
         return True
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         _, domain = self.helpers.split_domain(event.data)
         if hash(domain) in self.processed:
             return False
         self.processed.add(hash(domain))
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         _, query = self.helpers.split_domain(event.data)
-        for domain, _ in self.query(query):
+        for domain, _ in await self.query(query):
             self.emit_event(domain, "DNS_NAME", source=event, tags=["affiliate"])
             # todo: registrar?
 
-    def query(self, query):
+    async def query(self, query):
         url = f"{self.base_url}/reversewhois/?q={query}"
-        r = self.helpers.request(url)
+        r = await self.helpers.request(url)
         status_code = getattr(r, "status_code", 0)
         if status_code not in (200,):
             self.verbose(f"Error retrieving reverse whois results (status code: {status_code})")
diff --git a/bbot/test/test_step_2/test_modules_basic.py b/bbot/test/test_step_2/test_modules_basic.py
index 5c5285ad2c..9925eb1c8b 100644
--- a/bbot/test/test_step_2/test_modules_basic.py
+++ b/bbot/test/test_step_2/test_modules_basic.py
@@ -12,6 +12,7 @@ async def test_modules_basic(
     with open(fallback_nameservers, "w") as f:
         f.write("8.8.8.8\n")
 
+    httpx_mock.assert_all_responses_were_requested = False
     for http_method in ("GET", "CONNECT", "HEAD", "POST", "PUT", "TRACE", "DEBUG", "PATCH", "DELETE", "OPTIONS"):
         httpx_mock.add_response(method=http_method, url=re.compile(r".*"), json={"test": "test"})
 
@@ -90,13 +91,21 @@ async def test_modules_basic(
     scan2.helpers.dns.fallback_nameservers_file = fallback_nameservers
     patch_commands(scan2)
     patch_ansible(scan2)
-    scan2.load_modules()
+    await scan2.load_modules()
     scan2.status = "RUNNING"
 
     # attributes, descriptions, etc.
-    for module_name, module in scan2.modules.items():
+    for module_name, module in sorted(scan2.modules.items()):
         # flags
         assert module._type in ("internal", "output", "scan")
+        # async stuff
+        not_async = []
+        for func_name in ("setup", "ping", "filter_event", "handle_event", "finish", "report", "cleanup"):
+            f = getattr(module, func_name)
+            if not scan2.helpers.is_async_function(f):
+                log.error(f"{f.__qualname__}() is not async")
+                not_async.append(f)
+    assert not any(not_async)
 
     # module preloading
     all_preloaded = module_loader.preloaded()

From 8c6e413d95f014e27c8da426929139b39417b8d8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 17 May 2023 18:07:47 -0400
Subject: [PATCH 024/387] more module tests, sslcert suffering

---
 bbot/core/helpers/misc.py              |   2 +-
 bbot/core/helpers/modules.py           |   3 +-
 bbot/modules/base.py                   |   4 +-
 bbot/modules/bevigil.py                |   2 +-
 bbot/modules/binaryedge.py             |   2 +-
 bbot/modules/bucket_gcp.py             |   1 +
 bbot/modules/output/asset_inventory.py |   5 +-
 bbot/modules/output/base.py            |   4 +
 bbot/modules/shodan_dns.py             |   4 +-
 bbot/modules/sslcert.py                | 117 +++++++++++--------------
 bbot/test/bbot_fixtures.py             |  19 ----
 bbot/test/conftest.py                  |  19 ++++
 bbot/test/pytest.ini                   |   1 -
 bbot/test/test.conf                    |   5 ++
 poetry.lock                            |   9 +-
 15 files changed, 95 insertions(+), 102 deletions(-)
 delete mode 100644 bbot/test/pytest.ini

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 4f5bc3d615..ed8c414e37 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -27,8 +27,8 @@
 import cloudcheck as _cloudcheck
 import tldextract as _tldextract
 from hashlib import sha1 as hashlib_sha1
-from asyncio import as_completed, create_task, sleep  # noqa
 from urllib.parse import urlparse, quote, unquote, urlunparse  # noqa F401
+from asyncio import as_completed, create_task, sleep, wait_for  # noqa
 
 from .url import *  # noqa F401
 from . import regexes
diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index b121aca74f..16b2755e2f 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -1,6 +1,7 @@
 import ast
 import sys
 import importlib
+import traceback
 from pathlib import Path
 from omegaconf import OmegaConf
 from contextlib import suppress
@@ -41,8 +42,6 @@ def preload(self, module_dir):
                 self._configs[module_file.stem] = config
                 self._preloaded[module_file.stem] = preloaded
             except Exception:
-                import traceback
-
                 print(f"[CRIT] Error preloading {module_file}\n\n{traceback.format_exc()}")
                 print(f"[CRIT] Error in {module_file.name}")
                 sys.exit(1)
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index e359ed7816..49cad93f91 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -158,14 +158,14 @@ async def cleanup(self):
         """
         return
 
-    def require_api_key(self):
+    async def require_api_key(self):
         """
         Use in setup() to ensure the module is configured with an API key
         """
         self.api_key = self.config.get("api_key", "")
         if self.auth_secret:
             try:
-                self.ping()
+                await self.ping()
                 self.hugesuccess(f"API is ready")
                 return True
             except Exception as e:
diff --git a/bbot/modules/bevigil.py b/bbot/modules/bevigil.py
index a24d6331c1..3bf821e759 100644
--- a/bbot/modules/bevigil.py
+++ b/bbot/modules/bevigil.py
@@ -19,7 +19,7 @@ async def setup(self):
         self.api_key = self.config.get("api_key", "")
         self.headers = {"X-Access-Token": self.api_key}
         self.urls = self.config.get("urls", False)
-        return super().setup()
+        return await super().setup()
 
     async def ping(self):
         pass
diff --git a/bbot/modules/binaryedge.py b/bbot/modules/binaryedge.py
index 497dd03069..637585f9fc 100644
--- a/bbot/modules/binaryedge.py
+++ b/bbot/modules/binaryedge.py
@@ -17,7 +17,7 @@ class binaryedge(shodan_dns):
     async def setup(self):
         self.max_records = self.config.get("max_records", 1000)
         self.headers = {"X-Key": self.config.get("api_key", "")}
-        return super().setup()
+        return await super().setup()
 
     async def ping(self):
         url = f"{self.base_url}/user/subscription"
diff --git a/bbot/modules/bucket_gcp.py b/bbot/modules/bucket_gcp.py
index b7e96d5b1d..d4ac880a9c 100644
--- a/bbot/modules/bucket_gcp.py
+++ b/bbot/modules/bucket_gcp.py
@@ -50,4 +50,5 @@ async def check_bucket_exists(self, bucket_name, url):
         response = await self.helpers.request(url)
         status_code = getattr(response, "status_code", 0)
         existent_bucket = status_code not in (0, 400, 404)
+        self.critical(f"{bucket_name}: {url}: {existent_bucket}")
         return existent_bucket, set(), bucket_name, url
diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index d55794b74a..ce1f44e98b 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -56,7 +56,7 @@ async def filter_event(self, event):
         return True, ""
 
     async def handle_event(self, event):
-        if self.filter_event(event)[0]:
+        if (await self.filter_event(event))[0]:
             hostkey = _make_hostkey(event.host, event.resolved_hosts)
             if hostkey not in self.assets:
                 self.assets[hostkey] = Asset(event.host)
@@ -117,8 +117,7 @@ def increment_stat(stat, value):
                 self.log_table(table, table_header, table_name=f"asset-inventory-{header}")
 
         if self._file is not None:
-            with self._report_lock:
-                self.info(f"Saved asset-inventory output to {self.output_file}")
+            self.info(f"Saved asset-inventory output to {self.output_file}")
 
     def emit_contents(self):
         if self.use_previous and not self.emitted_contents:
diff --git a/bbot/modules/output/base.py b/bbot/modules/output/base.py
index 5a01b0307f..67880009f5 100644
--- a/bbot/modules/output/base.py
+++ b/bbot/modules/output/base.py
@@ -10,10 +10,14 @@ class BaseOutputModule(BaseModule):
     _stats_exclude = True
 
     def _event_precheck(self, event):
+        # omitted events such as HTTP_RESPONSE etc.
         if event._omit:
             return False, "_omit is True"
+        # forced events like intermediary links in a DNS resolution chain
         if event._force_output:
             return True, "_force_output is True"
+        # internal events like those from speculate, ipneighbor
+        # or events that are over our report distance
         if event._internal:
             return False, "_internal is True"
         return super()._event_precheck(event)
diff --git a/bbot/modules/shodan_dns.py b/bbot/modules/shodan_dns.py
index 9cefdae204..5323e74a40 100644
--- a/bbot/modules/shodan_dns.py
+++ b/bbot/modules/shodan_dns.py
@@ -17,8 +17,8 @@ class shodan_dns(crobat):
     base_url = "https://api.shodan.io"
 
     async def setup(self):
-        super().setup()
-        return self.require_api_key()
+        await super().setup()
+        return await self.require_api_key()
 
     async def ping(self):
         r = await self.request_with_fail_count(f"{self.base_url}/api-info?key={self.api_key}")
diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index b49e88a09b..cc437cc0d0 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -1,8 +1,6 @@
-import select
-import socket
-import threading
-from OpenSSL import SSL
-from ssl import PROTOCOL_TLSv1
+import ssl
+import asyncio
+from OpenSSL import crypto
 from contextlib import suppress
 
 from bbot.modules.base import BaseModule
@@ -26,7 +24,7 @@ class sslcert(BaseModule):
     scope_distance_modifier = 1
     _priority = 2
 
-    def setup(self):
+    async def setup(self):
         self.timeout = self.config.get("timeout", 5.0)
         self.skip_non_ssl = self.config.get("skip_non_ssl", True)
         self.non_ssl_ports = (22, 53, 80)
@@ -38,16 +36,15 @@ def setup(self):
         self.out_of_scope_abort_threshold = 10
 
         self.hosts_visited = set()
-        self.hosts_visited_lock = threading.Lock()
         self.ip_lock = NamedLock()
         return True
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         if self.skip_non_ssl and event.port in self.non_ssl_ports:
             return False, f"Port {event.port} doesn't typically use SSL"
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         _host = event.host
         if event.port:
             port = event.port
@@ -58,12 +55,7 @@ def handle_event(self, event):
         if self.helpers.is_ip(_host):
             hosts = [_host]
         else:
-            hosts = list(self.helpers.resolve(_host))
-
-        futures = {}
-        for host in hosts:
-            future = self.submit_task(self.visit_host, host, port)
-            futures[future] = host
+            hosts = list(await self.helpers.resolve(_host))
 
         if event.scope_distance == 0:
             abort_threshold = self.in_scope_abort_threshold
@@ -71,12 +63,17 @@ def handle_event(self, event):
         else:
             abort_threshold = self.out_of_scope_abort_threshold
             log_fn = self.verbose
-        for future in self.helpers.as_completed(futures):
-            host = futures[future]
-            result = future.result()
-            if not isinstance(result, tuple) or not len(result) == 2:
+
+        tasks = []
+        for host in hosts:
+            task = self.helpers.create_task(self.visit_host(host, port))
+            tasks.append(task)
+
+        for task in self.helpers.as_completed(tasks):
+            result = await task
+            if not isinstance(result, tuple) or not len(result) == 3:
                 continue
-            dns_names, emails = result
+            dns_names, emails, (host, port) = result
             if len(dns_names) > abort_threshold:
                 netloc = self.helpers.make_netloc(host, port)
                 log_fn(
@@ -100,61 +97,51 @@ def on_success_callback(self, event):
         if source_scope_distance == 0 and event.scope_distance > 0:
             event.add_tag("affiliate")
 
-    def visit_host(self, host, port):
+    async def visit_host(self, host, port):
         host = self.helpers.make_ip_type(host)
         netloc = self.helpers.make_netloc(host, port)
         host_hash = hash((host, port))
         dns_names = []
         emails = set()
-        with self.ip_lock.get_lock(host_hash):
-            with self.hosts_visited_lock:
-                if host_hash in self.hosts_visited:
-                    self.debug(f"Already processed {host} on port {port}, skipping")
-                    return [], []
-                else:
-                    self.hosts_visited.add(host_hash)
-
-            socket_type = socket.AF_INET
-            if self.helpers.is_ip(host):
-                if host.version == 6:
-                    socket_type = socket.AF_INET6
+        async with self.ip_lock.lock(host_hash):
+            if host_hash in self.hosts_visited:
+                self.debug(f"Already processed {host} on port {port}, skipping")
+                return [], [], (host, port)
+            else:
+                self.hosts_visited.add(host_hash)
+
             host = str(host)
+
+            # Create an SSL context
             try:
-                sock = socket.socket(socket_type, socket.SOCK_STREAM)
+                ssl_context = ssl.create_default_context()
+                ssl_context.check_hostname = False
+                ssl_context.verify_mode = ssl.CERT_NONE
             except Exception as e:
-                self.warning(f"Error creating socket for {netloc}: {e}. Do you have IPv6 disabled?")
-                return [], []
-            sock.settimeout(self.timeout)
-            try:
-                context = SSL.Context(PROTOCOL_TLSv1)
-            except AttributeError as e:
-                # AttributeError: module 'lib' has no attribute 'SSL_CTX_set_ecdh_auto'
                 self.warning(f"Error creating SSL context: {e}")
-                return [], []
-            self.debug(f"Connecting to {host} on port {port}")
-            try:
-                sock.connect((host, port))
-            except Exception as e:
-                self.debug(f"Error connecting to {host} on port {port}: {e}")
-                return [], []
-            connection = SSL.Connection(context, sock)
-            connection.set_tlsext_host_name(self.helpers.smart_encode(host))
-            connection.set_connect_state()
+                return [], [], (host, port)
+
+            # Connect to the host
             try:
-                while 1:
-                    try:
-                        connection.do_handshake()
-                    except SSL.WantReadError:
-                        rd, _, _ = select.select([sock], [], [], sock.gettimeout())
-                        if not rd:
-                            raise SSL.Error("select timed out")
-                        continue
-                    break
+                transport, _ = await self.scan._loop.create_connection(
+                    lambda: asyncio.Protocol(), host, port, ssl=ssl_context
+                )
             except Exception as e:
-                self.debug(f"Error with SSL handshake on {host} port {port}: {e}")
-                return [], []
-            cert = connection.get_peer_certificate()
-            sock.close()
+                log_fn = self.warning
+                if isinstance(e, OSError):
+                    log_fn = self.debug
+                log_fn(f"Error connecting to {netloc}: {e}")
+                return [], [], (host, port)
+            finally:
+                with suppress(Exception):
+                    transport.close()
+
+            # Get the SSL object
+            ssl_object = transport.get_extra_info("ssl_object")
+
+            # Get the certificate
+            der = ssl_object.getpeercert(binary_form=True)
+            cert = crypto.load_certificate(crypto.FILETYPE_ASN1, der)
             issuer = cert.get_issuer()
             if issuer.emailAddress and self.helpers.regexes.email_regex.match(issuer.emailAddress):
                 emails.add(issuer.emailAddress)
@@ -166,7 +153,7 @@ def visit_host(self, host, port):
             with suppress(KeyError):
                 dns_names.remove(common_name)
             dns_names = [common_name] + list(dns_names)
-        return dns_names, list(emails)
+        return dns_names, list(emails), (host, port)
 
     @staticmethod
     def get_cert_sans(cert):
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index 5b8d2ffe0e..2b0553475a 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -7,7 +7,6 @@
 import tldextract
 from pathlib import Path
 from omegaconf import OmegaConf
-from pytest_httpserver import HTTPServer
 import pytest_httpserver
 
 from werkzeug.wrappers import Request
@@ -337,21 +336,3 @@ def install_all_python_deps():
     for module in module_loader.preloaded().values():
         deps_pip.update(set(module.get("deps", {}).get("pip", [])))
     subprocess.run([sys.executable, "-m", "pip", "install"] + list(deps_pip))
-
-
-@pytest.fixture
-def bbot_httpserver():
-    server = HTTPServer(host="127.0.0.1", port=8888)
-    server.start()
-
-    yield server
-
-    server.clear()
-    if server.is_running():
-        server.stop()
-
-    # this is to check if the client has made any request where no
-    # `assert_request` was called on it from the test
-
-    server.check_assertions()
-    server.clear()
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 85a3f82504..be448d9feb 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -1,6 +1,7 @@
 import shutil
 import pytest
 import logging
+from pytest_httpserver import HTTPServer
 
 
 @pytest.hookimpl(tryfirst=True, hookwrapper=True)
@@ -16,3 +17,21 @@ def pytest_sessionfinish(session, exitstatus):
     shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
 
     yield
+
+
+@pytest.fixture
+def bbot_httpserver():
+    server = HTTPServer(host="127.0.0.1", port=8888)
+    server.start()
+
+    yield server
+
+    server.clear()
+    if server.is_running():
+        server.stop()
+
+    # this is to check if the client has made any request where no
+    # `assert_request` was called on it from the test
+
+    server.check_assertions()
+    server.clear()
diff --git a/bbot/test/pytest.ini b/bbot/test/pytest.ini
deleted file mode 100644
index 3396baacfc..0000000000
--- a/bbot/test/pytest.ini
+++ /dev/null
@@ -1 +0,0 @@
-log_level=DEBUG
\ No newline at end of file
diff --git a/bbot/test/test.conf b/bbot/test/test.conf
index 80daae5a53..86dcb526b9 100644
--- a/bbot/test/test.conf
+++ b/bbot/test/test.conf
@@ -41,3 +41,8 @@ excavate: false
 aggregate: false
 omit_event_types: []
 debug: true
+dns_wildcard_ignore:
+  - blacklanternsecurity.com
+  - google
+  - google.com
+  - example.com
\ No newline at end of file
diff --git a/poetry.lock b/poetry.lock
index 146a03dd54..1588260caf 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1155,18 +1155,17 @@ files = [
 
 [[package]]
 name = "pytest"
-version = "7.2.2"
+version = "7.3.1"
 description = "pytest: simple powerful testing with Python"
 category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "pytest-7.2.2-py3-none-any.whl", hash = "sha256:130328f552dcfac0b1cec75c12e3f005619dc5f874f0a06e8ff7263f0ee6225e"},
-    {file = "pytest-7.2.2.tar.gz", hash = "sha256:c99ab0c73aceb050f68929bc93af19ab6db0558791c6a0715723abe9d0ade9d4"},
+    {file = "pytest-7.3.1-py3-none-any.whl", hash = "sha256:3799fa815351fea3a5e96ac7e503a96fa51cc9942c3753cda7651b93c1cfa362"},
+    {file = "pytest-7.3.1.tar.gz", hash = "sha256:434afafd78b1d78ed0addf160ad2b77a30d35d4bdf8af234fe621919d9ed15e3"},
 ]
 
 [package.dependencies]
-attrs = ">=19.2.0"
 colorama = {version = "*", markers = "sys_platform == \"win32\""}
 exceptiongroup = {version = ">=1.0.0rc8", markers = "python_version < \"3.11\""}
 iniconfig = "*"
@@ -1175,7 +1174,7 @@ pluggy = ">=0.12,<2.0"
 tomli = {version = ">=1.0.0", markers = "python_version < \"3.11\""}
 
 [package.extras]
-testing = ["argcomplete", "hypothesis (>=3.56)", "mock", "nose", "pygments (>=2.7.2)", "requests", "xmlschema"]
+testing = ["argcomplete", "attrs (>=19.2.0)", "hypothesis (>=3.56)", "mock", "nose", "pygments (>=2.7.2)", "requests", "xmlschema"]
 
 [[package]]
 name = "pytest-asyncio"

From 55199e28d7cbf5f3f30511fd93c27e104650c480 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 17 May 2023 18:14:30 -0400
Subject: [PATCH 025/387] restored timeout

---
 bbot/modules/sslcert.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index cc437cc0d0..947bbe6aa5 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -123,9 +123,12 @@ async def visit_host(self, host, port):
 
             # Connect to the host
             try:
-                transport, _ = await self.scan._loop.create_connection(
+                transport, _ = await asyncio.wait_for(self.scan._loop.create_connection(
                     lambda: asyncio.Protocol(), host, port, ssl=ssl_context
-                )
+                ), timeout=self.timeout)
+            except asyncio.TimeoutError:
+                self.debug(f"Timed out after {self.timeout} seconds while connecting to {netloc}")
+                return [], [], (host, port)
             except Exception as e:
                 log_fn = self.warning
                 if isinstance(e, OSError):

From 912697f4b9bd3a7e097c97ddd3bf692b247505ac Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 17 May 2023 18:14:40 -0400
Subject: [PATCH 026/387] blacked

---
 bbot/modules/sslcert.py | 7 ++++---
 1 file changed, 4 insertions(+), 3 deletions(-)

diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index 947bbe6aa5..8792cecfa9 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -123,9 +123,10 @@ async def visit_host(self, host, port):
 
             # Connect to the host
             try:
-                transport, _ = await asyncio.wait_for(self.scan._loop.create_connection(
-                    lambda: asyncio.Protocol(), host, port, ssl=ssl_context
-                ), timeout=self.timeout)
+                transport, _ = await asyncio.wait_for(
+                    self.scan._loop.create_connection(lambda: asyncio.Protocol(), host, port, ssl=ssl_context),
+                    timeout=self.timeout,
+                )
             except asyncio.TimeoutError:
                 self.debug(f"Timed out after {self.timeout} seconds while connecting to {netloc}")
                 return [], [], (host, port)

From e3ba806ececd07baf5de4b4ceeb96025c4b59093 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 18 May 2023 23:18:45 -0400
Subject: [PATCH 027/387] steadily writing module tests

---
 bbot/core/helpers/diff.py   |   4 +-
 bbot/core/helpers/web.py    |   3 +
 bbot/modules/builtwith.py   |  23 ++++--
 bbot/modules/censys.py      | 158 +++++++++++++-----------------------
 bbot/modules/crt.py         |   2 +-
 bbot/modules/dnsdumpster.py |   6 +-
 bbot/test/conftest.py       |   5 ++
 bbot/test/test.conf         |   1 +
 8 files changed, 88 insertions(+), 114 deletions(-)

diff --git a/bbot/core/helpers/diff.py b/bbot/core/helpers/diff.py
index 2f191e0db6..7203071df2 100644
--- a/bbot/core/helpers/diff.py
+++ b/bbot/core/helpers/diff.py
@@ -47,7 +47,9 @@ async def _baseline(self):
 
             if baseline_1 is None or baseline_2 is None:
                 log.debug("HTTP error while establishing baseline, aborting")
-                raise HttpCompareError("Can't get baseline from source URL")
+                raise HttpCompareError(
+                    f"Can't get baseline from source URL: {url_1}:{baseline_1} / {url_2}:{baseline_2}"
+                )
             if baseline_1.status_code != baseline_2.status_code:
                 log.debug("Status code not stable during baseline, aborting")
                 raise HttpCompareError("Can't get baseline from source URL")
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 6ed9fe8427..d47b6289f2 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -175,6 +175,9 @@ async def api_page_iter(self, url, page_size=100, json=True, **requests_kwargs):
         offset = 0
         while 1:
             new_url = url.format(page=page, page_size=page_size, offset=offset)
+            data = requests_kwargs.get("data", None)
+            if data is not None:
+                requests_kwargs["data"] = requests_kwargs["data"].format(page=page, page_size=page_size, offset=offset)
             result = await self.request(new_url, **requests_kwargs)
             try:
                 if json:
diff --git a/bbot/modules/builtwith.py b/bbot/modules/builtwith.py
index e8139d5dd8..6fabcd2833 100644
--- a/bbot/modules/builtwith.py
+++ b/bbot/modules/builtwith.py
@@ -52,7 +52,7 @@ async def request_redirects(self, query):
 
     def parse_domains(self, r, query):
         """
-        This method yields subdomains.
+        This method returns a set of subdomains.
         Each subdomain is an "FQDN" that was reported in the "Detailed Technology Profile" page on builtwith.com
 
         Parameters
@@ -60,20 +60,25 @@ def parse_domains(self, r, query):
         r (requests Response): The raw requests response from the API
         query (string): The query used against the API
         """
+        results_set = set()
+        self.critical(r.content)
         json = r.json()
         if json:
-            for result in json.get("Results", []):
-                for chunk in result.get("Result", {}).get("Paths", []):
-                    domain = chunk.get("Domain", "")
-                    subdomain = chunk.get("SubDomain", "")
-                    if domain:
-                        if subdomain:
-                            domain = f"{subdomain}.{domain}"
-                        yield domain
+            results = json.get("Results", [])
+            if results:
+                for result in results:
+                    for chunk in result.get("Result", {}).get("Paths", []):
+                        domain = chunk.get("Domain", "")
+                        subdomain = chunk.get("SubDomain", "")
+                        if domain:
+                            if subdomain:
+                                domain = f"{subdomain}.{domain}"
+                            results_set.add(domain)
             else:
                 error = json.get("Errors", [{}])[0].get("Message", "Unknown Error")
                 if error:
                     self.verbose(f"No results for {query}: {error}")
+        return results_set
 
     def parse_redirects(self, r, query):
         """
diff --git a/bbot/modules/censys.py b/bbot/modules/censys.py
index ed713472d7..283b902e37 100644
--- a/bbot/modules/censys.py
+++ b/bbot/modules/censys.py
@@ -1,122 +1,80 @@
-from contextlib import suppress
-
-from censys.common import exceptions
-from censys.search import CensysHosts
-from censys.search import CensysCertificates
-
 from bbot.modules.shodan_dns import shodan_dns
 
 
 class censys(shodan_dns):
+    """
+    thanks to https://github.com/owasp-amass/amass/blob/master/resources/scripts/cert/censys.ads
+    """
+
     watched_events = ["DNS_NAME"]
     produced_events = ["DNS_NAME", "EMAIL_ADDRESS", "IP_ADDRESS", "OPEN_PORT", "PROTOCOL"]
     flags = ["subdomain-enum", "email-enum", "passive", "safe"]
     meta = {"description": "Query the Censys API", "auth_required": True}
-    options = {"api_id": "", "api_secret": "", "max_records": 1000}
-    options_desc = {
-        "api_id": "Censys.io API ID",
-        "api_secret": "Censys.io API Secret",
-        "max_records": "Limit results to help prevent exceeding API quota",
-    }
+    options = {"api_id": "", "api_secret": ""}
+    options_desc = {"api_id": "Censys.io API ID", "api_secret": "Censys.io API Secret"}
 
-    deps_pip = ["censys~=2.1.9"]
+    base_url = "https://search.censys.io/api/v1"
 
     async def setup(self):
-        self.max_records = self.config.get("max_records", 1000)
         self.api_id = self.config.get("api_id", "")
         self.api_secret = self.config.get("api_secret", "")
-        self._cert_name_threshold = 20
-        with suppress(Exception):
-            self.hosts = CensysHosts(api_id=self.api_id, api_secret=self.api_secret)
-        with suppress(Exception):
-            self.certificates = CensysCertificates(api_id=self.api_id, api_secret=self.api_secret)
-        return super().setup()
+        self.auth = (self.api_id, self.api_secret)
+        return await super().setup()
 
     async def ping(self):
-        quota = self.certificates.quota()
-        used = int(quota["used"])
-        allowance = int(quota["allowance"])
+        url = f"{self.base_url}/account"
+        resp = await self.helpers.request(url, auth=self.auth)
+        d = resp.json()
+        assert isinstance(d, dict), f"Invalid response from {url}: {resp}"
+        quota = d.get("quota", {})
+        used = int(quota.get("used", 0))
+        allowance = int(quota.get("allowance", 0))
         assert used < allowance, "No quota remaining"
 
     async def query(self, query):
-        emails = set()
-        dns_names = set()
-        ip_addresses = dict()
-        try:
-            # certificates
-            certificate_query = f"parsed.names: {query}"
-            certificate_fields = ["parsed.names", "parsed.issuer_dn", "parsed.subject_dn"]
-            results = await self.scan.run_in_executor(
-                self.certificates.search, certificate_query, fields=certificate_fields, max_records=self.max_records
+        results = set()
+        page = 1
+        while 1:
+            resp = await self.helpers.request(
+                f"{self.base_url}/search/certificates",
+                method="POST",
+                json={
+                    "query": f"parsed.names: {query}",
+                    "page": page,
+                    "fields": ["parsed.names"],
+                },
+                auth=self.auth,
             )
-            for result in results:
-                parsed_names = result.get("parsed.names", [])
-                # helps filter out third-party certs with a lot of garbage names
-                _filter = lambda x: True
-                domain = self.helpers.tldextract(query).domain
-                if len(parsed_names) > self._cert_name_threshold:
-                    _filter = lambda x: domain in str(x.lower())
-                parsed_names = list(filter(_filter, parsed_names))
-                dns_names.update(set([n.lstrip(".*").rstrip(".").lower() for n in parsed_names]))
-                emails.update(set(self.helpers.extract_emails(result.get("parsed.issuer_dn", ""))))
-                emails.update(set(self.helpers.extract_emails(result.get("parsed.subject_dn", ""))))
-
-            # hosts
-            per_page = 100
-            pages = max(1, int(self.max_records / per_page))
-            hosts_query = f"services.tls.certificates.leaf_data.names: {query} or services.tls.certificates.leaf_data.subject.email_address: {query}"
-            hosts_results = await self.scan.run_in_executor(
-                self.hosts.search, hosts_query, per_page=per_page, pages=pages
-            )
-            for i, page in enumerate(hosts_results):
-                for result in page:
-                    ip = result.get("ip", "")
-                    if not ip:
-                        continue
-                    ip_addresses[ip] = []
-                    services = result.get("services", [])
-                    for service in services:
-                        port = service.get("port")
-                        service_name = service.get("service_name", "")
-                        transport_protocol = service.get("transport_protocol", "")
-                        if not port or not transport_protocol:
-                            continue
-                        ip_addresses[ip].append((port, service_name, transport_protocol))
-                if self.scan.stopping:
-                    break
-
-        except exceptions.CensysRateLimitExceededException:
-            self.warning("Exceeded Censys account limits")
-        except exceptions.CensysException as e:
-            self.warning(f"Error with API: {e}")
-        except Exception as e:
-            self.warning(f"Unknown error: {e}")
-
-        return emails, dns_names, ip_addresses
-
-    async def handle_event(self, event):
-        query = self.make_query(event)
-        emails, dns_names, ip_addresses = self.query(query)
-        for email in emails:
-            self.emit_event(email, "EMAIL_ADDRESS", source=event)
-        for dns_name in dns_names:
-            self.emit_event(dns_name, "DNS_NAME", source=event)
-        for ip, services in ip_addresses.items():
-            ip_event = self.make_event(ip, "IP_ADDRESS", source=event)
-            if not ip_event:
-                continue
-            self.emit_event(ip_event)
-            for port, service_name, transport_protocol in services:
-                port_data = self.helpers.make_netloc(ip, port)
-                port_type = f"OPEN_{transport_protocol.upper()}_PORT"
-                port_event = self.make_event(port_data, port_type, source=ip_event)
-                if not port_event:
-                    continue
-                self.emit_event(port_event)
-                if service_name:
-                    service_name = str(service_name).upper()
-                    protocol_data = {"host": port_data, "protocol": service_name}
-                    self.emit_event(protocol_data, "PROTOCOL", source=port_event)
+            page += 1
+
+            if resp is None:
+                break
+
+            d = resp.json()
+            if d is None:
+                break
+            elif not isinstance(d, dict):
+                break
+
+            error = d.get("error", "")
+            if error:
+                self.warning(error)
+
+            if resp.status_code < 200 or resp.status_code >= 400:
+                break
+
+            elif d.get("status") is None or d["status"] != "ok" or len(d.get("results", [])) == 0:
+                break
+
+            for r in d["results"]:
+                for v in r["parsed.names"]:
+                    results.add(v.strip(".*").lower())
+
+            metadata = d.get("metadata", {})
+            if metadata.get("page", 0) >= metadata.get("pages", 0):
+                break
+
+        return results
 
     @property
     def auth_secret(self):
diff --git a/bbot/modules/crt.py b/bbot/modules/crt.py
index a4410354ce..62d4a37fd6 100644
--- a/bbot/modules/crt.py
+++ b/bbot/modules/crt.py
@@ -12,7 +12,7 @@ class crt(crobat):
 
     async def setup(self):
         self.cert_ids = set()
-        return super().setup()
+        return await super().setup()
 
     async def request_url(self, query):
         params = {"q": f"%.{query}", "output": "json"}
diff --git a/bbot/modules/dnsdumpster.py b/bbot/modules/dnsdumpster.py
index 2d7f69a4b7..cff5b0692f 100644
--- a/bbot/modules/dnsdumpster.py
+++ b/bbot/modules/dnsdumpster.py
@@ -14,10 +14,10 @@ class dnsdumpster(crobat):
 
     base_url = "https://dnsdumpster.com"
 
-    def query(self, domain):
+    async def query(self, domain):
         ret = []
         # first, get the CSRF tokens
-        res1 = self.request_with_fail_count(self.base_url)
+        res1 = await self.request_with_fail_count(self.base_url)
         status_code = getattr(res1, "status_code", 0)
         if status_code in [429]:
             self.verbose(f'Too many requests "{status_code}"')
@@ -56,7 +56,7 @@ def query(self, domain):
 
         # Otherwise, do the needful
         subdomains = set()
-        res2 = self.request_with_fail_count(
+        res2 = await self.request_with_fail_count(
             f"{self.base_url}/",
             method="POST",
             cookies={"csrftoken": csrftoken},
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index be448d9feb..0aca0ff1bd 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -19,6 +19,11 @@ def pytest_sessionfinish(session, exitstatus):
     yield
 
 
+@pytest.fixture
+def non_mocked_hosts() -> list:
+    return ["127.0.0.1"]
+
+
 @pytest.fixture
 def bbot_httpserver():
     server = HTTPServer(host="127.0.0.1", port=8888)
diff --git a/bbot/test/test.conf b/bbot/test/test.conf
index 86dcb526b9..602190edd4 100644
--- a/bbot/test/test.conf
+++ b/bbot/test/test.conf
@@ -36,6 +36,7 @@ keep_scans: 1
 agent_url: ws://127.0.0.1:8765
 agent_token: test
 dns_resolution: false
+dns_timeout: 1
 speculate: false
 excavate: false
 aggregate: false

From ea76f5619baecd7c7ac07b5b198dcbf9794a7de6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 19 May 2023 20:24:06 -0400
Subject: [PATCH 028/387] rolling on module tests

---
 bbot/core/helpers/dns.py                      |   7 +
 bbot/modules/dnszonetransfer.py               |   7 +-
 bbot/modules/emailformat.py                   |  11 +-
 bbot/modules/fullhunt.py                      |   7 +-
 bbot/test/helpers.py                          |  13 -
 bbot/test/modules_test_classes.py             | 393 ------------------
 bbot/test/test.conf                           |   2 +
 .../test/test_step_1/module_tests/__init__.py |  12 +
 bbot/test/test_step_1/module_tests/base.py    | 132 ++++++
 .../module_tests/test__module__tests.py       |  35 ++
 .../module_tests/test_module_affiliates.py    |  11 +
 .../module_tests/test_module_aggregate.py     |  11 +
 .../module_tests/test_module_anubisdb.py      |  13 +
 .../module_tests/test_module_asn.py           | 239 +++++++++++
 .../test_module_asset_inventory.py            |  17 +
 .../module_tests/test_module_azure_tenant.py  |  46 ++
 .../module_tests/test_module_badsecrets.py    | 110 +++++
 .../module_tests/test_module_bevigil.py       |  24 ++
 .../module_tests/test_module_binaryedge.py    |  31 ++
 .../module_tests/test_module_bucket_aws.py    |  93 +++++
 .../module_tests/test_module_bucket_azure.py  |  13 +
 .../test_module_bucket_digitalocean.py        |  10 +
 .../test_module_bucket_firebase.py            |  13 +
 .../module_tests/test_module_bucket_gcp.py    |  27 ++
 .../module_tests/test_module_builtwith.py     | 110 +++++
 .../module_tests/test_module_bypass403.py     |  50 +++
 .../module_tests/test_module_c99.py           |  25 ++
 .../module_tests/test_module_censys.py        |  41 ++
 .../module_tests/test_module_certspotter.py   |  14 +
 .../module_tests/test_module_crobat.py        |  12 +
 .../module_tests/test_module_crt.py           |  15 +
 .../module_tests/test_module_csv.py           |   8 +
 .../module_tests/test_module_dnscommonsrv.py  |  19 +
 .../module_tests/test_module_dnsdumpster.py   |  18 +
 .../test_module_dnszonetransfer.py            |  56 +++
 .../module_tests/test_module_emailformat.py   |  12 +
 .../module_tests/test_module_excavate.py      | 141 +++++++
 .../module_tests/test_module_ffuf.py          |  45 ++
 .../test_module_ffuf_shortnames.py            | 208 +++++++++
 .../module_tests/test_module_fingerprintx.py  |  14 +
 .../module_tests/test_module_fullhunt.py      |  48 +++
 .../module_tests/test_module_generic_ssrf.py  |   0
 .../module_tests/test_module_github.py        |   0
 .../module_tests/test_module_gowitness.py     |   0
 .../module_tests/test_module_hackertarget.py  |   0
 .../module_tests/test_module_host_header.py   |   0
 .../module_tests/test_module_http.py          |   0
 .../module_tests/test_module_httpx.py         |   0
 .../module_tests/test_module_human.py         |   0
 .../module_tests/test_module_hunt.py          |   0
 .../module_tests/test_module_hunterio.py      |   0
 .../test_module_iis_shortnames.py             |   0
 .../module_tests/test_module_ipneighbor.py    |   0
 .../module_tests/test_module_ipstack.py       |   0
 .../module_tests/test_module_json.py          |   0
 .../module_tests/test_module_leakix.py        |   0
 .../module_tests/test_module_masscan.py       |   0
 .../module_tests/test_module_massdns.py       |   0
 .../module_tests/test_module_naabu.py         |   0
 .../module_tests/test_module_neo4j.py         |   0
 .../module_tests/test_module_ntlm.py          |   0
 .../module_tests/test_module_nuclei.py        |   0
 .../module_tests/test_module_otx.py           |   0
 .../test_module_paramminer_cookies.py         |   0
 .../test_module_paramminer_getparams.py       |   0
 .../test_module_paramminer_headers.py         |   0
 .../module_tests/test_module_passivetotal.py  |   0
 .../module_tests/test_module_pgp.py           |   0
 .../module_tests/test_module_python.py        |   0
 .../module_tests/test_module_rapiddns.py      |   0
 .../module_tests/test_module_riddler.py       |   0
 .../module_tests/test_module_robots.py        |   0
 .../module_tests/test_module_secretsdb.py     |   0
 .../test_module_securitytrails.py             |   0
 .../module_tests/test_module_services.py      |   0
 .../module_tests/test_module_shodan_dns.py    |   0
 .../module_tests/test_module_skymem.py        |   0
 .../module_tests/test_module_smuggler.py      |   0
 .../module_tests/test_module_social.py        |   0
 .../module_tests/test_module_speculate.py     |   0
 .../module_tests/test_module_sslcert.py       |   8 +
 .../test_module_subdomain_hijack.py           |   0
 .../module_tests/test_module_sublist3r.py     |   0
 .../module_tests/test_module_telerik.py       |   0
 .../module_tests/test_module_threatminer.py   |   0
 .../test_module_url_manipulation.py           |   0
 .../module_tests/test_module_urlscan.py       |   0
 .../module_tests/test_module_vhost.py         |   0
 .../module_tests/test_module_viewdns.py       |   0
 .../module_tests/test_module_virustotal.py    |   0
 .../module_tests/test_module_wafw00f.py       |   0
 .../module_tests/test_module_wappalyzer.py    |   0
 .../module_tests/test_module_wayback.py       |   0
 .../module_tests/test_module_web_report.py    |   0
 .../module_tests/test_module_websocket.py     |   0
 .../module_tests/test_module_zoomeye.py       |   0
 96 files changed, 1703 insertions(+), 418 deletions(-)
 create mode 100644 bbot/test/test_step_1/module_tests/__init__.py
 create mode 100644 bbot/test/test_step_1/module_tests/base.py
 create mode 100644 bbot/test/test_step_1/module_tests/test__module__tests.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_affiliates.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_aggregate.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_anubisdb.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_asn.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_asset_inventory.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_azure_tenant.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_badsecrets.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_bevigil.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_binaryedge.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_bucket_aws.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_bucket_azure.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_bucket_digitalocean.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_bucket_firebase.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_bucket_gcp.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_builtwith.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_bypass403.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_c99.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_censys.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_certspotter.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_crobat.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_crt.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_csv.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_emailformat.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_excavate.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_ffuf.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_fingerprintx.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_fullhunt.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_github.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_gowitness.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_hackertarget.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_host_header.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_http.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_httpx.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_human.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_hunt.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_hunterio.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_ipstack.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_json.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_leakix.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_masscan.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_massdns.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_naabu.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_neo4j.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_ntlm.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_nuclei.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_otx.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_passivetotal.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_pgp.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_python.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_rapiddns.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_riddler.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_robots.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_secretsdb.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_securitytrails.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_services.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_skymem.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_smuggler.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_social.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_speculate.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_sslcert.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_sublist3r.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_telerik.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_threatminer.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_urlscan.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_vhost.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_viewdns.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_virustotal.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_wafw00f.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_wayback.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_web_report.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_websocket.py
 create mode 100644 bbot/test/test_step_1/module_tests/test_module_zoomeye.py

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 4f4b651199..3c10bcc48d 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -431,6 +431,13 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
         Note that is_wildcard can be True, False, or None (indicating that wildcard detection was inconclusive)
         """
         result = {}
+
+        # skip check if the query's parent domain is excluded in the config
+        for d in self.wildcard_ignore:
+            if self.parent_helper.host_in_host(query, d):
+                log.debug(f"Skipping wildcard detection on {query} because it is excluded in the config")
+                return {}
+
         if rdtype is None:
             rdtype = "ANY"
 
diff --git a/bbot/modules/dnszonetransfer.py b/bbot/modules/dnszonetransfer.py
index 4a3fb5a58b..52a9b9634d 100644
--- a/bbot/modules/dnszonetransfer.py
+++ b/bbot/modules/dnszonetransfer.py
@@ -1,5 +1,6 @@
 import dns.zone
 import dns.query
+from functools import partial
 
 from bbot.modules.base import BaseModule
 
@@ -36,10 +37,12 @@ async def handle_event(self, event):
                 break
             try:
                 self.debug(f"Attempting zone transfer against {nameserver} for domain {domain}")
-                xfr_answer = await dns.asyncquery.xfr(nameserver, domain, timeout=self.timeout, lifetime=self.timeout)
+                xfr_fn = partial(dns.query.xfr, timeout=self.timeout, lifetime=self.timeout)
+                xfr_answer = await self.scan.run_in_executor(xfr_fn, nameserver, domain)
                 zone = dns.zone.from_xfr(xfr_answer)
             except Exception as e:
-                self.debug(f"Error retrieving zone: {e}")
+                self.verbose(f"Error retrieving zone: {e}")
+                self.trace()
                 continue
             self.hugesuccess(f"Successful zone transfer against {nameserver} for domain {domain}!")
             finding_description = f"Successful DNS zone transfer against {nameserver} for {domain}"
diff --git a/bbot/modules/emailformat.py b/bbot/modules/emailformat.py
index fa47f23cf5..f28e19f9d9 100644
--- a/bbot/modules/emailformat.py
+++ b/bbot/modules/emailformat.py
@@ -10,16 +10,13 @@ class emailformat(viewdns):
 
     base_url = "https://www.email-format.com"
 
-    def extract_emails(self, content):
-        yield from self.helpers.regexes.email_regex.findall(content)
-
-    def handle_event(self, event):
+    async def handle_event(self, event):
         _, query = self.helpers.split_domain(event.data)
         url = f"{self.base_url}/d/{self.helpers.quote(query)}/"
-        r = self.request_with_fail_count(url)
+        r = await self.request_with_fail_count(url)
+        self.hugesuccess(r.content)
         if not r:
             return
-        for email in self.extract_emails(r.text):
-            email = email.lower()
+        for email in self.helpers.extract_emails(r.text):
             if email.endswith(query):
                 self.emit_event(email, "EMAIL_ADDRESS", source=event)
diff --git a/bbot/modules/fullhunt.py b/bbot/modules/fullhunt.py
index 4d6e740b09..8bc5d23265 100644
--- a/bbot/modules/fullhunt.py
+++ b/bbot/modules/fullhunt.py
@@ -14,17 +14,18 @@ class fullhunt(shodan_dns):
     async def setup(self):
         self.api_key = self.config.get("api_key", "")
         self.headers = {"x-api-key": self.api_key}
-        return super().setup()
+        return await super().setup()
 
     async def ping(self):
         url = f"{self.base_url}/auth/status"
-        j = await self.request_with_fail_count(url, headers=self.headers).json()
+        j = (await self.request_with_fail_count(url, headers=self.headers)).json()
         remaining = j["user_credits"]["remaining_credits"]
         assert remaining > 0, "No credits remaining"
 
     async def request_url(self, query):
         url = f"{self.base_url}/domain/{self.helpers.quote(query)}/subdomains"
-        return await self.request_with_fail_count(url, headers=self.headers)
+        response = await self.request_with_fail_count(url, headers=self.headers)
+        return response
 
     def parse_results(self, r, query):
         return r.json().get("hosts", [])
diff --git a/bbot/test/helpers.py b/bbot/test/helpers.py
index 0cfafafc99..a4aa453c9a 100644
--- a/bbot/test/helpers.py
+++ b/bbot/test/helpers.py
@@ -91,16 +91,3 @@ def set_expect_requests(self, expect_args={}, respond_args={}):
 
     def _after_scan_prep(self):
         self.mock_args()
-
-
-def tempwordlist(content):
-    tmp_path = "/tmp/.bbot_test/"
-    from bbot.core.helpers.misc import rand_string, mkdir
-
-    mkdir(tmp_path)
-    filename = f"{tmp_path}{rand_string(8)}"
-    with open(filename, "w", errors="ignore") as f:
-        for c in content:
-            line = f"{c}\n"
-            f.write(line)
-    return filename
diff --git a/bbot/test/modules_test_classes.py b/bbot/test/modules_test_classes.py
index 30088c65cf..a4a7665ebf 100644
--- a/bbot/test/modules_test_classes.py
+++ b/bbot/test/modules_test_classes.py
@@ -73,151 +73,6 @@ def check_events(self, events):
         assert technology, "No TECHNOLOGY emitted"
 
 
-class Excavate(HttpxMockHelper):
-    additional_modules = ["httpx"]
-    targets = ["http://127.0.0.1:8888/", "test.notreal", "http://127.0.0.1:8888/subdir/links.html"]
-
-    config_overrides = {"web_spider_distance": 1, "web_spider_depth": 1}
-
-    def setup(self, scan):
-        self.bbot_httpserver.no_handler_status_code = 404
-
-    def mock_args(self):
-        response_data = """
-        ftp://ftp.test.notreal
-        \\nhttps://www1.test.notreal
-        \\x3dhttps://www2.test.notreal
-        %0ahttps://www3.test.notreal
-        \\u000ahttps://www4.test.notreal
-        \nwww5.test.notreal
-        \\x3dwww6.test.notreal
-        %0awww7.test.notreal
-        \\u000awww8.test.notreal
-        <a src="http://www9.test.notreal">
-        """
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": response_data}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        # verify relatives path a-tag parsing is working correctly
-
-        expect_args = {"method": "GET", "uri": "/subdir/links.html"}
-        respond_args = {"response_data": "<a href='../relative.html'/><a href='/2/depth2.html'/>"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/relative.html"}
-        respond_args = {"response_data": "<a href='/distance2.html'/>"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        event_data = [e.data for e in events]
-        assert "https://www1.test.notreal/" in event_data
-        assert "https://www2.test.notreal/" in event_data
-        assert "https://www3.test.notreal/" in event_data
-        assert "https://www4.test.notreal/" in event_data
-        assert "www1.test.notreal" in event_data
-        assert "www2.test.notreal" in event_data
-        assert "www3.test.notreal" in event_data
-        assert "www4.test.notreal" in event_data
-        assert "www5.test.notreal" in event_data
-        assert "www6.test.notreal" in event_data
-        assert "www7.test.notreal" in event_data
-        assert "www8.test.notreal" in event_data
-        assert "http://www9.test.notreal/" in event_data
-
-        assert "nhttps://www1.test.notreal/" not in event_data
-        assert "x3dhttps://www2.test.notreal/" not in event_data
-        assert "a2https://www3.test.notreal/" not in event_data
-        assert "uac20https://www4.test.notreal/" not in event_data
-        assert "nwww5.test.notreal" not in event_data
-        assert "x3dwww6.test.notreal" not in event_data
-        assert "a2www7.test.notreal" not in event_data
-        assert "uac20www8.test.notreal" not in event_data
-
-        assert any(
-            e.type == "FINDING" and e.data.get("description", "") == "Non-HTTP URI: ftp://ftp.test.notreal"
-            for e in events
-        )
-        assert any(
-            e.type == "PROTOCOL"
-            and e.data.get("protocol", "") == "FTP"
-            and e.data.get("host", "") == "ftp.test.notreal"
-            for e in events
-        )
-
-        assert any(
-            e.type == "URL_UNVERIFIED"
-            and e.data == "http://127.0.0.1:8888/relative.html"
-            and "spider-danger" not in e.tags
-            for e in events
-        )
-
-        assert any(
-            e.type == "URL_UNVERIFIED"
-            and e.data == "http://127.0.0.1:8888/2/depth2.html"
-            and "spider-danger" in e.tags
-            for e in events
-        )
-
-        assert any(
-            e.type == "URL_UNVERIFIED"
-            and e.data == "http://127.0.0.1:8888/distance2.html"
-            and "spider-danger" in e.tags
-            for e in events
-        )
-
-
-class Excavate_relativelinks(HttpxMockHelper):
-    additional_modules = ["httpx"]
-    targets = ["http://127.0.0.1:8888/", "test.notreal", "http://127.0.0.1:8888/subdir/"]
-    config_overrides = {"web_spider_distance": 1, "web_spider_depth": 1}
-
-    def setup(self, scan):
-        self.bbot_httpserver.no_handler_status_code = 404
-
-    def mock_args(self):
-        # root relative
-        expect_args = {"method": "GET", "uri": "/rootrelative.html"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        # page relative
-        expect_args = {"method": "GET", "uri": "/subdir/pagerelative.html"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/subdir/"}
-        respond_args = {
-            "response_data": "<a href='/rootrelative.html'>root relative</a><a href='pagerelative.html'>page relative</a>"
-        }
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        root_relative_detection = False
-        page_relative_detection = False
-        root_page_confusion_1 = False
-        root_page_confusion_2 = False
-
-        for e in events:
-            if e.type == "URL_UNVERIFIED":
-                # these cases represent the desired behavior for parsing relative links
-                if e.data == "http://127.0.0.1:8888/rootrelative.html":
-                    root_relative_detection = True
-                if e.data == "http://127.0.0.1:8888/subdir/pagerelative.html":
-                    page_relative_detection = True
-
-                # these cases indicates that excavate parsed the relative links incorrectly
-                if e.data == "http://127.0.0.1:8888/pagerelative.html":
-                    root_page_confusion_1 = True
-                if e.data == "http://127.0.0.1:8888/subdir/rootrelative.html":
-                    root_page_confusion_2 = True
-
-        assert root_relative_detection, "Failed to properly excavate root-relative URL"
-        assert page_relative_detection, "Failed to properly excavate page-relative URL"
-        assert not root_page_confusion_1, "Incorrectly detected page-relative URL"
-        assert not root_page_confusion_2, "Incorrectly detected root-relative URL"
-
-
 class Subdomain_Hijack(HttpxMockHelper):
     additional_modules = ["httpx", "excavate"]
 
@@ -1162,52 +1017,6 @@ def check_events(self, events):
         assert any(e.type == "WAF" and "LiteSpeed" in e.data["WAF"] for e in events)
 
 
-class Ffuf(HttpxMockHelper):
-    test_wordlist = ["11111111", "admin", "junkword1", "zzzjunkword2"]
-    config_overrides = {
-        "modules": {
-            "ffuf": {
-                "wordlist": tempwordlist(test_wordlist),
-            }
-        }
-    }
-
-    additional_modules = ["httpx"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/admin"}
-        respond_args = {"response_data": "alive admin page"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "URL_UNVERIFIED" and "admin" in e.data for e in events)
-        assert not any(e.type == "URL_UNVERIFIED" and "11111111" in e.data for e in events)
-
-
-class Ffuf_extensions(HttpxMockHelper):
-    test_wordlist = ["11111111", "console", "junkword1", "zzzjunkword2"]
-    config_overrides = {"modules": {"ffuf": {"wordlist": tempwordlist(test_wordlist), "extensions": "php"}}}
-
-    additional_modules = ["httpx"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/console.php"}
-        respond_args = {"response_data": "alive admin page"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "URL_UNVERIFIED" and "console" in e.data for e in events)
-        assert not any(e.type == "URL_UNVERIFIED" and "11111111" in e.data for e in events)
-
-
 class Vhost(HttpxMockHelper):
     targets = ["http://localhost:8888", "secret.localhost"]
 
@@ -1274,208 +1083,6 @@ def check_events(self, events):
         assert wordcloud_detection
 
 
-class Ffuf_shortnames(HttpxMockHelper):
-    test_wordlist = ["11111111", "administrator", "portal", "console", "junkword1", "zzzjunkword2", "directory"]
-    config_overrides = {
-        "modules": {
-            "ffuf_shortnames": {
-                "find_common_prefixes": True,
-                "find_common_prefixes": True,
-                "wordlist": tempwordlist(test_wordlist),
-            }
-        }
-    }
-
-    def setup(self, scan):
-        self.bbot_httpserver.no_handler_status_code = 404
-
-        seed_events = []
-        parent_event = self.scan.make_event(
-            "http://127.0.0.1:8888/", "URL", self.scan.root_event, module="httpx", tags=["status-200", "distance-0"]
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/ADMINI~1.ASP",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-file"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/ADM_PO~1.ASP",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-file"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/ABCZZZ~1.ASP",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-file"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/ABCXXX~1.ASP",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-file"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/ABCYYY~1.ASP",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-file"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/ABCCON~1.ASP",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-file"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/DIRECT~1",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-directory"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/ADM_DI~1",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-directory"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/XYZDIR~1",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-directory"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/XYZAAA~1",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-directory"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/XYZBBB~1",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-directory"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/XYZCCC~1",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-directory"],
-            )
-        )
-        seed_events.append(
-            self.scan.make_event(
-                "http://127.0.0.1:8888/SHORT~1.PL",
-                "URL_HINT",
-                parent_event,
-                module="iis_shortnames",
-                tags=["shortname-file"],
-            )
-        )
-        self.scan.target._events["http://127.0.0.1:8888"] = seed_events
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/administrator.aspx"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/adm_portal.aspx"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/abcconsole.aspx"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/directory/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/adm_directory/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/xyzdirectory/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/short.pl"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        basic_detection = False
-        directory_detection = False
-        prefix_detection = False
-        delimeter_detection = False
-        directory_delimeter_detection = False
-        prefix_delimeter_detection = False
-        short_extensions_detection = False
-
-        for e in events:
-            if e.type == "URL_UNVERIFIED":
-                if e.data == "http://127.0.0.1:8888/administrator.aspx":
-                    basic_detection = True
-                if e.data == "http://127.0.0.1:8888/directory/":
-                    directory_detection = True
-                if e.data == "http://127.0.0.1:8888/adm_portal.aspx":
-                    prefix_detection = True
-                if e.data == "http://127.0.0.1:8888/abcconsole.aspx":
-                    delimeter_detection = True
-                if e.data == "http://127.0.0.1:8888/abcconsole.aspx":
-                    directory_delimeter_detection = True
-                if e.data == "http://127.0.0.1:8888/xyzdirectory/":
-                    prefix_delimeter_detection = True
-                if e.data == "http://127.0.0.1:8888/short.pl":
-                    short_extensions_detection = True
-
-        assert basic_detection
-        assert directory_detection
-        assert prefix_detection
-        assert delimeter_detection
-        assert directory_delimeter_detection
-        assert prefix_delimeter_detection
-        assert short_extensions_detection
-
-
 class Iis_shortnames(HttpxMockHelper):
     additional_modules = ["httpx"]
 
diff --git a/bbot/test/test.conf b/bbot/test/test.conf
index 602190edd4..9444e1d14c 100644
--- a/bbot/test/test.conf
+++ b/bbot/test/test.conf
@@ -44,6 +44,8 @@ omit_event_types: []
 debug: true
 dns_wildcard_ignore:
   - blacklanternsecurity.com
+  - fakedomain
+  - notreal
   - google
   - google.com
   - example.com
\ No newline at end of file
diff --git a/bbot/test/test_step_1/module_tests/__init__.py b/bbot/test/test_step_1/module_tests/__init__.py
new file mode 100644
index 0000000000..0b098d46a2
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/__init__.py
@@ -0,0 +1,12 @@
+from pathlib import Path
+
+from bbot.modules import module_loader
+
+parent_dir = Path(__file__).parent
+
+module_test_files = list(parent_dir.glob("test_module_*.py"))
+module_test_files = [m.name.split("test_module_")[-1].split(".")[0] for m in module_test_files]
+
+for module_name in module_loader.preloaded():
+    module_name = module_name.lower()
+    assert module_name in module_test_files, f'No test file found for module "{module_name}"'
diff --git a/bbot/test/test_step_1/module_tests/base.py b/bbot/test/test_step_1/module_tests/base.py
new file mode 100644
index 0000000000..2f5f935591
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/base.py
@@ -0,0 +1,132 @@
+import pytest
+import pytest_asyncio
+import logging
+from abc import abstractmethod
+from omegaconf import OmegaConf
+
+from bbot.scanner import Scanner
+from bbot.modules import module_loader
+from bbot.core.helpers.misc import rand_string
+from ...bbot_fixtures import test_config
+
+log = logging.getLogger("bbot.test.modules")
+
+
+def tempwordlist(content):
+    tmp_path = "/tmp/.bbot_test/"
+    from bbot.core.helpers.misc import rand_string, mkdir
+
+    mkdir(tmp_path)
+    filename = f"{tmp_path}{rand_string(8)}"
+    with open(filename, "w", errors="ignore") as f:
+        for c in content:
+            line = f"{c}\n"
+            f.write(line)
+    return filename
+
+
+class TestClass:
+    @pytest_asyncio.fixture
+    async def my_fixture(self, bbot_httpserver):
+        yield bbot_httpserver
+
+    @pytest.mark.asyncio
+    async def test_asdf(self, my_fixture):
+        log.critical(my_fixture)
+
+
+class ModuleTestBase:
+    targets = ["blacklanternsecurity.com"]
+    scan_name = None
+    blacklist = None
+    whitelist = None
+    module_name = None
+    config_overrides = {}
+    modules_overrides = []
+
+    class ModuleTest:
+        def __init__(self, module_test_base, httpx_mock, httpserver, monkeypatch):
+            self.name = module_test_base.name
+            self.config = OmegaConf.merge(test_config, OmegaConf.create(module_test_base.config_overrides))
+
+            self.httpx_mock = httpx_mock
+            self.httpserver = httpserver
+            self.monkeypatch = monkeypatch
+
+            # handle output, internal module types
+            preloaded = module_loader.preloaded()
+            output_modules = None
+            modules = list(module_test_base.modules)
+            output_modules = []
+            for module in list(modules):
+                module_type = preloaded[module]["type"]
+                if module_type in ("internal", "output"):
+                    modules.remove(module)
+                    if module_type == "output":
+                        output_modules.append(module)
+                    elif module_type == "internal":
+                        self.config = OmegaConf.merge(self.config, {module: True})
+            if not output_modules:
+                output_modules = None
+
+            self.scan = Scanner(
+                *module_test_base.targets,
+                modules=modules,
+                output_modules=output_modules,
+                name=module_test_base._scan_name,
+                config=self.config,
+                whitelist=module_test_base.whitelist,
+                blacklist=module_test_base.blacklist,
+            )
+            self.events = []
+            self.log = logging.getLogger(f"bbot.test.{module_test_base.name}")
+
+        def set_expect_requests(self, expect_args={}, respond_args={}):
+            if "uri" not in expect_args:
+                expect_args["uri"] = "/"
+            self.httpserver.expect_request(**expect_args).respond_with_data(**respond_args)
+
+        @property
+        def module(self):
+            return self.scan.modules[self.name]
+
+    @pytest_asyncio.fixture
+    async def module_test(self, httpx_mock, bbot_httpserver, monkeypatch):
+        module_test = self.ModuleTest(self, httpx_mock, bbot_httpserver, monkeypatch)
+        self.setup_before_prep(module_test)
+        await module_test.scan.prep()
+        self.setup_after_prep(module_test)
+        module_test.events = [e async for e in module_test.scan.start()]
+        yield module_test
+
+    @pytest.mark.asyncio
+    async def test_module_run(self, module_test):
+        self.check(module_test, module_test.events)
+
+    @abstractmethod
+    def check(self, module_test, events):
+        raise NotImplementedError
+
+    @property
+    def name(self):
+        if self.module_name is not None:
+            return self.module_name
+        return self.__class__.__name__.split("Test")[-1].lower()
+
+    @property
+    def _scan_name(self):
+        if self.scan_name:
+            return self.scan_name
+        return f"{self.__class__.__name__.lower()}_test_{rand_string()}"
+
+    @property
+    def modules(self):
+        if self.modules_overrides:
+            return self.modules_overrides
+        return [self.name]
+
+    def setup_before_prep(self, module_test):
+        pass
+
+    def setup_after_prep(self, module_test):
+        pass
diff --git a/bbot/test/test_step_1/module_tests/test__module__tests.py b/bbot/test/test_step_1/module_tests/test__module__tests.py
new file mode 100644
index 0000000000..4fbc60aa8a
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test__module__tests.py
@@ -0,0 +1,35 @@
+import logging
+import importlib
+from pathlib import Path
+
+from .base import ModuleTestBase
+from bbot.modules import module_loader
+
+log = logging.getLogger("bbot.test.modules")
+
+parent_dir = Path(__file__).parent
+
+_module_test_files = list(parent_dir.glob("test_module_*.py"))
+_module_test_files.sort(key=lambda p: p.name)
+module_test_files = [m.name.split("test_module_")[-1].split(".")[0] for m in _module_test_files]
+
+
+def test__module__tests():
+    # make sure each module has a .py file
+    for module_name in module_loader.preloaded():
+        module_name = module_name.lower()
+        assert module_name in module_test_files, f'No test file found for module "{module_name}"'
+
+    # make sure each test file has a test class
+    for file in _module_test_files:
+        module_name = file.stem
+        import_path = f"bbot.test.test_step_1.module_tests.{module_name}"
+        module_test_variables = importlib.import_module(import_path, "bbot")
+        module_pass = False
+        for var_name in dir(module_test_variables):
+            if var_name.startswith("Test"):
+                test_class = getattr(module_test_variables, var_name)
+                if ModuleTestBase in getattr(test_class, "__mro__", ()):
+                    module_pass = True
+                    break
+        assert module_pass, f"Couldn't find a test class for {module_name} in {file}"
diff --git a/bbot/test/test_step_1/module_tests/test_module_affiliates.py b/bbot/test/test_step_1/module_tests/test_module_affiliates.py
new file mode 100644
index 0000000000..18737cb831
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_affiliates.py
@@ -0,0 +1,11 @@
+from .base import ModuleTestBase
+
+
+class TestAffiliates(ModuleTestBase):
+    targets = ["8.8.8.8"]
+    config_overrides = {"dns_resolution": True}
+
+    def check(self, module_test, events):
+        filename = next(module_test.scan.home.glob("affiliates-table*.txt"))
+        with open(filename) as f:
+            assert "zdns.google" in f.read()
diff --git a/bbot/test/test_step_1/module_tests/test_module_aggregate.py b/bbot/test/test_step_1/module_tests/test_module_aggregate.py
new file mode 100644
index 0000000000..b3d72c57e9
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_aggregate.py
@@ -0,0 +1,11 @@
+from .base import ModuleTestBase
+
+
+class TestAggregate(ModuleTestBase):
+    config_overrides = {"dns_resolution": True}
+
+    def check(self, module_test, events):
+        module_test.log.critical(events)
+        filename = next(module_test.scan.home.glob("scan-stats-table*.txt"))
+        with open(filename) as f:
+            assert "| A  " in f.read()
diff --git a/bbot/test/test_step_1/module_tests/test_module_anubisdb.py b/bbot/test/test_step_1/module_tests/test_module_anubisdb.py
new file mode 100644
index 0000000000..d4a7168d89
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_anubisdb.py
@@ -0,0 +1,13 @@
+from .base import ModuleTestBase
+
+
+class TestAnubisdb(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.module.abort_if = lambda e: False
+        module_test.httpx_mock.add_response(
+            url=f"https://jldc.me/anubis/subdomains/blacklanternsecurity.com",
+            json=["asdf.blacklanternsecurity.com", "zzzz.blacklanternsecurity.com"],
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_asn.py b/bbot/test/test_step_1/module_tests/test_module_asn.py
new file mode 100644
index 0000000000..b027dfc04a
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_asn.py
@@ -0,0 +1,239 @@
+from .base import ModuleTestBase
+
+
+class TestASNBGPView(ModuleTestBase):
+    targets = ["8.8.8.8"]
+    module_name = "asn"
+    config_overrides = {"scope_report_distance": 2}
+
+    response_get_asn_bgpview = {
+        "status": "ok",
+        "status_message": "Query was successful",
+        "data": {
+            "ip": "8.8.8.8",
+            "ptr_record": "dns.google",
+            "prefixes": [
+                {
+                    "prefix": "8.8.8.0/24",
+                    "ip": "8.8.8.0",
+                    "cidr": 24,
+                    "asn": {"asn": 15169, "name": "GOOGLE", "description": "Google LLC", "country_code": "US"},
+                    "name": "LVLT-GOGL-8-8-8",
+                    "description": "Google LLC",
+                    "country_code": "US",
+                }
+            ],
+            "rir_allocation": {
+                "rir_name": "ARIN",
+                "country_code": None,
+                "ip": "8.0.0.0",
+                "cidr": 9,
+                "prefix": "8.0.0.0/9",
+                "date_allocated": "1992-12-01 00:00:00",
+                "allocation_status": "allocated",
+            },
+            "iana_assignment": {
+                "assignment_status": "legacy",
+                "description": "Administered by ARIN",
+                "whois_server": "whois.arin.net",
+                "date_assigned": None,
+            },
+            "maxmind": {"country_code": None, "city": None},
+        },
+        "@meta": {"time_zone": "UTC", "api_version": 1, "execution_time": "567.18 ms"},
+    }
+    response_get_emails_bgpview = {
+        "status": "ok",
+        "status_message": "Query was successful",
+        "data": {
+            "asn": 15169,
+            "name": "GOOGLE",
+            "description_short": "Google LLC",
+            "description_full": ["Google LLC"],
+            "country_code": "US",
+            "website": "https://about.google/intl/en/",
+            "email_contacts": ["network-abuse@google.com", "arin-contact@google.com"],
+            "abuse_contacts": ["network-abuse@google.com"],
+            "looking_glass": None,
+            "traffic_estimation": None,
+            "traffic_ratio": "Mostly Outbound",
+            "owner_address": ["1600 Amphitheatre Parkway", "Mountain View", "CA", "94043", "US"],
+            "rir_allocation": {
+                "rir_name": "ARIN",
+                "country_code": "US",
+                "date_allocated": "2000-03-30 00:00:00",
+                "allocation_status": "assigned",
+            },
+            "iana_assignment": {
+                "assignment_status": None,
+                "description": None,
+                "whois_server": None,
+                "date_assigned": None,
+            },
+            "date_updated": "2023-02-07 06:39:11",
+        },
+        "@meta": {"time_zone": "UTC", "api_version": 1, "execution_time": "56.55 ms"},
+    }
+
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.bgpview.io/ip/8.8.8.8", json=self.response_get_asn_bgpview
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.bgpview.io/asn/15169", json=self.response_get_emails_bgpview
+        )
+        module_test.module.sources = ["bgpview"]
+
+    def check(self, module_test, events):
+        assert any(e.type == "ASN" for e in events)
+        assert any(e.type == "EMAIL_ADDRESS" for e in events)
+
+
+class TestASNRipe(ModuleTestBase):
+    targets = ["8.8.8.8"]
+    module_name = "asn"
+    config_overrides = {"scope_report_distance": 2}
+
+    response_get_asn_ripe = {
+        "messages": [],
+        "see_also": [],
+        "version": "1.1",
+        "data_call_name": "network-info",
+        "data_call_status": "supported",
+        "cached": False,
+        "data": {"asns": ["15169"], "prefix": "8.8.8.0/24"},
+        "query_id": "20230217212133-f278ff23-d940-4634-8115-a64dee06997b",
+        "process_time": 5,
+        "server_id": "app139",
+        "build_version": "live.2023.2.1.142",
+        "status": "ok",
+        "status_code": 200,
+        "time": "2023-02-17T21:21:33.428469",
+    }
+    response_get_asn_metadata_ripe = {
+        "messages": [],
+        "see_also": [],
+        "version": "4.1",
+        "data_call_name": "whois",
+        "data_call_status": "supported - connecting to ursa",
+        "cached": False,
+        "data": {
+            "records": [
+                [
+                    {"key": "ASNumber", "value": "15169", "details_link": None},
+                    {"key": "ASName", "value": "GOOGLE", "details_link": None},
+                    {"key": "ASHandle", "value": "15169", "details_link": "https://stat.ripe.net/AS15169"},
+                    {"key": "RegDate", "value": "2000-03-30", "details_link": None},
+                    {
+                        "key": "Ref",
+                        "value": "https://rdap.arin.net/registry/autnum/15169",
+                        "details_link": "https://rdap.arin.net/registry/autnum/15169",
+                    },
+                    {"key": "source", "value": "ARIN", "details_link": None},
+                ],
+                [
+                    {"key": "OrgAbuseHandle", "value": "ABUSE5250-ARIN", "details_link": None},
+                    {"key": "OrgAbuseName", "value": "Abuse", "details_link": None},
+                    {"key": "OrgAbusePhone", "value": "+1-650-253-0000", "details_link": None},
+                    {
+                        "key": "OrgAbuseEmail",
+                        "value": "network-abuse@google.com",
+                        "details_link": "mailto:network-abuse@google.com",
+                    },
+                    {
+                        "key": "OrgAbuseRef",
+                        "value": "https://rdap.arin.net/registry/entity/ABUSE5250-ARIN",
+                        "details_link": "https://rdap.arin.net/registry/entity/ABUSE5250-ARIN",
+                    },
+                    {"key": "source", "value": "ARIN", "details_link": None},
+                ],
+                [
+                    {"key": "OrgName", "value": "Google LLC", "details_link": None},
+                    {"key": "OrgId", "value": "GOGL", "details_link": None},
+                    {"key": "Address", "value": "1600 Amphitheatre Parkway", "details_link": None},
+                    {"key": "City", "value": "Mountain View", "details_link": None},
+                    {"key": "StateProv", "value": "CA", "details_link": None},
+                    {"key": "PostalCode", "value": "94043", "details_link": None},
+                    {"key": "Country", "value": "US", "details_link": None},
+                    {"key": "RegDate", "value": "2000-03-30", "details_link": None},
+                    {
+                        "key": "Comment",
+                        "value": "Please note that the recommended way to file abuse complaints are located in the following links.",
+                        "details_link": None,
+                    },
+                    {
+                        "key": "Comment",
+                        "value": "To report abuse and illegal activity: https://www.google.com/contact/",
+                        "details_link": None,
+                    },
+                    {
+                        "key": "Comment",
+                        "value": "For legal requests: http://support.google.com/legal",
+                        "details_link": None,
+                    },
+                    {"key": "Comment", "value": "Regards,", "details_link": None},
+                    {"key": "Comment", "value": "The Google Team", "details_link": None},
+                    {
+                        "key": "Ref",
+                        "value": "https://rdap.arin.net/registry/entity/GOGL",
+                        "details_link": "https://rdap.arin.net/registry/entity/GOGL",
+                    },
+                    {"key": "source", "value": "ARIN", "details_link": None},
+                ],
+                [
+                    {"key": "OrgTechHandle", "value": "ZG39-ARIN", "details_link": None},
+                    {"key": "OrgTechName", "value": "Google LLC", "details_link": None},
+                    {"key": "OrgTechPhone", "value": "+1-650-253-0000", "details_link": None},
+                    {
+                        "key": "OrgTechEmail",
+                        "value": "arin-contact@google.com",
+                        "details_link": "mailto:arin-contact@google.com",
+                    },
+                    {
+                        "key": "OrgTechRef",
+                        "value": "https://rdap.arin.net/registry/entity/ZG39-ARIN",
+                        "details_link": "https://rdap.arin.net/registry/entity/ZG39-ARIN",
+                    },
+                    {"key": "source", "value": "ARIN", "details_link": None},
+                ],
+                [
+                    {"key": "RTechHandle", "value": "ZG39-ARIN", "details_link": None},
+                    {"key": "RTechName", "value": "Google LLC", "details_link": None},
+                    {"key": "RTechPhone", "value": "+1-650-253-0000", "details_link": None},
+                    {"key": "RTechEmail", "value": "arin-contact@google.com", "details_link": None},
+                    {
+                        "key": "RTechRef",
+                        "value": "https://rdap.arin.net/registry/entity/ZG39-ARIN",
+                        "details_link": None,
+                    },
+                    {"key": "source", "value": "ARIN", "details_link": None},
+                ],
+            ],
+            "irr_records": [],
+            "authorities": ["arin"],
+            "resource": "15169",
+            "query_time": "2023-02-17T21:25:00",
+        },
+        "query_id": "20230217212529-75f57efd-59f4-473f-8bdd-803062e94290",
+        "process_time": 268,
+        "server_id": "app143",
+        "build_version": "live.2023.2.1.142",
+        "status": "ok",
+        "status_code": 200,
+        "time": "2023-02-17T21:25:29.417812",
+    }
+
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://stat.ripe.net/data/network-info/data.json?resource=8.8.8.8",
+            json=self.response_get_asn_ripe,
+        )
+        module_test.httpx_mock.add_response(
+            url="https://stat.ripe.net/data/whois/data.json?resource=15169",
+            json=self.response_get_asn_metadata_ripe,
+        )
+        module_test.module.sources = ["ripe"]
+
+    def check(self, module_test, events):
+        assert any(e.type == "ASN" for e in events)
+        assert any(e.type == "EMAIL_ADDRESS" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_asset_inventory.py b/bbot/test/test_step_1/module_tests/test_module_asset_inventory.py
new file mode 100644
index 0000000000..b128fd6275
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_asset_inventory.py
@@ -0,0 +1,17 @@
+from .base import ModuleTestBase
+
+
+class TestAsset_Inventory(ModuleTestBase):
+    targets = ["8.8.8.8"]
+    config_overrides = {"dns_resolution": True}
+
+    def check(self, module_test, events):
+        filename = next(module_test.scan.home.glob("asset-inventory.csv"))
+        with open(filename) as f:
+            assert "8.8.8.8,,8.8.8.8" in f.read()
+        filename = next(module_test.scan.home.glob("asset-inventory-ip-addresses-table*.txt"))
+        with open(filename) as f:
+            assert "8.8.0.0/16" in f.read()
+        filename = next(module_test.scan.home.glob("asset-inventory-domains-table*.txt"))
+        with open(filename) as f:
+            assert "dns.google" in f.read()
diff --git a/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py b/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py
new file mode 100644
index 0000000000..9e37b02069
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py
@@ -0,0 +1,46 @@
+from .base import ModuleTestBase
+
+
+class TestAzure_Tenant(ModuleTestBase):
+    tenant_response = """
+<?xml version="1.0"?>
+<s:Envelope xmlns:s="http://schemas.xmlsoap.org/soap/envelope/" xmlns:a="http://www.w3.org/2005/08/addressing">
+  <s:Header>
+    <a:Action s:mustUnderstand="1">http://schemas.microsoft.com/exchange/2010/Autodiscover/Autodiscover/GetFederationInformationResponse</a:Action>
+    <h:ServerVersionInfo xmlns:h="http://schemas.microsoft.com/exchange/2010/Autodiscover" xmlns:i="http://www.w3.org/2001/XMLSchema-instance">
+      <h:MajorVersion>15</h:MajorVersion>
+      <h:MinorVersion>20</h:MinorVersion>
+      <h:MajorBuildNumber>6411</h:MajorBuildNumber>
+      <h:MinorBuildNumber>14</h:MinorBuildNumber>
+      <h:Version>Exchange2015</h:Version>
+    </h:ServerVersionInfo>
+  </s:Header>
+  <s:Body>
+    <GetFederationInformationResponseMessage xmlns="http://schemas.microsoft.com/exchange/2010/Autodiscover">
+      <Response xmlns:i="http://www.w3.org/2001/XMLSchema-instance">
+        <ErrorCode>NoError</ErrorCode>
+        <ErrorMessage/>
+        <ApplicationUri>outlook.com</ApplicationUri>
+        <Domains>
+          <Domain>blacklanternsecurity.onmicrosoft.com</Domain>
+        </Domains>
+        <TokenIssuers>
+          <TokenIssuer>
+            <Endpoint>https://login.microsoftonline.com/extSTS.srf</Endpoint>
+            <Uri>urn:federation:MicrosoftOnline</Uri>
+          </TokenIssuer>
+        </TokenIssuers>
+      </Response>
+    </GetFederationInformationResponseMessage>
+  </s:Body>
+</s:Envelope>"""
+
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            method="POST",
+            url="https://autodiscover-s.outlook.com/autodiscover/autodiscover.svc",
+            text=self.tenant_response,
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "blacklanternsecurity.onmicrosoft.com" and "affiliate" in e.tags for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_badsecrets.py b/bbot/test/test_step_1/module_tests/test_module_badsecrets.py
new file mode 100644
index 0000000000..daa39f946a
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_badsecrets.py
@@ -0,0 +1,110 @@
+from .base import ModuleTestBase
+
+
+class TestBadSecrets(ModuleTestBase):
+    targets = [
+        "http://127.0.0.1:8888/",
+        "http://127.0.0.1:8888/test.aspx",
+        "http://127.0.0.1:8888/cookie.aspx",
+        "http://127.0.0.1:8888/cookie2.aspx",
+    ]
+
+    sample_viewstate = """
+    <form method="post" action="./query.aspx" id="form1">
+<div class="aspNetHidden">
+<input type="hidden" name="__VIEWSTATE" id="__VIEWSTATE" value="rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu" />
+</div>
+
+<div class="aspNetHidden">
+
+    <input type="hidden" name="__VIEWSTATEGENERATOR" id="__VIEWSTATEGENERATOR" value="EDD8C9AE" />
+    <input type="hidden" name="__VIEWSTATEENCRYPTED" id="__VIEWSTATEENCRYPTED" value="" />
+</div>
+    </form>
+</body>
+</html>
+"""
+
+    sample_viewstate_notvuln = """
+    <form method="post" action="./query.aspx" id="form1">
+<div class="aspNetHidden">
+<input type="hidden" name="__VIEWSTATE" id="__VIEWSTATE" value="AAAAYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESfAAAA" />
+</div>
+
+<div class="aspNetHidden">
+
+    <input type="hidden" name="__VIEWSTATEGENERATOR" id="__VIEWSTATEGENERATOR" value="EDD8C9AE" />
+    <input type="hidden" name="__VIEWSTATEENCRYPTED" id="__VIEWSTATEENCRYPTED" value="" />
+</div>
+    </form>
+</body>
+</html>
+"""
+
+    modules_overrides = ["badsecrets", "httpx"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"uri": "/test.aspx"}
+        respond_args = {"response_data": self.sample_viewstate}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.sample_viewstate_notvuln}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+        expect_args = {"uri": "/cookie.aspx"}
+        respond_args = {
+            "response_data": "<html><body><p>JWT Cookie Test</p></body></html>",
+            "headers": {
+                "set-cookie": "vulnjwt=eyJhbGciOiJIUzI1NiJ9.eyJJc3N1ZXIiOiJJc3N1ZXIiLCJVc2VybmFtZSI6IkJhZFNlY3JldHMiLCJleHAiOjE1OTMxMzM0ODMsImlhdCI6MTQ2NjkwMzA4M30.ovqRikAo_0kKJ0GVrAwQlezymxrLGjcEiW_s3UJMMCo; secure"
+            },
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"uri": "/cookie2.aspx"}
+        respond_args = {
+            "response_data": "<html><body><p>Express Cookie Test</p></body></html>",
+            "headers": {
+                "set-cookie": "connect.sid=s%3A8FnPwdeM9kdGTZlWvdaVtQ0S1BCOhY5G.qys7H2oGSLLdRsEq7sqh7btOohHsaRKqyjV4LiVnBvc; Path=/; Expires=Wed, 05 Apr 2023 04:47:29 GMT; HttpOnly"
+            },
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        SecretFound = False
+        IdentifyOnly = False
+        CookieBasedDetection = False
+        CookieBasedDetection_2 = False
+
+        for e in events:
+            if (
+                e.type == "VULNERABILITY"
+                and e.data["description"]
+                == "Known Secret Found. Secret Type: [ASP.NET MachineKey] Secret: [validationKey: 0F97BAE23F6F36801ABDB5F145124E00A6F795A97093D778EE5CD24F35B78B6FC4C0D0D4420657689C4F321F8596B59E83F02E296E970C4DEAD2DFE226294979 validationAlgo: SHA1 encryptionKey: 8CCFBC5B7589DD37DC3B4A885376D7480A69645DAEEC74F418B4877BEC008156 encryptionAlgo: AES] Product Type: [ASP.NET Viewstate] Product: [rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu] Detecting Module: [ASPNET_Viewstate]"
+            ):
+                SecretFound = True
+
+            if (
+                e.type == "FINDING"
+                and e.data["description"]
+                == "Cryptographic Product identified. Product Type: [ASP.NET Viewstate] Product: [AAAAYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESfAAAA] Detecting Module: [ASPNET_Viewstate]"
+            ):
+                IdentifyOnly = True
+
+            if (
+                e.type == "VULNERABILITY"
+                and e.data["description"]
+                == "Known Secret Found. Secret Type: [HMAC/RSA Key] Secret: [1234] Product Type: [JSON Web Token (JWT)] Product: [eyJhbGciOiJIUzI1NiJ9.eyJJc3N1ZXIiOiJJc3N1ZXIiLCJVc2VybmFtZSI6IkJhZFNlY3JldHMiLCJleHAiOjE1OTMxMzM0ODMsImlhdCI6MTQ2NjkwMzA4M30.ovqRikAo_0kKJ0GVrAwQlezymxrLGjcEiW_s3UJMMCo] Detecting Module: [Generic_JWT]"
+            ):
+                CookieBasedDetection = True
+
+            if (
+                e.type == "VULNERABILITY"
+                and e.data["description"]
+                == "Known Secret Found. Secret Type: [Express.js SESSION_SECRET] Secret: [keyboard cat] Product Type: [Express.js Signed Cookie] Product: [s%3A8FnPwdeM9kdGTZlWvdaVtQ0S1BCOhY5G.qys7H2oGSLLdRsEq7sqh7btOohHsaRKqyjV4LiVnBvc] Detecting Module: [ExpressSignedCookies]"
+            ):
+                CookieBasedDetection_2 = True
+
+        assert SecretFound, "No secret found"
+        assert IdentifyOnly, "No crypto product identified"
+        assert CookieBasedDetection, "No JWT cookie detected"
+        assert CookieBasedDetection_2, "No Express.js cookie detected"
diff --git a/bbot/test/test_step_1/module_tests/test_module_bevigil.py b/bbot/test/test_step_1/module_tests/test_module_bevigil.py
new file mode 100644
index 0000000000..bceeecc4a9
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_bevigil.py
@@ -0,0 +1,24 @@
+from .base import ModuleTestBase
+
+
+class TestBeVigil(ModuleTestBase):
+    config_overrides = {"modules": {"bevigil": {"api_key": "asdf", "urls": True}}}
+
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://osint.bevigil.com/api/blacklanternsecurity.com/subdomains/",
+            json={
+                "domain": "blacklanternsecurity.com",
+                "subdomains": [
+                    "asdf.blacklanternsecurity.com",
+                ],
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url=f"https://osint.bevigil.com/api/blacklanternsecurity.com/urls/",
+            json={"domain": "blacklanternsecurity.com", "urls": ["https://asdf.blacklanternsecurity.com"]},
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "https://asdf.blacklanternsecurity.com/" for e in events), "Failed to detect url"
diff --git a/bbot/test/test_step_1/module_tests/test_module_binaryedge.py b/bbot/test/test_step_1/module_tests/test_module_binaryedge.py
new file mode 100644
index 0000000000..4845413da0
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_binaryedge.py
@@ -0,0 +1,31 @@
+from .base import ModuleTestBase
+
+
+class TestBinaryEdge(ModuleTestBase):
+    config_overrides = {"modules": {"binaryedge": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://api.binaryedge.io/v2/query/domains/subdomain/blacklanternsecurity.com",
+            json={
+                "query": "blacklanternsecurity.com",
+                "page": 1,
+                "pagesize": 100,
+                "total": 1,
+                "events": [
+                    "asdf.blacklanternsecurity.com",
+                ],
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url=f"https://api.binaryedge.io/v2/user/subscription",
+            json={
+                "subscription": {"name": "Free"},
+                "end_date": "2023-06-17",
+                "requests_left": 249,
+                "requests_plan": 250,
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py b/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py
new file mode 100644
index 0000000000..5be98dd86e
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py
@@ -0,0 +1,93 @@
+import re
+
+from .base import ModuleTestBase
+from bbot.core.helpers.misc import rand_string
+
+__all__ = ["random_bucket_name_1", "random_bucket_name_2", "random_bucket_name_3", "Bucket_AWS_Base"]
+
+# first one is a normal bucket
+random_bucket_name_1 = rand_string(15, digits=False)
+# second one is open/vulnerable
+random_bucket_name_2 = rand_string(15, digits=False)
+# third one is a mutation
+random_bucket_name_3 = f"{random_bucket_name_2}-dev"
+
+
+class Bucket_AWS_Base(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    provider = "aws"
+
+    random_bucket_1 = f"{random_bucket_name_1}.s3.amazonaws.com"
+    random_bucket_2 = f"{random_bucket_name_2}.s3-ap-southeast-2.amazonaws.com"
+    random_bucket_3 = f"{random_bucket_name_3}.s3.amazonaws.com"
+
+    open_bucket_body = """<?xml version="1.0" encoding="UTF-8"?>
+    <ListBucketResult xmlns="http://s3.amazonaws.com/doc/2006-03-01/"><Name>vpn-static</Name><Prefix></Prefix><Marker></Marker><MaxKeys>1000</MaxKeys><IsTruncated>false</IsTruncated><Contents><Key>style.css</Key><LastModified>2017-03-18T06:41:59.000Z</LastModified><ETag>&quot;bf9e72bdab09b785f05ff0395023cc35&quot;</ETag><Size>429</Size><StorageClass>STANDARD</StorageClass></Contents></ListBucketResult>"""
+
+    @property
+    def config_overrides(self):
+        return {"modules": {f"bucket_{self.provider}": {"permutations": True}}}
+
+    @property
+    def modules_overrides(self):
+        return ["excavate", "speculate", "httpx", f"bucket_{self.provider}"]
+
+    def url_setup(self):
+        self.url_1 = f"https://{self.random_bucket_1}"
+        self.url_2 = f"https://{self.random_bucket_2}"
+        self.url_3 = f"https://{self.random_bucket_3}"
+
+    def bucket_setup(self):
+        self.url_setup()
+        self.website_body = f"""
+        <a href="{self.url_1}"/>
+        <a href="{self.url_2}"/>
+        """
+
+    def setup_after_prep(self, module_test):
+        self.bucket_setup()
+        # patch mutations
+        module_test.scan.helpers.word_cloud.mutations = lambda b, cloud=False: [
+            (b, "dev"),
+        ]
+        module_test.set_expect_requests(
+            expect_args={"method": "GET", "uri": "/"}, respond_args={"response_data": self.website_body}
+        )
+        if module_test.module.supports_open_check:
+            module_test.httpx_mock.add_response(
+                url=self.url_2,
+                text=self.open_bucket_body,
+            )
+        module_test.httpx_mock.add_response(
+            url=self.url_3,
+            text="",
+        )
+        module_test.httpx_mock.add_response(url=re.compile(".*"), text="", status_code=404)
+
+    def check(self, module_test, events):
+        # make sure buckets were excavated
+        assert any(
+            e.type == "STORAGE_BUCKET" and str(e.module) == f"{self.provider}_cloud" for e in events
+        ), f'bucket not found for provider "{self.provider}"'
+        # make sure open buckets were found
+        if module_test.module.supports_open_check:
+            assert any(
+                e.type == "FINDING" and str(e.module) == f"bucket_{self.provider}" for e in events
+            ), f'open bucket not found for provider "{self.provider}"'
+            for e in events:
+                if e.type == "FINDING" and str(e.module) == f"bucket_{self.provider}":
+                    url = e.data.get("url", "")
+                    assert self.random_bucket_2 in url
+                    assert not self.random_bucket_1 in url
+                    assert not f"{self.random_bucket_3}" in url
+        # make sure bucket mutations were found
+        assert any(
+            e.type == "STORAGE_BUCKET"
+            and str(e.module) == f"bucket_{self.provider}"
+            and f"{random_bucket_name_3}" in e.data["url"]
+            for e in events
+        ), f'bucket (dev mutation) not found for provider "{self.provider}"'
+
+
+class TestBucket_AWS(Bucket_AWS_Base):
+    pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_azure.py b/bbot/test/test_step_1/module_tests/test_module_bucket_azure.py
new file mode 100644
index 0000000000..3081462ba8
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_bucket_azure.py
@@ -0,0 +1,13 @@
+from .test_module_bucket_aws import *
+
+
+class TestBucket_Azure(Bucket_AWS_Base):
+    provider = "azure"
+    random_bucket_1 = f"{random_bucket_name_1}.blob.core.windows.net"
+    random_bucket_2 = f"{random_bucket_name_2}.blob.core.windows.net"
+    random_bucket_3 = f"{random_bucket_name_3}.blob.core.windows.net"
+
+    def url_setup(self):
+        self.url_1 = f"https://{self.random_bucket_1}"
+        self.url_2 = f"https://{self.random_bucket_2}"
+        self.url_3 = f"https://{self.random_bucket_3}/{random_bucket_name_3}?restype=container"
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_digitalocean.py b/bbot/test/test_step_1/module_tests/test_module_bucket_digitalocean.py
new file mode 100644
index 0000000000..18d98b6413
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_bucket_digitalocean.py
@@ -0,0 +1,10 @@
+from .test_module_bucket_aws import *
+
+
+class TestBucket_DigitalOcean(Bucket_AWS_Base):
+    provider = "digitalocean"
+    random_bucket_1 = f"{random_bucket_name_1}.fra1.digitaloceanspaces.com"
+    random_bucket_2 = f"{random_bucket_name_2}.fra1.digitaloceanspaces.com"
+    random_bucket_3 = f"{random_bucket_name_3}.fra1.digitaloceanspaces.com"
+
+    open_bucket_body = """<?xml version="1.0" encoding="UTF-8"?><ListBucketResult xmlns="http://s3.amazonaws.com/doc/2006-03-01/"><Name>cloud01</Name><Prefix></Prefix><MaxKeys>1000</MaxKeys><IsTruncated>false</IsTruncated><Contents><Key>test.doc</Key><LastModified>2020-10-14T15:23:37.545Z</LastModified><ETag>&quot;4d25c8699f7347acc9f41e57148c62c0&quot;</ETag><Size>13362425</Size><StorageClass>STANDARD</StorageClass><Owner><ID>1957883</ID><DisplayName>1957883</DisplayName></Owner><Type>Normal</Type></Contents><Marker></Marker></ListBucketResult>"""
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_firebase.py b/bbot/test/test_step_1/module_tests/test_module_bucket_firebase.py
new file mode 100644
index 0000000000..f78f6cbc58
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_bucket_firebase.py
@@ -0,0 +1,13 @@
+from .test_module_bucket_aws import *
+
+
+class TestBucket_Firebase(Bucket_AWS_Base):
+    provider = "firebase"
+    random_bucket_1 = f"{random_bucket_name_1}.firebaseio.com"
+    random_bucket_2 = f"{random_bucket_name_2}.firebaseio.com"
+    random_bucket_3 = f"{random_bucket_name_3}.firebaseio.com"
+
+    def url_setup(self):
+        self.url_1 = f"https://{self.random_bucket_1}"
+        self.url_2 = f"https://{self.random_bucket_2}/.json"
+        self.url_3 = f"https://{self.random_bucket_3}/.json"
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_gcp.py b/bbot/test/test_step_1/module_tests/test_module_bucket_gcp.py
new file mode 100644
index 0000000000..49e35b52e2
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_bucket_gcp.py
@@ -0,0 +1,27 @@
+from .test_module_bucket_aws import *
+
+
+class TestBucket_GCP(Bucket_AWS_Base):
+    provider = "gcp"
+    random_bucket_1 = f"{random_bucket_name_1}.storage.googleapis.com"
+    random_bucket_2 = f"{random_bucket_name_2}.storage.googleapis.com"
+    random_bucket_3 = f"{random_bucket_name_3}.storage.googleapis.com"
+    open_bucket_body = """{
+  "kind": "storage#testIamPermissionsResponse",
+  "permissions": [
+    "storage.objects.create",
+    "storage.objects.list"
+  ]
+}"""
+
+    def bucket_setup(self):
+        self.url_setup()
+        self.website_body = f"""
+        <a href="{self.url_1}"/>
+        <a href="https://{self.random_bucket_2}"/>
+        """
+
+    def url_setup(self):
+        self.url_1 = f"{random_bucket_name_1}.storage.googleapis.com"
+        self.url_2 = f"https://www.googleapis.com/storage/v1/b/{random_bucket_name_2}/iam/testPermissions?permissions=storage.buckets.setIamPolicy&permissions=storage.objects.list&permissions=storage.objects.get&permissions=storage.objects.create"
+        self.url_3 = f"https://www.googleapis.com/storage/v1/b/{random_bucket_name_3}"
diff --git a/bbot/test/test_step_1/module_tests/test_module_builtwith.py b/bbot/test/test_step_1/module_tests/test_module_builtwith.py
new file mode 100644
index 0000000000..5ff69993fd
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_builtwith.py
@@ -0,0 +1,110 @@
+from .base import ModuleTestBase
+
+
+class TestBuiltWith(ModuleTestBase):
+    config_overrides = {"modules": {"builtwith": {"api_key": "asdf"}}}
+
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://api.builtwith.com/v20/api.json?KEY=asdf&LOOKUP=blacklanternsecurity.com&NOMETA=yes&NOATTR=yes&HIDETEXT=yes&HIDEDL=yes",
+            json={
+                "Results": [
+                    {
+                        "Result": {
+                            "IsDB": "True",
+                            "Spend": 734,
+                            "Paths": [
+                                {
+                                    "Technologies": [
+                                        {
+                                            "Name": "nginx",
+                                            "Tag": "Web Server",
+                                            "FirstDetected": 1533510000000,
+                                            "LastDetected": 1559516400000,
+                                            "IsPremium": "no",
+                                        },
+                                        {
+                                            "Parent": "nginx",
+                                            "Name": "Nginx 1.14",
+                                            "Tag": "Web Server",
+                                            "FirstDetected": 1555542000000,
+                                            "LastDetected": 1559516400000,
+                                            "IsPremium": "no",
+                                        },
+                                        {
+                                            "Name": "Domain Not Resolving",
+                                            "Tag": "hosting",
+                                            "FirstDetected": 1613894400000,
+                                            "LastDetected": 1633244400000,
+                                            "IsPremium": "no",
+                                        },
+                                    ],
+                                    "FirstIndexed": 1533510000000,
+                                    "LastIndexed": 1633244400000,
+                                    "Domain": "blacklanternsecurity.com",
+                                    "Url": "",
+                                    "SubDomain": "asdf",
+                                }
+                            ],
+                        },
+                        "Meta": {
+                            "Majestic": 0,
+                            "Umbrella": 0,
+                            "Vertical": "",
+                            "Social": None,
+                            "CompanyName": None,
+                            "Telephones": None,
+                            "Emails": [],
+                            "City": None,
+                            "State": None,
+                            "Postcode": None,
+                            "Country": "US",
+                            "Names": None,
+                            "ARank": 6249242,
+                            "QRank": -1,
+                        },
+                        "Attributes": {
+                            "Employees": 0,
+                            "MJRank": 0,
+                            "MJTLDRank": 0,
+                            "RefSN": 0,
+                            "RefIP": 0,
+                            "Followers": 0,
+                            "Sitemap": 0,
+                            "GTMTags": 0,
+                            "QubitTags": 0,
+                            "TealiumTags": 0,
+                            "AdobeTags": 0,
+                            "CDimensions": 0,
+                            "CGoals": 0,
+                            "CMetrics": 0,
+                            "ProductCount": 0,
+                        },
+                        "FirstIndexed": 1389481200000,
+                        "LastIndexed": 1684220400000,
+                        "Lookup": "blacklanternsecurity.com",
+                        "SalesRevenue": 0,
+                    }
+                ],
+                "Errors": [],
+                "Trust": None,
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url=f"https://api.builtwith.com/redirect1/api.json?KEY=asdf&LOOKUP=blacklanternsecurity.com",
+            json={
+                "Lookup": "blacklanternsecurity.com",
+                "Inbound": [
+                    {
+                        "Domain": "blacklanternsecurity.github.io",
+                        "FirstDetected": 1564354800000,
+                        "LastDetected": 1683783431121,
+                    }
+                ],
+                "Outbound": None,
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "blacklanternsecurity.github.io" for e in events), "Failed to detect redirect"
diff --git a/bbot/test/test_step_1/module_tests/test_module_bypass403.py b/bbot/test/test_step_1/module_tests/test_module_bypass403.py
new file mode 100644
index 0000000000..7446352319
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_bypass403.py
@@ -0,0 +1,50 @@
+import re
+from .base import ModuleTestBase
+
+
+class TestBypass403(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888/test"]
+    modules_overrides = ["bypass403", "httpx"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/test..;/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+        module_test.httpserver.no_handler_status_code = 403
+
+    def check(self, module_test, events):
+        findings = [e for e in events if e.type == "FINDING"]
+        assert len(findings) == 1
+        finding = findings[0]
+        assert "http://127.0.0.1:8888/test..;/" in finding.data["description"]
+
+
+class TestBypass403_aspnetcookieless(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888/admin.aspx"]
+    modules_overrides = ["bypass403", "httpx"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": re.compile(r"\/\([sS]\(\w+\)\)\/.+\.aspx")}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+        module_test.httpserver.no_handler_status_code = 403
+
+    def check(self, module_test, events):
+        findings = [e for e in events if e.type == "FINDING"]
+        assert len(findings) == 2
+        assert all("(S(X))/admin.aspx" in e.data["description"] for e in findings)
+
+
+class TestBypass403_waf(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888/test"]
+    modules_overrides = ["bypass403", "httpx"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/test..;/"}
+        respond_args = {"response_data": "The requested URL was rejected"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+        module_test.httpserver.no_handler_status_code = 403
+
+    def check(self, module_test, events):
+        findings = [e for e in events if e.type == "FINDING"]
+        assert not any(findings)
diff --git a/bbot/test/test_step_1/module_tests/test_module_c99.py b/bbot/test/test_step_1/module_tests/test_module_c99.py
new file mode 100644
index 0000000000..98c5e87652
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_c99.py
@@ -0,0 +1,25 @@
+from .base import ModuleTestBase
+
+
+class TestC99(ModuleTestBase):
+    config_overrides = {"modules": {"c99": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.c99.nl/randomnumber?key=asdf&between=1,100&json",
+            json={"success": True, "output": 65},
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.c99.nl/subdomainfinder?key=asdf&domain=blacklanternsecurity.com&json",
+            json={
+                "success": True,
+                "subdomains": [
+                    {"subdomain": "asdf.blacklanternsecurity.com", "ip": "1.2.3.4", "cloudflare": True},
+                ],
+                "cached": True,
+                "cache_time": "2023-05-19 03:13:05",
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_censys.py b/bbot/test/test_step_1/module_tests/test_module_censys.py
new file mode 100644
index 0000000000..e2792e6131
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_censys.py
@@ -0,0 +1,41 @@
+from .base import ModuleTestBase
+
+
+class TestCensys(ModuleTestBase):
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://search.censys.io/api/v1/account",
+            json={
+                "email": "info@blacklanternsecurity.com",
+                "login": "nope",
+                "first_login": "1917-08-03 20:03:55",
+                "last_login": "1918-05-19 01:15:22",
+                "quota": {"used": 26, "allowance": 250, "resets_at": "1919-06-03 16:30:32"},
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url="https://search.censys.io/api/v1/search/certificates",
+            match_content=b'{"query": "parsed.names: blacklanternsecurity.com", "page": 1, "fields": ["parsed.names"]}',
+            json={
+                "status": "ok",
+                "metadata": {
+                    "query": "parsed.names: blacklanternsecurity.com",
+                    "count": 1,
+                    "backend_time": 4465,
+                    "page": 1,
+                    "pages": 4,
+                },
+                "results": [
+                    {
+                        "parsed.names": [
+                            "asdf.blacklanternsecurity.com",
+                            "zzzz.blacklanternsecurity.com",
+                        ]
+                    },
+                ],
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_certspotter.py b/bbot/test/test_step_1/module_tests/test_module_certspotter.py
new file mode 100644
index 0000000000..fb6bb002c6
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_certspotter.py
@@ -0,0 +1,14 @@
+from .base import ModuleTestBase
+
+
+class TestCertspotter(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.module.abort_if = lambda e: False
+        for t in self.targets:
+            module_test.httpx_mock.add_response(
+                url="https://api.certspotter.com/v1/issuances?domain=blacklanternsecurity.com&include_subdomains=true&expand=dns_names",
+                json=[{"dns_names": ["*.asdf.blacklanternsecurity.com"]}],
+            )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_crobat.py b/bbot/test/test_step_1/module_tests/test_module_crobat.py
new file mode 100644
index 0000000000..c797541c27
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_crobat.py
@@ -0,0 +1,12 @@
+from .base import ModuleTestBase
+
+
+class TestCrobat(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://sonar.omnisint.io/subdomains/blacklanternsecurity.com",
+            json=["asdf.blacklanternsecurity.com"],
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_crt.py b/bbot/test/test_step_1/module_tests/test_module_crt.py
new file mode 100644
index 0000000000..f7a13e98de
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_crt.py
@@ -0,0 +1,15 @@
+from .base import ModuleTestBase
+
+
+class TestCRT(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.module.abort_if = lambda e: False
+        for t in self.targets:
+            module_test.httpx_mock.add_response(
+                url="https://crt.sh?q=%25.blacklanternsecurity.com&output=json",
+                json=[{"id": 1, "name_value": "asdf.blacklanternsecurity.com\nzzzz.blacklanternsecurity.com"}],
+            )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_csv.py b/bbot/test/test_step_1/module_tests/test_module_csv.py
new file mode 100644
index 0000000000..fc180d481b
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_csv.py
@@ -0,0 +1,8 @@
+from .base import ModuleTestBase
+
+
+class TestCSV(ModuleTestBase):
+    def check(self, module_test, events):
+        csv_file = module_test.scan.home / "output.csv"
+        with open(csv_file) as f:
+            assert "DNS_NAME,blacklanternsecurity.com,,TARGET" in f.read()
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py b/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
new file mode 100644
index 0000000000..4b2617a6bb
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
@@ -0,0 +1,19 @@
+from .base import ModuleTestBase
+
+
+class TestDNSCommonSRV(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        old_resolve_fn = module_test.scan.helpers.dns.resolve
+
+        async def resolve(query, **kwargs):
+            if query == "_ldap._tcp.gc._msdcs.blacklanternsecurity.com" and kwargs.get("type", "").upper() == "SRV":
+                return {"asdf.blacklanternsecurity.com"}
+            return await old_resolve_fn(query, **kwargs)
+
+        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "resolve", resolve)
+
+    def check(self, module_test, events):
+        assert any(
+            e.data == "_ldap._tcp.gc._msdcs.blacklanternsecurity.com" for e in events
+        ), "Failed to detect subdomain"
+        assert not any(e.data == "_ldap._tcp.dc._msdcs.blacklanternsecurity.com" for e in events), "False positive"
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py b/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py
new file mode 100644
index 0000000000..b7b1067cf4
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py
@@ -0,0 +1,18 @@
+from .base import ModuleTestBase
+
+
+class TestDNSDumpster(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://dnsdumpster.com",
+            headers={"Set-Cookie": "csrftoken=asdf"},
+            content=b'<!DOCTYPE html>\n<html lang="en">\n  <head>\n\n    <meta charset="utf-8">\n    <meta http-equiv="X-UA-Compatible" content="IE=edge">\n<meta name="google-site-verification" content="vAWNZCy-5XAPGRgA2_NY5HictfnByvgpqOLQUAmVZW0" />\n    <meta name="viewport" content="width=device-width, initial-scale=1">\n    <meta name="description" content="Find dns records in order to identify the Internet footprint of an organization. Recon that enables deeper security assessments and discovery of the attack surface.">\n    <meta name="author" content="">\n    <link rel="icon" href="/static/favicon.ico">\n    <title>DNSdumpster.com - dns recon and research, find and lookup dns records</title>\n\n\n    <!-- Bootstrap core CSS -->\n    <link href="/static/css/bootstrap.min.css" rel="stylesheet">\n    <link href="/static/font-awesome/css/font-awesome.min.css" rel="stylesheet">\n\n    <!-- Custom styles for this template -->\n    <link href="/static/cover.css?v=1.4" rel="stylesheet">\n\n  </head>\n\n  <body>\n\n    <div class="site-wrapper">\n      <div class="site-wrapper-inner">\n<!-- Section 1 -->\n<section id="intro" data-speed="6" data-type="background">\n    <div class="container">\n\n   <div class="masthead clearfix">\n   <div class="container inner">\n        <nav>\n       <ul class="nav masthead-nav">\n   <li><a href="https://dnsdumpster.com/" data-toggle="tooltip"  data-placement="bottom" title="Home"><i style="font-size: 1.2em;" class="fa fa-home"></i></a></li>\n   <li><a href="/osint-network-defenders/"  data-toggle="tooltip"  data-placement="bottom" title="Defend"><i style="font-size: 1.2em;" class="fa fa-shield" aria-hidden="true"></i></a></li>\n   <li><a href="/footprinting-reconnaissance/" data-placement="bottom" data-toggle="tooltip" title="Learn"><i style="font-size: 1.2em;" class="fa fa-mortar-board" aria-hidden="true"></i></a></li>\n   <li><a href="https://hackertarget.com/" data-toggle="tooltip" title="Online Vulnerability Scanners"><i style="font-size: 1.2em; color: #00CC00;" class="fa fa-bullseye"></i></a></li>\n       </ul>\n        </nav>\n   </div>\n   </div>\n\n\n\n\n        <div class="cover-container" style="max-width: 900px;">\n          <div class="inner cover">\n            <h1 class="cover-heading" style="margin-top: 100px;">dns recon & research, find & lookup dns records</h1>\n<p class="lead">\n<div id="hideform">\n<form role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="XYxKkbdJJrio6VMqowCdykwpM4mAflKkF9BcKFbLdmPbB3lwXArEVJvTPNpIz50l">\n  <div class="form-group">\n<div class="col-md-2"></div><div class="col-md-6">\n\n<input class="form-control" type="text" placeholder="exampledomain.com" name="targetip" id="regularInput" autofocus>\n\n<input type="hidden" name="user" value="free">\n</div></div>\n<div align="left" id="formsubmit"><button type="submit" class="btn btn-default">Search <span class="glyphicon glyphicon-chevron-right"></span></button></div>\n</form></div></div>\n<div class="row"><div class="col-md-2"></div><div class="col-md-8">\n<div id="showloading" style="color: #fff;">Loading...<br>\n<div class="progress">\n<div class="progress-bar progress-bar-success progress-bar-striped active" role="progressbar" aria-valuenow="45" aria-valuemin="0" aria-valuemax="100" style="width: 100%">\n</div></div></div></div></div></div>\n</P>\n\n<div class="row"><div class="col-md-12" style="padding: 80px;">\n\n</div></div>\n\n<p class="lead" style="margin-top: 40px; margin-bottom: 30px;">DNSdumpster.com is a FREE domain research tool that can discover hosts related to a domain. Finding visible hosts from the attackers perspective is an important part of the security assessment process.</p>\n\n          </div>\n\n              <p style="color: #777; margin-top: 40px;">this is a <a href="https://hackertarget.com/" title="Online Vulnerability Scanners"><button type="button" class="btn btn-danger btn-xs">HackerTarget.com</button></a> project</p>\n\n\n      <div style="margin-top: 160px;" class="container">\n        <div class="row">\n          <div class="col-lg-12 text-center">\n            <h2 class="section-heading text-uppercase"></h2>\n            <h3 class="section-subheading text-muted">Open Source Intelligence for Networks</h3>\n          </div>\n        </div>\n        <div style="margin-top: 30px;" class="row text-center">\n          <div class="col-md-4">\n            <span class="fa-stack fa-4x">\n              <i class="fa fa-user-secret fa-stack-1x" style="color: #00CC00;"></i>\n            </span>\n            <h4 class="service-heading">Attack</h4>\n            <p class="text-muted">The ability to quickly identify the attack surface is essential. Whether you are penetration testing or chasing bug bounties.</p>\n          </div>\n          <div class="col-md-4">\n            <span class="fa-stack fa-4x">\n              <i class="fa fa-shield fa-stack-1x" style="color: #00CC00;"></i>\n            </span>\n            <h4 class="service-heading">Defend</h4>\n            <p class="text-muted">Network defenders benefit from passive reconnaissance in a number of ways. With analysis informing information security strategy.</p>\n          </div>\n          <div class="col-md-4">\n            <span class="fa-stack fa-4x">\n              <i class="fa fa-mortar-board fa-stack-1x" style="color: #00CC00;"></i>\n            </span>\n            <h4 class="service-heading">Learn</h4>\n            <p class="text-muted">Understanding network based OSINT helps information technologists to better operate, assess and manage the network.</p>\n          </div>\n        </div>\n      </div>\n\n\n\n\n    <div class="container" style="background-color: #474747; margin-top: 180px; padding-bottom: 80px;"><div class="col-md-2"></div><div class="col-md-8">\n\n       <span class="glyphicon glyphicon-trash" style="font-size: 4em; line-height: 5.5em;"></span>\n<p style="font-size: 1.7em; line-height: 1.9em; margin-bottom: 80px;">Map an organizations attack surface with a virtual <i>dumpster dive*</i> of the DNS records associated with the target organization.</p>\n<p style="font-size: 1.2em; color: #fff;">*DUMPSTER DIVING: The practice of sifting refuse from an office or technical installation to extract confidential data, especially security-compromising information.</p>\n</div>    </div>\n\n\n<div class="container" style="text-align: left; margin-top: 80px; margin-bottom: 80px;">\n\n<h2 style="font-size: 1.8em;">Frequently Asked Questions</h2>\n\n<h4 style="margin-top: 30px;">How can I take my security assessments to the next level?</h4>\n\n<p>The company behind DNSDumpster is <a href="https://hackertarget.com/" title="Online Vulnerability Scanners">hackertarget.com</a> where we provide online hosted access to trusted open source security vulnerability scanners and network intelligence tools.</P><P>Save time and headaches by incorporating our attack surface discovery into your vulnerability assessment process.</p><P style="text-align: center; padding: 30px;"><a href="https://hackertarget.com/" title="HackerTarget.com | Online Security Testing and Open Source Intelligence"><img src="https://hackertarget.com/wp-content/uploads/2019/09/know-your-network-tools.png" alt="HackerTarget.com | Online Security Testing and Open Source Intelligence"></a></p>\n\n<h4>What data does DNSDumpster use?</h4>\n\n<p>No brute force subdomain enumeration is used as is common in dns recon tools that enumerate subdomains. We use open source intelligence resources to query for related domain data. It is then compiled into an actionable resource for both attackers and defenders of Internet facing systems.</P>\n<P>More than a simple <a href="https://hackertarget.com/dns-lookup/" title="Online DNS Lookup">DNS lookup</a> this tool will discover those hard to find sub-domains and web hosts. The search relies on data from our crawls of the Alexa Top 1 Million sites, Search Engines, Common Crawl, Certificate Transparency, Max Mind, Team Cymru, Shodan and <a href="https://scans.io/" style="text-decoration: underline;">scans.io</a>.</P>\n\n<h4>I have hit the host limit, do you have a PRO option?</h4>\n\n<P>Over at <a href="https://hackertarget.com/" title="Online Vulnerability Scanners">hackertarget.com</a> there\'s a tool we call <a href="https://hackertarget.com/domain-profiler/">domain profiler</a>. This compiles data similiar to DNSDumpster; with additional data discovery. Queries available are based on the membership plan with the number of results (subdomains) being unlimited. With a STARTER membership you have access to the domain profiler tool for 12 months. Once the years membership expires you will revert to BASIC member status, however access to Domain Profiler and Basic Nmap scans continue. The BASIC access does not expire.</P>\n\n<h4>What are some other resources and tools for learning more?</h4>\n\n<P>There are some great open source recon frameworks that have been developed over the past couple of years. In addition tools such as <b>Metasploit</b> and <b>Nmap</b> include various modules for enumerating DNS. Check our <a href="https://dnsdumpster.com/footprinting-reconnaissance/">Getting Started with Footprinting</a> for more information.</P>\n\n</div>\n\n\n</div></div>\n</div></div>\n\n<footer>\n<div class="row" style="background-color: #1e1e1e; padding-top: 40px; padding-bottom: 20px;"><div class="container">\n<div class="col-md-6 col-sm-12 right-border" style="text-align: center;">\n<div class="footer-about" style="text-align: left; padding-left: 40px;">\n<h2 class="footer-title" style="font-size: 1.8em;">About</h2>\n<p style="margin-top: 20px;">At <a href="https://hackertarget.com/">hackertarget.com</a>, we have been scanning the Internet since 2007. Our vulnerability scanners now reach millions of IP addresses every year. We work to raise awareness of the value in open source security solutions.</p>\n</div>\n</div>\n<div class="col-md-6 col-sm-12">\n<div class="contact-info" style="text-align: left; padding-left: 40px;">\n<h2 class="footer-title" style="font-size: 1.8em;">Stay in Touch</h2>\n\n<div class="single">\n        <p><i style="font-size: 1.2em;" class="fa fa-envelope"></i> dnsdumpster@gmail.com</p>\n</div>\n<div class="single">\n        <p><i style="font-size: 1.2em;" class="fa fa-twitter"></i> <a href="https://twitter.com/hackertarget/">@hackertarget</a></p>\n</div>\n<!-- Begin MailChimp Signup Form -->\n<link href="https://cdn-images.mailchimp.com/embedcode/horizontal-slim-10_7.css" rel="stylesheet" type="text/css">\n<style type="text/css">\n    #mc_embed_signup{background:#1e1e1e; clear:left; font:14px Helvetica,Arial,sans-serif; width:100%;}\n        /* Add your own MailChimp form style overrides in your site stylesheet or in this style block.\n               We recommend moving this block and the preceding CSS link to the HEAD of your HTML file. */\n               </style>\n               <div id="mc_embed_signup">\n               <form action="https://dnsdumpster.us17.list-manage.com/subscribe/post?u=3cbc62d931a69e74b2c856f1a&amp;id=532c46ab39" method="post" id="mc-embedded-subscribe-form" name="mc-embedded-subscribe-form" class="validate" target="_blank" novalidate>\n                   <div id="mc_embed_signup_scroll" style="text-align: left;">\n\n                        <input type="email" value="" name="EMAIL" class="email" id="mce-EMAIL" placeholder="email address" required>\n                            <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->\n                                <div style="position: absolute; left: -5000px;" aria-hidden="true"><input type="text" name="b_3cbc62d931a69e74b2c856f1a_532c46ab39" tabindex="-1" value=""></div><br>\n                                    <div class="clear" style="margin-top: 5px;"><input type="submit" style="background-color: #00CC00;" value="Subscribe to our List" name="subscribe" id="mc-embedded-subscribe" class="button"> <span style="font-size: 0.8em;">Low volume Updates and News</a></div>\n                                        </div>\n                                        </form>\n                                        </div>\n\n                                        <!--End mc_embed_signup-->\n\n</div>\n</div>\n</div>\n<div class="clearfix"></div>\n<div class="copyright" style="background-color: #1e1e1e; margin-top: 20px;">\n<p>Copyright &copy; 2023 Hacker Target Pty Ltd</p>\n</div>\n</div>\n</div>\n</div>\n</footer>\n                                                </div>\n                                        </div>\n                                </div>\n                        </div>\n\n\n\n\n</div></div>\n\n    <!-- Bootstrap core JavaScript\n    ================================================== -->\n    <!-- Placed at the end of the document so the pages load faster -->\n    <script src="https://dnsdumpster.com/static/js/jquery-1.12.4.min.js"></script>\n    <script src="/static/js/bootstrap.min.js"></script>\n\n\n\n<script type="text/javascript">\n            $(document).ready(function() {\n$(\'[data-toggle="tooltip"]\').tooltip({\'placement\': \'top\'});\n\n$("body").on(\'DOMSubtreeModified\', ".modal-content", function() {\n    $(".modal-heading").hide();\n    $(".modal-content").show();\n});\n\n      $(\'body\').on(\'hidden.bs.modal\', \'.modal\', function () {\n        $(this).removeData(\'bs.modal\');\n      });\n\n            }); //END $(document).ready()\n\n\n$(\'a.external\').on(\'click\', function(e) {\n        e.preventDefault();\n        $(".modal-heading").show();\n        $(".modal-content").hide();\n\n\n        var url = $(this).attr(\'href\');\n        $(".modal-body").html(\'<iframe id="myiframe" style="background-color: #ccc;" width="100%" height="100%" frameborder="0" scrolling="yes" allowtransparency="true" src="\'+url+\'"></iframe>\');\n    });\n\n \n\n\n    $(\'#myModal\').on(\'show.bs.modal\', function () {\n        $(this).find(\'.modal-dialog\').css({\n                  width:\'80%\', //choose your width\n                  height:\'80%\',\n                  \'padding\':\'5\'\n           });\n         $(this).find(\'.modal-content\').css({\n                  height:\'100%\',\n                  \'border-radius\':\'0\',\n                  \'padding\':\'15\'\n           });\n         $(this).find(\'.modal-body\').html(null);\n         $(this).find(\'.modal-body\').css({\n                  width:\'auto\',\n                  height:\'100%\',\n                  \'padding\':\'5\'\n           });\n    })\n\n        </script>\n\n<script>\n$(document).ready(function(){\n  $("#showloading").hide();\n  $("#formsubmit").click(function(){\n    $("#hideform").hide();\n    $("#showloading").show();\n  });\n\n});\n</script>\n<!-- Google tag (gtag.js) -->\n<script async src="https://www.googletagmanager.com/gtag/js?id=G-FPGN9YXFNE"></script>\n<script>\n  window.dataLayer = window.dataLayer || [];\n  function gtag(){dataLayer.push(arguments);}\n  gtag(\'js\', new Date());\n\n  gtag(\'config\', \'G-FPGN9YXFNE\');\n</script>\n  </body>\n</html>\n',
+        )
+        module_test.httpx_mock.add_response(
+            url=f"https://dnsdumpster.com/",
+            method="POST",
+            content=b'<!DOCTYPE html>\n<html lang="en">\n  <head>\n\n    <meta charset="utf-8">\n    <meta http-equiv="X-UA-Compatible" content="IE=edge">\n<meta name="google-site-verification" content="vAWNZCy-5XAPGRgA2_NY5HictfnByvgpqOLQUAmVZW0" />\n    <meta name="viewport" content="width=device-width, initial-scale=1">\n    <meta name="description" content="Find dns records in order to identify the Internet footprint of an organization. Recon that enables deeper security assessments and discovery of the attack surface.">\n    <meta name="author" content="">\n    <link rel="icon" href="/static/favicon.ico">\n    <title>DNSdumpster.com - dns recon and research, find and lookup dns records</title>\n\n\n    <!-- Bootstrap core CSS -->\n    <link href="/static/css/bootstrap.min.css" rel="stylesheet">\n    <link href="/static/font-awesome/css/font-awesome.min.css" rel="stylesheet">\n\n    <!-- Custom styles for this template -->\n    <link href="/static/cover.css?v=1.4" rel="stylesheet">\n\n  </head>\n\n  <body>\n\n    <div class="site-wrapper">\n      <div class="site-wrapper-inner">\n<!-- Section 1 -->\n<section id="intro" data-speed="6" data-type="background">\n    <div class="container">\n\n   <div class="masthead clearfix">\n   <div class="container inner">\n        <nav>\n       <ul class="nav masthead-nav">\n   <li><a href="https://dnsdumpster.com/" data-toggle="tooltip"  data-placement="bottom" title="Home"><i style="font-size: 1.2em;" class="fa fa-home"></i></a></li>\n   <li><a href="/osint-network-defenders/"  data-toggle="tooltip"  data-placement="bottom" title="Defend"><i style="font-size: 1.2em;" class="fa fa-shield" aria-hidden="true"></i></a></li>\n   <li><a href="/footprinting-reconnaissance/" data-placement="bottom" data-toggle="tooltip" title="Learn"><i style="font-size: 1.2em;" class="fa fa-mortar-board" aria-hidden="true"></i></a></li>\n   <li><a href="https://hackertarget.com/" data-toggle="tooltip" title="Online Vulnerability Scanners"><i style="font-size: 1.2em; color: #00CC00;" class="fa fa-bullseye"></i></a></li>\n       </ul>\n        </nav>\n   </div>\n   </div>\n\n\n\n\n        <div class="cover-container" style="max-width: 900px;">\n          <div class="inner cover">\n            <h1 class="cover-heading" style="margin-top: 100px;">dns recon & research, find & lookup dns records</h1>\n<p class="lead">\n<div id="hideform">\n<form role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS">\n  <div class="form-group">\n<div class="col-md-2"></div><div class="col-md-6">\n\n<input class="form-control" type="text" placeholder="exampledomain.com" name="targetip" id="regularInput" autofocus>\n\n<input type="hidden" name="user" value="free">\n</div></div>\n<div align="left" id="formsubmit"><button type="submit" class="btn btn-default">Search <span class="glyphicon glyphicon-chevron-right"></span></button></div>\n</form></div></div>\n<div class="row"><div class="col-md-2"></div><div class="col-md-8">\n<div id="showloading" style="color: #fff;">Loading...<br>\n<div class="progress">\n<div class="progress-bar progress-bar-success progress-bar-striped active" role="progressbar" aria-valuenow="45" aria-valuemin="0" aria-valuemax="100" style="width: 100%">\n</div></div></div></div></div></div>\n</P>\n\n<div class="row"><div class="col-md-12" style="padding: 80px;">\n\n<p><h4 style="color: #00CC00; text-align: left; font-size: 1.5em; line-height: 2.7em;">Showing results for <span style="font-weight: 700;">blacklanternsecurity.com</span></h4></p>\n<div style="text-align: right; font-size: 1em;"><a href="#dnsanchor"><span class="label label-default">DNS Servers</span></a> <a href="#mxanchor"><span class="label label-default">MX Records</span></a> <a href="#txtanchor"><span class="label label-default">TXT Records</span></a> <a href="#hostanchor"><span class="label label-default">Host (A) Records</span></a> <a href="#domainmap"><span class="label label-default">Domain Map</span></a></div><div class="clearfix" style="height: 30px;"></div>\n<div class="container">\n    <div class="row">\n        <div class="col-md-4">\n<p style="color: #ddd; font-family: \'Courier New\', Courier, monospace; text-align: left; padding-left: 30px; padding-bottom: 20px;">Hosting (IP block owners)</P>\n<canvas id="hosting" height="380" width="300"></canvas></div>\n        <div class="col-md-8">\n<p style="color: #ddd; font-family: \'Courier New\', Courier, monospace; text-align: left; padding-left: 30px;">GeoIP of Host Locations</P>\n  <div id="world-map" style="width: 480px; height: 380px"></div>\n</div>                        </div>\n</div>\n\n<p style="color: #ddd; font-family: \'Courier New\', Courier, monospace; text-align: left;"><a name="dnsanchor"></a>DNS Servers</P>\n<div class="table-responsive" style="text-align: left;">\n  <table class="table" style="font-size: 1.1em; border-color: #777;">\n \n   <tr><td class="col-md-4">ns01.domaincontrol.com.<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=ns01.domaincontrol.com." data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers from IP address (Active)"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/zonetransfer/?q=ns01.domaincontrol.com." data-target="#myModal"><span class="glyphicon glyphicon-log-in" data-toggle="tooltip" data-placement="top" title="Attempt Zone Transfer (Active)"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=97.74.100.1" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path to IP address using MTR (Active)"></span></a> <a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/findshareddns/?q=ns01.domaincontrol.com." data-target="#myModal"><span class="glyphicon glyphicon-cloud-download" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this DNS server"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="97.74.100.0/23" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="97.74.100.1" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n</td><td class="col-md-3">97.74.100.1<br><span style="font-size: 0.9em; color: #eee;">ns01.domaincontrol.com</span></td><td class="col-md-3">GODADDY-DNS<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n \n   <tr><td class="col-md-4">ns02.domaincontrol.com.<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=ns02.domaincontrol.com." data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers from IP address (Active)"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/zonetransfer/?q=ns02.domaincontrol.com." data-target="#myModal"><span class="glyphicon glyphicon-log-in" data-toggle="tooltip" data-placement="top" title="Attempt Zone Transfer (Active)"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=173.201.68.1" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path to IP address using MTR (Active)"></span></a> <a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/findshareddns/?q=ns02.domaincontrol.com." data-target="#myModal"><span class="glyphicon glyphicon-cloud-download" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this DNS server"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="173.201.68.0/23" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="173.201.68.1" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n</td><td class="col-md-3">173.201.68.1<br><span style="font-size: 0.9em; color: #eee;">ns02.domaincontrol.com</span></td><td class="col-md-3">GODADDY-DNS<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n   \n  </table>\n</div>\n\n<p style="color: #ddd; font-family: \'Courier New\', Courier, monospace; text-align: left;"><a name="mxanchor"></a>MX Records <span style="font-size: 0.8em; color: #777;">** This is where email for the domain goes...</P>\n<div class="table-responsive" style="text-align: left;">\n  <table class="table" style="font-size: 1.1em; font-family: \'Courier New\', Courier, monospace;">\n \n   <tr><td class="col-md-4">asdf.blacklanternsecurity.com.mail.protection.outlook.com.<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=104.47.55.138" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=104.47.55.138" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="104.40.0.0/13" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="104.47.55.138" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n</td><td class="col-md-3">104.47.55.138<br><span style="font-size: 0.9em; color: #eee;">mail-bn8nam120138.inbound.protection.outlook.com</span></td><td class="col-md-3">MICROSOFT-CORP-MSN-AS-BLOCK<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n   \n  </table>\n</div>\n\n<p style="color: #ddd; font-family: \'Courier New\', Courier, monospace; text-align: left;"><a name="txtanchor"></a>TXT Records <span style="font-size: 0.8em; color: #777;">** Find more hosts in Sender Policy Framework (SPF) configurations</span></P>\n<div class="table-responsive" style="text-align: left;">\n  <table class="table" style="font-size: 1.1em; font-family: \'Courier New\', Courier, monospace;">\n\n<tr><td>&quot;MS=ms26206678&quot;</td></tr>\n\n<tr><td>&quot;v=spf1 ip4:50.240.76.25 include:spf.protection.outlook.com -all&quot;</td></tr>\n\n<tr><td>&quot;google-site-verification=O_PoQFTGJ_hZ9LqfNT9OEc0KPFERKHQ_1t1m0YTx_1E&quot;</td></tr>\n\n<tr><td>&quot;google-site-verification=7XKUMxJSTHBSzdvT7gH47jLRjNAS76nrEfXmzhR_DO4&quot;</td></tr>\n\n</table>\n</div>\n\n\n<p style="color: #ddd; font-family: \'Courier New\', Courier, monospace; text-align: left;"><a name="hostanchor"></a>Host Records (A) <span style="font-size: 0.8em; color: #777;">** this data may not be current as it uses a static database (updated monthly)</span> </P>\n<div class="table-responsive" style="text-align: left;">\n  <table class="table" style="font-size: 1.1em; font-family: \'Courier New\', Courier, monospace;">\n\n \n   <tr><td class="col-md-4">blacklanternsecurity.com<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=185.199.108.153" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=http://blacklanternsecurity.com" data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=185.199.108.153" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="185.199.108.0/24" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="185.199.108.153" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n<!--  -->\n\n<br><span style="font-size: 0.8em; color: #bbb;">HTTP: </span>\n <span style="font-size: 0.9em; color: #eee; color: #0C0;"  data-toggle="tooltip" data-placement="top" title="HTTP Server found in Global Scan data (Passive)">GitHub.com</span>\n\n\n\n\n\n\n\n\n<br><span style="font-size: 0.8em; color: #bbb;">HTTP TECH: </span>\n <span style="font-size: 0.9em; color: #eee; color: #0C0;"  data-toggle="tooltip" data-placement="top" title="Apps / Technologies found in Global Scan data (Passive)">varnish</span>\n\n\n\n</td><td class="col-md-3">185.199.108.153<br><span style="font-size: 0.9em; color: #eee;">cdn-185-199-108-153.github.com</span></td><td class="col-md-3">FASTLY<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n \n   <tr><td class="col-md-4">asdf.blacklanternsecurity.com<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=143.244.156.80" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=http://asdf.blacklanternsecurity.com" data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=143.244.156.80" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="143.244.144.0/20" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="143.244.156.80" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n<!--  -->\n\n\n\n\n<br><span style="font-size: 0.8em; color: #bbb;">SSH: </span>\n <span style="font-size: 0.9em; color: #eee; color: #0C0;"  data-toggle="tooltip" data-placement="top" title="SSH Server found in Global Scan data (Passive)">SSH-2.0-OpenSSH_8.2p1 Ubuntu-4ubuntu0.3</span>\n\n\n\n\n\n\n\n</td><td class="col-md-3">143.244.156.80<br><span style="font-size: 0.9em; color: #eee;">asdf.blacklanternsecurity.com</span></td><td class="col-md-3">DIGITALOCEAN-ASN<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n \n   <tr><td class="col-md-4">asdf.blacklanternsecurity.com<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=64.227.8.231" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=http://asdf.blacklanternsecurity.com" data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=64.227.8.231" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="64.227.0.0/20" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="64.227.8.231" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n<!--  -->\n\n<br><span style="font-size: 0.8em; color: #bbb;">HTTP: </span>\n <span style="font-size: 0.9em; color: #eee; color: #0C0;"  data-toggle="tooltip" data-placement="top" title="HTTP Server found in Global Scan data (Passive)">Apache/2.4.29 (Ubuntu)</span>\n\n\n\n\n\n\n\n\n<br><span style="font-size: 0.8em; color: #bbb;">HTTP TECH: </span>\n <span style="font-size: 0.9em; color: #eee; color: #0C0;"  data-toggle="tooltip" data-placement="top" title="Apps / Technologies found in Global Scan data (Passive)">Ubuntu<br>Apache,2.4.29</span>\n\n\n\n</td><td class="col-md-3">64.227.8.231<br><span style="font-size: 0.9em; color: #eee;">asdf.blacklanternsecurity.com</span></td><td class="col-md-3">DIGITALOCEAN-ASN<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n \n   <tr><td class="col-md-4">asdf.blacklanternsecurity.com<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=192.34.56.157" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=http://asdf.blacklanternsecurity.com" data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=192.34.56.157" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="192.34.56.0/24" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="192.34.56.157" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n<!--  -->\n\n\n\n\n\n\n\n\n\n\n</td><td class="col-md-3">192.34.56.157<br><span style="font-size: 0.9em; color: #eee;">asdf.blacklanternsecurity.com</span></td><td class="col-md-3">DIGITALOCEAN-ASN<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n \n   <tr><td class="col-md-4">asdf.blacklanternsecurity.com<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=192.241.216.208" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=http://asdf.blacklanternsecurity.com" data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=192.241.216.208" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="192.241.192.0/19" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="192.241.216.208" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n<!--  -->\n\n\n\n\n\n\n\n\n\n\n</td><td class="col-md-3">192.241.216.208<br><span style="font-size: 0.9em; color: #eee;">asdf.blacklanternsecurity.com</span></td><td class="col-md-3">DIGITALOCEAN-ASN<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n \n   <tr><td class="col-md-4">asdf.blacklanternsecurity.com<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=167.71.95.71" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=http://asdf.blacklanternsecurity.com" data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=167.71.95.71" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="167.71.80.0/20" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="167.71.95.71" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n<!--  -->\n\n\n\n\n\n\n\n\n\n\n</td><td class="col-md-3">167.71.95.71<br><span style="font-size: 0.9em; color: #eee;">asdf.blacklanternsecurity.com</span></td><td class="col-md-3">DIGITALOCEAN-ASN<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n \n   <tr><td class="col-md-4">asdf.blacklanternsecurity.com<br>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/reverseiplookup/?q=157.245.247.197" data-target="#myModal"><span class="glyphicon glyphicon-th" data-toggle="tooltip" data-placement="top" title="Find hosts sharing this IP address"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/httpheaders/?q=http://asdf.blacklanternsecurity.com" data-target="#myModal"><span class="glyphicon glyphicon-globe" data-toggle="tooltip" data-placement="top" title="Get HTTP Headers"></span></a>\n<a class="external nounderline" data-toggle="modal" href="https://api.hackertarget.com/mtr/?q=157.245.247.197" data-target="#myModal"><span class="glyphicon glyphicon-random" data-toggle="tooltip" data-placement="top" title="Trace path"></span></a>\n<form style="display: inline;" role="form" action="." method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="157.245.240.0/20" name="targetip"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Search Banners for Netblock (Passive)"><span class="glyphicon glyphicon-eye-open"></span></button></form>\n<form style="display: inline;" role="form" action="https://hackertarget.com/nmap-online-port-scanner/" target="_blank" method="post"><input type="hidden" name="csrfmiddlewaretoken" value="FNUVMI6wikKoeDeCNL9cFyiCnsxbycmxnwLAffFtp8wzEwJEc1lJHpmrmZFVDxiS"><input type="hidden" value="157.245.247.197" name="send_scan[]"><button class="submit-with-icon" type="submit" data-toggle="tooltip" data-placement="top" title="Nmap Port Scan (Active)"><span class="glyphicon glyphicon-screenshot" style="color: #0C0;"></span></button></form>\n<!--  -->\n\n\n\n\n\n\n\n\n\n\n</td><td class="col-md-3">157.245.247.197<br><span style="font-size: 0.9em; color: #eee;">asdf.blacklanternsecurity.com</span></td><td class="col-md-3">DIGITALOCEAN-ASN<br><span style="font-size: 0.9em; color: #eee;">United States</span></td></tr>\n   \n  </table>\n<br>\n\n\n\n<div style="margin: 30px;" align="center"><a href="/static/asdf.blacklanternsecurity.com-202305190301.xlsx"><button type="button" class="btn btn-default"><span class="glyphicon glyphicon-download" aria-hidden="true"></span> Download .xlsx of Hosts</button></a> <a href="/static/asdf.blacklanternsecurity.com-202305190301.html" target="_blank"><button type="button" class="btn btn-default"><span class="glyphicon glyphicon-download" aria-hidden="true"></span> View Graph (beta)</button></div>\n\n<br>\n<p style="color: #ddd; font-family: \'Courier New\', Courier, monospace; text-align: left;"><a name="domainmap"></a>Mapping the domain<span style="font-size: 0.8em; color: #777;"> ** click for full size image</span> </P>\n<p>\n<a href="/static/asdf.blacklanternsecurity.com.png"><img style="max-width: 100%;" class="img-responsive"  src="/static/asdf.blacklanternsecurity.com.png"></a>\n</p>\n</div>\n\n</div></div>\n\n<p class="lead" style="margin-top: 40px; margin-bottom: 30px;">DNSdumpster.com is a FREE domain research tool that can discover hosts related to a domain. Finding visible hosts from the attackers perspective is an important part of the security assessment process.</p>\n\n          </div>\n\n              <p style="color: #777; margin-top: 40px;">this is a <a href="https://hackertarget.com/" title="Online Vulnerability Scanners"><button type="button" class="btn btn-danger btn-xs">HackerTarget.com</button></a> project</p>\n\n\n      <div style="margin-top: 160px;" class="container">\n        <div class="row">\n          <div class="col-lg-12 text-center">\n            <h2 class="section-heading text-uppercase"></h2>\n            <h3 class="section-subheading text-muted">Open Source Intelligence for Networks</h3>\n          </div>\n        </div>\n        <div style="margin-top: 30px;" class="row text-center">\n          <div class="col-md-4">\n            <span class="fa-stack fa-4x">\n              <i class="fa fa-user-secret fa-stack-1x" style="color: #00CC00;"></i>\n            </span>\n            <h4 class="service-heading">Attack</h4>\n            <p class="text-muted">The ability to quickly identify the attack surface is essential. Whether you are penetration testing or chasing bug bounties.</p>\n          </div>\n          <div class="col-md-4">\n            <span class="fa-stack fa-4x">\n              <i class="fa fa-shield fa-stack-1x" style="color: #00CC00;"></i>\n            </span>\n            <h4 class="service-heading">Defend</h4>\n            <p class="text-muted">Network defenders benefit from passive reconnaissance in a number of ways. With analysis informing information security strategy.</p>\n          </div>\n          <div class="col-md-4">\n            <span class="fa-stack fa-4x">\n              <i class="fa fa-mortar-board fa-stack-1x" style="color: #00CC00;"></i>\n            </span>\n            <h4 class="service-heading">Learn</h4>\n            <p class="text-muted">Understanding network based OSINT helps information technologists to better operate, assess and manage the network.</p>\n          </div>\n        </div>\n      </div>\n\n\n\n\n    <div class="container" style="background-color: #474747; margin-top: 180px; padding-bottom: 80px;"><div class="col-md-2"></div><div class="col-md-8">\n\n       <span class="glyphicon glyphicon-trash" style="font-size: 4em; line-height: 5.5em;"></span>\n<p style="font-size: 1.7em; line-height: 1.9em; margin-bottom: 80px;">Map an organizations attack surface with a virtual <i>dumpster dive*</i> of the DNS records associated with the target organization.</p>\n<p style="font-size: 1.2em; color: #fff;">*DUMPSTER DIVING: The practice of sifting refuse from an office or technical installation to extract confidential data, especially security-compromising information.</p>\n</div>    </div>\n\n\n<div class="container" style="text-align: left; margin-top: 80px; margin-bottom: 80px;">\n\n<h2 style="font-size: 1.8em;">Frequently Asked Questions</h2>\n\n<h4 style="margin-top: 30px;">How can I take my security assessments to the next level?</h4>\n\n<p>The company behind DNSDumpster is <a href="https://hackertarget.com/" title="Online Vulnerability Scanners">hackertarget.com</a> where we provide online hosted access to trusted open source security vulnerability scanners and network intelligence tools.</P><P>Save time and headaches by incorporating our attack surface discovery into your vulnerability assessment process.</p><P style="text-align: center; padding: 30px;"><a href="https://hackertarget.com/" title="HackerTarget.com | Online Security Testing and Open Source Intelligence"><img src="https://hackertarget.com/wp-content/uploads/2019/09/know-your-network-tools.png" alt="HackerTarget.com | Online Security Testing and Open Source Intelligence"></a></p>\n\n<h4>What data does DNSDumpster use?</h4>\n\n<p>No brute force subdomain enumeration is used as is common in dns recon tools that enumerate subdomains. We use open source intelligence resources to query for related domain data. It is then compiled into an actionable resource for both attackers and defenders of Internet facing systems.</P>\n<P>More than a simple <a href="https://hackertarget.com/dns-lookup/" title="Online DNS Lookup">DNS lookup</a> this tool will discover those hard to find sub-domains and web hosts. The search relies on data from our crawls of the Alexa Top 1 Million sites, Search Engines, Common Crawl, Certificate Transparency, Max Mind, Team Cymru, Shodan and <a href="https://scans.io/" style="text-decoration: underline;">scans.io</a>.</P>\n\n<h4>I have hit the host limit, do you have a PRO option?</h4>\n\n<P>Over at <a href="https://hackertarget.com/" title="Online Vulnerability Scanners">hackertarget.com</a> there\'s a tool we call <a href="https://hackertarget.com/domain-profiler/">domain profiler</a>. This compiles data similiar to DNSDumpster; with additional data discovery. Queries available are based on the membership plan with the number of results (subdomains) being unlimited. With a STARTER membership you have access to the domain profiler tool for 12 months. Once the years membership expires you will revert to BASIC member status, however access to Domain Profiler and Basic Nmap scans continue. The BASIC access does not expire.</P>\n\n<h4>What are some other resources and tools for learning more?</h4>\n\n<P>There are some great open source recon frameworks that have been developed over the past couple of years. In addition tools such as <b>Metasploit</b> and <b>Nmap</b> include various modules for enumerating DNS. Check our <a href="https://dnsdumpster.com/footprinting-reconnaissance/">Getting Started with Footprinting</a> for more information.</P>\n\n</div>\n\n\n\n<!-- Modal -->\n<div class="modal fade" id="myModal" tabindex="-1" role="dialog" aria-labelledby="myModalLabel" aria-hidden="true">\n  <div class="modal-dialog">\n<div class="modal-heading lds-facebook" style="margin-top: 200px;"><div></div><div></div><div></div></div>\n    <div class="modal-content" style="background-color: #CCC; white-space: pre-wrap; padding: 20px; text-shadow: none; font-size: 1.2em; max-width: 1000px;">\n      </div><!-- /.modal-content -->\n  </div><!-- /.modal-dialog -->\n</div><!-- /.modal -->\n\n</div></div>\n</div></div>\n\n<footer>\n<div class="row" style="background-color: #1e1e1e; padding-top: 40px; padding-bottom: 20px;"><div class="container">\n<div class="col-md-6 col-sm-12 right-border" style="text-align: center;">\n<div class="footer-about" style="text-align: left; padding-left: 40px;">\n<h2 class="footer-title" style="font-size: 1.8em;">About</h2>\n<p style="margin-top: 20px;">At <a href="https://hackertarget.com/">hackertarget.com</a>, we have been scanning the Internet since 2007. Our vulnerability scanners now reach millions of IP addresses every year. We work to raise awareness of the value in open source security solutions.</p>\n</div>\n</div>\n<div class="col-md-6 col-sm-12">\n<div class="contact-info" style="text-align: left; padding-left: 40px;">\n<h2 class="footer-title" style="font-size: 1.8em;">Stay in Touch</h2>\n\n<div class="single">\n        <p><i style="font-size: 1.2em;" class="fa fa-envelope"></i> dnsdumpster@gmail.com</p>\n</div>\n<div class="single">\n        <p><i style="font-size: 1.2em;" class="fa fa-twitter"></i> <a href="https://twitter.com/hackertarget/">@hackertarget</a></p>\n</div>\n<!-- Begin MailChimp Signup Form -->\n<link href="https://cdn-images.mailchimp.com/embedcode/horizontal-slim-10_7.css" rel="stylesheet" type="text/css">\n<style type="text/css">\n    #mc_embed_signup{background:#1e1e1e; clear:left; font:14px Helvetica,Arial,sans-serif; width:100%;}\n        /* Add your own MailChimp form style overrides in your site stylesheet or in this style block.\n               We recommend moving this block and the preceding CSS link to the HEAD of your HTML file. */\n               </style>\n               <div id="mc_embed_signup">\n               <form action="https://dnsdumpster.us17.list-manage.com/subscribe/post?u=3cbc62d931a69e74b2c856f1a&amp;id=532c46ab39" method="post" id="mc-embedded-subscribe-form" name="mc-embedded-subscribe-form" class="validate" target="_blank" novalidate>\n                   <div id="mc_embed_signup_scroll" style="text-align: left;">\n\n                        <input type="email" value="" name="EMAIL" class="email" id="mce-EMAIL" placeholder="email address" required>\n                            <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->\n                                <div style="position: absolute; left: -5000px;" aria-hidden="true"><input type="text" name="b_3cbc62d931a69e74b2c856f1a_532c46ab39" tabindex="-1" value=""></div><br>\n                                    <div class="clear" style="margin-top: 5px;"><input type="submit" style="background-color: #00CC00;" value="Subscribe to our List" name="subscribe" id="mc-embedded-subscribe" class="button"> <span style="font-size: 0.8em;">Low volume Updates and News</a></div>\n                                        </div>\n                                        </form>\n                                        </div>\n\n                                        <!--End mc_embed_signup-->\n\n</div>\n</div>\n</div>\n<div class="clearfix"></div>\n<div class="copyright" style="background-color: #1e1e1e; margin-top: 20px;">\n<p>Copyright &copy; 2023 Hacker Target Pty Ltd</p>\n</div>\n</div>\n</div>\n</div>\n</footer>\n                                                </div>\n                                        </div>\n                                </div>\n                        </div>\n\n\n\n\n</div></div>\n\n    <!-- Bootstrap core JavaScript\n    ================================================== -->\n    <!-- Placed at the end of the document so the pages load faster -->\n    <script src="https://dnsdumpster.com/static/js/jquery-1.12.4.min.js"></script>\n    <script src="/static/js/bootstrap.min.js"></script>\n\n\n<script src="/static/Chart.js"></script>\n  <link rel="stylesheet" href="/static/jquery-jvectormap-2.0.1.css" type="text/css" media="screen"/>\n  <script src="/static/jquery-jvectormap-2.0.1.min.js"></script>\n  <script src="/static/jquery-jvectormap-world-mill-en.js"></script>\n\n   <script type="text/javascript">\nvar barChartData = {\nlabels : [\n\n"GODADDY-DNS",\n\n"MICROSOFT-CORP-MSN-AS-BLOCK",\n\n"FASTLY",\n\n"DIGITALOCEAN-ASN",\n\n],\ndatasets : [\n{\nfillColor : "#ccc",\nstrokeColor : "#ccc",\ndata : [\n\n2,\n\n1,\n\n1,\n\n6,\n\n],\n}\n]\n}\n\nwindow.onload = function(){\nvar ctx = document.getElementById("hosting").getContext("2d");\nwindow.myBar = new Chart(ctx).Bar(barChartData, {\n});\n}\n</script>\n\n\n<script>\nvar gdpData = {\n\n"US" : 3,\n\n"United States" : 7,\n\n};\n    $(function(){\n$(\'#world-map\').vectorMap({\n  map: \'world_mill_en\',\n  backgroundColor: \'#333333\',\n  zoomButtons : false,\n  series: {\n    regions: [{\n      values: gdpData,\n      scale: [\'#00CC00\', \'#008400\'],\n      normalizeFunction: \'polynomial\'\n    }]\n  },\n  onRegionTipShow: function(e, el, code){\n    if (typeof gdpData[code] !=="undefined"){\n    el.html(el.html()+\' <br>Hosts Found : \'+gdpData[code]);\n    } \n  }\n});\n    });\n  </script>\n\n\n\n<script type="text/javascript">\n            $(document).ready(function() {\n$(\'[data-toggle="tooltip"]\').tooltip({\'placement\': \'top\'});\n\n$("body").on(\'DOMSubtreeModified\', ".modal-content", function() {\n    $(".modal-heading").hide();\n    $(".modal-content").show();\n});\n\n      $(\'body\').on(\'hidden.bs.modal\', \'.modal\', function () {\n        $(this).removeData(\'bs.modal\');\n      });\n\n            }); //END $(document).ready()\n\n\n$(\'a.external\').on(\'click\', function(e) {\n        e.preventDefault();\n        $(".modal-heading").show();\n        $(".modal-content").hide();\n\n\n        var url = $(this).attr(\'href\');\n        $(".modal-body").html(\'<iframe id="myiframe" style="background-color: #ccc;" width="100%" height="100%" frameborder="0" scrolling="yes" allowtransparency="true" src="\'+url+\'"></iframe>\');\n    });\n\n \n\n\n    $(\'#myModal\').on(\'show.bs.modal\', function () {\n        $(this).find(\'.modal-dialog\').css({\n                  width:\'80%\', //choose your width\n                  height:\'80%\',\n                  \'padding\':\'5\'\n           });\n         $(this).find(\'.modal-content\').css({\n                  height:\'100%\',\n                  \'border-radius\':\'0\',\n                  \'padding\':\'15\'\n           });\n         $(this).find(\'.modal-body\').html(null);\n         $(this).find(\'.modal-body\').css({\n                  width:\'auto\',\n                  height:\'100%\',\n                  \'padding\':\'5\'\n           });\n    })\n\n        </script>\n\n<script>\n$(document).ready(function(){\n  $("#showloading").hide();\n  $("#formsubmit").click(function(){\n    $("#hideform").hide();\n    $("#showloading").show();\n  });\n\n});\n</script>\n<!-- Google tag (gtag.js) -->\n<script async src="https://www.googletagmanager.com/gtag/js?id=G-FPGN9YXFNE"></script>\n<script>\n  window.dataLayer = window.dataLayer || [];\n  function gtag(){dataLayer.push(arguments);}\n  gtag(\'js\', new Date());\n\n  gtag(\'config\', \'G-FPGN9YXFNE\');\n</script>\n  </body>\n</html>\n',
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
new file mode 100644
index 0000000000..f746ee717d
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
@@ -0,0 +1,56 @@
+import dns.zone
+import dns.query
+import dns.message
+from types import SimpleNamespace
+
+from .base import ModuleTestBase
+
+
+class TestDNSZoneTransfer(ModuleTestBase):
+    targets = ["blacklanternsecurity.fakedomain"]
+    config_overrides = {"dns_resolution": True}
+
+    def setup_after_prep(self, module_test):
+        old_resolve_fn = module_test.scan.helpers.dns._resolve_hostname
+
+        class MockRecord:
+            def __init__(self, record, rdtype):
+                self.rdtype = SimpleNamespace()
+                self.rdtype.name = rdtype
+                self.record = record
+
+            def __str__(self):
+                return self.record
+
+            def to_text(self):
+                return str(self)
+
+        async def _resolve_hostname(query, **kwargs):
+            if query == "blacklanternsecurity.fakedomain" and kwargs.get("rdtype", "").upper() == "NS":
+                return [MockRecord("ns01.blacklanternsecurity.fakedomain", "NS")], []
+            if query == "ns01.blacklanternsecurity.fakedomain" and kwargs.get("rdtype", "").upper() in "A":
+                return [MockRecord("127.0.0.1", "A")], []
+            return await old_resolve_fn(query, **kwargs)
+
+        def from_xfr(*args, **kwargs):
+            zone_text = """
+@ 600 IN SOA ns.blacklanternsecurity.fakedomain. admin.blacklanternsecurity.fakedomain. (
+    1   ; Serial
+    3600   ; Refresh
+    900   ; Retry
+    604800   ; Expire
+    86400 )  ; Minimum TTL
+@ 600 IN NS ns.blacklanternsecurity.fakedomain.
+@ 600 IN A 127.0.0.1
+asdf 600 IN A 127.0.0.1
+zzzz 600 IN AAAA dead::beef
+"""
+            zone = dns.zone.from_text(zone_text, origin="blacklanternsecurity.fakedomain.")
+            return zone
+
+        module_test.monkeypatch.setattr("dns.zone.from_xfr", from_xfr)
+        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "_resolve_hostname", _resolve_hostname)
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.fakedomain" for e in events), "Zone transfer failed"
+        assert any(e.data == "zzzz.blacklanternsecurity.fakedomain" for e in events), "Zone transfer failed"
diff --git a/bbot/test/test_step_1/module_tests/test_module_emailformat.py b/bbot/test/test_step_1/module_tests/test_module_emailformat.py
new file mode 100644
index 0000000000..ff1c0d3b36
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_emailformat.py
@@ -0,0 +1,12 @@
+from .base import ModuleTestBase
+
+
+class TestEmailFormat(ModuleTestBase):
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://www.email-format.com/d/blacklanternsecurity.com/",
+            text="<p>info@blacklanternsecurity.com</a>",
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "info@blacklanternsecurity.com" for e in events), "Failed to detect email"
diff --git a/bbot/test/test_step_1/module_tests/test_module_excavate.py b/bbot/test/test_step_1/module_tests/test_module_excavate.py
new file mode 100644
index 0000000000..250506f5e1
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_excavate.py
@@ -0,0 +1,141 @@
+from .base import ModuleTestBase
+
+
+class TestExcavate(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888/", "test.notreal", "http://127.0.0.1:8888/subdir/links.html"]
+    modules_overrides = ["excavate", "httpx"]
+    config_overrides = {"web_spider_distance": 1, "web_spider_depth": 1}
+
+    def setup_before_prep(self, module_test):
+        response_data = """
+        ftp://ftp.test.notreal
+        \\nhttps://www1.test.notreal
+        \\x3dhttps://www2.test.notreal
+        %0ahttps://www3.test.notreal
+        \\u000ahttps://www4.test.notreal
+        \nwww5.test.notreal
+        \\x3dwww6.test.notreal
+        %0awww7.test.notreal
+        \\u000awww8.test.notreal
+        <a src="http://www9.test.notreal">
+        """
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": response_data}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        # verify relatives path a-tag parsing is working correctly
+
+        expect_args = {"method": "GET", "uri": "/subdir/links.html"}
+        respond_args = {"response_data": "<a href='../relative.html'/><a href='/2/depth2.html'/>"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/relative.html"}
+        respond_args = {"response_data": "<a href='/distance2.html'/>"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        module_test.httpserver.no_handler_status_code = 404
+
+    def check(self, module_test, events):
+        event_data = [e.data for e in events]
+        assert "https://www1.test.notreal/" in event_data
+        assert "https://www2.test.notreal/" in event_data
+        assert "https://www3.test.notreal/" in event_data
+        assert "https://www4.test.notreal/" in event_data
+        assert "www1.test.notreal" in event_data
+        assert "www2.test.notreal" in event_data
+        assert "www3.test.notreal" in event_data
+        assert "www4.test.notreal" in event_data
+        assert "www5.test.notreal" in event_data
+        assert "www6.test.notreal" in event_data
+        assert "www7.test.notreal" in event_data
+        assert "www8.test.notreal" in event_data
+        assert "http://www9.test.notreal/" in event_data
+
+        assert "nhttps://www1.test.notreal/" not in event_data
+        assert "x3dhttps://www2.test.notreal/" not in event_data
+        assert "a2https://www3.test.notreal/" not in event_data
+        assert "uac20https://www4.test.notreal/" not in event_data
+        assert "nwww5.test.notreal" not in event_data
+        assert "x3dwww6.test.notreal" not in event_data
+        assert "a2www7.test.notreal" not in event_data
+        assert "uac20www8.test.notreal" not in event_data
+
+        assert any(
+            e.type == "FINDING" and e.data.get("description", "") == "Non-HTTP URI: ftp://ftp.test.notreal"
+            for e in events
+        )
+        assert any(
+            e.type == "PROTOCOL"
+            and e.data.get("protocol", "") == "FTP"
+            and e.data.get("host", "") == "ftp.test.notreal"
+            for e in events
+        )
+
+        assert any(
+            e.type == "URL_UNVERIFIED"
+            and e.data == "http://127.0.0.1:8888/relative.html"
+            and "spider-danger" not in e.tags
+            for e in events
+        )
+
+        assert any(
+            e.type == "URL_UNVERIFIED"
+            and e.data == "http://127.0.0.1:8888/2/depth2.html"
+            and "spider-danger" in e.tags
+            for e in events
+        )
+
+        assert any(
+            e.type == "URL_UNVERIFIED"
+            and e.data == "http://127.0.0.1:8888/distance2.html"
+            and "spider-danger" in e.tags
+            for e in events
+        )
+
+
+class TestExcavate2(TestExcavate):
+    targets = ["http://127.0.0.1:8888/", "test.notreal", "http://127.0.0.1:8888/subdir/"]
+
+    def setup_before_prep(self, module_test):
+        # root relative
+        expect_args = {"method": "GET", "uri": "/rootrelative.html"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        # page relative
+        expect_args = {"method": "GET", "uri": "/subdir/pagerelative.html"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/subdir/"}
+        respond_args = {
+            "response_data": "<a href='/rootrelative.html'>root relative</a><a href='pagerelative.html'>page relative</a>"
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        module_test.httpserver.no_handler_status_code = 404
+
+    def check(self, module_test, events):
+        root_relative_detection = False
+        page_relative_detection = False
+        root_page_confusion_1 = False
+        root_page_confusion_2 = False
+
+        for e in events:
+            if e.type == "URL_UNVERIFIED":
+                # these cases represent the desired behavior for parsing relative links
+                if e.data == "http://127.0.0.1:8888/rootrelative.html":
+                    root_relative_detection = True
+                if e.data == "http://127.0.0.1:8888/subdir/pagerelative.html":
+                    page_relative_detection = True
+
+                # these cases indicates that excavate parsed the relative links incorrectly
+                if e.data == "http://127.0.0.1:8888/pagerelative.html":
+                    root_page_confusion_1 = True
+                if e.data == "http://127.0.0.1:8888/subdir/rootrelative.html":
+                    root_page_confusion_2 = True
+
+        assert root_relative_detection, "Failed to properly excavate root-relative URL"
+        assert page_relative_detection, "Failed to properly excavate page-relative URL"
+        assert not root_page_confusion_1, "Incorrectly detected page-relative URL"
+        assert not root_page_confusion_2, "Incorrectly detected root-relative URL"
diff --git a/bbot/test/test_step_1/module_tests/test_module_ffuf.py b/bbot/test/test_step_1/module_tests/test_module_ffuf.py
new file mode 100644
index 0000000000..9da9805567
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_ffuf.py
@@ -0,0 +1,45 @@
+from .base import ModuleTestBase, tempwordlist
+
+
+class TestFFUF(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    test_wordlist = ["11111111", "admin", "junkword1", "zzzjunkword2"]
+    config_overrides = {
+        "modules": {
+            "ffuf": {
+                "wordlist": tempwordlist(test_wordlist),
+            }
+        }
+    }
+    modules_overrides = ["ffuf", "httpx"]
+
+    def setup_before_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/admin"}
+        respond_args = {"response_data": "alive admin page"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "URL_UNVERIFIED" and "admin" in e.data for e in events)
+        assert not any(e.type == "URL_UNVERIFIED" and "11111111" in e.data for e in events)
+
+
+class TestFFUF2(TestFFUF):
+    test_wordlist = ["11111111", "console", "junkword1", "zzzjunkword2"]
+    config_overrides = {"modules": {"ffuf": {"wordlist": tempwordlist(test_wordlist), "extensions": "php"}}}
+
+    def setup_before_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/console.php"}
+        respond_args = {"response_data": "alive admin page"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "URL_UNVERIFIED" and "console" in e.data for e in events)
+        assert not any(e.type == "URL_UNVERIFIED" and "11111111" in e.data for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py b/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py
new file mode 100644
index 0000000000..09312dcee3
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py
@@ -0,0 +1,208 @@
+from .base import ModuleTestBase, tempwordlist
+
+
+class TestFFUFShortnames(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    test_wordlist = ["11111111", "administrator", "portal", "console", "junkword1", "zzzjunkword2", "directory"]
+    config_overrides = {
+        "modules": {
+            "ffuf_shortnames": {
+                "find_common_prefixes": True,
+                "find_common_prefixes": True,
+                "wordlist": tempwordlist(test_wordlist),
+            }
+        }
+    }
+    modules_overrides = ["ffuf_shortnames", "httpx"]
+
+    def setup_after_prep(self, module_test):
+        module_test.httpserver.no_handler_status_code = 404
+
+        seed_events = []
+        parent_event = module_test.scan.make_event(
+            "http://127.0.0.1:8888/",
+            "URL",
+            module_test.scan.root_event,
+            module="httpx",
+            tags=["status-200", "distance-0"],
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/ADMINI~1.ASP",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-file"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/ADM_PO~1.ASP",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-file"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/ABCZZZ~1.ASP",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-file"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/ABCXXX~1.ASP",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-file"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/ABCYYY~1.ASP",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-file"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/ABCCON~1.ASP",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-file"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/DIRECT~1",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-directory"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/ADM_DI~1",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-directory"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/XYZDIR~1",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-directory"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/XYZAAA~1",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-directory"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/XYZBBB~1",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-directory"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/XYZCCC~1",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-directory"],
+            )
+        )
+        seed_events.append(
+            module_test.scan.make_event(
+                "http://127.0.0.1:8888/SHORT~1.PL",
+                "URL_HINT",
+                parent_event,
+                module="iis_shortnames",
+                tags=["shortname-file"],
+            )
+        )
+        module_test.scan.target._events["http://127.0.0.1:8888"] = seed_events
+
+        expect_args = {"method": "GET", "uri": "/administrator.aspx"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/adm_portal.aspx"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/abcconsole.aspx"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/directory/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/adm_directory/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/xyzdirectory/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/short.pl"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        basic_detection = False
+        directory_detection = False
+        prefix_detection = False
+        delimeter_detection = False
+        directory_delimeter_detection = False
+        prefix_delimeter_detection = False
+        short_extensions_detection = False
+
+        for e in events:
+            if e.type == "URL_UNVERIFIED":
+                if e.data == "http://127.0.0.1:8888/administrator.aspx":
+                    basic_detection = True
+                if e.data == "http://127.0.0.1:8888/directory/":
+                    directory_detection = True
+                if e.data == "http://127.0.0.1:8888/adm_portal.aspx":
+                    prefix_detection = True
+                if e.data == "http://127.0.0.1:8888/abcconsole.aspx":
+                    delimeter_detection = True
+                if e.data == "http://127.0.0.1:8888/abcconsole.aspx":
+                    directory_delimeter_detection = True
+                if e.data == "http://127.0.0.1:8888/xyzdirectory/":
+                    prefix_delimeter_detection = True
+                if e.data == "http://127.0.0.1:8888/short.pl":
+                    short_extensions_detection = True
+
+        assert basic_detection
+        assert directory_detection
+        assert prefix_detection
+        assert delimeter_detection
+        assert directory_delimeter_detection
+        assert prefix_delimeter_detection
+        assert short_extensions_detection
diff --git a/bbot/test/test_step_1/module_tests/test_module_fingerprintx.py b/bbot/test/test_step_1/module_tests/test_module_fingerprintx.py
new file mode 100644
index 0000000000..7e0cc3a169
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_fingerprintx.py
@@ -0,0 +1,14 @@
+from .base import ModuleTestBase
+
+
+class TestFingerprintx(ModuleTestBase):
+    targets = ["127.0.0.1:8888"]
+
+    def check(self, module_test, events):
+        assert any(
+            event.type == "PROTOCOL"
+            and event.host == module_test.scan.helpers.make_ip_type("127.0.0.1")
+            and event.port == 8888
+            and event.data["protocol"] == "HTTP"
+            for event in events
+        ), "HTTP protocol not detected"
diff --git a/bbot/test/test_step_1/module_tests/test_module_fullhunt.py b/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
new file mode 100644
index 0000000000..bada14732a
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
@@ -0,0 +1,48 @@
+from .base import ModuleTestBase
+
+
+class TestFullhunt(ModuleTestBase):
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://fullhunt.io/api/v1/auth/status",
+            json={
+                "message": "",
+                "status": 200,
+                "user": {
+                    "company": "nightwatch",
+                    "email": "jonsnow@nightwatch.notreal",
+                    "first_name": "Jon",
+                    "last_name": "Snow",
+                    "plan": "free",
+                },
+                "user_credits": {
+                    "credits_usage": 0,
+                    "max_results_per_request": 3000,
+                    "remaining_credits": 100,
+                    "total_credits_per_month": 100,
+                },
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url="https://fullhunt.io/api/v1/domain/blacklanternsecurity.com/subdomains",
+            json={
+                "domain": "blacklanternsecurity.com",
+                "hosts": [
+                    "asdf.blacklanternsecurity.com",
+                ],
+                "message": "",
+                "metadata": {
+                    "all_results_count": 11,
+                    "available_results_for_user": 11,
+                    "domain": "blacklanternsecurity.com",
+                    "last_scanned": 1647083421,
+                    "max_results_for_user": 3000,
+                    "timestamp": 1684541940,
+                    "user_plan": "free",
+                },
+                "status": 200,
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py b/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_github.py b/bbot/test/test_step_1/module_tests/test_module_github.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_gowitness.py b/bbot/test/test_step_1/module_tests/test_module_gowitness.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_hackertarget.py b/bbot/test/test_step_1/module_tests/test_module_hackertarget.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_host_header.py b/bbot/test/test_step_1/module_tests/test_module_host_header.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_http.py b/bbot/test/test_step_1/module_tests/test_module_http.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_httpx.py b/bbot/test/test_step_1/module_tests/test_module_httpx.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_human.py b/bbot/test/test_step_1/module_tests/test_module_human.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunt.py b/bbot/test/test_step_1/module_tests/test_module_hunt.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunterio.py b/bbot/test/test_step_1/module_tests/test_module_hunterio.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py b/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py b/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipstack.py b/bbot/test/test_step_1/module_tests/test_module_ipstack.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_json.py b/bbot/test/test_step_1/module_tests/test_module_json.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_leakix.py b/bbot/test/test_step_1/module_tests/test_module_leakix.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_masscan.py b/bbot/test/test_step_1/module_tests/test_module_masscan.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_massdns.py b/bbot/test/test_step_1/module_tests/test_module_massdns.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_naabu.py b/bbot/test/test_step_1/module_tests/test_module_naabu.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_neo4j.py b/bbot/test/test_step_1/module_tests/test_module_neo4j.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_ntlm.py b/bbot/test/test_step_1/module_tests/test_module_ntlm.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_nuclei.py b/bbot/test/test_step_1/module_tests/test_module_nuclei.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_otx.py b/bbot/test/test_step_1/module_tests/test_module_otx.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_passivetotal.py b/bbot/test/test_step_1/module_tests/test_module_passivetotal.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_pgp.py b/bbot/test/test_step_1/module_tests/test_module_pgp.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_python.py b/bbot/test/test_step_1/module_tests/test_module_python.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_rapiddns.py b/bbot/test/test_step_1/module_tests/test_module_rapiddns.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_riddler.py b/bbot/test/test_step_1/module_tests/test_module_riddler.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_robots.py b/bbot/test/test_step_1/module_tests/test_module_robots.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_secretsdb.py b/bbot/test/test_step_1/module_tests/test_module_secretsdb.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_securitytrails.py b/bbot/test/test_step_1/module_tests/test_module_securitytrails.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_services.py b/bbot/test/test_step_1/module_tests/test_module_services.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py b/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_skymem.py b/bbot/test/test_step_1/module_tests/test_module_skymem.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_smuggler.py b/bbot/test/test_step_1/module_tests/test_module_smuggler.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_social.py b/bbot/test/test_step_1/module_tests/test_module_social.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_speculate.py b/bbot/test/test_step_1/module_tests/test_module_speculate.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_sslcert.py b/bbot/test/test_step_1/module_tests/test_module_sslcert.py
new file mode 100644
index 0000000000..d443dfb618
--- /dev/null
+++ b/bbot/test/test_step_1/module_tests/test_module_sslcert.py
@@ -0,0 +1,8 @@
+from .base import ModuleTestBase
+
+
+class TestSSLCert(ModuleTestBase):
+    targets = ["8.8.8.8:443"]
+
+    def check(self, module_test, events):
+        assert any(e.data == "dns.google" and str(e.module) == "sslcert" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py b/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_sublist3r.py b/bbot/test/test_step_1/module_tests/test_module_sublist3r.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_telerik.py b/bbot/test/test_step_1/module_tests/test_module_telerik.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_threatminer.py b/bbot/test/test_step_1/module_tests/test_module_threatminer.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py b/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_urlscan.py b/bbot/test/test_step_1/module_tests/test_module_urlscan.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_vhost.py b/bbot/test/test_step_1/module_tests/test_module_vhost.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_viewdns.py b/bbot/test/test_step_1/module_tests/test_module_viewdns.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_virustotal.py b/bbot/test/test_step_1/module_tests/test_module_virustotal.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_wafw00f.py b/bbot/test/test_step_1/module_tests/test_module_wafw00f.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py b/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_wayback.py b/bbot/test/test_step_1/module_tests/test_module_wayback.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_web_report.py b/bbot/test/test_step_1/module_tests/test_module_web_report.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_websocket.py b/bbot/test/test_step_1/module_tests/test_module_websocket.py
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py b/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
new file mode 100644
index 0000000000..e69de29bb2

From cb95e10efc2c0f84427f0392bec3988eb77b647b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 19 May 2023 20:25:49 -0400
Subject: [PATCH 029/387] removed duplicate tests

---
 bbot/test/test_step_1/module_tests/__init__.py | 12 ------------
 1 file changed, 12 deletions(-)

diff --git a/bbot/test/test_step_1/module_tests/__init__.py b/bbot/test/test_step_1/module_tests/__init__.py
index 0b098d46a2..e69de29bb2 100644
--- a/bbot/test/test_step_1/module_tests/__init__.py
+++ b/bbot/test/test_step_1/module_tests/__init__.py
@@ -1,12 +0,0 @@
-from pathlib import Path
-
-from bbot.modules import module_loader
-
-parent_dir = Path(__file__).parent
-
-module_test_files = list(parent_dir.glob("test_module_*.py"))
-module_test_files = [m.name.split("test_module_")[-1].split(".")[0] for m in module_test_files]
-
-for module_name in module_loader.preloaded():
-    module_name = module_name.lower()
-    assert module_name in module_test_files, f'No test file found for module "{module_name}"'

From a2943d858eb68d122b0906618bc95f9ab6f317eb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 20 May 2023 00:00:42 -0400
Subject: [PATCH 030/387] gowitness and github tests

---
 bbot/modules/github.py                        |   4 +-
 bbot/test/conftest.py                         |   2 +-
 bbot/test/modules_test_classes.py             |  38 -------
 .../module_tests/test_module_github.py        | 100 ++++++++++++++++++
 .../module_tests/test_module_gowitness.py     |  42 ++++++++
 5 files changed, 145 insertions(+), 41 deletions(-)

diff --git a/bbot/modules/github.py b/bbot/modules/github.py
index 9fddf0393e..f6a933ea50 100644
--- a/bbot/modules/github.py
+++ b/bbot/modules/github.py
@@ -42,7 +42,7 @@ async def query(self, query):
         try:
             async for r in agen:
                 if r is None:
-                    continue
+                    break
                 status_code = getattr(r, "status_code", 0)
                 if status_code == 429:
                     "Github is rate-limiting us (HTTP status: 429)"
@@ -51,7 +51,7 @@ async def query(self, query):
                     j = r.json()
                 except Exception as e:
                     self.warning(f"Failed to decode JSON for {r.url} (HTTP status: {status_code}): {e}")
-                    continue
+                    break
                 items = j.get("items", [])
                 if not items:
                     break
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 0aca0ff1bd..c3cdb78766 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -14,7 +14,7 @@ def pytest_sessionfinish(session, exitstatus):
             logger.removeHandler(handler)
 
     # Wipe out BBOT home dir
-    shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
+    # shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
 
     yield
 
diff --git a/bbot/test/modules_test_classes.py b/bbot/test/modules_test_classes.py
index a4a7665ebf..e6ac6b67fe 100644
--- a/bbot/test/modules_test_classes.py
+++ b/bbot/test/modules_test_classes.py
@@ -34,44 +34,6 @@ def check_events(self, events):
         assert open_port, "Failed to visit target OPEN_TCP_PORT"
 
 
-class Gowitness(HttpxMockHelper):
-    additional_modules = ["httpx"]
-    import shutil
-    from pathlib import Path
-
-    home_dir = Path("/tmp/.bbot_gowitness_test")
-    shutil.rmtree(home_dir, ignore_errors=True)
-    config_overrides = {"force_deps": True, "home": str(home_dir)}
-
-    def mock_args(self):
-        respond_args = {
-            "response_data": """<html><head><title>BBOT is life</title></head><body>
-<link rel="preconnect" href="https://fonts.googleapis.com">
-<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
-<link href="https://fonts.googleapis.com/css2?family=Open+Sans+Condensed:wght@700&family=Open+Sans:ital,wght@0,400;0,600;0,700;0,800;1,400&display=swap" rel="stylesheet">
-</body></html>""",
-            "headers": {"Server": "Apache/2.4.41 (Ubuntu)"},
-        }
-        self.set_expect_requests(respond_args=respond_args)
-
-    def check_events(self, events):
-        screenshots_path = self.home_dir / "scans" / "gowitness_test" / "gowitness" / "screenshots"
-        screenshots = list(screenshots_path.glob("*.png"))
-        assert screenshots, f"No .png files found at {screenshots_path}"
-        url = False
-        webscreenshot = False
-        technology = False
-        for event in events:
-            if event.type == "URL_UNVERIFIED":
-                url = True
-            elif event.type == "WEBSCREENSHOT":
-                webscreenshot = True
-            elif event.type == "TECHNOLOGY":
-                technology = True
-        assert url, "No URL emitted"
-        assert webscreenshot, "No WEBSCREENSHOT emitted"
-        assert technology, "No TECHNOLOGY emitted"
-
 
 class Subdomain_Hijack(HttpxMockHelper):
     additional_modules = ["httpx", "excavate"]
diff --git a/bbot/test/test_step_1/module_tests/test_module_github.py b/bbot/test/test_step_1/module_tests/test_module_github.py
index e69de29bb2..52f8154e9f 100644
--- a/bbot/test/test_step_1/module_tests/test_module_github.py
+++ b/bbot/test/test_step_1/module_tests/test_module_github.py
@@ -0,0 +1,100 @@
+from .base import ModuleTestBase
+
+
+class TestGithub(ModuleTestBase):
+    config_overrides = {"omit_event_types": [], "scope_report_distance": 1}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(url="https://api.github.com/zen")
+        module_test.httpx_mock.add_response(
+            url="https://api.github.com/search/code?per_page=100&type=Code&q=blacklanternsecurity.com&page=1",
+            json={
+                "total_count": 214,
+                "incomplete_results": False,
+                "items": [
+                    {
+                        "name": "main.go",
+                        "path": "v2/cmd/cve-annotate/main.go",
+                        "sha": "4aa7c9ec68acb4c603d4b9163bf7ed42de1939fe",
+                        "url": "https://api.github.com/repositories/252813491/contents/v2/cmd/cve-annotate/main.go?ref=06f242e5fce3439b7418877676810cbf57934875",
+                        "git_url": "https://api.github.com/repositories/252813491/git/blobs/4aa7c9ec68acb4c603d4b9163bf7ed42de1939fe",
+                        "html_url": "https://github.com/projectdiscovery/nuclei/blob/06f242e5fce3439b7418877676810cbf57934875/v2/cmd/cve-annotate/main.go",
+                        "repository": {
+                            "id": 252813491,
+                            "node_id": "MDEwOlJlcG9zaXRvcnkyNTI4MTM0OTE=",
+                            "name": "nuclei",
+                            "full_name": "projectdiscovery/nuclei",
+                            "private": False,
+                            "owner": {
+                                "login": "projectdiscovery",
+                                "id": 50994705,
+                                "node_id": "MDEyOk9yZ2FuaXphdGlvbjUwOTk0NzA1",
+                                "avatar_url": "https://avatars.githubusercontent.com/u/50994705?v=4",
+                                "gravatar_id": "",
+                                "url": "https://api.github.com/users/projectdiscovery",
+                                "html_url": "https://github.com/projectdiscovery",
+                                "followers_url": "https://api.github.com/users/projectdiscovery/followers",
+                                "following_url": "https://api.github.com/users/projectdiscovery/following{/other_user}",
+                                "gists_url": "https://api.github.com/users/projectdiscovery/gists{/gist_id}",
+                                "starred_url": "https://api.github.com/users/projectdiscovery/starred{/owner}{/repo}",
+                                "subscriptions_url": "https://api.github.com/users/projectdiscovery/subscriptions",
+                                "organizations_url": "https://api.github.com/users/projectdiscovery/orgs",
+                                "repos_url": "https://api.github.com/users/projectdiscovery/repos",
+                                "events_url": "https://api.github.com/users/projectdiscovery/events{/privacy}",
+                                "received_events_url": "https://api.github.com/users/projectdiscovery/received_events",
+                                "type": "Organization",
+                                "site_admin": False,
+                            },
+                            "html_url": "https://github.com/projectdiscovery/nuclei",
+                            "description": "Fast and customizable vulnerability scanner based on simple YAML based DSL.",
+                            "fork": False,
+                            "url": "https://api.github.com/repos/projectdiscovery/nuclei",
+                            "forks_url": "https://api.github.com/repos/projectdiscovery/nuclei/forks",
+                            "keys_url": "https://api.github.com/repos/projectdiscovery/nuclei/keys{/key_id}",
+                            "collaborators_url": "https://api.github.com/repos/projectdiscovery/nuclei/collaborators{/collaborator}",
+                            "teams_url": "https://api.github.com/repos/projectdiscovery/nuclei/teams",
+                            "hooks_url": "https://api.github.com/repos/projectdiscovery/nuclei/hooks",
+                            "issue_events_url": "https://api.github.com/repos/projectdiscovery/nuclei/issues/events{/number}",
+                            "events_url": "https://api.github.com/repos/projectdiscovery/nuclei/events",
+                            "assignees_url": "https://api.github.com/repos/projectdiscovery/nuclei/assignees{/user}",
+                            "branches_url": "https://api.github.com/repos/projectdiscovery/nuclei/branches{/branch}",
+                            "tags_url": "https://api.github.com/repos/projectdiscovery/nuclei/tags",
+                            "blobs_url": "https://api.github.com/repos/projectdiscovery/nuclei/git/blobs{/sha}",
+                            "git_tags_url": "https://api.github.com/repos/projectdiscovery/nuclei/git/tags{/sha}",
+                            "git_refs_url": "https://api.github.com/repos/projectdiscovery/nuclei/git/refs{/sha}",
+                            "trees_url": "https://api.github.com/repos/projectdiscovery/nuclei/git/trees{/sha}",
+                            "statuses_url": "https://api.github.com/repos/projectdiscovery/nuclei/statuses/{sha}",
+                            "languages_url": "https://api.github.com/repos/projectdiscovery/nuclei/languages",
+                            "stargazers_url": "https://api.github.com/repos/projectdiscovery/nuclei/stargazers",
+                            "contributors_url": "https://api.github.com/repos/projectdiscovery/nuclei/contributors",
+                            "subscribers_url": "https://api.github.com/repos/projectdiscovery/nuclei/subscribers",
+                            "subscription_url": "https://api.github.com/repos/projectdiscovery/nuclei/subscription",
+                            "commits_url": "https://api.github.com/repos/projectdiscovery/nuclei/commits{/sha}",
+                            "git_commits_url": "https://api.github.com/repos/projectdiscovery/nuclei/git/commits{/sha}",
+                            "comments_url": "https://api.github.com/repos/projectdiscovery/nuclei/comments{/number}",
+                            "issue_comment_url": "https://api.github.com/repos/projectdiscovery/nuclei/issues/comments{/number}",
+                            "contents_url": "https://api.github.com/repos/projectdiscovery/nuclei/contents/{+path}",
+                            "compare_url": "https://api.github.com/repos/projectdiscovery/nuclei/compare/{base}...{head}",
+                            "merges_url": "https://api.github.com/repos/projectdiscovery/nuclei/merges",
+                            "archive_url": "https://api.github.com/repos/projectdiscovery/nuclei/{archive_format}{/ref}",
+                            "downloads_url": "https://api.github.com/repos/projectdiscovery/nuclei/downloads",
+                            "issues_url": "https://api.github.com/repos/projectdiscovery/nuclei/issues{/number}",
+                            "pulls_url": "https://api.github.com/repos/projectdiscovery/nuclei/pulls{/number}",
+                            "milestones_url": "https://api.github.com/repos/projectdiscovery/nuclei/milestones{/number}",
+                            "notifications_url": "https://api.github.com/repos/projectdiscovery/nuclei/notifications{?since,all,participating}",
+                            "labels_url": "https://api.github.com/repos/projectdiscovery/nuclei/labels{/name}",
+                            "releases_url": "https://api.github.com/repos/projectdiscovery/nuclei/releases{/id}",
+                            "deployments_url": "https://api.github.com/repos/projectdiscovery/nuclei/deployments",
+                        },
+                        "score": 1.0,
+                    }
+                ],
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(
+            e.data
+            == "https://raw.githubusercontent.com/projectdiscovery/nuclei/06f242e5fce3439b7418877676810cbf57934875/v2/cmd/cve-annotate/main.go"
+            for e in events
+        ), "Failed to detect URL"
diff --git a/bbot/test/test_step_1/module_tests/test_module_gowitness.py b/bbot/test/test_step_1/module_tests/test_module_gowitness.py
index e69de29bb2..278eb21a3f 100644
--- a/bbot/test/test_step_1/module_tests/test_module_gowitness.py
+++ b/bbot/test/test_step_1/module_tests/test_module_gowitness.py
@@ -0,0 +1,42 @@
+from .base import ModuleTestBase
+
+
+class TestGowitness(ModuleTestBase):
+    targets = ["127.0.0.1:8888"]
+    modules_overrides = ["gowitness", "httpx"]
+    import shutil
+    from pathlib import Path
+
+    home_dir = Path("/tmp/.bbot_gowitness_test")
+    shutil.rmtree(home_dir, ignore_errors=True)
+    config_overrides = {"force_deps": True, "home": str(home_dir)}
+
+    def setup_after_prep(self, module_test):
+        respond_args = {
+            "response_data": """<html><head><title>BBOT is life</title></head><body>
+<link rel="preconnect" href="https://fonts.googleapis.com">
+<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
+<link href="https://fonts.googleapis.com/css2?family=Open+Sans+Condensed:wght@700&family=Open+Sans:ital,wght@0,400;0,600;0,700;0,800;1,400&display=swap" rel="stylesheet">
+</body></html>""",
+            "headers": {"Server": "Apache/2.4.41 (Ubuntu)"},
+        }
+        module_test.set_expect_requests(respond_args=respond_args)
+
+
+    def check(self, module_test, events):
+        screenshots_path = self.home_dir / "scans" / module_test.scan.name / "gowitness" / "screenshots"
+        screenshots = list(screenshots_path.glob("*.png"))
+        assert screenshots, f"No .png files found at {screenshots_path}"
+        url = False
+        webscreenshot = False
+        technology = False
+        for event in events:
+            if event.type == "URL_UNVERIFIED":
+                url = True
+            elif event.type == "WEBSCREENSHOT":
+                webscreenshot = True
+            elif event.type == "TECHNOLOGY":
+                technology = True
+        assert url, "No URL emitted"
+        assert webscreenshot, "No WEBSCREENSHOT emitted"
+        assert technology, "No TECHNOLOGY emitted"

From 906d944198cfec136bd8e90d527c5cea702e64ca Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 20 May 2023 12:13:41 -0400
Subject: [PATCH 031/387] more module tests

---
 bbot/modules/hackertarget.py                  |    6 +-
 bbot/modules/hunterio.py                      |   30 +-
 bbot/test/bbot_fixtures.py                    |   13 +
 bbot/test/conftest.py                         |    2 +-
 bbot/test/modules_test_classes.py             | 1377 -----------------
 .../module_tests/test_module_generic_ssrf.py  |    6 +
 .../module_tests/test_module_gowitness.py     |    1 -
 .../module_tests/test_module_hackertarget.py  |   13 +
 .../module_tests/test_module_host_header.py   |    6 +
 .../module_tests/test_module_http.py          |   24 +
 .../module_tests/test_module_httpx.py         |   29 +
 .../module_tests/test_module_human.py         |    8 +
 .../module_tests/test_module_hunt.py          |   17 +
 .../module_tests/test_module_hunterio.py      |   96 ++
 .../test_module_iis_shortnames.py             |   56 +
 bbot/test/test_step_1/test_modules_full.py    |  234 ---
 bbot/test/test_step_2/test_scope.py           |   46 +-
 bbot/test/test_step_2/test_web.py             |    5 +
 18 files changed, 304 insertions(+), 1665 deletions(-)
 delete mode 100644 bbot/test/modules_test_classes.py
 delete mode 100644 bbot/test/test_step_1/test_modules_full.py

diff --git a/bbot/modules/hackertarget.py b/bbot/modules/hackertarget.py
index 38ff695818..8392110340 100644
--- a/bbot/modules/hackertarget.py
+++ b/bbot/modules/hackertarget.py
@@ -9,8 +9,10 @@ class hackertarget(crobat):
 
     base_url = "https://api.hackertarget.com"
 
-    def request_url(self, query):
-        return self.request_with_fail_count(f"{self.base_url}/hostsearch/?q={self.helpers.quote(query)}")
+    async def request_url(self, query):
+        url = f"{self.base_url}/hostsearch/?q={self.helpers.quote(query)}"
+        response = await self.request_with_fail_count(url)
+        return response
 
     def parse_results(self, r, query):
         for line in r.text.splitlines():
diff --git a/bbot/modules/hunterio.py b/bbot/modules/hunterio.py
index 845488844c..8bb9f74744 100644
--- a/bbot/modules/hunterio.py
+++ b/bbot/modules/hunterio.py
@@ -10,19 +10,17 @@ class hunterio(shodan_dns):
     options_desc = {"api_key": "Hunter.IO API key"}
 
     base_url = "https://api.hunter.io/v2"
+    limit = 100
 
-    def setup(self):
-        self.limit = 100
-        return super().setup()
-
-    def ping(self):
-        r = self.helpers.request(f"{self.base_url}/account?api_key={self.api_key}")
+    async def ping(self):
+        url = f"{self.base_url}/account?api_key={self.api_key}"
+        r = await self.helpers.request(url)
         resp_content = getattr(r, "text", "")
         assert getattr(r, "status_code", 0) == 200, resp_content
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
-        for entry in self.query(query):
+        for entry in await self.query(query):
             email = entry.get("value", "")
             sources = entry.get("sources", [])
             if email:
@@ -37,15 +35,19 @@ def handle_event(self, event):
                         if url:
                             self.emit_event(url, "URL_UNVERIFIED", email_event)
 
-    def query(self, query):
+    async def query(self, query):
         emails = []
         url = (
             f"{self.base_url}/domain-search?domain={query}&api_key={self.api_key}"
             + "&limit={page_size}&offset={offset}"
         )
-        for j in self.helpers.api_page_iter(url, page_size=self.limit):
-            new_emails = j.get("data", {}).get("emails", [])
-            if not new_emails:
-                break
-            emails += new_emails
+        agen = self.helpers.api_page_iter(url, page_size=self.limit)
+        try:
+            async for j in agen:
+                new_emails = j.get("data", {}).get("emails", [])
+                if not new_emails:
+                    break
+                emails += new_emails
+        finally:
+            agen.aclose()
         return emails
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index 2b0553475a..f30710b5b0 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -336,3 +336,16 @@ def install_all_python_deps():
     for module in module_loader.preloaded().values():
         deps_pip.update(set(module.get("deps", {}).get("pip", [])))
     subprocess.run([sys.executable, "-m", "pip", "install"] + list(deps_pip))
+
+
+def tempwordlist(content):
+    tmp_path = "/tmp/.bbot_test/"
+    from bbot.core.helpers.misc import rand_string, mkdir
+
+    mkdir(tmp_path)
+    filename = f"{tmp_path}{rand_string(8)}"
+    with open(filename, "w", errors="ignore") as f:
+        for c in content:
+            line = f"{c}\n"
+            f.write(line)
+    return filename
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index c3cdb78766..0aca0ff1bd 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -14,7 +14,7 @@ def pytest_sessionfinish(session, exitstatus):
             logger.removeHandler(handler)
 
     # Wipe out BBOT home dir
-    # shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
+    shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
 
     yield
 
diff --git a/bbot/test/modules_test_classes.py b/bbot/test/modules_test_classes.py
deleted file mode 100644
index e6ac6b67fe..0000000000
--- a/bbot/test/modules_test_classes.py
+++ /dev/null
@@ -1,1377 +0,0 @@
-import re
-import json
-import logging
-
-from .helpers import *
-
-log = logging.getLogger(f"bbot.test")
-
-
-class Httpx(HttpxMockHelper):
-    targets = ["http://127.0.0.1:8888/url", "127.0.0.1:8888"]
-
-    def mock_args(self):
-        request_args = dict(uri="/", headers={"test": "header"})
-        respond_args = dict(response_data=json.dumps({"open": "port"}))
-        self.set_expect_requests(request_args, respond_args)
-        request_args = dict(uri="/url", headers={"test": "header"})
-        respond_args = dict(response_data=json.dumps({"url": "url"}))
-        self.set_expect_requests(request_args, respond_args)
-
-    def check_events(self, events):
-        url = False
-        open_port = False
-        for e in events:
-            if e.type == "HTTP_RESPONSE":
-                j = json.loads(e.data["body"])
-                if e.data["path"] == "/":
-                    if j.get("open", "") == "port":
-                        open_port = True
-                elif e.data["path"] == "/url":
-                    if j.get("url", "") == "url":
-                        url = True
-        assert url, "Failed to visit target URL"
-        assert open_port, "Failed to visit target OPEN_TCP_PORT"
-
-
-
-class Subdomain_Hijack(HttpxMockHelper):
-    additional_modules = ["httpx", "excavate"]
-
-    def mock_args(self):
-        fingerprints = self.module.fingerprints
-        assert fingerprints, "No subdomain hijacking fingerprints available"
-        fingerprint = next(iter(fingerprints))
-        rand_string = self.scan.helpers.rand_string(length=15, digits=False)
-        self.rand_subdomain = f"{rand_string}.{next(iter(fingerprint.domains))}"
-        respond_args = {"response_data": f'<a src="http://{self.rand_subdomain}"/>'}
-        self.set_expect_requests(respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(
-            event.type == "FINDING"
-            and event.data["description"].startswith("Hijackable Subdomain")
-            and self.rand_subdomain in event.data["description"]
-            and event.data["host"] == self.rand_subdomain
-            for event in events
-        ), f"No hijackable subdomains in {events}"
-
-
-class Fingerprintx(HttpxMockHelper):
-    targets = ["127.0.0.1:8888"]
-
-    def mock_args(self):
-        pass
-
-    def check_events(self, events):
-        assert any(
-            event.type == "PROTOCOL"
-            and event.host == self.scan.helpers.make_ip_type("127.0.0.1")
-            and event.port == 8888
-            and event.data["protocol"] == "HTTP"
-            for event in events
-        ), "HTTP protocol not detected"
-
-
-class Otx(RequestMockHelper):
-    def mock_args(self):
-        for t in self.targets:
-            self.httpx_mock.add_response(
-                url=f"https://otx.alienvault.com/api/v1/indicators/domain/{t}/passive_dns",
-                json={
-                    "passive_dns": [
-                        {
-                            "address": "2606:50c0:8000::153",
-                            "first": "2021-10-28T20:23:08",
-                            "last": "2022-08-24T18:29:49",
-                            "hostname": "asdf.blacklanternsecurity.com",
-                            "record_type": "AAAA",
-                            "indicator_link": "/indicator/hostname/www.blacklanternsecurity.com",
-                            "flag_url": "assets/images/flags/us.png",
-                            "flag_title": "United States",
-                            "asset_type": "hostname",
-                            "asn": "AS54113 fastly",
-                        }
-                    ]
-                },
-            )
-
-    def check_events(self, events):
-        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
-
-
-class Anubisdb(RequestMockHelper):
-    def setup(self, scan):
-        self.module.abort_if = lambda e: False
-
-    def mock_args(self):
-        for t in self.targets:
-            self.httpx_mock.add_response(
-                url=f"https://jldc.me/anubis/subdomains/{t}",
-                json=["asdf.blacklanternsecurity.com", "zzzz.blacklanternsecurity.com"],
-            )
-
-    def check_events(self, events):
-        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
-
-
-class SecretsDB(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "-----BEGIN PGP PRIVATE KEY BLOCK-----"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "FINDING" for e in events)
-
-
-class Badsecrets(HttpxMockHelper):
-    targets = [
-        "http://127.0.0.1:8888/",
-        "http://127.0.0.1:8888/test.aspx",
-        "http://127.0.0.1:8888/cookie.aspx",
-        "http://127.0.0.1:8888/cookie2.aspx",
-    ]
-
-    sample_viewstate = """
-    <form method="post" action="./query.aspx" id="form1">
-<div class="aspNetHidden">
-<input type="hidden" name="__VIEWSTATE" id="__VIEWSTATE" value="rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu" />
-</div>
-
-<div class="aspNetHidden">
-
-    <input type="hidden" name="__VIEWSTATEGENERATOR" id="__VIEWSTATEGENERATOR" value="EDD8C9AE" />
-    <input type="hidden" name="__VIEWSTATEENCRYPTED" id="__VIEWSTATEENCRYPTED" value="" />
-</div>
-    </form>
-</body>
-</html>
-"""
-
-    sample_viewstate_notvuln = """
-    <form method="post" action="./query.aspx" id="form1">
-<div class="aspNetHidden">
-<input type="hidden" name="__VIEWSTATE" id="__VIEWSTATE" value="AAAAYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESfAAAA" />
-</div>
-
-<div class="aspNetHidden">
-
-    <input type="hidden" name="__VIEWSTATEGENERATOR" id="__VIEWSTATEGENERATOR" value="EDD8C9AE" />
-    <input type="hidden" name="__VIEWSTATEENCRYPTED" id="__VIEWSTATEENCRYPTED" value="" />
-</div>
-    </form>
-</body>
-</html>
-"""
-
-    additional_modules = ["httpx"]
-
-    def mock_args(self):
-        expect_args = {"uri": "/test.aspx"}
-        respond_args = {"response_data": self.sample_viewstate}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        respond_args = {"response_data": self.sample_viewstate_notvuln}
-        self.set_expect_requests(respond_args=respond_args)
-
-        expect_args = {"uri": "/cookie.aspx"}
-        respond_args = {
-            "response_data": "<html><body><p>JWT Cookie Test</p></body></html>",
-            "headers": {
-                "set-cookie": "vulnjwt=eyJhbGciOiJIUzI1NiJ9.eyJJc3N1ZXIiOiJJc3N1ZXIiLCJVc2VybmFtZSI6IkJhZFNlY3JldHMiLCJleHAiOjE1OTMxMzM0ODMsImlhdCI6MTQ2NjkwMzA4M30.ovqRikAo_0kKJ0GVrAwQlezymxrLGjcEiW_s3UJMMCo; secure"
-            },
-        }
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"uri": "/cookie2.aspx"}
-        respond_args = {
-            "response_data": "<html><body><p>Express Cookie Test</p></body></html>",
-            "headers": {
-                "set-cookie": "connect.sid=s%3A8FnPwdeM9kdGTZlWvdaVtQ0S1BCOhY5G.qys7H2oGSLLdRsEq7sqh7btOohHsaRKqyjV4LiVnBvc; Path=/; Expires=Wed, 05 Apr 2023 04:47:29 GMT; HttpOnly"
-            },
-        }
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        SecretFound = False
-        IdentifyOnly = False
-        CookieBasedDetection = False
-        CookieBasedDetection_2 = False
-
-        for e in events:
-            if (
-                e.type == "VULNERABILITY"
-                and e.data["description"]
-                == "Known Secret Found. Secret Type: [ASP.NET MachineKey] Secret: [validationKey: 0F97BAE23F6F36801ABDB5F145124E00A6F795A97093D778EE5CD24F35B78B6FC4C0D0D4420657689C4F321F8596B59E83F02E296E970C4DEAD2DFE226294979 validationAlgo: SHA1 encryptionKey: 8CCFBC5B7589DD37DC3B4A885376D7480A69645DAEEC74F418B4877BEC008156 encryptionAlgo: AES] Product Type: [ASP.NET Viewstate] Product: [rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu] Detecting Module: [ASPNET_Viewstate]"
-            ):
-                SecretFound = True
-
-            if (
-                e.type == "FINDING"
-                and e.data["description"]
-                == "Cryptographic Product identified. Product Type: [ASP.NET Viewstate] Product: [AAAAYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESfAAAA] Detecting Module: [ASPNET_Viewstate]"
-            ):
-                IdentifyOnly = True
-
-            if (
-                e.type == "VULNERABILITY"
-                and e.data["description"]
-                == "Known Secret Found. Secret Type: [HMAC/RSA Key] Secret: [1234] Product Type: [JSON Web Token (JWT)] Product: [eyJhbGciOiJIUzI1NiJ9.eyJJc3N1ZXIiOiJJc3N1ZXIiLCJVc2VybmFtZSI6IkJhZFNlY3JldHMiLCJleHAiOjE1OTMxMzM0ODMsImlhdCI6MTQ2NjkwMzA4M30.ovqRikAo_0kKJ0GVrAwQlezymxrLGjcEiW_s3UJMMCo] Detecting Module: [Generic_JWT]"
-            ):
-                CookieBasedDetection = True
-
-            if (
-                e.type == "VULNERABILITY"
-                and e.data["description"]
-                == "Known Secret Found. Secret Type: [Express.js SESSION_SECRET] Secret: [keyboard cat] Product Type: [Express.js Signed Cookie] Product: [s%3A8FnPwdeM9kdGTZlWvdaVtQ0S1BCOhY5G.qys7H2oGSLLdRsEq7sqh7btOohHsaRKqyjV4LiVnBvc] Detecting Module: [ExpressSignedCookies]"
-            ):
-                CookieBasedDetection_2 = True
-
-        assert SecretFound, "No secret found"
-        assert IdentifyOnly, "No crypto product identified"
-        assert CookieBasedDetection, "No JWT cookie detected"
-        assert CookieBasedDetection_2, "No Express.js cookie detected"
-
-
-class Telerik(HttpxMockHelper):
-    additional_modules = ["httpx"]
-    config_overrides = {"modules": {"telerik": {"exploit_RAU_crypto": True}}}
-
-    def mock_args(self):
-        # Simulate Telerik.Web.UI.WebResource.axd?type=rau detection
-        expect_args = {"method": "GET", "uri": "/Telerik.Web.UI.WebResource.axd", "query_string": "type=rau"}
-        respond_args = {
-            "response_data": '{ "message" : "RadAsyncUpload handler is registered succesfully, however, it may not be accessed directly." }'
-        }
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        # Simulate Vulnerable Telerik.Web.UI.WebResource.axd
-        vuln_data = "ATTu5i4R+ViNFYO6kst0jC11wM/1iqH+W/isjhaDjNuCI7eJ/BY5d1E9eqZK27CJCMuon9u8/hgRIM/cTlgLlv4qOYjPBjs81Y3dAZAdtIr3TXiCmZi9M09a1BYMxjvGKfVky3b7PoOppeWS/3rglTwL1e8oyqLGx2NKUH5y8Cd+kLKV2f31J1sV4I5HTDKgDmvziJp3zlDrCb0Fi9ilKH+O1cbVx6SdBop/U30FxLaB/QIbt2N1rQHREJ5Skpgo7dilPxzBaTObdBhCVyB/FiJhenS/0u3h0Mpi6+A40SylICcyyxQha7+Uh7lEJ8Ne+2eTs4WqcaaQbvIhy7oHc+D0soxRKMZRjo7Up+UWHQJJh6KtWSCxUESNSdNcxjPQZE9HqsPlldVlkeC+ehSGce5bR0Ylots6Iz1OoCgMEWwxByeG3VzgxF6XpitL61A1hFcNo9euSTnCfOWh0vrQHON7DN5LpM9xr7SoD0Dnu01hZ9NS1PHhPLyN5WS87u5qdZp/z3Sxwc3wawIdo62RNf4Iz2gAKJZnPfxrE1mRn5kBe7f6O44rcuv6lcdao/DGlwbERKwRI6/n+FxGmc7H5iEKyihIwS2XUoOgsYTx5CWCDM8CuOXTk+H5fPYp9APRPbkD1IS9I/vRmvNPwWsgv8/7DzttqdBsGxiZJfCw1uZ7KSVmbItgXPAcscNxGEMaHXyJzkAl/mlM5/t/YSejwYoSW6jFfQcLdaVx2dpIpl5UmmQjFedzKeiNqpZDCk4yzXFHX24XUODYMJDtIJK2Hz1KTZmFG+LAOJjB9QOI58hFAnytcKay+JWFrzah/IvoNZxJUtlYdxw0YEyKs/ExET7AXgYQN0S+8j2PfaMMpzDSctTqpp5XBFV4Mt718GiqVnQJtWQv2p9Xl8XXOerBthbzzAciVcB8AV2WfZ51W3e4aX4kcyT/sCJhm7NR5WrNG5mX/ns0TTnGnzlPYhJcbu8uMFjMGDpXuhVyroJ7wmZucaIvesg0h5Y9cMEFviqsdy15vjMzFh+v9uO9Vicf6n9Z9JGSpWKE8wer2JU5b53Zw0cTfulAAffLWXnzOnfu&6R/cGaqQeHVAzdJ9wTFOyCsrMSTtqcjLe8AHwiPckPDUwecnJyNlkDYwDQpxGYQ9hs6YxhupK310sbCbtXB4H6Dz5rGNL40nkkyo4j2clmRr08jtFsPQ0RpE5BGsulPT3l0MxyAvPFMs8bMybUyAP+9RB9LoHE3Xo8BqDadX3HQakpPfGtiDMp+wxkWRgaNpCnXeY1QewWTF6z/duLzbu6CT6s+H4HgBHrOLTpemC2PvP2bDm0ySPHLdpapLYxU8nIYjLKIyYJgwv9S9jNckIVpcGVTWVul7CauCKxAB2mMnM9jJi8zfFwKajT5d2d9XfpkiVMrdlmikSB/ehyX1wQ=="
-        expect_args = {
-            "method": "POST",
-            "uri": "/Telerik.Web.UI.WebResource.axd",
-            "query_string": "type=rau",
-            "data": vuln_data,
-        }
-        respond_args = {
-            "response_data": '{"fileInfo":{"FileName":"RAU_crypto.bypass","ContentType":"text/html","ContentLength":5,"DateJson":"2019-01-02T03:04:05.067Z","Index":0}, "metaData":"CS8S/Z0J/b2982DRxDin0BBslA7fI0cWMuWlPu4W3FkE4tKaVoIEiAOtVlJ6D+0RQsfu8ox6gvMYxceQ0LtWyTkQBaIUa8LgLQg05DMaQuufHNx0YQ2ACi5neqDBvduj2MGiSGC0hNKzSWsHystZGUfFPLTZuJXYnff+WXurecuRzSI7d4Q1aj0bcTKKvfyQtH+fsTEafWRRZ99X/xgi4ON2OsRZ738uQHw7pQT2e1v7AtN46mxO/BmhEuZQr6m6HEvxK0pJRNkBhFUiQ+poeu8j3JzicOjvPDwFE4Rjqf3RVILt83XZrju2VpRIJqAEtf//znhH8BhT5BWvhnRo+J3ML5qoZLa2joE/QK8Ctf3UPvAFkHIUMdOH2mLNgZ+U87tdVE6fYfzvphZsLxmJRG45H8ZTZuYhJbOfei2LQ4fqHmr7p8KpJNVqoz/ev1dnBclAf5ayb40qJKEVsGXIbWEbIZwg7TTsLFc29aP7DPg=" }'
-        }
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        # Simulate DialogHandler detection
-        expect_args = {"method": "GET", "uri": "Telerik.Web.UI.SpellCheckHandler.axd"}
-        respond_args = {"status": 500}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        # Simulate DialogHandler detection
-        expect_args = {"method": "GET", "uri": "/App_Master/Telerik.Web.UI.DialogHandler.aspx"}
-        respond_args = {
-            "response_data": '<input type="hidden" name="dialogParametersHolder" id="dialogParametersHolder" /><div style=\'color:red\'>Cannot deserialize dialog parameters. Please refresh the editor page.</div><div>Error Message:Invalid length for a Base-64 char array or string.</div></form></body></html>'
-        }
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        # Fallback
-        expect_args = {"uri": re.compile(r"^/\w{10}$")}
-        respond_args = {"status": 200}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        telerik_axd_detection = False
-        telerik_axd_vulnerable = False
-        telerik_spellcheck_detection = False
-        telerik_dialoghandler_detection = False
-
-        for e in events:
-            if e.type == "FINDING" and "Telerik RAU AXD Handler detected" in e.data["description"]:
-                telerik_axd_detection = True
-                continue
-
-            if e.type == "VULNERABILITY" and "Confirmed Vulnerable Telerik (version: 2014.3.1024)":
-                telerik_axd_vulnerable = True
-                continue
-
-            if e.type == "FINDING" and "Telerik DialogHandler detected" in e.data["description"]:
-                telerik_dialoghandler_detection = True
-                continue
-
-            if e.type == "FINDING" and "Telerik SpellCheckHandler detected" in e.data["description"]:
-                telerik_spellcheck_detection = True
-                continue
-
-        assert telerik_axd_detection, "Telerik AXD detection failed"
-        assert telerik_axd_vulnerable, "Telerik vulnerable AXD detection failed"
-        assert telerik_spellcheck_detection, "Telerik spellcheck detection failed"
-        assert telerik_dialoghandler_detection, "Telerik dialoghandler detection failed"
-
-
-class Paramminer_headers(HttpxMockHelper):
-    headers_body = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello null!</p>';
-    </body>
-    </html>
-    """
-
-    headers_body_match = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello AAAAAAAAAAAAAA!</p>';
-    </body>
-    </html>
-    """
-    additional_modules = ["httpx"]
-
-    config_overrides = {"modules": {"paramminer_headers": {"wordlist": tempwordlist(["junkword1", "tracestate"])}}}
-
-    def setup(self, scan):
-        from bbot.core.helpers import helper
-
-        self.module.rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
-        helper.HttpCompare.gen_cache_buster = lambda *args, **kwargs: {"AAAAAA": "1"}
-
-    def mock_args(self):
-        expect_args = dict(headers={"tracestate": "AAAAAAAAAAAAAA"})
-        respond_args = {"response_data": self.headers_body_match}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        respond_args = {"response_data": self.headers_body}
-        self.set_expect_requests(respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [tracestate] Reasons: [body]"
-            for e in events
-        )
-        assert not any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [junkword1] Reasons: [body]"
-            for e in events
-        )
-
-
-class Paramminer_getparams(HttpxMockHelper):
-    getparam_body = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello null!</p>';
-    </body>
-    </html>
-    """
-
-    getparam_body_match = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello AAAAAAAAAAAAAA!</p>';
-    </body>
-    </html>
-    """
-    additional_modules = ["httpx"]
-
-    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"])}}}
-
-    def setup(self, scan):
-        from bbot.core.helpers import helper
-
-        self.module.rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
-        helper.HttpCompare.gen_cache_buster = lambda *args, **kwargs: {"AAAAAA": "1"}
-
-    def mock_args(self):
-        expect_args = {"query_string": b"id=AAAAAAAAAAAAAA&AAAAAA=1"}
-        respond_args = {"response_data": self.getparam_body_match}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        respond_args = {"response_data": self.getparam_body}
-        self.set_expect_requests(respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [id] Reasons: [body]"
-            for e in events
-        )
-        assert not any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [canary] Reasons: [body]"
-            for e in events
-        )
-
-
-class Paramminer_cookies(HttpxMockHelper):
-    cookies_body = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello null!</p>';
-    </body>
-    </html>
-    """
-
-    cookies_body_match = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello AAAAAAAAAAAAAA!</p>';
-    </body>
-    </html>
-    """
-    additional_modules = ["httpx"]
-
-    config_overrides = {"modules": {"paramminer_cookies": {"wordlist": tempwordlist(["junkcookie", "admincookie"])}}}
-
-    def setup(self, scan):
-        from bbot.core.helpers import helper
-
-        self.module.rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
-        helper.HttpCompare.gen_cache_buster = lambda *args, **kwargs: {"AAAAAA": "1"}
-
-    def mock_args(self):
-        expect_args = dict(headers={"Cookie": "admincookie=AAAAAAAAAAAAAA"})
-        respond_args = {"response_data": self.cookies_body_match}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        respond_args = {"response_data": self.cookies_body}
-        self.set_expect_requests(respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [admincookie] Reasons: [body]"
-            for e in events
-        )
-        assert not any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [junkcookie] Reasons: [body]"
-            for e in events
-        )
-
-
-class LeakIX(RequestMockHelper):
-    def mock_args(self):
-        self.httpx_mock.add_response(
-            url="https://leakix.net/api/subdomains/blacklanternsecurity.com",
-            json=[
-                {
-                    "subdomain": "www.blacklanternsecurity.com",
-                    "distinct_ips": 2,
-                    "last_seen": "2023-02-20T20:23:13.583Z",
-                },
-                {
-                    "subdomain": "asdf.blacklanternsecurity.com",
-                    "distinct_ips": 1,
-                    "last_seen": "2022-09-17T01:31:52.563Z",
-                },
-            ],
-        )
-
-    def check_events(self, events):
-        www = False
-        asdf = False
-        for e in events:
-            if e.type in ("DNS_NAME", "DNS_NAME_UNRESOLVED") and str(e.module) == "leakix":
-                if e.data == "www.blacklanternsecurity.com":
-                    www = True
-                elif e.data == "asdf.blacklanternsecurity.com":
-                    asdf = True
-        assert www
-        assert asdf
-
-
-class Massdns(RequestMockHelper):
-    subdomain_wordlist = tempwordlist(["www", "asdf"])
-    config_overrides = {"modules": {"massdns": {"wordlist": str(subdomain_wordlist)}}}
-
-    def __init__(self, request):
-        super().__init__(request)
-        self.httpx_mock.add_response(
-            url="https://raw.githubusercontent.com/blacklanternsecurity/public-dns-servers/master/nameservers.txt",
-            text="8.8.8.8\n8.8.4.4\n1.1.1.1",
-        )
-
-    def mock_args(self):
-        pass
-
-    def check_events(self, events):
-        assert any(
-            e.type in ("DNS_NAME", "DNS_NAME_UNRESOLVED") and e.data == "www.blacklanternsecurity.com" for e in events
-        )
-
-
-class Robots(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    config_overrides = {"modules": {"robots": {"include_sitemap": True}}}
-
-    def mock_args(self):
-        sample_robots = f"Allow: /allow/\nDisallow: /disallow/\nJunk: test.com\nDisallow: /*/wildcard.txt\nSitemap: {self.targets[0]}sitemap.txt"
-
-        expect_args = {"method": "GET", "uri": "/robots.txt"}
-        respond_args = {"response_data": sample_robots}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        allow_bool = False
-        disallow_bool = False
-        sitemap_bool = False
-        wildcard_bool = False
-
-        for e in events:
-            if e.type == "URL_UNVERIFIED":
-                if str(e.module) != "TARGET":
-                    assert "spider-danger" in e.tags, f"{e} doesn't have spider-danger tag"
-                if e.data == "http://127.0.0.1:8888/allow/":
-                    allow_bool = True
-
-                if e.data == "http://127.0.0.1:8888/disallow/":
-                    disallow_bool = True
-
-                if e.data == "http://127.0.0.1:8888/sitemap.txt":
-                    sitemap_bool = True
-
-                if re.match(r"http://127\.0\.0\.1:8888/\w+/wildcard\.txt", e.data):
-                    wildcard_bool = True
-
-        assert allow_bool
-        assert disallow_bool
-        assert sitemap_bool
-        assert wildcard_bool
-
-
-class Masscan(MockHelper):
-    targets = ["8.8.8.8/32"]
-    config_overrides = {"modules": {"masscan": {"ports": "443", "wait": 1}}}
-    config_overrides_2 = {"modules": {"masscan": {"ports": "443", "wait": 1, "use_cache": True}}}
-    masscan_output = """[
-{   "ip": "8.8.8.8",   "timestamp": "1680197558", "ports": [ {"port": 443, "proto": "tcp", "status": "open", "reason": "syn-ack", "ttl": 54} ] }
-]"""
-    masscan_config = """seed = 17230484647655100360
-rate = 600       
-shard = 1/1
-
-
-# TARGET SELECTION (IP, PORTS, EXCLUDES)
-ports = 
-range = 9.8.7.6"""
-
-    def __init__(self, request):
-        super().__init__(request)
-        config2 = OmegaConf.merge(self.config, OmegaConf.create(self.config_overrides_2))
-        self.add_scan(
-            *self.targets,
-            modules=[self.name] + self.additional_modules,
-            name=f"{self.name}_test",
-            config=config2,
-            whitelist=self.whitelist,
-            blacklist=self.blacklist,
-        )
-        self.masscan_run = False
-
-    async def run_masscan(self, command, *args, **kwargs):
-        if "masscan" in command[:2]:
-            for l in self.masscan_output.splitlines():
-                yield l
-            self.masscan_run = True
-        else:
-            async for l in self.scan.helpers.run_live(command, *args, **kwargs):
-                yield l
-
-    def setup(self, scan):
-        scan.helpers.run_live = self.run_masscan
-        scan.modules["masscan"].masscan_config = self.masscan_config
-
-    async def run(self):
-        for i, scan in enumerate(self.scans):
-            await scan.prep()
-            self.setup(scan)
-            events = [e async for e in scan.start()]
-            self.check_events(events)
-            if i == 0:
-                assert self.masscan_run == True, "masscan didn't run when it was supposed to"
-                self.masscan_run = False
-            else:
-                assert self.masscan_run == False, "masscan ran when it wasn't supposed to"
-
-    def check_events(self, events):
-        assert any(e.type == "IP_ADDRESS" and e.data == "8.8.8.8" for e in events), "No IP_ADDRESS emitted"
-        assert any(e.type == "OPEN_TCP_PORT" and e.data == "8.8.8.8:443" for e in events), "No OPEN_TCP_PORT emitted"
-
-
-class Buckets(HttpxMockHelper):
-    providers = ["aws", "gcp", "azure", "digitalocean", "firebase"]
-    # providers = ["azure"]
-    additional_modules = ["excavate", "speculate", "httpx"] + [f"bucket_{p}" for p in providers]
-    config_overrides = {
-        "modules": {
-            "bucket_aws": {"permutations": True},
-            "bucket_gcp": {"permutations": True},
-            "bucket_azure": {"permutations": True},
-            "bucket_digitalocean": {"permutations": True},
-            "bucket_firebase": {"permutations": True},
-        },
-        "excavate": True,
-        "speculate": True,
-    }
-
-    from bbot.core.helpers.misc import rand_string
-
-    random_bucket_name_1 = rand_string(15, digits=False)
-    random_bucket_name_2 = rand_string(15, digits=False)
-
-    open_aws_bucket = """<?xml version="1.0" encoding="UTF-8"?>
-<ListBucketResult xmlns="http://s3.amazonaws.com/doc/2006-03-01/"><Name>vpn-static</Name><Prefix></Prefix><Marker></Marker><MaxKeys>1000</MaxKeys><IsTruncated>false</IsTruncated><Contents><Key>style.css</Key><LastModified>2017-03-18T06:41:59.000Z</LastModified><ETag>&quot;bf9e72bdab09b785f05ff0395023cc35&quot;</ETag><Size>429</Size><StorageClass>STANDARD</StorageClass></Contents></ListBucketResult>"""
-    open_digitalocean_bucket = """<?xml version="1.0" encoding="UTF-8"?><ListBucketResult xmlns="http://s3.amazonaws.com/doc/2006-03-01/"><Name>cloud01</Name><Prefix></Prefix><MaxKeys>1000</MaxKeys><IsTruncated>false</IsTruncated><Contents><Key>test.doc</Key><LastModified>2020-10-14T15:23:37.545Z</LastModified><ETag>&quot;4d25c8699f7347acc9f41e57148c62c0&quot;</ETag><Size>13362425</Size><StorageClass>STANDARD</StorageClass><Owner><ID>1957883</ID><DisplayName>1957883</DisplayName></Owner><Type>Normal</Type></Contents><Marker></Marker></ListBucketResult>"""
-    open_gcp_bucket = """{
-  "kind": "storage#testIamPermissionsResponse",
-  "permissions": [
-    "storage.objects.create",
-    "storage.objects.list"
-  ]
-}"""
-
-    def __init__(self, request, **kwargs):
-        self.httpx_mock = request.getfixturevalue("httpx_mock")
-        super().__init__(request, **kwargs)
-
-    def setup(self, scan):
-        scan.helpers.word_cloud.mutations = lambda b, cloud=False: [
-            (b, "dev"),
-        ]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        body = f"""
-        <a href="https://{self.random_bucket_name_1}.s3.amazonaws.com"/>
-        <a href="https://{self.random_bucket_name_1}.nyc3.digitaloceanspaces.com"/>
-        <a href="https://{self.random_bucket_name_1}.storage.googleapis.com"/>
-        <a href="https://{self.random_bucket_name_1}.blob.core.windows.net"/>
-        <a href="https://{self.random_bucket_name_1}.firebaseio.com"/>
-
-        <a href="https://{self.random_bucket_name_2}.s3-ap-southeast-2.amazonaws.com"/>
-        <a href="https://{self.random_bucket_name_2}.fra1.digitaloceanspaces.com"/>
-        <a href="https://{self.random_bucket_name_2}.storage.googleapis.com"/>
-        <a href="https://{self.random_bucket_name_2}.blob.core.windows.net"/>
-        <a href="https://{self.random_bucket_name_2}.firebaseio.com"/>
-        """
-        self.set_expect_requests(expect_args=expect_args, respond_args={"response_data": body})
-
-        self.httpx_mock.add_response(
-            url=f"https://{self.random_bucket_name_2}.s3-ap-southeast-2.amazonaws.com",
-            text=self.open_aws_bucket,
-        )
-        self.httpx_mock.add_response(
-            url=f"https://{self.random_bucket_name_2}.fra1.digitaloceanspaces.com",
-            text=self.open_digitalocean_bucket,
-        )
-        self.httpx_mock.add_response(
-            url=f"https://www.googleapis.com/storage/v1/b/{self.random_bucket_name_2}/iam/testPermissions?permissions=storage.buckets.setIamPolicy&permissions=storage.objects.list&permissions=storage.objects.get&permissions=storage.objects.create",
-            text=self.open_gcp_bucket,
-        )
-        self.httpx_mock.add_response(
-            url=f"https://{self.random_bucket_name_2}.firebaseio.com/.json",
-            text="",
-        )
-        self.httpx_mock.add_response(
-            url=f"https://{self.random_bucket_name_2}-dev.s3.amazonaws.com",
-            text="",
-        )
-        self.httpx_mock.add_response(
-            url=f"https://{self.random_bucket_name_2}-dev.fra1.digitaloceanspaces.com",
-            text="",
-        )
-        self.httpx_mock.add_response(
-            url=f"https://{self.random_bucket_name_2}-dev.blob.core.windows.net/{self.random_bucket_name_2}-dev?restype=container",
-            text="",
-        )
-        self.httpx_mock.add_response(
-            url=f"https://www.googleapis.com/storage/v1/b/{self.random_bucket_name_2}-dev",
-            text="",
-        )
-        self.httpx_mock.add_response(
-            url=f"https://{self.random_bucket_name_2}-dev.firebaseio.com/.json",
-            text="",
-        )
-        self.httpx_mock.add_response(url=re.compile(".*"), text="", status_code=404)
-
-    def check_events(self, events):
-        for provider in self.providers:
-            # make sure buckets were excavated
-            assert any(
-                e.type == "STORAGE_BUCKET" and str(e.module) == f"{provider}_cloud" for e in events
-            ), f'bucket not found for provider "{provider}"'
-            # make sure open buckets were found
-            if not provider == "azure":
-                assert any(
-                    e.type == "FINDING" and str(e.module) == f"bucket_{provider}" for e in events
-                ), f'open bucket not found for provider "{provider}"'
-                for e in events:
-                    if e.type == "FINDING" and str(e.module) == f"bucket_{provider}":
-                        url = e.data.get("url", "")
-                        assert self.random_bucket_name_2 in url
-                        assert not self.random_bucket_name_1 in url
-                        assert not f"{self.random_bucket_name_2}-dev" in url
-            # make sure bucket mutations were found
-            assert any(
-                e.type == "STORAGE_BUCKET"
-                and str(e.module) == f"bucket_{provider}"
-                and f"{self.random_bucket_name_2}-dev" in e.data["url"]
-                for e in events
-            ), f'bucket (dev mutation) not found for provider "{provider}"'
-
-
-class ASN(HttpxMockHelper):
-    targets = ["8.8.8.8"]
-    response_get_asn_ripe = {
-        "messages": [],
-        "see_also": [],
-        "version": "1.1",
-        "data_call_name": "network-info",
-        "data_call_status": "supported",
-        "cached": False,
-        "data": {"asns": ["15169"], "prefix": "8.8.8.0/24"},
-        "query_id": "20230217212133-f278ff23-d940-4634-8115-a64dee06997b",
-        "process_time": 5,
-        "server_id": "app139",
-        "build_version": "live.2023.2.1.142",
-        "status": "ok",
-        "status_code": 200,
-        "time": "2023-02-17T21:21:33.428469",
-    }
-    response_get_asn_metadata_ripe = {
-        "messages": [],
-        "see_also": [],
-        "version": "4.1",
-        "data_call_name": "whois",
-        "data_call_status": "supported - connecting to ursa",
-        "cached": False,
-        "data": {
-            "records": [
-                [
-                    {"key": "ASNumber", "value": "15169", "details_link": None},
-                    {"key": "ASName", "value": "GOOGLE", "details_link": None},
-                    {"key": "ASHandle", "value": "15169", "details_link": "https://stat.ripe.net/AS15169"},
-                    {"key": "RegDate", "value": "2000-03-30", "details_link": None},
-                    {
-                        "key": "Ref",
-                        "value": "https://rdap.arin.net/registry/autnum/15169",
-                        "details_link": "https://rdap.arin.net/registry/autnum/15169",
-                    },
-                    {"key": "source", "value": "ARIN", "details_link": None},
-                ],
-                [
-                    {"key": "OrgAbuseHandle", "value": "ABUSE5250-ARIN", "details_link": None},
-                    {"key": "OrgAbuseName", "value": "Abuse", "details_link": None},
-                    {"key": "OrgAbusePhone", "value": "+1-650-253-0000", "details_link": None},
-                    {
-                        "key": "OrgAbuseEmail",
-                        "value": "network-abuse@google.com",
-                        "details_link": "mailto:network-abuse@google.com",
-                    },
-                    {
-                        "key": "OrgAbuseRef",
-                        "value": "https://rdap.arin.net/registry/entity/ABUSE5250-ARIN",
-                        "details_link": "https://rdap.arin.net/registry/entity/ABUSE5250-ARIN",
-                    },
-                    {"key": "source", "value": "ARIN", "details_link": None},
-                ],
-                [
-                    {"key": "OrgName", "value": "Google LLC", "details_link": None},
-                    {"key": "OrgId", "value": "GOGL", "details_link": None},
-                    {"key": "Address", "value": "1600 Amphitheatre Parkway", "details_link": None},
-                    {"key": "City", "value": "Mountain View", "details_link": None},
-                    {"key": "StateProv", "value": "CA", "details_link": None},
-                    {"key": "PostalCode", "value": "94043", "details_link": None},
-                    {"key": "Country", "value": "US", "details_link": None},
-                    {"key": "RegDate", "value": "2000-03-30", "details_link": None},
-                    {
-                        "key": "Comment",
-                        "value": "Please note that the recommended way to file abuse complaints are located in the following links.",
-                        "details_link": None,
-                    },
-                    {
-                        "key": "Comment",
-                        "value": "To report abuse and illegal activity: https://www.google.com/contact/",
-                        "details_link": None,
-                    },
-                    {
-                        "key": "Comment",
-                        "value": "For legal requests: http://support.google.com/legal",
-                        "details_link": None,
-                    },
-                    {"key": "Comment", "value": "Regards,", "details_link": None},
-                    {"key": "Comment", "value": "The Google Team", "details_link": None},
-                    {
-                        "key": "Ref",
-                        "value": "https://rdap.arin.net/registry/entity/GOGL",
-                        "details_link": "https://rdap.arin.net/registry/entity/GOGL",
-                    },
-                    {"key": "source", "value": "ARIN", "details_link": None},
-                ],
-                [
-                    {"key": "OrgTechHandle", "value": "ZG39-ARIN", "details_link": None},
-                    {"key": "OrgTechName", "value": "Google LLC", "details_link": None},
-                    {"key": "OrgTechPhone", "value": "+1-650-253-0000", "details_link": None},
-                    {
-                        "key": "OrgTechEmail",
-                        "value": "arin-contact@google.com",
-                        "details_link": "mailto:arin-contact@google.com",
-                    },
-                    {
-                        "key": "OrgTechRef",
-                        "value": "https://rdap.arin.net/registry/entity/ZG39-ARIN",
-                        "details_link": "https://rdap.arin.net/registry/entity/ZG39-ARIN",
-                    },
-                    {"key": "source", "value": "ARIN", "details_link": None},
-                ],
-                [
-                    {"key": "RTechHandle", "value": "ZG39-ARIN", "details_link": None},
-                    {"key": "RTechName", "value": "Google LLC", "details_link": None},
-                    {"key": "RTechPhone", "value": "+1-650-253-0000", "details_link": None},
-                    {"key": "RTechEmail", "value": "arin-contact@google.com", "details_link": None},
-                    {
-                        "key": "RTechRef",
-                        "value": "https://rdap.arin.net/registry/entity/ZG39-ARIN",
-                        "details_link": None,
-                    },
-                    {"key": "source", "value": "ARIN", "details_link": None},
-                ],
-            ],
-            "irr_records": [],
-            "authorities": ["arin"],
-            "resource": "15169",
-            "query_time": "2023-02-17T21:25:00",
-        },
-        "query_id": "20230217212529-75f57efd-59f4-473f-8bdd-803062e94290",
-        "process_time": 268,
-        "server_id": "app143",
-        "build_version": "live.2023.2.1.142",
-        "status": "ok",
-        "status_code": 200,
-        "time": "2023-02-17T21:25:29.417812",
-    }
-    response_get_asn_bgpview = {
-        "status": "ok",
-        "status_message": "Query was successful",
-        "data": {
-            "ip": "8.8.8.8",
-            "ptr_record": "dns.google",
-            "prefixes": [
-                {
-                    "prefix": "8.8.8.0/24",
-                    "ip": "8.8.8.0",
-                    "cidr": 24,
-                    "asn": {"asn": 15169, "name": "GOOGLE", "description": "Google LLC", "country_code": "US"},
-                    "name": "LVLT-GOGL-8-8-8",
-                    "description": "Google LLC",
-                    "country_code": "US",
-                }
-            ],
-            "rir_allocation": {
-                "rir_name": "ARIN",
-                "country_code": None,
-                "ip": "8.0.0.0",
-                "cidr": 9,
-                "prefix": "8.0.0.0/9",
-                "date_allocated": "1992-12-01 00:00:00",
-                "allocation_status": "allocated",
-            },
-            "iana_assignment": {
-                "assignment_status": "legacy",
-                "description": "Administered by ARIN",
-                "whois_server": "whois.arin.net",
-                "date_assigned": None,
-            },
-            "maxmind": {"country_code": None, "city": None},
-        },
-        "@meta": {"time_zone": "UTC", "api_version": 1, "execution_time": "567.18 ms"},
-    }
-    response_get_emails_bgpview = {
-        "status": "ok",
-        "status_message": "Query was successful",
-        "data": {
-            "asn": 15169,
-            "name": "GOOGLE",
-            "description_short": "Google LLC",
-            "description_full": ["Google LLC"],
-            "country_code": "US",
-            "website": "https://about.google/intl/en/",
-            "email_contacts": ["network-abuse@google.com", "arin-contact@google.com"],
-            "abuse_contacts": ["network-abuse@google.com"],
-            "looking_glass": None,
-            "traffic_estimation": None,
-            "traffic_ratio": "Mostly Outbound",
-            "owner_address": ["1600 Amphitheatre Parkway", "Mountain View", "CA", "94043", "US"],
-            "rir_allocation": {
-                "rir_name": "ARIN",
-                "country_code": "US",
-                "date_allocated": "2000-03-30 00:00:00",
-                "allocation_status": "assigned",
-            },
-            "iana_assignment": {
-                "assignment_status": None,
-                "description": None,
-                "whois_server": None,
-                "date_assigned": None,
-            },
-            "date_updated": "2023-02-07 06:39:11",
-        },
-        "@meta": {"time_zone": "UTC", "api_version": 1, "execution_time": "56.55 ms"},
-    }
-    config_overrides = {"scope_report_distance": 2}
-
-    def __init__(self, request, **kwargs):
-        super().__init__(request, **kwargs)
-        self.scan2 = self.add_scan(
-            *self.targets,
-            modules=[self.name] + self.additional_modules,
-            name=f"{self.name}_test_2",
-            config=self.config,
-        )
-
-    def mock_args(self):
-        self.httpx_mock.add_response(
-            url="https://stat.ripe.net/data/network-info/data.json?resource=8.8.8.8",
-            text=json.dumps(self.response_get_asn_ripe),
-        )
-        self.httpx_mock.add_response(
-            url="https://stat.ripe.net/data/whois/data.json?resource=15169",
-            text=json.dumps(self.response_get_asn_metadata_ripe),
-        )
-        self.httpx_mock.add_response(
-            url="https://api.bgpview.io/ip/8.8.8.8", text=json.dumps(self.response_get_asn_bgpview)
-        )
-        self.httpx_mock.add_response(
-            url="https://api.bgpview.io/asn/15169", text=json.dumps(self.response_get_emails_bgpview)
-        )
-
-    async def run(self):
-        await self.scan.prep()
-        self.module.sources = ["bgpview", "ripe"]
-        events = [e async for e in self.scan.start() if e.module == self.module]
-        assert self.check_events(events)
-        await self.scan2.prep()
-        self.module2 = self.scan2.modules["asn"]
-        self.module2.sources = ["ripe", "bgpview"]
-        events2 = [e async for e in self.scan2.start() if e.module == self.module2]
-        assert self.check_events(events2)
-
-    def check_events(self, events):
-        asn = False
-        email = False
-        for e in events:
-            if e.type == "ASN":
-                asn = True
-            elif e.type == "EMAIL_ADDRESS":
-                email = True
-        return asn and email
-
-
-class Wafw00f(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "Proudly powered by litespeed web server"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "WAF" and "LiteSpeed" in e.data["WAF"] for e in events)
-
-
-class Vhost(HttpxMockHelper):
-    targets = ["http://localhost:8888", "secret.localhost"]
-
-    additional_modules = ["httpx"]
-
-    test_wordlist = ["11111111", "admin", "cloud", "junkword1", "zzzjunkword2"]
-    config_overrides = {
-        "modules": {
-            "vhost": {
-                "wordlist": tempwordlist(test_wordlist),
-            }
-        }
-    }
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "admin.localhost:8888"}}
-        respond_args = {"response_data": "Alive vhost admin"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "cloud.localhost:8888"}}
-        respond_args = {"response_data": "Alive vhost cloud"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "q-cloud.localhost:8888"}}
-        respond_args = {"response_data": "Alive vhost q-cloud"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "secret.localhost:8888"}}
-        respond_args = {"response_data": "Alive vhost secret"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "host.docker.internal"}}
-        respond_args = {"response_data": "Alive vhost host.docker.internal"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        basic_detection = False
-        mutaton_of_detected = False
-        basehost_mutation = False
-        special_vhost_list = False
-        wordcloud_detection = False
-
-        for e in events:
-            if e.type == "VHOST":
-                if e.data["vhost"] == "admin":
-                    basic_detection = True
-                if e.data["vhost"] == "cloud":
-                    mutaton_of_detected = True
-                if e.data["vhost"] == "q-cloud":
-                    basehost_mutation = True
-                if e.data["vhost"] == "host.docker.internal":
-                    special_vhost_list = True
-                if e.data["vhost"] == "secret":
-                    wordcloud_detection = True
-
-        assert basic_detection
-        assert mutaton_of_detected
-        assert basehost_mutation
-        assert special_vhost_list
-        assert wordcloud_detection
-
-
-class Iis_shortnames(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    config_overrides = {"modules": {"iis_shortnames": {"detect_only": False}}}
-
-    def setup(self, scan):
-        self.bbot_httpserver.no_handler_status_code = 404
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive", "status": 200}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/*~1*/a.aspx"}
-        respond_args = {"response_data": "", "status": 400}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": re.compile(r"\/B\*~1\*.*$")}
-        respond_args = {"response_data": "", "status": 400}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": re.compile(r"\/BL\*~1\*.*$")}
-        respond_args = {"response_data": "", "status": 400}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": re.compile(r"\/BLS\*~1\*.*$")}
-        respond_args = {"response_data": "", "status": 400}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": re.compile(r"\/BLSH\*~1\*.*$")}
-        respond_args = {"response_data": "", "status": 400}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": re.compile(r"\/BLSHA\*~1\*.*$")}
-        respond_args = {"response_data": "", "status": 400}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": re.compile(r"\/BLSHAX\*~1\*.*$")}
-        respond_args = {"response_data": "", "status": 400}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        vulnerabilityEmitted = False
-        url_hintEmitted = False
-        for e in events:
-            if e.type == "VULNERABILITY":
-                vulnerabilityEmitted = True
-            if e.type == "URL_HINT" and e.data == "http://127.0.0.1:8888/BLSHAX~1":
-                url_hintEmitted = True
-
-        assert vulnerabilityEmitted
-        assert url_hintEmitted
-
-
-class Nuclei_manual(HttpxMockHelper):
-    additional_modules = ["httpx", "excavate"]
-
-    test_html = """
-    html>
- <head>
-  <title>Index of /test</title>
- </head>
- <body>
-<h1>Index of /test</h1>
-  <table>
-   <tr><th><a href="?C=N;O=D">Name</a></th><th><a href="?C=M;O=A">Last modified</a></th><th><a href="?C=S;O=A">Size</a></th></tr>
-   <tr><th colspan="3"><hr></th></tr>
-<tr><td><a href="/">Parent Directory</a></td><td>&nbsp;</td><td align="right">  - </td></tr>
-</table>
-<address>Apache/2.4.38 (Debian) Server at http://127.0.0.1:8888/testmultipleruns.html</address>
-</body></html>
-"""
-    config_overrides = {
-        "web_spider_distance": 1,
-        "web_spider_depth": 1,
-        "modules": {
-            "nuclei": {
-                "version": "2.9.4",
-                "mode": "manual",
-                "concurrency": 2,
-                "ratelimit": 10,
-                "templates": "/tmp/.bbot_test/tools/nuclei-templates/http/miscellaneous/",
-                "interactsh_disable": True,
-                "directory_only": False,
-            }
-        },
-    }
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": self.test_html}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/testmultipleruns.html"}
-        respond_args = {"response_data": "<html>Copyright 1984</html>"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        first_run_detect = False
-        second_run_detect = False
-        for e in events:
-            if e.type == "FINDING":
-                if "Directory listing enabled" in e.data["description"]:
-                    first_run_detect = True
-                elif "Copyright" in e.data["description"]:
-                    second_run_detect = True
-        assert first_run_detect
-        assert second_run_detect
-
-
-class Nuclei_severe(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    config_overrides = {
-        "modules": {
-            "nuclei": {
-                "mode": "severe",
-                "concurrency": 1,
-                "templates": "/tmp/.bbot_test/tools/nuclei-templates/vulnerabilities/generic/generic-linux-lfi.yaml",
-            }
-        },
-        "interactsh_disable": True,
-    }
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/etc/passwd"}
-        respond_args = {"response_data": "<html>root:.*:0:0:</html>"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(
-            e.type == "VULNERABILITY" and "Generic Linux - Local File Inclusion" in e.data["description"]
-            for e in events
-        )
-
-
-class Nuclei_technology(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    config_overrides = {
-        "interactsh_disable": True,
-        "modules": {"nuclei": {"mode": "technology", "concurrency": 2, "tags": "apache"}},
-    }
-
-    def __init__(self, request, caplog, **kwargs):
-        self.caplog = caplog
-        super().__init__(request, **kwargs)
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {
-            "response_data": "<html><Directory></Directory></html>",
-            "headers": {"Server": "Apache/2.4.52 (Ubuntu)"},
-        }
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        if "Using Interactsh Server" in self.caplog.text:
-            return False
-        assert any(e.type == "FINDING" and "apache" in e.data["description"] for e in events)
-
-
-class Nuclei_budget(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    config_overrides = {
-        "modules": {
-            "nuclei": {
-                "mode": "budget",
-                "concurrency": 1,
-                "tags": "spiderfoot",
-                "templates": "/tmp/.bbot_test/tools/nuclei-templates/exposed-panels/spiderfoot.yaml",
-                "interactsh_disable": True,
-            }
-        }
-    }
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "<html><title>SpiderFoot</title><p>support@spiderfoot.net</p></html>"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "FINDING" and "SpiderFoot" in e.data["description"] for e in events)
-
-
-class Url_manipulation(HttpxMockHelper):
-    body = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello null!</p>';
-    </body>
-    </html>
-    """
-
-    body_match = """
-    <html>
-    <title>the title</title>
-    <body>
-    <p>Hello AAAAAAAAAAAAAA!</p>';
-    </body>
-    </html>
-    """
-    additional_modules = ["httpx"]
-
-    def mock_args(self):
-        expect_args = {"query_string": f"{self.module.rand_string}=.xml".encode()}
-        respond_args = {"response_data": self.body_match}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        respond_args = {"response_data": self.body}
-        self.set_expect_requests(respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(
-            e.type == "FINDING"
-            and e.data["description"]
-            == f"Url Manipulation: [body] Sig: [Modified URL: http://127.0.0.1:8888/?{self.module.rand_string}=.xml]"
-            for e in events
-        )
-
-
-class Naabu(HttpxMockHelper):
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "OPEN_TCP_PORT" for e in events)
-
-
-class Social(HttpxMockHelper):
-    additional_modules = ["httpx", "excavate"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": '<html><a href="https://discord.gg/asdf"/></html>'}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "SOCIAL" and e.data["platform"] == "discord" for e in events)
-
-
-class Hunt(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": '<html><a href="/hackme.php?cipher=xor">ping</a></html>'}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(
-            e.type == "FINDING" and e.data["description"] == "Found potential INSECURE CRYPTOGRAPHY parameter [cipher]"
-            for e in events
-        )
-
-
-class Bypass403(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    targets = ["http://127.0.0.1:8888/test"]
-
-    def setup(self, scan):
-        self.bbot_httpserver.no_handler_status_code = 403
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/test..;/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "FINDING" for e in events)
-
-
-class Bypass403_aspnetcookieless(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    targets = ["http://127.0.0.1:8888/admin.aspx"]
-
-    def setup(self, scan):
-        self.bbot_httpserver.no_handler_status_code = 403
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": re.compile(r"\/\([sS]\(\w+\)\)\/.+\.aspx")}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "FINDING" for e in events)
-
-
-class Bypass403_waf(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
-    targets = ["http://127.0.0.1:8888/test"]
-
-    def setup(self, scan):
-        self.bbot_httpserver.no_handler_status_code = 403
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/test..;/"}
-        respond_args = {"response_data": "The requested URL was rejected"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert not any(e.type == "FINDING" for e in events)
-
-
-class Speculate_subdirectories(HttpxMockHelper):
-    additional_modules = ["httpx"]
-    targets = ["http://127.0.0.1:8888/subdir1/subdir2/"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/subdir1/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"method": "GET", "uri": "/subdir1/subdir2/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        assert any(e.type == "URL_UNVERIFIED" and e.data == "http://127.0.0.1:8888/subdir1/" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py b/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
index e69de29bb2..2d9cb1a7ae 100644
--- a/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
+++ b/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
@@ -0,0 +1,6 @@
+from .base import ModuleTestBase
+
+
+class TestGeneric_SSRF(ModuleTestBase):
+    # PAUL TODO
+    pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_gowitness.py b/bbot/test/test_step_1/module_tests/test_module_gowitness.py
index 278eb21a3f..9b3cc08082 100644
--- a/bbot/test/test_step_1/module_tests/test_module_gowitness.py
+++ b/bbot/test/test_step_1/module_tests/test_module_gowitness.py
@@ -22,7 +22,6 @@ def setup_after_prep(self, module_test):
         }
         module_test.set_expect_requests(respond_args=respond_args)
 
-
     def check(self, module_test, events):
         screenshots_path = self.home_dir / "scans" / module_test.scan.name / "gowitness" / "screenshots"
         screenshots = list(screenshots_path.glob("*.png"))
diff --git a/bbot/test/test_step_1/module_tests/test_module_hackertarget.py b/bbot/test/test_step_1/module_tests/test_module_hackertarget.py
index e69de29bb2..d32faa7bb5 100644
--- a/bbot/test/test_step_1/module_tests/test_module_hackertarget.py
+++ b/bbot/test/test_step_1/module_tests/test_module_hackertarget.py
@@ -0,0 +1,13 @@
+from .base import ModuleTestBase
+
+
+class TestHackertarget(ModuleTestBase):
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.hackertarget.com/hostsearch/?q=blacklanternsecurity.com",
+            text="asdf.blacklanternsecurity.com\nzzzz.blacklanternsecurity.com",
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_host_header.py b/bbot/test/test_step_1/module_tests/test_module_host_header.py
index e69de29bb2..75f24378e7 100644
--- a/bbot/test/test_step_1/module_tests/test_module_host_header.py
+++ b/bbot/test/test_step_1/module_tests/test_module_host_header.py
@@ -0,0 +1,6 @@
+from .base import ModuleTestBase
+
+
+class TestHost_Header(ModuleTestBase):
+    # PAUL TODO
+    pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_http.py b/bbot/test/test_step_1/module_tests/test_module_http.py
index e69de29bb2..d1dd57daa6 100644
--- a/bbot/test/test_step_1/module_tests/test_module_http.py
+++ b/bbot/test/test_step_1/module_tests/test_module_http.py
@@ -0,0 +1,24 @@
+from .base import ModuleTestBase
+
+
+class TestHTTP(ModuleTestBase):
+    downstream_url = "https://blacklanternsecurity.fakedomain:1234/events"
+    config_overrides = {
+        "output_modules": {
+            "http": {
+                "url": downstream_url,
+                "method": "PUT",
+                "bearer": "auth_token",
+                "username": "bbot_user",
+                "password": "bbot_password",
+            }
+        }
+    }
+
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            method="PUT", headers={"Authorization": "bearer auth_token"}, url=self.downstream_url
+        )
+
+    def check(self, module_test, events):
+        pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_httpx.py b/bbot/test/test_step_1/module_tests/test_module_httpx.py
index e69de29bb2..a737b2d762 100644
--- a/bbot/test/test_step_1/module_tests/test_module_httpx.py
+++ b/bbot/test/test_step_1/module_tests/test_module_httpx.py
@@ -0,0 +1,29 @@
+import json
+from .base import ModuleTestBase
+
+
+class TestHTTPX(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888/url", "127.0.0.1:8888"]
+
+    def setup_after_prep(self, module_test):
+        request_args = dict(uri="/", headers={"test": "header"})
+        respond_args = dict(response_data=json.dumps({"open": "port"}))
+        module_test.set_expect_requests(request_args, respond_args)
+        request_args = dict(uri="/url", headers={"test": "header"})
+        respond_args = dict(response_data=json.dumps({"url": "url"}))
+        module_test.set_expect_requests(request_args, respond_args)
+
+    def check(self, module_test, events):
+        url = False
+        open_port = False
+        for e in events:
+            if e.type == "HTTP_RESPONSE":
+                j = json.loads(e.data["body"])
+                if e.data["path"] == "/":
+                    if j.get("open", "") == "port":
+                        open_port = True
+                elif e.data["path"] == "/url":
+                    if j.get("url", "") == "url":
+                        url = True
+        assert url, "Failed to visit target URL"
+        assert open_port, "Failed to visit target OPEN_TCP_PORT"
diff --git a/bbot/test/test_step_1/module_tests/test_module_human.py b/bbot/test/test_step_1/module_tests/test_module_human.py
index e69de29bb2..8bf252a002 100644
--- a/bbot/test/test_step_1/module_tests/test_module_human.py
+++ b/bbot/test/test_step_1/module_tests/test_module_human.py
@@ -0,0 +1,8 @@
+from .base import ModuleTestBase
+
+
+class TestHuman(ModuleTestBase):
+    def check(self, module_test, events):
+        txt_file = module_test.scan.home / "output.txt"
+        with open(txt_file) as f:
+            assert f.read().startswith("[SCAN]")
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunt.py b/bbot/test/test_step_1/module_tests/test_module_hunt.py
index e69de29bb2..d5809fa1e0 100644
--- a/bbot/test/test_step_1/module_tests/test_module_hunt.py
+++ b/bbot/test/test_step_1/module_tests/test_module_hunt.py
@@ -0,0 +1,17 @@
+from .base import ModuleTestBase
+
+
+class TestHunt(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "hunt"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": '<html><a href="/hackme.php?cipher=xor">ping</a></html>'}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "Found potential INSECURE CRYPTOGRAPHY parameter [cipher]"
+            for e in events
+        )
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunterio.py b/bbot/test/test_step_1/module_tests/test_module_hunterio.py
index e69de29bb2..ff09ed0d8b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_hunterio.py
+++ b/bbot/test/test_step_1/module_tests/test_module_hunterio.py
@@ -0,0 +1,96 @@
+from .base import ModuleTestBase
+
+
+class TestHunterio(ModuleTestBase):
+    config_overrides = {"modules": {"hunterio": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.hunter.io/v2/account?api_key=asdf",
+            json={
+                "data": {
+                    "first_name": "jon",
+                    "last_name": "snow",
+                    "email": "jon@blacklanternsecurity.notreal",
+                    "plan_name": "Starter",
+                    "plan_level": 1,
+                    "reset_date": "1917-05-23",
+                    "team_id": 1234,
+                    "calls": {
+                        "_deprecation_notice": "Sums the searches and the verifications, giving an unprecise look of the available requests",
+                        "used": 999,
+                        "available": 2000,
+                    },
+                    "requests": {
+                        "searches": {"used": 998, "available": 1000},
+                        "verifications": {"used": 0, "available": 1000},
+                    },
+                }
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.hunter.io/v2/domain-search?domain=blacklanternsecurity.com&api_key=asdf&limit=100&offset=0",
+            json={
+                "data": {
+                    "domain": "blacklanternsecurity.com",
+                    "disposable": False,
+                    "webmail": False,
+                    "accept_all": False,
+                    "pattern": "{first}",
+                    "organization": "Black Lantern Security",
+                    "description": None,
+                    "twitter": None,
+                    "facebook": None,
+                    "linkedin": "https://linkedin.com/company/black-lantern-security",
+                    "instagram": None,
+                    "youtube": None,
+                    "technologies": ["jekyll", "nginx"],
+                    "country": "US",
+                    "state": "CA",
+                    "city": "Night City",
+                    "postal_code": "12345",
+                    "street": "123 Any St",
+                    "emails": [
+                        {
+                            "value": "asdf@blacklanternsecurity.com",
+                            "type": "generic",
+                            "confidence": 77,
+                            "sources": [
+                                {
+                                    "domain": "blacklanternsecurity.com",
+                                    "uri": "http://blacklanternsecurity.com",
+                                    "extracted_on": "2021-06-09",
+                                    "last_seen_on": "2023-03-21",
+                                    "still_on_page": True,
+                                }
+                            ],
+                            "first_name": None,
+                            "last_name": None,
+                            "position": None,
+                            "seniority": None,
+                            "department": "support",
+                            "linkedin": None,
+                            "twitter": None,
+                            "phone_number": None,
+                            "verification": {"date": None, "status": None},
+                        }
+                    ],
+                    "linked_domains": [],
+                },
+                "meta": {
+                    "results": 1,
+                    "limit": 100,
+                    "offset": 0,
+                    "params": {
+                        "domain": "blacklanternsecurity.com",
+                        "company": None,
+                        "type": None,
+                        "seniority": None,
+                        "department": None,
+                    },
+                },
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf@blacklanternsecurity.com" for e in events), "Failed to detect email"
diff --git a/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py b/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
index e69de29bb2..338d4e3b3c 100644
--- a/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
+++ b/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
@@ -0,0 +1,56 @@
+import re
+
+from .base import ModuleTestBase
+
+
+class TestIIS_Shortnames(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "iis_shortnames"]
+    config_overrides = {"modules": {"iis_shortnames": {"detect_only": False}}}
+
+    def setup_after_prep(self, module_test):
+        module_test.httpserver.no_handler_status_code = 404
+
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "alive", "status": 200}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/*~1*/a.aspx"}
+        respond_args = {"response_data": "", "status": 400}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": re.compile(r"\/B\*~1\*.*$")}
+        respond_args = {"response_data": "", "status": 400}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": re.compile(r"\/BL\*~1\*.*$")}
+        respond_args = {"response_data": "", "status": 400}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": re.compile(r"\/BLS\*~1\*.*$")}
+        respond_args = {"response_data": "", "status": 400}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": re.compile(r"\/BLSH\*~1\*.*$")}
+        respond_args = {"response_data": "", "status": 400}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": re.compile(r"\/BLSHA\*~1\*.*$")}
+        respond_args = {"response_data": "", "status": 400}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": re.compile(r"\/BLSHAX\*~1\*.*$")}
+        respond_args = {"response_data": "", "status": 400}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        vulnerabilityEmitted = False
+        url_hintEmitted = False
+        for e in events:
+            if e.type == "VULNERABILITY":
+                vulnerabilityEmitted = True
+            if e.type == "URL_HINT" and e.data == "http://127.0.0.1:8888/BLSHAX~1":
+                url_hintEmitted = True
+
+        assert vulnerabilityEmitted
+        assert url_hintEmitted
diff --git a/bbot/test/test_step_1/test_modules_full.py b/bbot/test/test_step_1/test_modules_full.py
deleted file mode 100644
index 5c6ec38651..0000000000
--- a/bbot/test/test_step_1/test_modules_full.py
+++ /dev/null
@@ -1,234 +0,0 @@
-import logging
-
-from ..bbot_fixtures import *  # noqa: F401
-from ..modules_test_classes import *
-
-log = logging.getLogger(f"bbot.test")
-
-
-@pytest.mark.asyncio
-async def test_httpx(request):
-    x = Httpx(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_gowitness(request):
-    x = Gowitness(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_excavate(request):
-    x = Excavate(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_excavate_relativelinks(request):
-    x = Excavate_relativelinks(request, module_name="excavate")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_subdomain_hijack(request):
-    x = Subdomain_Hijack(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_fingerprintx(request):
-    x = Fingerprintx(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_otx(request):
-    x = Otx(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_anubisdb(request):
-    x = Anubisdb(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_secretsdb(request):
-    x = SecretsDB(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_badsecrets(request):
-    x = Badsecrets(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_telerik(request):
-    x = Telerik(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_paramminer_headers(request):
-    x = Paramminer_headers(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_paramminer_getparams(request):
-    x = Paramminer_getparams(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_paramminer_cookies(request):
-    x = Paramminer_cookies(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_leakix(request):
-    x = LeakIX(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_massdns(request):
-    x = Massdns(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_masscan(request):
-    x = Masscan(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_robots(request):
-    x = Robots(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_buckets(request):
-    x = Buckets(request, module_name="excavate")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_asn(request):
-    x = ASN(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_wafw00f(request):
-    x = Wafw00f(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_ffuf(request):
-    x = Ffuf(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_ffuf_extensions(request):
-    x = Ffuf_extensions(request, module_name="ffuf")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_vhost(request):
-    x = Vhost(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_ffuf_shortnames(request):
-    x = Ffuf_shortnames(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_iis_shortnames(request):
-    x = Iis_shortnames(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_nuclei_manual(request):
-    x = Nuclei_manual(request, module_name="nuclei")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_bypass403(request):
-    x = Bypass403(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_bypass403_waf(request):
-    x = Bypass403_waf(request, module_name="bypass403")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_bypass403_aspnetcookieless(request):
-    x = Bypass403_aspnetcookieless(request, module_name="bypass403")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_nuclei_technology(request, caplog):
-    x = Nuclei_technology(request, caplog, module_name="nuclei")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_nuclei_severe(request):
-    x = Nuclei_severe(request, module_name="nuclei")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_nuclei_budget(request):
-    x = Nuclei_budget(request, module_name="nuclei")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_url_manipulation(request):
-    x = Url_manipulation(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_naabu(request):
-    x = Naabu(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_hunt(request):
-    x = Hunt(request)
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_speculate_subdirectories(request):
-    x = Speculate_subdirectories(request, module_name="speculate")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_social(request):
-    x = Social(request)
-    await x.run()
diff --git a/bbot/test/test_step_2/test_scope.py b/bbot/test/test_step_2/test_scope.py
index 55838d3458..cc39902ee9 100644
--- a/bbot/test/test_step_2/test_scope.py
+++ b/bbot/test/test_step_2/test_scope.py
@@ -1,48 +1,22 @@
 from ..bbot_fixtures import *  # noqa: F401
-from ..modules_test_classes import HttpxMockHelper
+from ..test_step_1.module_tests.base import ModuleTestBase
 
 
-class Scope_test_blacklist(HttpxMockHelper):
-    additional_modules = ["httpx"]
+class Scope_test_blacklist(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx"]
 
     blacklist = ["127.0.0.1"]
 
-    def mock_args(self):
+    def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
-    def check_events(self, events):
-        for e in events:
-            if e.type == "URL":
-                return False
-        return True
+    def check(self, module_test, events):
+        assert not any(e.type == "URL" for e in events)
 
 
-class Scope_test_whitelist(HttpxMockHelper):
-    additional_modules = ["httpx"]
-
+class Scope_test_whitelist(Scope_test_blacklist):
+    blacklist = []
     whitelist = ["255.255.255.255"]
-
-    def mock_args(self):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive"}
-        self.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check_events(self, events):
-        for e in events:
-            if e.type == "URL":
-                return False
-        return True
-
-
-@pytest.mark.asyncio
-async def test_scope_blacklist(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Scope_test_blacklist(bbot_config, bbot_scanner, bbot_httpserver, module_name="httpx")
-    await x.run()
-
-
-@pytest.mark.asyncio
-async def test_scope_whitelist(bbot_config, bbot_scanner, bbot_httpserver):
-    x = Scope_test_whitelist(bbot_config, bbot_scanner, bbot_httpserver, module_name="httpx")
-    await x.run()
diff --git a/bbot/test/test_step_2/test_web.py b/bbot/test/test_step_2/test_web.py
index 92fcfa1afe..b0c76bf4fc 100644
--- a/bbot/test/test_step_2/test_web.py
+++ b/bbot/test/test_step_2/test_web.py
@@ -104,9 +104,14 @@ async def async_callback(data):
         log.debug(f"interactsh poll: {data}")
 
     interactsh_domain = await interactsh_client.register(callback=async_callback)
+    url = f"https://{interactsh_domain}/bbot_interactsh_test"
+    response = await scan1.helpers.request(url)
+    assert response.status_code == 200
+    await asyncio.sleep(10)
     assert any(interactsh_domain.endswith(f"{s}") for s in server_list)
     data_list = await interactsh_client.poll()
     assert isinstance(data_list, list)
+    assert any("bbot_interactsh_test" in d.get("raw-request", "") for d in data_list)
     assert await interactsh_client.deregister() is None
 
 
From b8b15345e03154176fe1b4663d3ca0e83ffd6785 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 21 May 2023 13:27:23 -0400
Subject: [PATCH 032/387] more module tests

---
 bbot/cli.py                                   |   2 +
 bbot/core/errors.py                           |   2 +-
 bbot/core/helpers/dns.py                      |   6 +
 bbot/core/helpers/misc.py                     |   7 +-
 bbot/modules/dnszonetransfer.py               |   6 +-
 bbot/modules/ipstack.py                       |   6 +-
 bbot/modules/leakix.py                        |  25 +++-
 bbot/modules/ntlm.py                          |  25 ++--
 bbot/modules/output/neo4j.py                  |  14 +-
 bbot/modules/telerik.py                       |   6 +-
 bbot/scanner/scanner.py                       |  11 +-
 bbot/test/test_step_1/module_tests/base.py    |  26 +++-
 .../test_module_dnszonetransfer.py            |  17 +--
 .../module_tests/test_module_fullhunt.py      |   4 +
 .../module_tests/test_module_ipneighbor.py    |  20 +++
 .../module_tests/test_module_ipstack.py       |  70 ++++++++++
 .../module_tests/test_module_json.py          |  14 ++
 .../module_tests/test_module_leakix.py        |  26 ++++
 .../module_tests/test_module_masscan.py       |  49 +++++++
 .../module_tests/test_module_massdns.py       |  16 +++
 .../module_tests/test_module_naabu.py         |  11 ++
 .../module_tests/test_module_neo4j.py         |  16 +++
 .../module_tests/test_module_ntlm.py          |  23 ++++
 .../module_tests/test_module_nuclei.py        | 125 ++++++++++++++++++
 .../module_tests/test_module_otx.py           |  27 ++++
 .../test_module_paramminer_cookies.py         |  46 +++++++
 .../test_module_paramminer_getparams.py       |  45 +++++++
 .../test_module_paramminer_headers.py         |  49 +++++++
 28 files changed, 641 insertions(+), 53 deletions(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index bc292f7c75..32e2a8c33c 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -327,6 +327,8 @@ def main():
     global scan_name
     try:
         asyncio.run(_main())
+    except asyncio.CancelledError:
+        pass
     except KeyboardInterrupt:
         msg = "Interrupted"
         if scan_name:
diff --git a/bbot/core/errors.py b/bbot/core/errors.py
index 24c94d4343..df134f66c2 100644
--- a/bbot/core/errors.py
+++ b/bbot/core/errors.py
@@ -1,4 +1,4 @@
-from httpx import RequestError  # noqa
+from httpx import RequestError, ReadTimeout  # noqa
 
 
 class BBOTError(Exception):
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 3c10bcc48d..8135151ac2 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -432,6 +432,9 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
         """
         result = {}
 
+        if is_ip(query):
+            return result
+
         # skip check if the query's parent domain is excluded in the config
         for d in self.wildcard_ignore:
             if self.parent_helper.host_in_host(query, d):
@@ -518,6 +521,9 @@ async def is_wildcard_domain(self, domain, log_info=False):
         wildcard_domain_results = {}
         domain = self._clean_dns_record(domain)
 
+        if is_ip(domain):
+            return {}
+
         # skip check if the query's parent domain is excluded in the config
         for d in self.wildcard_ignore:
             if self.parent_helper.host_in_host(domain, d):
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index ed8c414e37..9f2fa15db8 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -1066,5 +1066,10 @@ def get_traceback_details(e):
 async def cancel_tasks(tasks):
     for task in tasks:
         task.cancel()
-        with suppress(asyncio.CancelledError):
+        try:
             await task
+        except asyncio.CancelledError:
+            pass
+        except Exception as e:
+            log.debug(e)
+            log.trace(traceback.format_exc())
diff --git a/bbot/modules/dnszonetransfer.py b/bbot/modules/dnszonetransfer.py
index 52a9b9634d..5d959bcfe9 100644
--- a/bbot/modules/dnszonetransfer.py
+++ b/bbot/modules/dnszonetransfer.py
@@ -1,6 +1,5 @@
 import dns.zone
 import dns.query
-from functools import partial
 
 from bbot.modules.base import BaseModule
 
@@ -37,8 +36,9 @@ async def handle_event(self, event):
                 break
             try:
                 self.debug(f"Attempting zone transfer against {nameserver} for domain {domain}")
-                xfr_fn = partial(dns.query.xfr, timeout=self.timeout, lifetime=self.timeout)
-                xfr_answer = await self.scan.run_in_executor(xfr_fn, nameserver, domain)
+                xfr_answer = await self.scan.run_in_executor(
+                    dns.query.xfr, nameserver, domain, timeout=self.timeout, lifetime=self.timeout
+                )
                 zone = dns.zone.from_xfr(xfr_answer)
             except Exception as e:
                 self.verbose(f"Error retrieving zone: {e}")
diff --git a/bbot/modules/ipstack.py b/bbot/modules/ipstack.py
index a5636ed62f..a1d01acc7c 100644
--- a/bbot/modules/ipstack.py
+++ b/bbot/modules/ipstack.py
@@ -19,8 +19,12 @@ class Ipstack(shodan_dns):
 
     base_url = "http://api.ipstack.com/"
 
+    async def filter_event(self, event):
+        return True
+
     async def ping(self):
-        r = await self.request_with_fail_count(f"{self.base_url}/check?access_key={self.api_key}")
+        url = f"{self.base_url}/check?access_key={self.api_key}"
+        r = await self.request_with_fail_count(url)
         resp_content = getattr(r, "text", "")
         assert getattr(r, "status_code", 0) == 200, resp_content
 
diff --git a/bbot/modules/leakix.py b/bbot/modules/leakix.py
index d494683afc..6622242e83 100644
--- a/bbot/modules/leakix.py
+++ b/bbot/modules/leakix.py
@@ -1,17 +1,38 @@
 from .crobat import crobat
+from .shodan_dns import shodan_dns
 
 
-class leakix(crobat):
+class leakix(shodan_dns):
     watched_events = ["DNS_NAME"]
     produced_events = ["DNS_NAME"]
     flags = ["subdomain-enum", "passive", "safe"]
+    options = {"api_key": ""}
+    # NOTE: API key is not required (but having one will get you more results)
+    options_desc = {"api_key": "LeakIX API Key"}
     meta = {"description": "Query leakix.net for subdomains"}
 
     base_url = "https://leakix.net"
 
+    async def setup(self):
+        ret = await crobat.setup(self)
+        self.headers = {"Accept": "application/json"}
+        self.api_key = self.config.get("api_key", "")
+        if self.api_key:
+            self.headers["api-key"] = self.api_key
+            return await self.require_api_key()
+        return ret
+
+    async def ping(self):
+        url = f"{self.base_url}/host/1.2.3.4.5"
+        r = await self.helpers.request(url, headers=self.headers)
+        resp_content = getattr(r, "text", "")
+        assert getattr(r, "status_code", 0) != 401, resp_content
+
     async def request_url(self, query):
         url = f"{self.base_url}/api/subdomains/{self.helpers.quote(query)}"
-        return await self.request_with_fail_count(url, headers={"Accept": "application/json"})
+        response = await self.request_with_fail_count(url, headers=self.headers)
+        self.hugewarning(response.json())
+        return response
 
     def parse_results(self, r, query=None):
         json = r.json()
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index 6ef511560c..a5d2fed372 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -1,5 +1,5 @@
 from bbot.modules.base import BaseModule
-from bbot.core.errors import NTLMError, RequestError
+from bbot.core.errors import NTLMError, RequestError, ReadTimeout
 
 ntlm_discovery_endpoints = [
     "",
@@ -77,19 +77,21 @@ async def setup(self):
     async def handle_event(self, event):
         found_hash = hash(f"{event.host}:{event.port}")
         if found_hash not in self.found:
-            result_FQDN, request_url = self.handle_url(event)
-            if result_FQDN and request_url:
+            result, request_url = await self.handle_url(event)
+            if result and request_url:
                 self.found.add(found_hash)
                 self.emit_event(
                     {
                         "host": str(event.host),
                         "url": request_url,
-                        "description": f"NTLM AUTH: {result_FQDN}",
+                        "description": f"NTLM AUTH: {result}",
                     },
                     "FINDING",
                     source=event,
                 )
-                self.emit_event(result_FQDN, "DNS_NAME", source=event)
+                fqdn = result.get("FQDN", "")
+                if fqdn:
+                    self.emit_event(fqdn, "DNS_NAME", source=event)
 
     async def filter_event(self, event):
         if self.try_all:
@@ -127,12 +129,13 @@ async def handle_url(self, event):
             try:
                 result, url = await task
                 if result:
-                    self.helpers.cancel_tasks(tasks)
-                    return str(result["FQDN"]), url
-            except RequestError as e:
-                self.warning(str(e))
+                    await self.helpers.cancel_tasks(tasks)
+                    return result, url
+            except (RequestError, ReadTimeout) as e:
+                if str(e):
+                    self.warning(str(e))
                 # cancel all the tasks if there's an error
-                self.helpers.cancel_tasks(tasks)
+                await self.helpers.cancel_tasks(tasks)
                 break
 
         return None, None
@@ -152,3 +155,5 @@ async def check_ntlm(self, test_url):
                     return ntlm_resp_decoded, test_url
             except NTLMError as e:
                 self.verbose(str(e))
+                return None, test_url
+        return None, test_url
diff --git a/bbot/modules/output/neo4j.py b/bbot/modules/output/neo4j.py
index ea7e3ff720..477bdd373b 100644
--- a/bbot/modules/output/neo4j.py
+++ b/bbot/modules/output/neo4j.py
@@ -1,5 +1,4 @@
 from bbot.db.neo4j import Neo4j
-
 from bbot.modules.output.base import BaseOutputModule
 
 
@@ -21,19 +20,20 @@ class neo4j(BaseOutputModule):
 
     async def setup(self):
         try:
-            self.neo4j = Neo4j(
+            self.neo4j = await self.scan.run_in_executor(
+                Neo4j,
                 uri=self.config.get("uri", self.options["uri"]),
                 username=self.config.get("username", self.options["username"]),
                 password=self.config.get("password", self.options["password"]),
             )
-            self.neo4j.insert_event(self.scan.root_event)
+            await self.scan.run_in_executor(self.neo4j.insert_event, self.scan.root_event)
         except Exception as e:
             self.warning(f"Error setting up Neo4j: {e}")
             return False
         return True
 
-    def handle_event(self, event):
-        self.neo4j.insert_event(event)
+    async def handle_event(self, event):
+        await self.scan.run_in_executor(self.neo4j.insert_event, event)
 
-    def handle_batch(self, *events):
-        self.neo4j.insert_events(events)
+    async def handle_batch(self, *events):
+        await self.scan.run_in_executor(self.neo4j.insert_events, events)
diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index 5166e45b73..1fa5cc6425 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -235,11 +235,11 @@ async def handle_event(self, event):
                 if fail_count < 2:
                     continue
                 self.debug(f"Cancelling run against {event.data} due to failed request")
-                self.helpers.cancel_tasks(tasks)
+                await self.helpers.cancel_tasks(tasks)
                 break
             else:
                 if "Cannot deserialize dialog parameters" in result.text:
-                    self.helpers.cancel_tasks(tasks)
+                    await self.helpers.cancel_tasks(tasks)
                     self.debug(f"Detected Telerik UI instance ({dh})")
                     description = f"Telerik DialogHandler detected"
                     self.emit_event(
@@ -250,7 +250,7 @@ async def handle_event(self, event):
                     # Once we have a match we need to stop, because the basic handler (Telerik.Web.UI.DialogHandler.aspx) usually works with a path wildcard
                     break
 
-        self.helpers.cancel_tasks(tasks)
+        await self.helpers.cancel_tasks(tasks)
 
         spellcheckhandler = "Telerik.Web.UI.SpellCheckHandler.axd"
         result, _ = await self.test_detector(event.data, spellcheckhandler)
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index c2459ad1cd..f55a5c0d60 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -8,6 +8,7 @@
 from sys import exc_info
 from pathlib import Path
 from datetime import datetime
+from functools import partial
 from omegaconf import OmegaConf
 from collections import OrderedDict
 
@@ -381,10 +382,7 @@ async def cancel_tasks(self):
             tasks.append(self.ticker_task)
         # manager worker loops
         tasks += self.manager_worker_loop_tasks
-        for t in tasks:
-            t.cancel()
-            with contextlib.suppress(asyncio.CancelledError):
-                await t
+        await self.helpers.cancel_tasks(tasks)
 
     async def report(self):
         for mod in self.modules.values():
@@ -675,8 +673,9 @@ async def acatch(self, context="scan", finally_callback=None):
         except BaseException as e:
             self._handle_exception(e, context=context)
 
-    def run_in_executor(self, *args, **kwargs):
-        return self._loop.run_in_executor(None, *args, **kwargs)
+    def run_in_executor(self, callback, *args, **kwargs):
+        callback = partial(callback, **kwargs)
+        return self._loop.run_in_executor(None, callback, *args)
 
     def _handle_exception(self, e, context="scan", finally_callback=None):
         if callable(context):
diff --git a/bbot/test/test_step_1/module_tests/base.py b/bbot/test/test_step_1/module_tests/base.py
index 2f5f935591..41294b2c6c 100644
--- a/bbot/test/test_step_1/module_tests/base.py
+++ b/bbot/test/test_step_1/module_tests/base.py
@@ -1,8 +1,9 @@
 import pytest
-import pytest_asyncio
 import logging
+import pytest_asyncio
 from abc import abstractmethod
 from omegaconf import OmegaConf
+from types import SimpleNamespace
 
 from bbot.scanner import Scanner
 from bbot.modules import module_loader
@@ -25,6 +26,19 @@ def tempwordlist(content):
     return filename
 
 
+class MockRecord:
+    def __init__(self, record, rdtype):
+        self.rdtype = SimpleNamespace()
+        self.rdtype.name = rdtype
+        self.record = record
+
+    def __str__(self):
+        return self.record
+
+    def to_text(self):
+        return str(self)
+
+
 class TestClass:
     @pytest_asyncio.fixture
     async def my_fixture(self, bbot_httpserver):
@@ -45,13 +59,14 @@ class ModuleTestBase:
     modules_overrides = []
 
     class ModuleTest:
-        def __init__(self, module_test_base, httpx_mock, httpserver, monkeypatch):
+        def __init__(self, module_test_base, httpx_mock, httpserver, monkeypatch, request):
             self.name = module_test_base.name
             self.config = OmegaConf.merge(test_config, OmegaConf.create(module_test_base.config_overrides))
 
             self.httpx_mock = httpx_mock
             self.httpserver = httpserver
             self.monkeypatch = monkeypatch
+            self.request_fixture = request
 
             # handle output, internal module types
             preloaded = module_loader.preloaded()
@@ -90,9 +105,12 @@ def set_expect_requests(self, expect_args={}, respond_args={}):
         def module(self):
             return self.scan.modules[self.name]
 
+        def mock_record(self, *args, **kwargs):
+            return MockRecord(*args, **kwargs)
+
     @pytest_asyncio.fixture
-    async def module_test(self, httpx_mock, bbot_httpserver, monkeypatch):
-        module_test = self.ModuleTest(self, httpx_mock, bbot_httpserver, monkeypatch)
+    async def module_test(self, httpx_mock, bbot_httpserver, monkeypatch, request):
+        module_test = self.ModuleTest(self, httpx_mock, bbot_httpserver, monkeypatch, request)
         self.setup_before_prep(module_test)
         await module_test.scan.prep()
         self.setup_after_prep(module_test)
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
index f746ee717d..40f450a974 100644
--- a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
+++ b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
@@ -1,7 +1,6 @@
 import dns.zone
 import dns.query
 import dns.message
-from types import SimpleNamespace
 
 from .base import ModuleTestBase
 
@@ -13,23 +12,11 @@ class TestDNSZoneTransfer(ModuleTestBase):
     def setup_after_prep(self, module_test):
         old_resolve_fn = module_test.scan.helpers.dns._resolve_hostname
 
-        class MockRecord:
-            def __init__(self, record, rdtype):
-                self.rdtype = SimpleNamespace()
-                self.rdtype.name = rdtype
-                self.record = record
-
-            def __str__(self):
-                return self.record
-
-            def to_text(self):
-                return str(self)
-
         async def _resolve_hostname(query, **kwargs):
             if query == "blacklanternsecurity.fakedomain" and kwargs.get("rdtype", "").upper() == "NS":
-                return [MockRecord("ns01.blacklanternsecurity.fakedomain", "NS")], []
+                return [module_test.mock_record("ns01.blacklanternsecurity.fakedomain", "NS")], []
             if query == "ns01.blacklanternsecurity.fakedomain" and kwargs.get("rdtype", "").upper() in "A":
-                return [MockRecord("127.0.0.1", "A")], []
+                return [module_test.mock_record("127.0.0.1", "A")], []
             return await old_resolve_fn(query, **kwargs)
 
         def from_xfr(*args, **kwargs):
diff --git a/bbot/test/test_step_1/module_tests/test_module_fullhunt.py b/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
index bada14732a..1847ad40c7 100644
--- a/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
+++ b/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
@@ -2,9 +2,12 @@
 
 
 class TestFullhunt(ModuleTestBase):
+    config_overrides = {"modules": {"fullhunt": {"api_key": "asdf"}}}
+
     def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://fullhunt.io/api/v1/auth/status",
+            match_headers={"x-api-key": "asdf"},
             json={
                 "message": "",
                 "status": 200,
@@ -25,6 +28,7 @@ def setup_before_prep(self, module_test):
         )
         module_test.httpx_mock.add_response(
             url="https://fullhunt.io/api/v1/domain/blacklanternsecurity.com/subdomains",
+            match_headers={"x-api-key": "asdf"},
             json={
                 "domain": "blacklanternsecurity.com",
                 "hosts": [
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py b/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
index e69de29bb2..6463c2cfaf 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
@@ -0,0 +1,20 @@
+from .base import ModuleTestBase
+
+
+class TestIPNeighbor(ModuleTestBase):
+    targets = ["127.0.0.15", "www.bls.notreal"]
+    config_overrides = {"scope_report_distance": 1, "dns_resolution": True}
+
+    def setup_after_prep(self, module_test):
+        old_resolve_fn = module_test.scan.helpers.dns.resolve
+
+        async def resolve(query, **kwargs):
+            module_test.log.critical(f"{query}: {kwargs}")
+            if query == "127.0.0.3" and kwargs.get("type", "").upper() == "PTR":
+                return {"www.bls.notreal"}
+            return await old_resolve_fn(query, **kwargs)
+
+        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "resolve", resolve)
+
+    def check(self, module_test, events):
+        assert any(e.data == "127.0.0.3" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipstack.py b/bbot/test/test_step_1/module_tests/test_module_ipstack.py
index e69de29bb2..8e45c338c2 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ipstack.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ipstack.py
@@ -0,0 +1,70 @@
+from .base import ModuleTestBase
+
+
+class TestIPStack(ModuleTestBase):
+    targets = ["8.8.8.8"]
+    config_overrides = {"modules": {"ipstack": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="http://api.ipstack.com//check?access_key=asdf",
+            json={
+                "ip": "1.2.3.4",
+                "type": "ipv4",
+                "continent_code": "NA",
+                "continent_name": "North America",
+                "country_code": "US",
+                "country_name": "United States",
+                "region_code": "FL",
+                "region_name": "Florida",
+                "city": "Cape Canaveral",
+                "zip": "12345",
+                "latitude": 47.89263153076172,
+                "longitude": -97.04190063476562,
+                "location": {
+                    "geoname_id": 5059429,
+                    "capital": "Washington D.C.",
+                    "languages": [{"code": "en", "name": "English", "native": "English"}],
+                    "country_flag": "https://assets.ipstack.com/flags/us.svg",
+                    "country_flag_emoji": "\ud83c\uddfa\ud83c\uddf8",
+                    "country_flag_emoji_unicode": "U+1F1FA U+1F1F8",
+                    "calling_code": "1",
+                    "is_eu": False,
+                },
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url="http://api.ipstack.com//8.8.8.8?access_key=asdf",
+            json={
+                "ip": "8.8.8.8",
+                "type": "ipv4",
+                "continent_code": "NA",
+                "continent_name": "North America",
+                "country_code": "US",
+                "country_name": "United States",
+                "region_code": "OH",
+                "region_name": "Ohio",
+                "city": "Glenmont",
+                "zip": "44628",
+                "latitude": 40.5369987487793,
+                "longitude": -82.12859344482422,
+                "location": {
+                    "geoname_id": None,
+                    "capital": "Washington D.C.",
+                    "languages": [{"code": "en", "name": "English", "native": "English"}],
+                    "country_flag": "https://assets.ipstack.com/flags/us.svg",
+                    "country_flag_emoji": "\ud83c\uddfa\ud83c\uddf8",
+                    "country_flag_emoji_unicode": "U+1F1FA U+1F1F8",
+                    "calling_code": "1",
+                    "is_eu": False,
+                },
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "GEOLOCATION"
+            and e.data
+            == "Ip: 8.8.8.8, Country: United States, City: Glenmont, Zip_code: 44628, Region: Ohio, Latitude: 40.5369987487793, Longitude: -82.12859344482422"
+            for e in events
+        ), "Failed to geolocate IP"
diff --git a/bbot/test/test_step_1/module_tests/test_module_json.py b/bbot/test/test_step_1/module_tests/test_module_json.py
index e69de29bb2..dd552742a5 100644
--- a/bbot/test/test_step_1/module_tests/test_module_json.py
+++ b/bbot/test/test_step_1/module_tests/test_module_json.py
@@ -0,0 +1,14 @@
+import json
+
+from .base import ModuleTestBase
+from bbot.core.event.base import event_from_json
+
+
+class TestJSON(ModuleTestBase):
+    def check(self, module_test, events):
+        txt_file = module_test.scan.home / "output.json"
+        lines = list(module_test.scan.helpers.read_file(txt_file))
+        assert lines
+        e = event_from_json(json.loads(lines[0]))
+        assert e.type == "SCAN"
+        assert e.data == f"{module_test.scan.name} ({module_test.scan.id})"
diff --git a/bbot/test/test_step_1/module_tests/test_module_leakix.py b/bbot/test/test_step_1/module_tests/test_module_leakix.py
index e69de29bb2..9266660f45 100644
--- a/bbot/test/test_step_1/module_tests/test_module_leakix.py
+++ b/bbot/test/test_step_1/module_tests/test_module_leakix.py
@@ -0,0 +1,26 @@
+from .base import ModuleTestBase
+
+
+class TestLeakIX(ModuleTestBase):
+    config_overrides = {"modules": {"leakix": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://leakix.net/host/1.2.3.4.5",
+            match_headers={"api-key": "asdf"},
+            json={"title": "Not Found", "description": "Host not found"},
+        )
+        module_test.httpx_mock.add_response(
+            url=f"https://leakix.net/api/subdomains/blacklanternsecurity.com",
+            match_headers={"api-key": "asdf"},
+            json=[
+                {
+                    "subdomain": "asdf.blacklanternsecurity.com",
+                    "distinct_ips": 3,
+                    "last_seen": "2023-04-02T09:38:30.02Z",
+                },
+            ],
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_masscan.py b/bbot/test/test_step_1/module_tests/test_module_masscan.py
index e69de29bb2..2d4fd44631 100644
--- a/bbot/test/test_step_1/module_tests/test_module_masscan.py
+++ b/bbot/test/test_step_1/module_tests/test_module_masscan.py
@@ -0,0 +1,49 @@
+from .base import ModuleTestBase
+
+
+class TestMasscan(ModuleTestBase):
+    targets = ["8.8.8.8/32"]
+    scan_name = "test_masscan"
+    config_overrides = {"modules": {"masscan": {"ports": "443", "wait": 1}}}
+    masscan_config = """seed = 17230484647655100360
+rate = 600       
+shard = 1/1
+
+
+# TARGET SELECTION (IP, PORTS, EXCLUDES)
+ports = 
+range = 9.8.7.6"""
+
+    masscan_output = """[
+{   "ip": "8.8.8.8",   "timestamp": "1680197558", "ports": [ {"port": 443, "proto": "tcp", "status": "open", "reason": "syn-ack", "ttl": 54} ] }
+]"""
+
+    def setup_after_prep(self, module_test):
+        self.masscan_run = False
+
+        async def run_masscan(command, *args, **kwargs):
+            if "masscan" in command[:2]:
+                for l in self.masscan_output.splitlines():
+                    yield l
+                self.masscan_run = True
+            else:
+                async for l in self.scan.helpers.run_live(command, *args, **kwargs):
+                    yield l
+
+        module_test.scan.modules["masscan"].masscan_config = self.masscan_config
+        module_test.monkeypatch.setattr(module_test.scan.helpers, "run_live", run_masscan)
+
+    def check(self, module_test, events):
+        assert self.masscan_run == True
+        assert any(e.type == "IP_ADDRESS" and e.data == "8.8.8.8" for e in events), "No IP_ADDRESS emitted"
+        assert any(e.type == "OPEN_TCP_PORT" and e.data == "8.8.8.8:443" for e in events), "No OPEN_TCP_PORT emitted"
+
+
+class TestMasscan1(TestMasscan):
+    modules_overrides = ["masscan"]
+    config_overrides = {"modules": {"masscan": {"ports": "443", "wait": 1, "use_cache": True}}}
+
+    def check(self, module_test, events):
+        assert self.masscan_run == False
+        assert any(e.type == "IP_ADDRESS" and e.data == "8.8.8.8" for e in events), "No IP_ADDRESS emitted"
+        assert any(e.type == "OPEN_TCP_PORT" and e.data == "8.8.8.8:443" for e in events), "No OPEN_TCP_PORT emitted"
diff --git a/bbot/test/test_step_1/module_tests/test_module_massdns.py b/bbot/test/test_step_1/module_tests/test_module_massdns.py
index e69de29bb2..5d2fcdfb61 100644
--- a/bbot/test/test_step_1/module_tests/test_module_massdns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_massdns.py
@@ -0,0 +1,16 @@
+from .base import ModuleTestBase, tempwordlist
+
+
+class TestMassdns(ModuleTestBase):
+    subdomain_wordlist = tempwordlist(["www", "asdf"])
+    config_overrides = {"modules": {"massdns": {"wordlist": str(subdomain_wordlist)}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://raw.githubusercontent.com/blacklanternsecurity/public-dns-servers/master/nameservers.txt",
+            text="8.8.8.8\n8.8.4.4\n1.1.1.1",
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "www.blacklanternsecurity.com" for e in events)
+        assert not any(e.data == "asdf.blacklanternsecurity.com" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_naabu.py b/bbot/test/test_step_1/module_tests/test_module_naabu.py
index e69de29bb2..2f985d5a22 100644
--- a/bbot/test/test_step_1/module_tests/test_module_naabu.py
+++ b/bbot/test/test_step_1/module_tests/test_module_naabu.py
@@ -0,0 +1,11 @@
+from .base import ModuleTestBase
+
+
+class TestNaabu(ModuleTestBase):
+    def setup_before_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "OPEN_TCP_PORT" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_neo4j.py b/bbot/test/test_step_1/module_tests/test_module_neo4j.py
index e69de29bb2..97cb754e0a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_neo4j.py
+++ b/bbot/test/test_step_1/module_tests/test_module_neo4j.py
@@ -0,0 +1,16 @@
+from .base import ModuleTestBase
+
+
+class TestNeo4j(ModuleTestBase):
+    def setup_before_prep(self, module_test):
+        class MockGraph:
+            def __init__(self, *args, **kwargs):
+                self.used = False
+
+            def merge(self, *args, **kwargs):
+                self.used = True
+
+        module_test.monkeypatch.setattr("py2neo.Graph", MockGraph)
+
+    def check(self, module_test, events):
+        assert module_test.scan.modules["neo4j"].neo4j.graph.used == True
diff --git a/bbot/test/test_step_1/module_tests/test_module_ntlm.py b/bbot/test/test_step_1/module_tests/test_module_ntlm.py
index e69de29bb2..814e2578e7 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ntlm.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ntlm.py
@@ -0,0 +1,23 @@
+from .base import ModuleTestBase
+
+
+class TestNTLM(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "ntlm"]
+    config_overrides = {"modules": {"ntlm": {"try_all": True}}}
+
+    def setup_after_prep(self, module_test):
+        request_args = dict(uri="/", headers={"test": "header"})
+        module_test.set_expect_requests(request_args, {})
+        request_args = dict(
+            uri="/oab/", headers={"Authorization": "NTLM TlRMTVNTUAABAAAAl4II4gAAAAAAAAAAAAAAAAAAAAAKAGFKAAAADw=="}
+        )
+        respond_args = dict(
+            headers={
+                "WWW-Authenticate": "NTLM TlRMTVNTUAACAAAABgAGADgAAAAVgoni89aZT4Q0mH0AAAAAAAAAAHYAdgA+AAAABgGxHQAAAA9WAE4ATwACAAYAVgBOAE8AAQAKAEUAWABDADAAMQAEABIAdgBuAG8ALgBsAG8AYwBhAGwAAwAeAEUAWABDADAAMQAuAHYAbgBvAC4AbABvAGMAYQBsAAUAEgB2AG4AbwAuAGwAbwBjAGEAbAAHAAgAXxo0p/6L2QEAAAAA"
+            }
+        )
+        module_test.set_expect_requests(request_args, respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "FINDING" and "EXC01.vno.local" in e.data["description"] for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_nuclei.py b/bbot/test/test_step_1/module_tests/test_module_nuclei.py
index e69de29bb2..b8eca8a3b5 100644
--- a/bbot/test/test_step_1/module_tests/test_module_nuclei.py
+++ b/bbot/test/test_step_1/module_tests/test_module_nuclei.py
@@ -0,0 +1,125 @@
+from .base import ModuleTestBase
+
+
+class TestNucleiManual(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "excavate", "nuclei"]
+    config_overrides = {
+        "web_spider_distance": 1,
+        "web_spider_depth": 1,
+        "modules": {
+            "nuclei": {
+                "version": "2.9.4",
+                "mode": "manual",
+                "concurrency": 2,
+                "ratelimit": 10,
+                "templates": "/tmp/.bbot_test/tools/nuclei-templates/http/miscellaneous/",
+                "interactsh_disable": True,
+                "directory_only": False,
+            }
+        },
+    }
+
+    test_html = """
+    html>
+ <head>
+  <title>Index of /test</title>
+ </head>
+ <body>
+<h1>Index of /test</h1>
+  <table>
+   <tr><th><a href="?C=N;O=D">Name</a></th><th><a href="?C=M;O=A">Last modified</a></th><th><a href="?C=S;O=A">Size</a></th></tr>
+   <tr><th colspan="3"><hr></th></tr>
+<tr><td><a href="/">Parent Directory</a></td><td>&nbsp;</td><td align="right">  - </td></tr>
+</table>
+<address>Apache/2.4.38 (Debian) Server at http://127.0.0.1:8888/testmultipleruns.html</address>
+</body></html>
+"""
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": self.test_html}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+        expect_args = {"method": "GET", "uri": "/testmultipleruns.html"}
+        respond_args = {"response_data": "<html>Copyright 1984</html>"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        first_run_detect = False
+        second_run_detect = False
+        for e in events:
+            if e.type == "FINDING":
+                if "Directory listing enabled" in e.data["description"]:
+                    first_run_detect = True
+                elif "Copyright" in e.data["description"]:
+                    second_run_detect = True
+        assert first_run_detect
+        assert second_run_detect
+
+
+class TestNucleiSevere(TestNucleiManual):
+    modules_overrides = ["httpx", "nuclei"]
+    config_overrides = {
+        "modules": {
+            "nuclei": {
+                "mode": "severe",
+                "concurrency": 1,
+                "templates": "/tmp/.bbot_test/tools/nuclei-templates/vulnerabilities/generic/generic-linux-lfi.yaml",
+            }
+        },
+        "interactsh_disable": True,
+    }
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/etc/passwd"}
+        respond_args = {"response_data": "<html>root:.*:0:0:</html>"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "VULNERABILITY" and "Generic Linux - Local File Inclusion" in e.data["description"]
+            for e in events
+        )
+
+
+class TestNucleiTechnology(TestNucleiManual):
+    config_overrides = {
+        "interactsh_disable": True,
+        "modules": {"nuclei": {"mode": "technology", "concurrency": 2, "tags": "apache"}},
+    }
+
+    def setup_before_prep(self, module_test):
+        self.caplog = module_test.request_fixture.getfixturevalue("caplog")
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {
+            "response_data": "<html><Directory></Directory></html>",
+            "headers": {"Server": "Apache/2.4.52 (Ubuntu)"},
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        if "Using Interactsh Server" in self.caplog.text:
+            return False
+        assert any(e.type == "FINDING" and "apache" in e.data["description"] for e in events)
+
+
+class TestNucleiBudget(TestNucleiManual):
+    config_overrides = {
+        "modules": {
+            "nuclei": {
+                "mode": "budget",
+                "concurrency": 1,
+                "tags": "spiderfoot",
+                "templates": "/tmp/.bbot_test/tools/nuclei-templates/exposed-panels/spiderfoot.yaml",
+                "interactsh_disable": True,
+            }
+        }
+    }
+
+    def setup_before_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "<html><title>SpiderFoot</title><p>support@spiderfoot.net</p></html>"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "FINDING" and "SpiderFoot" in e.data["description"] for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_otx.py b/bbot/test/test_step_1/module_tests/test_module_otx.py
index e69de29bb2..7481e29056 100644
--- a/bbot/test/test_step_1/module_tests/test_module_otx.py
+++ b/bbot/test/test_step_1/module_tests/test_module_otx.py
@@ -0,0 +1,27 @@
+from .base import ModuleTestBase
+
+
+class TestOTX(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://otx.alienvault.com/api/v1/indicators/domain/blacklanternsecurity.com/passive_dns",
+            json={
+                "passive_dns": [
+                    {
+                        "address": "2606:50c0:8000::153",
+                        "first": "2021-10-28T20:23:08",
+                        "last": "2022-08-24T18:29:49",
+                        "hostname": "asdf.blacklanternsecurity.com",
+                        "record_type": "AAAA",
+                        "indicator_link": "/indicator/hostname/www.blacklanternsecurity.com",
+                        "flag_url": "assets/images/flags/us.png",
+                        "flag_title": "United States",
+                        "asset_type": "hostname",
+                        "asn": "AS54113 fastly",
+                    }
+                ]
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
index e69de29bb2..c0ebbb3e04 100644
--- a/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
+++ b/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
@@ -0,0 +1,46 @@
+from .test_module_paramminer_headers import *
+
+
+class TestParamminer_Cookies(TestParamminer_Headers):
+    modules_overrides = ["httpx", "paramminer_cookies"]
+    config_overrides = {"modules": {"paramminer_cookies": {"wordlist": tempwordlist(["junkcookie", "admincookie"])}}}
+
+    cookies_body = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello null!</p>';
+    </body>
+    </html>
+    """
+
+    cookies_body_match = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello AAAAAAAAAAAAAA!</p>';
+    </body>
+    </html>
+    """
+
+    def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_cookies"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+        expect_args = dict(headers={"Cookie": "admincookie=AAAAAAAAAAAAAA"})
+        respond_args = {"response_data": self.cookies_body_match}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.cookies_body}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [admincookie] Reasons: [body]"
+            for e in events
+        )
+        assert not any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [junkcookie] Reasons: [body]"
+            for e in events
+        )
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
index e69de29bb2..f6cbdebeac 100644
--- a/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
@@ -0,0 +1,45 @@
+from .test_module_paramminer_headers import *
+
+
+class TestParamminer_Getparams(TestParamminer_Headers):
+    modules_overrides = ["httpx", "paramminer_getparams"]
+    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"])}}}
+    getparam_body = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello null!</p>';
+    </body>
+    </html>
+    """
+
+    getparam_body_match = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello AAAAAAAAAAAAAA!</p>';
+    </body>
+    </html>
+    """
+
+    def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+        expect_args = {"query_string": b"id=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {"response_data": self.getparam_body_match}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.getparam_body}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [id] Reasons: [body]"
+            for e in events
+        )
+        assert not any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [canary] Reasons: [body]"
+            for e in events
+        )
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
index e69de29bb2..7fc2e63959 100644
--- a/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
+++ b/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
@@ -0,0 +1,49 @@
+from bbot.core.helpers import helper
+
+from .base import ModuleTestBase, tempwordlist
+
+
+class TestParamminer_Headers(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "paramminer_headers"]
+    config_overrides = {"modules": {"paramminer_headers": {"wordlist": tempwordlist(["junkword1", "tracestate"])}}}
+
+    headers_body = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello null!</p>';
+    </body>
+    </html>
+    """
+
+    headers_body_match = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello AAAAAAAAAAAAAA!</p>';
+    </body>
+    </html>
+    """
+
+    def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_headers"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+        expect_args = dict(headers={"tracestate": "AAAAAAAAAAAAAA"})
+        respond_args = {"response_data": self.headers_body_match}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.headers_body}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [tracestate] Reasons: [body]"
+            for e in events
+        )
+        assert not any(
+            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [junkword1] Reasons: [body]"
+            for e in events
+        )

From c915b557e34f1a062074728ff2effa28ec0eb44f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 21 May 2023 16:49:23 -0400
Subject: [PATCH 033/387] tests for passivetotal, pgp

---
 bbot/core/event/helpers.py                    |  4 +--
 bbot/core/helpers/dns.py                      |  8 ++---
 bbot/core/helpers/misc.py                     | 11 ++++++
 bbot/core/helpers/regexes.py                  |  3 +-
 bbot/core/helpers/validators.py               |  2 +-
 bbot/modules/crobat.py                        |  7 ++--
 bbot/modules/passivetotal.py                  | 12 +++----
 bbot/modules/pgp.py                           | 14 ++++----
 .../module_tests/test_module_passivetotal.py  | 21 +++++++++++
 .../module_tests/test_module_pgp.py           | 35 +++++++++++++++++++
 bbot/test/test_step_2/test_helpers.py         |  6 ++++
 11 files changed, 100 insertions(+), 23 deletions(-)

diff --git a/bbot/core/event/helpers.py b/bbot/core/event/helpers.py
index 5820183ec2..7213bc57b5 100644
--- a/bbot/core/event/helpers.py
+++ b/bbot/core/event/helpers.py
@@ -4,7 +4,7 @@
 
 from bbot.core.errors import ValidationError
 from bbot.core.helpers import sha1, smart_decode, smart_decode_punycode
-from bbot.core.helpers.regexes import event_type_regexes, event_id_regex, _hostname_regex
+from bbot.core.helpers.regexes import event_type_regexes, event_id_regex, hostname_regex
 
 
 log = logging.getLogger("bbot.core.event.helpers")
@@ -36,7 +36,7 @@ def get_event_type(data):
                 return t
 
     # Assume DNS_NAME for basic words
-    if _hostname_regex.match(data):
+    if hostname_regex.match(data):
         return "DNS_NAME"
 
     raise ValidationError(f'Unable to autodetect event type from "{data}"')
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 8135151ac2..48bb444cc4 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -9,7 +9,7 @@
 from .regexes import dns_name_regex
 from bbot.core.helpers.async_helpers import NamedLock
 from bbot.core.errors import ValidationError, DNSError
-from .misc import is_ip, is_domain, domain_parents, parent_domain, rand_string, cloudcheck
+from .misc import is_ip, is_domain, is_dns_name, domain_parents, parent_domain, rand_string, cloudcheck
 
 log = logging.getLogger("bbot.core.helpers.dns")
 
@@ -432,8 +432,8 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
         """
         result = {}
 
-        if is_ip(query):
-            return result
+        if not is_dns_name(query):
+            return {}
 
         # skip check if the query's parent domain is excluded in the config
         for d in self.wildcard_ignore:
@@ -521,7 +521,7 @@ async def is_wildcard_domain(self, domain, log_info=False):
         wildcard_domain_results = {}
         domain = self._clean_dns_record(domain)
 
-        if is_ip(domain):
+        if not is_dns_name(domain):
             return {}
 
         # skip check if the query's parent domain is excluded in the config
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 9f2fa15db8..ec4b9b20ec 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -214,6 +214,17 @@ def is_port(p):
     return p and p.isdigit() and 0 <= int(p) <= 65535
 
 
+def is_dns_name(d):
+    if is_ip(d):
+        return False
+    d = smart_decode(d)
+    if regexes.hostname_regex.match(d):
+        return True
+    if regexes.dns_name_regex.match(d):
+        return True
+    return False
+
+
 def is_ip(d, version=None):
     """
     "192.168.1.1" --> True
diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index c739ebb029..634257ca5f 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -22,7 +22,7 @@
 _ipv6_regex = r"[A-F0-9:]*:[A-F0-9:]*:[A-F0-9:]*"
 ipv6_regex = re.compile(_ipv6_regex, re.I)
 _dns_name_regex = r"(?:(?:[\w-]+)\.)+(?:[^\W_0-9]{2,20})"
-_hostname_regex = re.compile(r"^[\w-]+$")
+_hostname_regex = r"^[\w-]+$"
 _email_regex = r"(?:[^\W_][\w\-\.\+]{,100})@(?:\w[\w\-\._]{,100})\.(?:[^\W_0-9]{2,8})"
 email_regex = re.compile(_email_regex, re.I)
 _ptr_regex = r"(?:[0-9]{1,3}[-_\.]){3}[0-9]{1,3}"
@@ -61,3 +61,4 @@
 event_id_regex = re.compile(r"[0-9a-f]{40}:[A-Z0-9_]+")
 dns_name_regex = re.compile(_dns_name_regex, re.I)
 scan_name_regex = re.compile(r"[a-z]{3,20}_[a-z]{3,20}")
+hostname_regex = re.compile(_hostname_regex, re.I)
diff --git a/bbot/core/helpers/validators.py b/bbot/core/helpers/validators.py
index a1945802a5..5082a2dd31 100644
--- a/bbot/core/helpers/validators.py
+++ b/bbot/core/helpers/validators.py
@@ -62,7 +62,7 @@ def validate_host(host):
             for r in regexes.event_type_regexes["DNS_NAME"]:
                 if r.match(host):
                     return host
-            if regexes._hostname_regex.match(host):
+            if regexes.hostname_regex.match(host):
                 return host
     assert False, f'Invalid hostname: "{host}"'
 
diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index da4191911f..1db822eb8d 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -29,9 +29,10 @@ async def setup(self):
         return True
 
     async def _is_wildcard(self, query):
-        for domain, wildcard_rdtypes in (await self.helpers.is_wildcard_domain(query)).items():
-            if any(t in wildcard_rdtypes for t in ("A", "AAAA", "CNAME")):
-                return True
+        if self.helpers.is_dns_name(query):
+            for domain, wildcard_rdtypes in (await self.helpers.is_wildcard_domain(query)).items():
+                if any(t in wildcard_rdtypes for t in ("A", "AAAA", "CNAME")):
+                    return True
         return False
 
     async def filter_event(self, event):
diff --git a/bbot/modules/passivetotal.py b/bbot/modules/passivetotal.py
index 27220bca35..83ebd1d7ae 100644
--- a/bbot/modules/passivetotal.py
+++ b/bbot/modules/passivetotal.py
@@ -11,15 +11,15 @@ class passivetotal(shodan_dns):
 
     base_url = "https://api.passivetotal.org/v2"
 
-    def setup(self):
+    async def setup(self):
         self.username = self.config.get("username", "")
         self.api_key = self.config.get("api_key", "")
         self.auth = (self.username, self.api_key)
-        return super().setup()
+        return await super().setup()
 
-    def ping(self):
+    async def ping(self):
         url = f"{self.base_url}/account/quota"
-        j = self.request_with_fail_count(url, auth=self.auth).json()
+        j = (await self.request_with_fail_count(url, auth=self.auth)).json()
         limit = j["user"]["limits"]["search_api"]
         used = j["user"]["counts"]["search_api"]
         assert used < limit, "No quota remaining"
@@ -28,9 +28,9 @@ def abort_if(self, event):
         # RiskIQ is famous for their junk data
         return super().abort_if(event) or "unresolved" in event.tags
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/enrichment/subdomains?query={self.helpers.quote(query)}"
-        return self.request_with_fail_count(url, auth=self.auth)
+        return await self.request_with_fail_count(url, auth=self.auth)
 
     def parse_results(self, r, query):
         for subdomain in r.json().get("subdomains", []):
diff --git a/bbot/modules/pgp.py b/bbot/modules/pgp.py
index fe967cbe22..ce7098e27d 100644
--- a/bbot/modules/pgp.py
+++ b/bbot/modules/pgp.py
@@ -14,20 +14,22 @@ class pgp(crobat):
     }
     options_desc = {"search_urls": "PGP key servers to search"}
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
-        results = self.query(query)
+        results = await self.query(query)
         if results:
             for hostname in results:
                 if not hostname == event:
                     self.emit_event(hostname, "EMAIL_ADDRESS", event, abort_if=self.abort_if)
 
-    def query(self, query):
+    async def query(self, query):
+        results = set()
         for url in self.config.get("search_urls", []):
             url = url.replace("<query>", self.helpers.quote(query))
-            response = self.helpers.request(url)
+            response = await self.helpers.request(url)
             if response is not None:
                 for email in self.helpers.extract_emails(response.text):
                     email = email.lower()
-                    if email.lower().endswith(query):
-                        yield email
+                    if email.endswith(query):
+                        results.add(email)
+        return results
diff --git a/bbot/test/test_step_1/module_tests/test_module_passivetotal.py b/bbot/test/test_step_1/module_tests/test_module_passivetotal.py
index e69de29bb2..5d2835979b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_passivetotal.py
+++ b/bbot/test/test_step_1/module_tests/test_module_passivetotal.py
@@ -0,0 +1,21 @@
+from .base import ModuleTestBase
+
+
+class TestPassiveTotal(ModuleTestBase):
+    config_overrides = {"modules": {"passivetotal": {"username": "jon@bls.fakedomain", "api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.passivetotal.org/v2/account/quota",
+            json={"user": {"counts": {"search_api": 10}, "limits": {"search_api": 20}}},
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.passivetotal.org/v2/enrichment/subdomains?query=blacklanternsecurity.com",
+            json={"subdomains": ["asdf"]},
+        )
+
+    def setup_after_prep(self, module_test):
+        module_test.monkeypatch.setattr(module_test.scan.modules["passivetotal"], "abort_if", lambda e: False)
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_pgp.py b/bbot/test/test_step_1/module_tests/test_module_pgp.py
index e69de29bb2..dac4152577 100644
--- a/bbot/test/test_step_1/module_tests/test_module_pgp.py
+++ b/bbot/test/test_step_1/module_tests/test_module_pgp.py
@@ -0,0 +1,35 @@
+from .base import ModuleTestBase
+
+
+class TestPGP(ModuleTestBase):
+    web_body = """<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd" >
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>Search results for 'blacklanternsecurity.com'</title>
+<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
+<link href='/assets/css/pks.min.css' rel='stylesheet' type='text/css'>
+<style type="text/css">
+ 
+ .uid { color: green; text-decoration: underline; }
+ .warn { color: red; font-weight: bold; }
+ 
+</style></head><body><h1>Search results for 'blacklanternsecurity.com'</h1><pre>Type bits/keyID            cr. time   exp time   key expir
+</pre>
+
+
+<hr /><pre><strong>pub</strong> <a href="/pks/lookup?op=get&search=0xd4e98af823deadbeef">eddsa263/0xd4e98af823deadbeef</a> 2022-09-14T15:11:31Z
+
+<strong>uid</strong> <span class="uid">Asdf &lt;asdf@blacklanternsecurity.com&gt;</span>
+sig  sig  <a href="/pks/lookup?op=get&search=0xd4e98af823deadbeef">0xd4e98af823deadbeef</a> 2022-09-14T15:11:31Z 2024-09-14T17:00:00Z ____________________ <a href="/pks/lookup?op=vindex&search=0xd4e98af823deadbeef">[selfsig]</a>
+
+</pre>
+</body></html>"""
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=blacklanternsecurity.com",
+            text=self.web_body,
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf@blacklanternsecurity.com" for e in events), "Failed to detect email"
diff --git a/bbot/test/test_step_2/test_helpers.py b/bbot/test/test_step_2/test_helpers.py
index 9639f6110c..ec91009b67 100644
--- a/bbot/test/test_step_2/test_helpers.py
+++ b/bbot/test/test_step_2/test_helpers.py
@@ -79,6 +79,12 @@ async def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver
     ]
     assert helpers.is_ip("127.0.0.1")
     assert not helpers.is_ip("127.0.0.0.1")
+    assert helpers.is_dns_name("evilcorp.com")
+    assert helpers.is_dns_name("evilcorp")
+    assert helpers.is_dns_name("ドメイン.テスト")
+    assert not helpers.is_dns_name("127.0.0.1")
+    assert not helpers.is_dns_name("dead::beef")
+    assert not helpers.is_dns_name("bob@evilcorp.com")
 
     assert helpers.domain_stem("evilcorp.co.uk") == "evilcorp"
     assert helpers.domain_stem("www.evilcorp.co.uk") == "www.evilcorp"

From ca55a854c9b50ca45ec7a2ead2ea2ad63ca9b825 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 21 May 2023 20:47:41 -0400
Subject: [PATCH 034/387] tests for riddler, rapiddns, python

---
 bbot/modules/rapiddns.py                         |  5 +++--
 bbot/modules/riddler.py                          |  5 +++--
 .../module_tests/test_module_python.py           |  6 ++++++
 .../module_tests/test_module_rapiddns.py         | 16 ++++++++++++++++
 .../module_tests/test_module_riddler.py          | 16 ++++++++++++++++
 5 files changed, 44 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/rapiddns.py b/bbot/modules/rapiddns.py
index 61bfa767dd..0af7e39306 100644
--- a/bbot/modules/rapiddns.py
+++ b/bbot/modules/rapiddns.py
@@ -9,9 +9,10 @@ class rapiddns(crobat):
 
     base_url = "https://rapiddns.io"
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/subdomain/{self.helpers.quote(query)}?full=1#result"
-        return self.request_with_fail_count(url)
+        response = await self.request_with_fail_count(url)
+        return response
 
     def parse_results(self, r, query):
         results = set()
diff --git a/bbot/modules/riddler.py b/bbot/modules/riddler.py
index a7128943c8..c6f865ee10 100644
--- a/bbot/modules/riddler.py
+++ b/bbot/modules/riddler.py
@@ -9,9 +9,10 @@ class riddler(crobat):
 
     base_url = "https://riddler.io"
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/search/exportcsv?q=pld:{self.helpers.quote(query)}"
-        return self.request_with_fail_count(url)
+        response = await self.request_with_fail_count(url)
+        return response
 
     def parse_results(self, r, query):
         results = set()
diff --git a/bbot/test/test_step_1/module_tests/test_module_python.py b/bbot/test/test_step_1/module_tests/test_module_python.py
index e69de29bb2..eb1628437b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_python.py
+++ b/bbot/test/test_step_1/module_tests/test_module_python.py
@@ -0,0 +1,6 @@
+from .base import ModuleTestBase
+
+
+class TestPython(ModuleTestBase):
+    def check(self, module_test, events):
+        assert any(e.data == "blacklanternsecurity.com" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_rapiddns.py b/bbot/test/test_step_1/module_tests/test_module_rapiddns.py
index e69de29bb2..e324a5ac14 100644
--- a/bbot/test/test_step_1/module_tests/test_module_rapiddns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_rapiddns.py
@@ -0,0 +1,16 @@
+from .base import ModuleTestBase
+
+
+class TestRapidDNS(ModuleTestBase):
+    web_body = """<th scope="row ">12</th>
+<td>asdf.blacklanternsecurity.com</td>
+<td><a href="/sameip/asdf.blacklanternsecurity.com.?t=cname#result" target="_blank" title="asdf.blacklanternsecurity.com. same ip website">asdf.blacklanternsecurity.com.</a>"""
+
+    def setup_after_prep(self, module_test):
+        module_test.module.abort_if = lambda e: False
+        module_test.httpx_mock.add_response(
+            url=f"https://rapiddns.io/subdomain/blacklanternsecurity.com?full=1#result", text=self.web_body
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_riddler.py b/bbot/test/test_step_1/module_tests/test_module_riddler.py
index e69de29bb2..f06a0513b0 100644
--- a/bbot/test/test_step_1/module_tests/test_module_riddler.py
+++ b/bbot/test/test_step_1/module_tests/test_module_riddler.py
@@ -0,0 +1,16 @@
+from .base import ModuleTestBase
+
+
+class TestRiddler(ModuleTestBase):
+    web_body = """<th scope="row ">12</th>
+<td>asdf.blacklanternsecurity.com</td>
+<td><a href="/sameip/asdf.blacklanternsecurity.com.?t=cname#result" target="_blank" title="asdf.blacklanternsecurity.com. same ip website">asdf.blacklanternsecurity.com.</a>"""
+
+    def setup_after_prep(self, module_test):
+        module_test.module.abort_if = lambda e: False
+        module_test.httpx_mock.add_response(
+            url=f"https://riddler.io/search/exportcsv?q=pld:blacklanternsecurity.com", text=self.web_body
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"

From 29845eb21ac3669e5b1b898cd49f603f0229dd4b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 21 May 2023 21:33:38 -0400
Subject: [PATCH 035/387] skymem, shodan, securitytrails, secretsdb tests

---
 bbot/modules/securitytrails.py                |   14 +-
 bbot/modules/shodan_dns.py                    |    8 +-
 bbot/modules/skymem.py                        |   11 +-
 .../module_tests/test_module_robots.py        |   42 +
 .../module_tests/test_module_secretsdb.py     |   22 +
 .../test_module_securitytrails.py             |   21 +
 .../module_tests/test_module_shodan_dns.py    |   21 +
 .../module_tests/test_module_skymem.py        | 1222 +++++++++++++++++
 8 files changed, 1347 insertions(+), 14 deletions(-)

diff --git a/bbot/modules/securitytrails.py b/bbot/modules/securitytrails.py
index 592616ae55..d58b227e50 100644
--- a/bbot/modules/securitytrails.py
+++ b/bbot/modules/securitytrails.py
@@ -11,18 +11,20 @@ class securitytrails(shodan_dns):
 
     base_url = "https://api.securitytrails.com/v1"
 
-    def setup(self):
+    async def setup(self):
         self.limit = 100
-        return super().setup()
+        return await super().setup()
 
-    def ping(self):
-        r = self.request_with_fail_count(f"{self.base_url}/ping?apikey={self.api_key}")
+    async def ping(self):
+        url = f"{self.base_url}/ping?apikey={self.api_key}"
+        r = await self.request_with_fail_count(url)
         resp_content = getattr(r, "text", "")
         assert getattr(r, "status_code", 0) == 200, resp_content
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/domain/{query}/subdomains?apikey={self.api_key}"
-        return self.request_with_fail_count(url)
+        response = await self.request_with_fail_count(url)
+        return response
 
     def parse_results(self, r, query):
         j = r.json()
diff --git a/bbot/modules/shodan_dns.py b/bbot/modules/shodan_dns.py
index 5323e74a40..c94d0ac203 100644
--- a/bbot/modules/shodan_dns.py
+++ b/bbot/modules/shodan_dns.py
@@ -21,16 +21,18 @@ async def setup(self):
         return await self.require_api_key()
 
     async def ping(self):
-        r = await self.request_with_fail_count(f"{self.base_url}/api-info?key={self.api_key}")
+        url = f"{self.base_url}/api-info?key={self.api_key}"
+        r = await self.request_with_fail_count(url)
         resp_content = getattr(r, "text", "")
         assert getattr(r, "status_code", 0) == 200, resp_content
 
     async def request_url(self, query):
         url = f"{self.base_url}/dns/domain/{self.helpers.quote(query)}?key={self.api_key}"
-        return await self.request_with_fail_count(url)
+        response = await self.request_with_fail_count(url)
+        return response
 
     def parse_results(self, r, query):
         json = r.json()
         if json:
-            for hostname in json.get("subdomains"):
+            for hostname in json.get("subdomains", []):
                 yield f"{hostname}.{query}"
diff --git a/bbot/modules/skymem.py b/bbot/modules/skymem.py
index e319cc6dba..56f5e39f65 100644
--- a/bbot/modules/skymem.py
+++ b/bbot/modules/skymem.py
@@ -11,14 +11,14 @@ class skymem(emailformat):
 
     base_url = "https://www.skymem.info"
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         _, query = self.helpers.split_domain(event.data)
         # get first page
         url = f"{self.base_url}/srch?q={self.helpers.quote(query)}"
-        r = self.request_with_fail_count(url)
+        r = await self.request_with_fail_count(url)
         if not r:
             return
-        for email in self.extract_emails(r.text):
+        for email in self.helpers.extract_emails(r.text):
             self.emit_event(email, "EMAIL_ADDRESS", source=event)
 
         # iterate through other pages
@@ -27,12 +27,13 @@ def handle_event(self, event):
             return
         domain_id = domain_ids[0]
         for page in range(2, 22):
-            r2 = self.request_with_fail_count(f"{self.base_url}/domain/{domain_id}?p={page}")
+            r2 = await self.request_with_fail_count(f"{self.base_url}/domain/{domain_id}?p={page}")
             if not r2:
                 continue
-            for email in self.extract_emails(r2.text):
+            for email in self.helpers.extract_emails(r2.text):
                 self.emit_event(email, "EMAIL_ADDRESS", source=event)
             pages = re.findall(r"/domain/" + domain_id + r"\?p=(\d+)", r2.text)
+            self.critical(pages)
             if not pages:
                 break
             last_page = max([int(p) for p in pages])
diff --git a/bbot/test/test_step_1/module_tests/test_module_robots.py b/bbot/test/test_step_1/module_tests/test_module_robots.py
index e69de29bb2..aba68778fc 100644
--- a/bbot/test/test_step_1/module_tests/test_module_robots.py
+++ b/bbot/test/test_step_1/module_tests/test_module_robots.py
@@ -0,0 +1,42 @@
+import re
+from .base import ModuleTestBase
+
+
+class TestRobots(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "robots"]
+    config_overrides = {"modules": {"robots": {"include_sitemap": True}}}
+
+    def setup_after_prep(self, module_test):
+        sample_robots = f"Allow: /allow/\nDisallow: /disallow/\nJunk: test.com\nDisallow: /*/wildcard.txt\nSitemap: {self.targets[0]}/sitemap.txt"
+
+        expect_args = {"method": "GET", "uri": "/robots.txt"}
+        respond_args = {"response_data": sample_robots}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        allow_bool = False
+        disallow_bool = False
+        sitemap_bool = False
+        wildcard_bool = False
+
+        for e in events:
+            if e.type == "URL_UNVERIFIED":
+                if str(e.module) != "TARGET":
+                    assert "spider-danger" in e.tags, f"{e} doesn't have spider-danger tag"
+                if e.data == "http://127.0.0.1:8888/allow/":
+                    allow_bool = True
+
+                if e.data == "http://127.0.0.1:8888/disallow/":
+                    disallow_bool = True
+
+                if e.data == "http://127.0.0.1:8888/sitemap.txt":
+                    sitemap_bool = True
+
+                if re.match(r"http://127\.0\.0\.1:8888/\w+/wildcard\.txt", e.data):
+                    wildcard_bool = True
+
+        assert allow_bool
+        assert disallow_bool
+        assert sitemap_bool
+        assert wildcard_bool
diff --git a/bbot/test/test_step_1/module_tests/test_module_secretsdb.py b/bbot/test/test_step_1/module_tests/test_module_secretsdb.py
index e69de29bb2..5c0d1a00df 100644
--- a/bbot/test/test_step_1/module_tests/test_module_secretsdb.py
+++ b/bbot/test/test_step_1/module_tests/test_module_secretsdb.py
@@ -0,0 +1,22 @@
+from .base import ModuleTestBase
+
+
+class TestSecretsDB(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "secretsdb"]
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml",
+            text="""patterns:
+- pattern:
+    confidence: 99
+    name: Asymmetric Private Key
+    regex: '-----BEGIN ((EC|PGP|DSA|RSA|OPENSSH) )?PRIVATE KEY( BLOCK)?-----'""",
+        )
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "-----BEGIN PGP PRIVATE KEY BLOCK-----"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "FINDING" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_securitytrails.py b/bbot/test/test_step_1/module_tests/test_module_securitytrails.py
index e69de29bb2..8e015baf88 100644
--- a/bbot/test/test_step_1/module_tests/test_module_securitytrails.py
+++ b/bbot/test/test_step_1/module_tests/test_module_securitytrails.py
@@ -0,0 +1,21 @@
+from .base import ModuleTestBase
+
+
+class TestSecurityTrails(ModuleTestBase):
+    config_overrides = {"modules": {"securitytrails": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.securitytrails.com/v1/ping?apikey=asdf",
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.securitytrails.com/v1/domain/blacklanternsecurity.com/subdomains?apikey=asdf",
+            json={
+                "subdomains": [
+                    "asdf",
+                ],
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py b/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
index e69de29bb2..dfe19dfaec 100644
--- a/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
@@ -0,0 +1,21 @@
+from .base import ModuleTestBase
+
+
+class TestShodan_DNS(ModuleTestBase):
+    config_overrides = {"modules": {"shodan_dns": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.shodan.io/api-info?key=asdf",
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.shodan.io/dns/domain/blacklanternsecurity.com?key=asdf",
+            json={
+                "subdomains": [
+                    "asdf",
+                ],
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_skymem.py b/bbot/test/test_step_1/module_tests/test_module_skymem.py
index e69de29bb2..a7c7268b1a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_skymem.py
+++ b/bbot/test/test_step_1/module_tests/test_module_skymem.py
@@ -0,0 +1,1222 @@
+from .base import ModuleTestBase
+
+
+class TestSkymem(ModuleTestBase):
+    targets = ["blacklanternsecurity.com"]
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://www.skymem.info/srch?q=blacklanternsecurity.com",
+            text=page_1_body,
+        )
+        module_test.httpx_mock.add_response(
+            url="https://www.skymem.info/domain/5679236812ad5b3f748a413d?p=2",
+            text=page_2_body,
+        )
+        module_test.httpx_mock.add_response(
+            url="https://www.skymem.info/domain/5679236812ad5b3f748a413d?p=3",
+            text=page_3_body,
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "page1email@blacklanternsecurity.com" for e in events), "Failed to detect first email"
+        assert any(e.data == "page2email@blacklanternsecurity.com" for e in events), "Failed to detect second email"
+        assert any(e.data == "page3email@blacklanternsecurity.com" for e in events), "Failed to detect third email"
+
+
+page_1_body = """
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="utf-8" />    
+    <meta name="viewport" content="width=device-width, initial-scale=1">
+    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
+    <title>q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails</title>
+    <meta property="fb:app_id" content="876814239665436" /> 
+    <meta name="keywords" content="email, emails, email list, email marketing, marketing,  contacts, contact">
+    <meta name="description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails">
+    <meta name="author" content="Skymem">
+    <meta property="og:title" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
+    <meta property="og:site_name" content="Skymem web page" />
+    <meta property="og:type" content="website" />
+    <meta property="og:url" content="http://www.skymem.info/srch?q=blacklanternsecurity.com" />
+    <meta property="og:description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
+    <meta property="og:image" content="http://www.skymem.info/images/www2.jpg" />
+    <meta property="og:image:type" content="image/jpeg" />
+    <meta property="og:image:width" content="400" />
+    <meta property="og:image:height" content="300" />
+    <meta name="google-site-verification" content="tfut_b-dbvVtExEHbFHdpQirHTtvQLRFmBJOBw38s7w" />
+    <meta name="robots" content="noarchive">
+    <!-- Material Design for Bootstrap fonts and icons -->
+<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,400,500,700|Material+Icons">
+<link href="/lib2/mcw/dist/material-components-web.css" rel="stylesheet" />
+<link rel="stylesheet" href="https://stackpath.bootstrapcdn.com/bootstrap/4.2.1/css/bootstrap.min.css" />
+<meta name="x-stylesheet-fallback-test" content="" class="sr-only" /><script>!function(a,b,c,d){var e,f=document,g=f.getElementsByTagName("SCRIPT"),h=g[g.length-1].previousElementSibling,i=f.defaultView&&f.defaultView.getComputedStyle?f.defaultView.getComputedStyle(h):h.currentStyle;if(i&&i[a]!==b)for(e=0;e<c.length;e++)f.write('<link href="'+c[e]+'" '+d+"/>")}("position","absolute",["/lib2/bootstrap/dist/css/bootstrap.min.css"], "rel=\u0022stylesheet\u0022 ");</script>
+<link rel="stylesheet" href="/lib2/angular-ui-grid/ui-grid.css" />
+<link rel="stylesheet" href="/css/site.min.css" />
+<script src="/lib2/angular/angular.min.js"></script>
+        <script>            
+            (function (i, s, o, g, r, a, m) {
+                i['GoogleAnalyticsObject'] = r;
+                i[r] = i[r] ||
+                    function () {
+                        (i[r].q = i[r].q || []).push(arguments);
+                    }, i[r].l = 1 * new Date();
+                a = s.createElement(o),
+                    m = s.getElementsByTagName(o)[0];
+                a.async = 1;
+                a.src = g;
+                m.parentNode.insertBefore(a, m);
+            })(window, document, 'script', '//www.google-analytics.com/analytics.js', 'ga');
+            ga('create', 'UA-177951-20', 'auto');
+            ga('send', 'pageview');
+        </script>
+    <meta name="yandex-verification" content="552f869c3d2c3790" />
+    <!-- Bing: Verify ownership for: www.skymem.info -->
+    <meta name="msvalidate.01" content="C0E58004DB6ADBA4BDA8A8683D08CEF5" />
+    <meta name="exoclick-site-verification" content="a21b82b756cc4c93d048b5d81c98ed70">
+<meta name="ahrefs-site-verification" content="2dd82e09740f685c7a184846aa6da037541576526eda4833a0c622189d9a323a">
+</head>
+<body>
+<script>
+  window.fbAsyncInit = function() {
+    FB.init({
+      appId      : '876814239665436',
+      xfbml      : true,
+      version    : 'v12.0'
+    });
+    FB.AppEvents.logPageView();
+  };
+  (function(d, s, id){
+     var js, fjs = d.getElementsByTagName(s)[0];
+     if (d.getElementById(id)) {return;}
+     js = d.createElement(s); js.id = id;
+     js.src = "https://connect.facebook.net/en_US/sdk.js";
+     fjs.parentNode.insertBefore(js, fjs);
+   }(document, 'script', 'facebook-jssdk'));
+</script>
+<div id="fb-root"></div>
+<script async defer crossorigin="anonymous" src="https://connect.facebook.net/en_US/sdk.js#xfbml=1&version=v12.0&appId=876814239665436&autoLogAppEvents=1" nonce="CJ4gP3PN"></script>
+    <header>
+        <div style="border-bottom:1px solid #ffffff;">
+            <nav class="navbar navbar-expand-md navbar-light bg-light" style="border-bottom:1px solid #d8d8d8;background-color: #fff!important;">
+                <div class="container">
+                    <a class="navbar-brand valign-center text-muted" href="/"><i class="material-icons nav-link-go1">home</i></a>
+                    <button class="navbar-toggler collapsed" type="button" data-toggle="collapse" data-target="#navbarsExample07" aria-controls="navbarsExample07" aria-expanded="false" aria-label="Toggle navigation">
+                        <span class="navbar-toggler-icon"></span>
+                    </button>
+                    <div class="navbar-collapse collapse" id="navbarsExample07" style="">
+                        <ul class="navbar-nav mr-auto">
+                            <li class="nav-item">
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/list"><i class="material-icons" style="color:#007bff;">add</i> &nbsp; <span>Create email list</span></a>
+                            </li>
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/lists"> <i class="material-icons">mail_outline</i> &nbsp; <span>Email Lists</span></a>
+                            </li>
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/"> <i class="material-icons">search</i> &nbsp; <span></span></a>
+                            </li>
+                            
+                        </ul>
+                    </div>
+                </div>
+            </nav>
+        </div>
+    </header>
+    <main role="main">\
+        
+<style>
+img {
+  margin: 0em auto;
+  display: inline-block;  
+  width: 18px;
+}
+</style>
+<script>
+    var EmptyListPackData =  {"DocResRep":{"ItemsUI":null,"UiLimit":{"Throttle":0.15,"MiningInAdCasePer":0,"MiningInNoAdCasePer":100,"ShowAd":false,"EmailShowOnFirstSearchPage":5,"RelatedEmailsMax":100,"RelatedEmailsItemsPerPage":10,"EmailSearchCountLimitOnMore":50,"DomainCountShowOnFirstSearchPage":10,"DomainRelatedLimitOnMore":200,"DomainRelatedItemsPerPage":25,"EmailsOfDomainShowPercentageOfAll":50,"ItemsPerPageOnList":5,"ListIdItemsPerPage":25,"MaxEmailsInTrial":50,"DownloadEmailsCountTrialLimit":30},"ListVersionId":null,"ListName":null,"ListFilter":{"ConditionANDs":[],"NEmailPerDomain":2000000,"EmailsLimitPerList":2000000,"HostLimitPerList":2000000,"EmailsPreviewMaxCount":100,"HostsPreviewMaxCount":5000},"ListPackDesc":null,"ListFilterItems":null,"HostORItems":null,"OtherORItems":null,"FV":null,"DomainCount":0,"EmailCount":0,"TotalNEmails":null,"FoundNEmails":null,"CloneBy":null,"ListInternalType":"Normal","MarketplaceLP":null,"OperationMod":"None","FinishedPercentage":0.0,"ListComplete":null,"ListCompleteStat":null,"TrialEmails":[],"PriceCalc":null,"BuyNowUrl":null,"TotalNDomains":null,"CreatorId":null,"CreatorName":null,"IdEntity":null,"IdDoc":null,"IdDocVer":null,"ExtraElements":null},"DocCollection":"","Resources":""}; 
+</script>
+<div ng-app="AppMain">
+    <div ng-controller="SearchResultCtrl">
+        <div class="container">
+            
+    <form class="form" role="form">
+            <div class="input-group input-group-lg mb-3"
+                 title="The search lets you find all the email addresses using one given domain name (for example, 'company.com').">
+                <input type="text" style="min-width: 200px;" ng-model="Doc.SearchRequest" class="form-control" placeholder="company.com" autofocus />
+                <span ng-init="Doc.SearchRequest='blacklanternsecurity.com'"></span>
+                <div class="input-group-append">
+                    <button type="submit" value="Submit" class="btn btn-primary btn-lg" ng-click="post()">
+                        <div class="valign-center">
+                            <i class="material-icons md-24">search</i>
+                        </div>
+                        <span class="d-none d-sm-inline-block"> Find </span> <span class="d-none d-md-inline-block">email </span> <span class="d-none d-lg-inline-block"> addresses</span>
+                    </button>
+                </div>
+            </div>     
+            <div style="position:relative; top:-18px;">
+                <a href="#a" class="popovers" style="text-decoration:none;"
+                   data-toggle="popover" data-trigger="manual" title="New feature in search"
+                   data-original-title="New feature in search"
+                   data-content="Type first and last name with domain name and we will do our best to find the email of this person. eg. <br /> <a href='/srch?q=david%20baker%20exeloncorp.com&ss=home'><strong>david baker exeloncorp.com</strong></a>">                   
+                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
+                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
+                    </div>
+                </a>
+            </div>
+    </form>
+            <div style="margin: 0 0; text-align: center;">
+            </div>
+        <div class="row ">
+                <div class="col-sm-8" style="padding-top:20px">
+                    <!-- Emails found -------------------------------------------------------------------------- -->
+                    <!-- Related emails -------------------------------------------------------------------------- -->
+                    <!-- Domain XXX emails found -------------------------------------------------------------------------- -->
+                        <div style="padding-bottom:20px">
+                            <div class="valign-center text-muted mdc-typography--headline5" title="Domain related to this search result">
+                                <!-- <i class="material-icons md-dark md-36">language</i>&nbsp; --> 
+                <img style="width: 32px; margin-right:5px;" src="https://s2.googleusercontent.com/s2/favicons?domain=blacklanternsecurity.com&sz=128" />
+                                <a href="/srch?q=blacklanternsecurity.com">blacklanternsecurity.com</a>&nbsp;
+                                <span title="Press CTRL + mouse click or middle mouse button, to open in background tab. This is a link to external web site of this domene in form https://example.com. If web site in form www.example.com or is not have SSL change to http://www.example.com">
+                                    <a href="https://blacklanternsecurity.com" target="_blank">
+                                        <i class="material-icons" style="width:20px;font-size: 18px; color:#c1c1c1">outbound_outline</i>
+                                    </a>
+                                </span>
+                                <small><small>(1768 emails)</small></small>
+                            </div>
+                            <span title="Buy Now all 1768 emails of domain blacklanternsecurity.com">
+                                &nbsp;
+                                <button type="button" class="btn btn-primary btn-sm" ng-disabled="DisabledBuyNow" ng-click="buyOneDomain('blacklanternsecurity.com')">
+                                    <i class="material-icons md-18">arrow_right</i> Buy Now
+                                </button>
+                            </span>
+                            <button class="mdc-icon-button material-icons md-18"
+                                    style="color:#aaa"
+                                    data-toggle="popover" data-trigger="focus" data-html="true" title="Buy Now"
+                                    data-content=" &lt;b&gt;Buy now&lt;/b&gt; all &lt;b&gt;1768&lt;/b&gt; emails of &lt;b&gt;blacklanternsecurity.com&lt;/b&gt; domain.&lt;br /&gt;&#xD;&#xA;                                            &lt;b&gt;Here&lt;/b&gt; is only the preview part of all emails for this domain.&lt;br /&gt;&#xD;&#xA;                                             &lt;b&gt;After &lt;/b&gt; you press &lt;b&gt;Buy now&lt;/b&gt; button we will redirect you to email list with all emails of this domain,&#xD;&#xA;                                                    where you can buy it with PayPal or any of popular credit card or with Bitcoin (see &lt;a href=&#x27;/faq&#x27;&gt;FAQ&lt;/a&gt;) &lt;br /&gt;&lt;br /&gt;&#xD;&#xA;                                            ">
+                                help_outline
+                            </button>
+                            <div ng-show="ShowProgressBar" class="ng-hide">
+                                <div class="progress position-relative" style="height: 5px;margin-bottom:2px;">
+                                    <div class="progress-bar progress-bar-striped progress-bar-animated" role="progressbar" aria-valuemin="0" aria-valuemax="100"
+                                         style="width:{{ProgressBarValue}}%;  background-color:rgb(148, 194, 250) !important;"></div>
+                                    <span class="justify-content-center d-flex position-absolute w-100"></span>
+                                </div>
+                            </div>
+                            <span hidden ng-init="Doc.DomainEmails.Host='blacklanternsecurity.com'"></span>
+                            <span hidden ng-init="Doc.DomainEmails.IdEntity='5679236812ad5b3f748a413d'"></span>
+                            <table class="table table-striped  table-sm table-hover table-bordered text-muted">
+                                <thead class="table-primary">
+                                    <tr class="info">
+                                            <th style="width:1%;">#</th>
+                                        <th>
+                                            <div class="valign-center text-muted" title="Number of domain that filtered at least one email. Other domain is not in this list but it still you can see it in filter.">
+                                                <i class="material-icons md-dark">mail_outline</i> &nbsp; Email
+                                            </div>
+                                        </th>
+                                    </tr>
+                                </thead>
+                                <tbody>
+                                            <tr>
+                                                <td scope="row">1</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">2</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">3</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">4</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">5</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">6</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">7</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">8</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">9</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">10</td>
+                                                <td>
+                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                </tbody>
+                            </table>
+                                <a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+                                <a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+                        </div>
+                    <!-- Related domains -------------------------------------------------------------------------- -->
+            <br />
+            <br />
+            <br />
+            <br />
+      <div class="fb-comments" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="100%" data-numposts="5"></div>
+                </div>
+            <div class="col-sm-4" style="padding-top:60px;">
+             
+<div  style="display:inline-block;vertical-align:top;">
+    <div  style="display:inline-block;vertical-align:top;margin-top:-3px;">
+        <div class="fb-save" data-uri="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-size="small"></div>        </div>     
+    <div  style="display:inline-block;vertical-align:top;margin-top:0px;">
+        <div class="fb-like" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="" data-layout="button_count" data-action="like" data-size="small" data-share="true" data-colorscheme="light"></div>
+        </div>      
+</div>             
+<hr />
+            
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        
+    </div>
+</div>
+<br />
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        <br />
+        
+    </div>
+</div>
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        <br />
+        
+    </div>
+</div>  
+            <br />
+            <br />
+        </div>
+            </div>
+        </div>
+    </div>
+</div>
+    </main>
+    <footer class="text-muted" style="background-color: #ddd; margin-top: 60px; padding-top: 60px;">
+        <div class="container">
+            <hr>
+            <div class="row">
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">&copy; Skymem</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/">Home</a></li>
+                        <li><a href="/list">Create new email list</a></li>
+                        <li><a href="/faq">FAQ</a></li>
+                        <li><a href="/lists">Email lists</a></li>
+                <li>
+<a href="#a" class="popovers" style="text-decoration:none;"
+                   data-toggle="popover" data-trigger="manual" title="Name Extractor from text."
+                   data-original-title="Name Extractor from text."
+                   data-content="Try our new tool in (alfa version) for extracting person names from any kind of text.">                   
+                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
+                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
+                    </div>
+                </a>
+                                <a href="http://name.skymem.info"> New Tool: <b>Name Explorer</b></a>
+                            </li>
+                <li>
+                                <a href="http://martext.skymem.info"> MarText</a>
+                            </li>
+                        <li><a href="/donation">BitCoin Donations</a></li>
+                    </ul>
+                </div>
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">Contact</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/contact">Contact Us</a></li>
+                        <li><a href="https://www.facebook.com/Skymem-128969217176249/" target="_blank">Facebook page</a></li>
+            <li><a href="https://www.facebook.com/groups/169518103095402" target="_blank">Facebook group</a></li>
+            <li><a href="https://twitter.com/skymem" target="_blank">Twitter</a></li>
+                    </ul>
+                </div>
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">Policies</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/dmca-policy">DMCA Policy</a></li>
+                        <li><a href="/spam-policy">Spam Policy</a></li>
+                        <li><a href="/cookies-policy">Cookies Policy</a></li>
+                        <li><a href="/terms">Terms of Service</a></li>
+                        <li><a href="/privacy-policy">Privacy Policy</a></li>
+                        <li>
+                            <a href="http://www1395355448.e-cdn.com" rel="nofollow" target="_blank">Fight Spam!</a>
+                        </li>
+                    </ul>
+                </div>
+            </div>
+            <br />
+        </div>
+    </footer>
+    
+<script src="https://code.jquery.com/jquery-3.4.1.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous">
+</script>
+<script>(window.jQuery||document.write("\u003Cscript src=\u0022/lib2/jquery/jquery.min.js\u0022 integrity=\u0022sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
+<script src="https://stackpath.bootstrapcdn.com/bootstrap/4.3.1/js/bootstrap.bundle.min.js" integrity="sha384-xrRywqdh3PHs8keKZN+8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o" crossorigin="anonymous">
+</script>
+<script>(window.jQuery && window.jQuery.fn && window.jQuery.fn.modal||document.write("\u003Cscript src=\u0022/lib2/bootstrap/dist/js/bootstrap.bundle.min.js\u0022 integrity=\u0022sha384-xrRywqdh3PHs8keKZN\u002B8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/lodash.js/4.17.15/lodash.min.js" integrity="sha256-VeNaFBVDhoX3H+gJ37DpT/nTuZTdjYro9yBruHjVmoQ=" crossorigin="anonymous"></script>
+<script src="/lib2/angular-ui-grid/ui-grid.min.js"></script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/URI.js/1.19.1/URI.min.js"></script>
+<script src="/tsscripts/tsc.js?v=8ScpiXoINQWyILwjXqQp3feeposq0Ze9zjhZzJBAxc8"></script>
+<script src="/lib2/mcw/dist/material-components-web.min.js"></script>
+<script>
+    //$(function () {
+    //    $('[data-toggle="popover"]').popover();
+    //});
+    $(function () {
+        $("[data-toggle=popover]")
+            .popover({ html: true })
+            .on("focus", function () {
+                $(this).popover("show");
+            }).on("focusout", function () {
+                var _this = this;
+                if (!$(".popover:hover").length) {
+                    $(this).popover("hide");
+                }
+                else {
+                    $('.popover').mouseleave(function () {
+                        $(_this).popover("hide");
+                        $(this).off('mouseleave');
+                    });
+                }
+            });
+    });
+    $('.popover-dismiss').popover({
+        trigger: 'focus', html: true
+    });
+</script>
+<!-- Facebook Pixel Code -->
+<!-- End Facebook Pixel Code -->
+    
+</body>
+</html>
+"""
+page_2_body = """<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="utf-8" />    
+    <meta name="viewport" content="width=device-width, initial-scale=1">
+    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
+    <title>q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails</title>
+    <meta property="fb:app_id" content="876814239665436" /> 
+    <meta name="keywords" content="email, emails, email list, email marketing, marketing,  contacts, contact">
+    <meta name="description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails">
+    <meta name="author" content="Skymem">
+    <meta property="og:title" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
+    <meta property="og:site_name" content="Skymem web page" />
+    <meta property="og:type" content="website" />
+    <meta property="og:url" content="http://www.skymem.info/srch?q=blacklanternsecurity.com" />
+    <meta property="og:description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
+    <meta property="og:image" content="http://www.skymem.info/images/www2.jpg" />
+    <meta property="og:image:type" content="image/jpeg" />
+    <meta property="og:image:width" content="400" />
+    <meta property="og:image:height" content="300" />
+    <meta name="google-site-verification" content="tfut_b-dbvVtExEHbFHdpQirHTtvQLRFmBJOBw38s7w" />
+    <meta name="robots" content="noarchive">
+    <!-- Material Design for Bootstrap fonts and icons -->
+<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,400,500,700|Material+Icons">
+<link href="/lib2/mcw/dist/material-components-web.css" rel="stylesheet" />
+<link rel="stylesheet" href="https://stackpath.bootstrapcdn.com/bootstrap/4.2.1/css/bootstrap.min.css" />
+<meta name="x-stylesheet-fallback-test" content="" class="sr-only" /><script>!function(a,b,c,d){var e,f=document,g=f.getElementsByTagName("SCRIPT"),h=g[g.length-1].previousElementSibling,i=f.defaultView&&f.defaultView.getComputedStyle?f.defaultView.getComputedStyle(h):h.currentStyle;if(i&&i[a]!==b)for(e=0;e<c.length;e++)f.write('<link href="'+c[e]+'" '+d+"/>")}("position","absolute",["/lib2/bootstrap/dist/css/bootstrap.min.css"], "rel=\u0022stylesheet\u0022 ");</script>
+<link rel="stylesheet" href="/lib2/angular-ui-grid/ui-grid.css" />
+<link rel="stylesheet" href="/css/site.min.css" />
+<script src="/lib2/angular/angular.min.js"></script>
+        <script>            
+            (function (i, s, o, g, r, a, m) {
+                i['GoogleAnalyticsObject'] = r;
+                i[r] = i[r] ||
+                    function () {
+                        (i[r].q = i[r].q || []).push(arguments);
+                    }, i[r].l = 1 * new Date();
+                a = s.createElement(o),
+                    m = s.getElementsByTagName(o)[0];
+                a.async = 1;
+                a.src = g;
+                m.parentNode.insertBefore(a, m);
+            })(window, document, 'script', '//www.google-analytics.com/analytics.js', 'ga');
+            ga('create', 'UA-177951-20', 'auto');
+            ga('send', 'pageview');
+        </script>
+    <meta name="yandex-verification" content="552f869c3d2c3790" />
+    <!-- Bing: Verify ownership for: www.skymem.info -->
+    <meta name="msvalidate.01" content="C0E58004DB6ADBA4BDA8A8683D08CEF5" />
+    <meta name="exoclick-site-verification" content="a21b82b756cc4c93d048b5d81c98ed70">
+<meta name="ahrefs-site-verification" content="2dd82e09740f685c7a184846aa6da037541576526eda4833a0c622189d9a323a">
+</head>
+<body>
+<script>
+  window.fbAsyncInit = function() {
+    FB.init({
+      appId      : '876814239665436',
+      xfbml      : true,
+      version    : 'v12.0'
+    });
+    FB.AppEvents.logPageView();
+  };
+  (function(d, s, id){
+     var js, fjs = d.getElementsByTagName(s)[0];
+     if (d.getElementById(id)) {return;}
+     js = d.createElement(s); js.id = id;
+     js.src = "https://connect.facebook.net/en_US/sdk.js";
+     fjs.parentNode.insertBefore(js, fjs);
+   }(document, 'script', 'facebook-jssdk'));
+</script>
+<div id="fb-root"></div>
+<script async defer crossorigin="anonymous" src="https://connect.facebook.net/en_US/sdk.js#xfbml=1&version=v12.0&appId=876814239665436&autoLogAppEvents=1" nonce="CJ4gP3PN"></script>
+    <header>
+        <div style="border-bottom:1px solid #ffffff;">
+            <nav class="navbar navbar-expand-md navbar-light bg-light" style="border-bottom:1px solid #d8d8d8;background-color: #fff!important;">
+                <div class="container">
+                    <a class="navbar-brand valign-center text-muted" href="/"><i class="material-icons nav-link-go1">home</i></a>
+                    <button class="navbar-toggler collapsed" type="button" data-toggle="collapse" data-target="#navbarsExample07" aria-controls="navbarsExample07" aria-expanded="false" aria-label="Toggle navigation">
+                        <span class="navbar-toggler-icon"></span>
+                    </button>
+                    <div class="navbar-collapse collapse" id="navbarsExample07" style="">
+                        <ul class="navbar-nav mr-auto">
+                            <li class="nav-item">
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/list"><i class="material-icons" style="color:#007bff;">add</i> &nbsp; <span>Create email list</span></a>
+                            </li>
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/lists"> <i class="material-icons">mail_outline</i> &nbsp; <span>Email Lists</span></a>
+                            </li>
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/"> <i class="material-icons">search</i> &nbsp; <span></span></a>
+                            </li>
+                            
+                        </ul>
+                    </div>
+                </div>
+            </nav>
+        </div>
+    </header>
+    <main role="main">\
+        
+<style>
+img {
+  margin: 0em auto;
+  display: inline-block;  
+  width: 18px;
+}
+</style>
+<script>
+    var EmptyListPackData =  {"DocResRep":{"ItemsUI":null,"UiLimit":{"Throttle":0.15,"MiningInAdCasePer":0,"MiningInNoAdCasePer":100,"ShowAd":false,"EmailShowOnFirstSearchPage":5,"RelatedEmailsMax":100,"RelatedEmailsItemsPerPage":10,"EmailSearchCountLimitOnMore":50,"DomainCountShowOnFirstSearchPage":10,"DomainRelatedLimitOnMore":200,"DomainRelatedItemsPerPage":25,"EmailsOfDomainShowPercentageOfAll":50,"ItemsPerPageOnList":5,"ListIdItemsPerPage":25,"MaxEmailsInTrial":50,"DownloadEmailsCountTrialLimit":30},"ListVersionId":null,"ListName":null,"ListFilter":{"ConditionANDs":[],"NEmailPerDomain":2000000,"EmailsLimitPerList":2000000,"HostLimitPerList":2000000,"EmailsPreviewMaxCount":100,"HostsPreviewMaxCount":5000},"ListPackDesc":null,"ListFilterItems":null,"HostORItems":null,"OtherORItems":null,"FV":null,"DomainCount":0,"EmailCount":0,"TotalNEmails":null,"FoundNEmails":null,"CloneBy":null,"ListInternalType":"Normal","MarketplaceLP":null,"OperationMod":"None","FinishedPercentage":0.0,"ListComplete":null,"ListCompleteStat":null,"TrialEmails":[],"PriceCalc":null,"BuyNowUrl":null,"TotalNDomains":null,"CreatorId":null,"CreatorName":null,"IdEntity":null,"IdDoc":null,"IdDocVer":null,"ExtraElements":null},"DocCollection":"","Resources":""}; 
+</script>
+<div ng-app="AppMain">
+    <div ng-controller="SearchResultCtrl">
+        <div class="container">
+            
+    <form class="form" role="form">
+            <div class="input-group input-group-lg mb-3"
+                 title="The search lets you find all the email addresses using one given domain name (for example, 'company.com').">
+                <input type="text" style="min-width: 200px;" ng-model="Doc.SearchRequest" class="form-control" placeholder="company.com" autofocus />
+                <span ng-init="Doc.SearchRequest='blacklanternsecurity.com'"></span>
+                <div class="input-group-append">
+                    <button type="submit" value="Submit" class="btn btn-primary btn-lg" ng-click="post()">
+                        <div class="valign-center">
+                            <i class="material-icons md-24">search</i>
+                        </div>
+                        <span class="d-none d-sm-inline-block"> Find </span> <span class="d-none d-md-inline-block">email </span> <span class="d-none d-lg-inline-block"> addresses</span>
+                    </button>
+                </div>
+            </div>     
+            <div style="position:relative; top:-18px;">
+                <a href="#a" class="popovers" style="text-decoration:none;"
+                   data-toggle="popover" data-trigger="manual" title="New feature in search"
+                   data-original-title="New feature in search"
+                   data-content="Type first and last name with domain name and we will do our best to find the email of this person. eg. <br /> <a href='/srch?q=david%20baker%20exeloncorp.com&ss=home'><strong>david baker exeloncorp.com</strong></a>">                   
+                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
+                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
+                    </div>
+                </a>
+            </div>
+    </form>
+            <div style="margin: 0 0; text-align: center;">
+            </div>
+        <div class="row ">
+                <div class="col-sm-8" style="padding-top:20px">
+                    <!-- Emails found -------------------------------------------------------------------------- -->
+                    <!-- Related emails -------------------------------------------------------------------------- -->
+                    <!-- Domain XXX emails found -------------------------------------------------------------------------- -->
+                        <div style="padding-bottom:20px">
+                            <div class="valign-center text-muted mdc-typography--headline5" title="Domain related to this search result">
+                                <!-- <i class="material-icons md-dark md-36">language</i>&nbsp; --> 
+                <img style="width: 32px; margin-right:5px;" src="https://s2.googleusercontent.com/s2/favicons?domain=blacklanternsecurity.com&sz=128" />
+                                <a href="/srch?q=blacklanternsecurity.com">blacklanternsecurity.com</a>&nbsp;
+                                <span title="Press CTRL + mouse click or middle mouse button, to open in background tab. This is a link to external web site of this domene in form https://example.com. If web site in form www.example.com or is not have SSL change to http://www.example.com">
+                                    <a href="https://blacklanternsecurity.com" target="_blank">
+                                        <i class="material-icons" style="width:20px;font-size: 18px; color:#c1c1c1">outbound_outline</i>
+                                    </a>
+                                </span>
+                                <small><small>(1768 emails)</small></small>
+                            </div>
+                            <span title="Buy Now all 1768 emails of domain blacklanternsecurity.com">
+                                &nbsp;
+                                <button type="button" class="btn btn-primary btn-sm" ng-disabled="DisabledBuyNow" ng-click="buyOneDomain('blacklanternsecurity.com')">
+                                    <i class="material-icons md-18">arrow_right</i> Buy Now
+                                </button>
+                            </span>
+                            <button class="mdc-icon-button material-icons md-18"
+                                    style="color:#aaa"
+                                    data-toggle="popover" data-trigger="focus" data-html="true" title="Buy Now"
+                                    data-content=" &lt;b&gt;Buy now&lt;/b&gt; all &lt;b&gt;1768&lt;/b&gt; emails of &lt;b&gt;blacklanternsecurity.com&lt;/b&gt; domain.&lt;br /&gt;&#xD;&#xA;                                            &lt;b&gt;Here&lt;/b&gt; is only the preview part of all emails for this domain.&lt;br /&gt;&#xD;&#xA;                                             &lt;b&gt;After &lt;/b&gt; you press &lt;b&gt;Buy now&lt;/b&gt; button we will redirect you to email list with all emails of this domain,&#xD;&#xA;                                                    where you can buy it with PayPal or any of popular credit card or with Bitcoin (see &lt;a href=&#x27;/faq&#x27;&gt;FAQ&lt;/a&gt;) &lt;br /&gt;&lt;br /&gt;&#xD;&#xA;                                            ">
+                                help_outline
+                            </button>
+                            <div ng-show="ShowProgressBar" class="ng-hide">
+                                <div class="progress position-relative" style="height: 5px;margin-bottom:2px;">
+                                    <div class="progress-bar progress-bar-striped progress-bar-animated" role="progressbar" aria-valuemin="0" aria-valuemax="100"
+                                         style="width:{{ProgressBarValue}}%;  background-color:rgb(148, 194, 250) !important;"></div>
+                                    <span class="justify-content-center d-flex position-absolute w-100"></span>
+                                </div>
+                            </div>
+                            <span hidden ng-init="Doc.DomainEmails.Host='blacklanternsecurity.com'"></span>
+                            <span hidden ng-init="Doc.DomainEmails.IdEntity='5679236812ad5b3f748a413d'"></span>
+                            <table class="table table-striped  table-sm table-hover table-bordered text-muted">
+                                <thead class="table-primary">
+                                    <tr class="info">
+                                            <th style="width:1%;">#</th>
+                                        <th>
+                                            <div class="valign-center text-muted" title="Number of domain that filtered at least one email. Other domain is not in this list but it still you can see it in filter.">
+                                                <i class="material-icons md-dark">mail_outline</i> &nbsp; Email
+                                            </div>
+                                        </th>
+                                    </tr>
+                                </thead>
+                                <tbody>
+                                            <tr>
+                                                <td scope="row">1</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">2</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">3</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">4</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">5</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">6</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">7</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">8</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">9</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">10</td>
+                                                <td>
+                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                </tbody>
+                            </table>
+                                <a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+                                <a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+                        </div>
+                    <!-- Related domains -------------------------------------------------------------------------- -->
+            <br />
+            <br />
+            <br />
+            <br />
+      <div class="fb-comments" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="100%" data-numposts="5"></div>
+                </div>
+            <div class="col-sm-4" style="padding-top:60px;">
+             
+<div  style="display:inline-block;vertical-align:top;">
+    <div  style="display:inline-block;vertical-align:top;margin-top:-3px;">
+        <div class="fb-save" data-uri="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-size="small"></div>        </div>     
+    <div  style="display:inline-block;vertical-align:top;margin-top:0px;">
+        <div class="fb-like" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="" data-layout="button_count" data-action="like" data-size="small" data-share="true" data-colorscheme="light"></div>
+        </div>      
+</div>             
+<hr />
+            
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        
+    </div>
+</div>
+<br />
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        <br />
+        
+    </div>
+</div>
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        <br />
+        
+    </div>
+</div>  
+            <br />
+            <br />
+        </div>
+            </div>
+        </div>
+    </div>
+</div>
+    </main>
+    <footer class="text-muted" style="background-color: #ddd; margin-top: 60px; padding-top: 60px;">
+        <div class="container">
+            <hr>
+            <div class="row">
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">&copy; Skymem</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/">Home</a></li>
+                        <li><a href="/list">Create new email list</a></li>
+                        <li><a href="/faq">FAQ</a></li>
+                        <li><a href="/lists">Email lists</a></li>
+                <li>
+<a href="#a" class="popovers" style="text-decoration:none;"
+                   data-toggle="popover" data-trigger="manual" title="Name Extractor from text."
+                   data-original-title="Name Extractor from text."
+                   data-content="Try our new tool in (alfa version) for extracting person names from any kind of text.">                   
+                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
+                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
+                    </div>
+                </a>
+                                <a href="http://name.skymem.info"> New Tool: <b>Name Explorer</b></a>
+                            </li>
+                <li>
+                                <a href="http://martext.skymem.info"> MarText</a>
+                            </li>
+                        <li><a href="/donation">BitCoin Donations</a></li>
+                    </ul>
+                </div>
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">Contact</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/contact">Contact Us</a></li>
+                        <li><a href="https://www.facebook.com/Skymem-128969217176249/" target="_blank">Facebook page</a></li>
+            <li><a href="https://www.facebook.com/groups/169518103095402" target="_blank">Facebook group</a></li>
+            <li><a href="https://twitter.com/skymem" target="_blank">Twitter</a></li>
+                    </ul>
+                </div>
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">Policies</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/dmca-policy">DMCA Policy</a></li>
+                        <li><a href="/spam-policy">Spam Policy</a></li>
+                        <li><a href="/cookies-policy">Cookies Policy</a></li>
+                        <li><a href="/terms">Terms of Service</a></li>
+                        <li><a href="/privacy-policy">Privacy Policy</a></li>
+                        <li>
+                            <a href="http://www1395355448.e-cdn.com" rel="nofollow" target="_blank">Fight Spam!</a>
+                        </li>
+                    </ul>
+                </div>
+            </div>
+            <br />
+        </div>
+    </footer>
+    
+<script src="https://code.jquery.com/jquery-3.4.1.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous">
+</script>
+<script>(window.jQuery||document.write("\u003Cscript src=\u0022/lib2/jquery/jquery.min.js\u0022 integrity=\u0022sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
+<script src="https://stackpath.bootstrapcdn.com/bootstrap/4.3.1/js/bootstrap.bundle.min.js" integrity="sha384-xrRywqdh3PHs8keKZN+8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o" crossorigin="anonymous">
+</script>
+<script>(window.jQuery && window.jQuery.fn && window.jQuery.fn.modal||document.write("\u003Cscript src=\u0022/lib2/bootstrap/dist/js/bootstrap.bundle.min.js\u0022 integrity=\u0022sha384-xrRywqdh3PHs8keKZN\u002B8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/lodash.js/4.17.15/lodash.min.js" integrity="sha256-VeNaFBVDhoX3H+gJ37DpT/nTuZTdjYro9yBruHjVmoQ=" crossorigin="anonymous"></script>
+<script src="/lib2/angular-ui-grid/ui-grid.min.js"></script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/URI.js/1.19.1/URI.min.js"></script>
+<script src="/tsscripts/tsc.js?v=8ScpiXoINQWyILwjXqQp3feeposq0Ze9zjhZzJBAxc8"></script>
+<script src="/lib2/mcw/dist/material-components-web.min.js"></script>
+<script>
+    //$(function () {
+    //    $('[data-toggle="popover"]').popover();
+    //});
+    $(function () {
+        $("[data-toggle=popover]")
+            .popover({ html: true })
+            .on("focus", function () {
+                $(this).popover("show");
+            }).on("focusout", function () {
+                var _this = this;
+                if (!$(".popover:hover").length) {
+                    $(this).popover("hide");
+                }
+                else {
+                    $('.popover').mouseleave(function () {
+                        $(_this).popover("hide");
+                        $(this).off('mouseleave');
+                    });
+                }
+            });
+    });
+    $('.popover-dismiss').popover({
+        trigger: 'focus', html: true
+    });
+</script>
+<!-- Facebook Pixel Code -->
+<!-- End Facebook Pixel Code -->
+    
+</body>
+</html>"""
+page_3_body = """<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="utf-8" />    
+    <meta name="viewport" content="width=device-width, initial-scale=1">
+    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
+    <title>q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails</title>
+    <meta property="fb:app_id" content="876814239665436" /> 
+    <meta name="keywords" content="email, emails, email list, email marketing, marketing,  contacts, contact">
+    <meta name="description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails">
+    <meta name="author" content="Skymem">
+    <meta property="og:title" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
+    <meta property="og:site_name" content="Skymem web page" />
+    <meta property="og:type" content="website" />
+    <meta property="og:url" content="http://www.skymem.info/srch?q=blacklanternsecurity.com" />
+    <meta property="og:description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
+    <meta property="og:image" content="http://www.skymem.info/images/www2.jpg" />
+    <meta property="og:image:type" content="image/jpeg" />
+    <meta property="og:image:width" content="400" />
+    <meta property="og:image:height" content="300" />
+    <meta name="google-site-verification" content="tfut_b-dbvVtExEHbFHdpQirHTtvQLRFmBJOBw38s7w" />
+    <meta name="robots" content="noarchive">
+    <!-- Material Design for Bootstrap fonts and icons -->
+<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,400,500,700|Material+Icons">
+<link href="/lib2/mcw/dist/material-components-web.css" rel="stylesheet" />
+<link rel="stylesheet" href="https://stackpath.bootstrapcdn.com/bootstrap/4.2.1/css/bootstrap.min.css" />
+<meta name="x-stylesheet-fallback-test" content="" class="sr-only" /><script>!function(a,b,c,d){var e,f=document,g=f.getElementsByTagName("SCRIPT"),h=g[g.length-1].previousElementSibling,i=f.defaultView&&f.defaultView.getComputedStyle?f.defaultView.getComputedStyle(h):h.currentStyle;if(i&&i[a]!==b)for(e=0;e<c.length;e++)f.write('<link href="'+c[e]+'" '+d+"/>")}("position","absolute",["/lib2/bootstrap/dist/css/bootstrap.min.css"], "rel=\u0022stylesheet\u0022 ");</script>
+<link rel="stylesheet" href="/lib2/angular-ui-grid/ui-grid.css" />
+<link rel="stylesheet" href="/css/site.min.css" />
+<script src="/lib2/angular/angular.min.js"></script>
+        <script>            
+            (function (i, s, o, g, r, a, m) {
+                i['GoogleAnalyticsObject'] = r;
+                i[r] = i[r] ||
+                    function () {
+                        (i[r].q = i[r].q || []).push(arguments);
+                    }, i[r].l = 1 * new Date();
+                a = s.createElement(o),
+                    m = s.getElementsByTagName(o)[0];
+                a.async = 1;
+                a.src = g;
+                m.parentNode.insertBefore(a, m);
+            })(window, document, 'script', '//www.google-analytics.com/analytics.js', 'ga');
+            ga('create', 'UA-177951-20', 'auto');
+            ga('send', 'pageview');
+        </script>
+    <meta name="yandex-verification" content="552f869c3d2c3790" />
+    <!-- Bing: Verify ownership for: www.skymem.info -->
+    <meta name="msvalidate.01" content="C0E58004DB6ADBA4BDA8A8683D08CEF5" />
+    <meta name="exoclick-site-verification" content="a21b82b756cc4c93d048b5d81c98ed70">
+<meta name="ahrefs-site-verification" content="2dd82e09740f685c7a184846aa6da037541576526eda4833a0c622189d9a323a">
+</head>
+<body>
+<script>
+  window.fbAsyncInit = function() {
+    FB.init({
+      appId      : '876814239665436',
+      xfbml      : true,
+      version    : 'v12.0'
+    });
+    FB.AppEvents.logPageView();
+  };
+  (function(d, s, id){
+     var js, fjs = d.getElementsByTagName(s)[0];
+     if (d.getElementById(id)) {return;}
+     js = d.createElement(s); js.id = id;
+     js.src = "https://connect.facebook.net/en_US/sdk.js";
+     fjs.parentNode.insertBefore(js, fjs);
+   }(document, 'script', 'facebook-jssdk'));
+</script>
+<div id="fb-root"></div>
+<script async defer crossorigin="anonymous" src="https://connect.facebook.net/en_US/sdk.js#xfbml=1&version=v12.0&appId=876814239665436&autoLogAppEvents=1" nonce="CJ4gP3PN"></script>
+    <header>
+        <div style="border-bottom:1px solid #ffffff;">
+            <nav class="navbar navbar-expand-md navbar-light bg-light" style="border-bottom:1px solid #d8d8d8;background-color: #fff!important;">
+                <div class="container">
+                    <a class="navbar-brand valign-center text-muted" href="/"><i class="material-icons nav-link-go1">home</i></a>
+                    <button class="navbar-toggler collapsed" type="button" data-toggle="collapse" data-target="#navbarsExample07" aria-controls="navbarsExample07" aria-expanded="false" aria-label="Toggle navigation">
+                        <span class="navbar-toggler-icon"></span>
+                    </button>
+                    <div class="navbar-collapse collapse" id="navbarsExample07" style="">
+                        <ul class="navbar-nav mr-auto">
+                            <li class="nav-item">
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/list"><i class="material-icons" style="color:#007bff;">add</i> &nbsp; <span>Create email list</span></a>
+                            </li>
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/lists"> <i class="material-icons">mail_outline</i> &nbsp; <span>Email Lists</span></a>
+                            </li>
+                            <li class="nav-item">
+                                <a class="nav-link valign-center" href="/"> <i class="material-icons">search</i> &nbsp; <span></span></a>
+                            </li>
+                            
+                        </ul>
+                    </div>
+                </div>
+            </nav>
+        </div>
+    </header>
+    <main role="main">\
+        
+<style>
+img {
+  margin: 0em auto;
+  display: inline-block;  
+  width: 18px;
+}
+</style>
+<script>
+    var EmptyListPackData =  {"DocResRep":{"ItemsUI":null,"UiLimit":{"Throttle":0.15,"MiningInAdCasePer":0,"MiningInNoAdCasePer":100,"ShowAd":false,"EmailShowOnFirstSearchPage":5,"RelatedEmailsMax":100,"RelatedEmailsItemsPerPage":10,"EmailSearchCountLimitOnMore":50,"DomainCountShowOnFirstSearchPage":10,"DomainRelatedLimitOnMore":200,"DomainRelatedItemsPerPage":25,"EmailsOfDomainShowPercentageOfAll":50,"ItemsPerPageOnList":5,"ListIdItemsPerPage":25,"MaxEmailsInTrial":50,"DownloadEmailsCountTrialLimit":30},"ListVersionId":null,"ListName":null,"ListFilter":{"ConditionANDs":[],"NEmailPerDomain":2000000,"EmailsLimitPerList":2000000,"HostLimitPerList":2000000,"EmailsPreviewMaxCount":100,"HostsPreviewMaxCount":5000},"ListPackDesc":null,"ListFilterItems":null,"HostORItems":null,"OtherORItems":null,"FV":null,"DomainCount":0,"EmailCount":0,"TotalNEmails":null,"FoundNEmails":null,"CloneBy":null,"ListInternalType":"Normal","MarketplaceLP":null,"OperationMod":"None","FinishedPercentage":0.0,"ListComplete":null,"ListCompleteStat":null,"TrialEmails":[],"PriceCalc":null,"BuyNowUrl":null,"TotalNDomains":null,"CreatorId":null,"CreatorName":null,"IdEntity":null,"IdDoc":null,"IdDocVer":null,"ExtraElements":null},"DocCollection":"","Resources":""}; 
+</script>
+<div ng-app="AppMain">
+    <div ng-controller="SearchResultCtrl">
+        <div class="container">
+            
+    <form class="form" role="form">
+            <div class="input-group input-group-lg mb-3"
+                 title="The search lets you find all the email addresses using one given domain name (for example, 'company.com').">
+                <input type="text" style="min-width: 200px;" ng-model="Doc.SearchRequest" class="form-control" placeholder="company.com" autofocus />
+                <span ng-init="Doc.SearchRequest='blacklanternsecurity.com'"></span>
+                <div class="input-group-append">
+                    <button type="submit" value="Submit" class="btn btn-primary btn-lg" ng-click="post()">
+                        <div class="valign-center">
+                            <i class="material-icons md-24">search</i>
+                        </div>
+                        <span class="d-none d-sm-inline-block"> Find </span> <span class="d-none d-md-inline-block">email </span> <span class="d-none d-lg-inline-block"> addresses</span>
+                    </button>
+                </div>
+            </div>     
+            <div style="position:relative; top:-18px;">
+                <a href="#a" class="popovers" style="text-decoration:none;"
+                   data-toggle="popover" data-trigger="manual" title="New feature in search"
+                   data-original-title="New feature in search"
+                   data-content="Type first and last name with domain name and we will do our best to find the email of this person. eg. <br /> <a href='/srch?q=david%20baker%20exeloncorp.com&ss=home'><strong>david baker exeloncorp.com</strong></a>">                   
+                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
+                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
+                    </div>
+                </a>
+            </div>
+    </form>
+            <div style="margin: 0 0; text-align: center;">
+            </div>
+        <div class="row ">
+                <div class="col-sm-8" style="padding-top:20px">
+                    <!-- Emails found -------------------------------------------------------------------------- -->
+                    <!-- Related emails -------------------------------------------------------------------------- -->
+                    <!-- Domain XXX emails found -------------------------------------------------------------------------- -->
+                        <div style="padding-bottom:20px">
+                            <div class="valign-center text-muted mdc-typography--headline5" title="Domain related to this search result">
+                                <!-- <i class="material-icons md-dark md-36">language</i>&nbsp; --> 
+                <img style="width: 32px; margin-right:5px;" src="https://s2.googleusercontent.com/s2/favicons?domain=blacklanternsecurity.com&sz=128" />
+                                <a href="/srch?q=blacklanternsecurity.com">blacklanternsecurity.com</a>&nbsp;
+                                <span title="Press CTRL + mouse click or middle mouse button, to open in background tab. This is a link to external web site of this domene in form https://example.com. If web site in form www.example.com or is not have SSL change to http://www.example.com">
+                                    <a href="https://blacklanternsecurity.com" target="_blank">
+                                        <i class="material-icons" style="width:20px;font-size: 18px; color:#c1c1c1">outbound_outline</i>
+                                    </a>
+                                </span>
+                                <small><small>(1768 emails)</small></small>
+                            </div>
+                            <span title="Buy Now all 1768 emails of domain blacklanternsecurity.com">
+                                &nbsp;
+                                <button type="button" class="btn btn-primary btn-sm" ng-disabled="DisabledBuyNow" ng-click="buyOneDomain('blacklanternsecurity.com')">
+                                    <i class="material-icons md-18">arrow_right</i> Buy Now
+                                </button>
+                            </span>
+                            <button class="mdc-icon-button material-icons md-18"
+                                    style="color:#aaa"
+                                    data-toggle="popover" data-trigger="focus" data-html="true" title="Buy Now"
+                                    data-content=" &lt;b&gt;Buy now&lt;/b&gt; all &lt;b&gt;1768&lt;/b&gt; emails of &lt;b&gt;blacklanternsecurity.com&lt;/b&gt; domain.&lt;br /&gt;&#xD;&#xA;                                            &lt;b&gt;Here&lt;/b&gt; is only the preview part of all emails for this domain.&lt;br /&gt;&#xD;&#xA;                                             &lt;b&gt;After &lt;/b&gt; you press &lt;b&gt;Buy now&lt;/b&gt; button we will redirect you to email list with all emails of this domain,&#xD;&#xA;                                                    where you can buy it with PayPal or any of popular credit card or with Bitcoin (see &lt;a href=&#x27;/faq&#x27;&gt;FAQ&lt;/a&gt;) &lt;br /&gt;&lt;br /&gt;&#xD;&#xA;                                            ">
+                                help_outline
+                            </button>
+                            <div ng-show="ShowProgressBar" class="ng-hide">
+                                <div class="progress position-relative" style="height: 5px;margin-bottom:2px;">
+                                    <div class="progress-bar progress-bar-striped progress-bar-animated" role="progressbar" aria-valuemin="0" aria-valuemax="100"
+                                         style="width:{{ProgressBarValue}}%;  background-color:rgb(148, 194, 250) !important;"></div>
+                                    <span class="justify-content-center d-flex position-absolute w-100"></span>
+                                </div>
+                            </div>
+                            <span hidden ng-init="Doc.DomainEmails.Host='blacklanternsecurity.com'"></span>
+                            <span hidden ng-init="Doc.DomainEmails.IdEntity='5679236812ad5b3f748a413d'"></span>
+                            <table class="table table-striped  table-sm table-hover table-bordered text-muted">
+                                <thead class="table-primary">
+                                    <tr class="info">
+                                            <th style="width:1%;">#</th>
+                                        <th>
+                                            <div class="valign-center text-muted" title="Number of domain that filtered at least one email. Other domain is not in this list but it still you can see it in filter.">
+                                                <i class="material-icons md-dark">mail_outline</i> &nbsp; Email
+                                            </div>
+                                        </th>
+                                    </tr>
+                                </thead>
+                                <tbody>
+                                            <tr>
+                                                <td scope="row">1</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">2</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">3</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">4</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">5</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">6</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">7</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">8</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">9</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                            <tr>
+                                                <td scope="row">10</td>
+                                                <td>
+                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+                                                </td>
+                                            </tr>
+                                </tbody>
+                            </table>
+                                <a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+                                <a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+                        </div>
+                    <!-- Related domains -------------------------------------------------------------------------- -->
+            <br />
+            <br />
+            <br />
+            <br />
+      <div class="fb-comments" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="100%" data-numposts="5"></div>
+                </div>
+            <div class="col-sm-4" style="padding-top:60px;">
+             
+<div  style="display:inline-block;vertical-align:top;">
+    <div  style="display:inline-block;vertical-align:top;margin-top:-3px;">
+        <div class="fb-save" data-uri="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-size="small"></div>        </div>     
+    <div  style="display:inline-block;vertical-align:top;margin-top:0px;">
+        <div class="fb-like" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="" data-layout="button_count" data-action="like" data-size="small" data-share="true" data-colorscheme="light"></div>
+        </div>      
+</div>             
+<hr />
+            
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        
+    </div>
+</div>
+<br />
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        <br />
+        
+    </div>
+</div>
+<div class="hidden-xs" style="text-align: left;">
+    <div>
+        <br />
+        
+    </div>
+</div>  
+            <br />
+            <br />
+        </div>
+            </div>
+        </div>
+    </div>
+</div>
+    </main>
+    <footer class="text-muted" style="background-color: #ddd; margin-top: 60px; padding-top: 60px;">
+        <div class="container">
+            <hr>
+            <div class="row">
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">&copy; Skymem</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/">Home</a></li>
+                        <li><a href="/list">Create new email list</a></li>
+                        <li><a href="/faq">FAQ</a></li>
+                        <li><a href="/lists">Email lists</a></li>
+                <li>
+<a href="#a" class="popovers" style="text-decoration:none;"
+                   data-toggle="popover" data-trigger="manual" title="Name Extractor from text."
+                   data-original-title="Name Extractor from text."
+                   data-content="Try our new tool in (alfa version) for extracting person names from any kind of text.">                   
+                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
+                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
+                    </div>
+                </a>
+                                <a href="http://name.skymem.info"> New Tool: <b>Name Explorer</b></a>
+                            </li>
+                <li>
+                                <a href="http://martext.skymem.info"> MarText</a>
+                            </li>
+                        <li><a href="/donation">BitCoin Donations</a></li>
+                    </ul>
+                </div>
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">Contact</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/contact">Contact Us</a></li>
+                        <li><a href="https://www.facebook.com/Skymem-128969217176249/" target="_blank">Facebook page</a></li>
+            <li><a href="https://www.facebook.com/groups/169518103095402" target="_blank">Facebook group</a></li>
+            <li><a href="https://twitter.com/skymem" target="_blank">Twitter</a></li>
+                    </ul>
+                </div>
+                <div class="col-md-4">
+                    <h4 class="font-weight-light">Policies</h4>
+                    <ul class="list-unstyled">
+                        <li><a href="/dmca-policy">DMCA Policy</a></li>
+                        <li><a href="/spam-policy">Spam Policy</a></li>
+                        <li><a href="/cookies-policy">Cookies Policy</a></li>
+                        <li><a href="/terms">Terms of Service</a></li>
+                        <li><a href="/privacy-policy">Privacy Policy</a></li>
+                        <li>
+                            <a href="http://www1395355448.e-cdn.com" rel="nofollow" target="_blank">Fight Spam!</a>
+                        </li>
+                    </ul>
+                </div>
+            </div>
+            <br />
+        </div>
+    </footer>
+    
+<script src="https://code.jquery.com/jquery-3.4.1.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous">
+</script>
+<script>(window.jQuery||document.write("\u003Cscript src=\u0022/lib2/jquery/jquery.min.js\u0022 integrity=\u0022sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
+<script src="https://stackpath.bootstrapcdn.com/bootstrap/4.3.1/js/bootstrap.bundle.min.js" integrity="sha384-xrRywqdh3PHs8keKZN+8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o" crossorigin="anonymous">
+</script>
+<script>(window.jQuery && window.jQuery.fn && window.jQuery.fn.modal||document.write("\u003Cscript src=\u0022/lib2/bootstrap/dist/js/bootstrap.bundle.min.js\u0022 integrity=\u0022sha384-xrRywqdh3PHs8keKZN\u002B8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/lodash.js/4.17.15/lodash.min.js" integrity="sha256-VeNaFBVDhoX3H+gJ37DpT/nTuZTdjYro9yBruHjVmoQ=" crossorigin="anonymous"></script>
+<script src="/lib2/angular-ui-grid/ui-grid.min.js"></script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/URI.js/1.19.1/URI.min.js"></script>
+<script src="/tsscripts/tsc.js?v=8ScpiXoINQWyILwjXqQp3feeposq0Ze9zjhZzJBAxc8"></script>
+<script src="/lib2/mcw/dist/material-components-web.min.js"></script>
+<script>
+    //$(function () {
+    //    $('[data-toggle="popover"]').popover();
+    //});
+    $(function () {
+        $("[data-toggle=popover]")
+            .popover({ html: true })
+            .on("focus", function () {
+                $(this).popover("show");
+            }).on("focusout", function () {
+                var _this = this;
+                if (!$(".popover:hover").length) {
+                    $(this).popover("hide");
+                }
+                else {
+                    $('.popover').mouseleave(function () {
+                        $(_this).popover("hide");
+                        $(this).off('mouseleave');
+                    });
+                }
+            });
+    });
+    $('.popover-dismiss').popover({
+        trigger: 'focus', html: true
+    });
+</script>
+<!-- Facebook Pixel Code -->
+<!-- End Facebook Pixel Code -->
+    
+</body>
+</html>"""

From 516bf8d3ad97a0ad4321d37932f002d2ea328150 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 01:18:00 -0400
Subject: [PATCH 036/387] tests for ntlm, social, speculate, sublist3r,
 telerik, threatminer, url_manipulation, urlscan, viewdns, virustotal,
 wafw00f, wappalyzer

---
 bbot/core/helpers/web.py                      |   5 +-
 bbot/modules/ntlm.py                          |   3 +-
 bbot/modules/threatminer.py                   |   8 +-
 bbot/modules/url_manipulation.py              |   2 +-
 bbot/modules/urlscan.py                       |  21 +-
 bbot/modules/viewdns.py                       |  13 +-
 bbot/modules/virustotal.py                    |  11 +-
 bbot/modules/wappalyzer.py                    |   8 +-
 .../module_tests/test_module_social.py        |  14 +
 .../module_tests/test_module_speculate.py     |  22 ++
 .../test_module_subdomain_hijack.py           |  44 +++
 .../module_tests/test_module_sublist3r.py     |  13 +
 .../module_tests/test_module_telerik.py       |  74 ++++
 .../module_tests/test_module_threatminer.py   |  12 +
 .../test_module_url_manipulation.py           |  39 ++
 .../module_tests/test_module_urlscan.py       |  58 +++
 .../module_tests/test_module_viewdns.py       | 333 ++++++++++++++++++
 .../module_tests/test_module_virustotal.py    |  51 +++
 .../module_tests/test_module_wafw00f.py       |  14 +
 .../module_tests/test_module_wappalyzer.py    |  20 ++
 20 files changed, 733 insertions(+), 32 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index d47b6289f2..f111071273 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -119,7 +119,7 @@ async def download(self, url, **kwargs):
         cache_hrs = float(kwargs.pop("cache_hrs", -1))
         log.debug(f"Downloading file from {url} with cache_hrs={cache_hrs}")
         if cache_hrs > 0 and self.parent_helper.is_cached(url):
-            log.debug(f"{url} is cached")
+            log.debug(f"{url} is cached at {self.parent_helper.cache_filename(url)}")
             success = True
         else:
             # kwargs["raise_error"] = True
@@ -175,9 +175,6 @@ async def api_page_iter(self, url, page_size=100, json=True, **requests_kwargs):
         offset = 0
         while 1:
             new_url = url.format(page=page, page_size=page_size, offset=offset)
-            data = requests_kwargs.get("data", None)
-            if data is not None:
-                requests_kwargs["data"] = requests_kwargs["data"].format(page=page, page_size=page_size, offset=offset)
             result = await self.request(new_url, **requests_kwargs)
             try:
                 if json:
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index a5d2fed372..6f5f535d0e 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -3,7 +3,8 @@
 
 ntlm_discovery_endpoints = [
     "",
-    "autodiscover/autodiscover.xml" "ecp/",
+    "autodiscover/autodiscover.xml",
+    "ecp/",
     "ews/",
     "ews/exchange.asmx",
     "exchange/",
diff --git a/bbot/modules/threatminer.py b/bbot/modules/threatminer.py
index 3f6c99f2fe..066e4c3bb1 100644
--- a/bbot/modules/threatminer.py
+++ b/bbot/modules/threatminer.py
@@ -11,9 +11,11 @@ class threatminer(crobat):
 
     base_url = "https://api.threatminer.org/v2"
 
-    def request_url(self, query):
-        return self.request_with_fail_count(f"{self.base_url}/domain.php?q={self.helpers.quote(query)}&rt=5")
+    async def request_url(self, query):
+        url = f"{self.base_url}/domain.php?q={self.helpers.quote(query)}&rt=5"
+        r = await self.request_with_fail_count(url)
+        return r
 
     def parse_results(self, r, query):
         j = r.json()
-        yield from j.get("results", [])
+        return list(j.get("results", []))
diff --git a/bbot/modules/url_manipulation.py b/bbot/modules/url_manipulation.py
index 851761dc2a..1af1316ccc 100644
--- a/bbot/modules/url_manipulation.py
+++ b/bbot/modules/url_manipulation.py
@@ -78,7 +78,7 @@ async def handle_event(self, event):
                 else:
                     self.debug("Ignoring positive result due to presence of parameter name in result")
 
-    def filter_event(self, event):
+    async def filter_event(self, event):
         accepted_status_codes = ["200", "301", "302"]
 
         for c in accepted_status_codes:
diff --git a/bbot/modules/urlscan.py b/bbot/modules/urlscan.py
index 2b3b92400d..320c327618 100644
--- a/bbot/modules/urlscan.py
+++ b/bbot/modules/urlscan.py
@@ -13,13 +13,13 @@ class urlscan(crobat):
 
     base_url = "https://urlscan.io/api/v1"
 
-    def setup(self):
+    async def setup(self):
         self.urls = self.config.get("urls", False)
-        return super().setup()
+        return await super().setup()
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
-        for domain, url in self.query(query):
+        for domain, url in await self.query(query):
             source_event = event
             if domain and domain != query:
                 domain_event = self.make_event(domain, "DNS_NAME", source=event)
@@ -38,10 +38,12 @@ def handle_event(self, event):
                     else:
                         self.debug(f"{url_event.host} does not match {query}")
 
-    def query(self, query):
-        results = self.helpers.request(f"{self.base_url}/search/?q={self.helpers.quote(query)}")
+    async def query(self, query):
+        results = set()
+        url = f"{self.base_url}/search/?q={self.helpers.quote(query)}"
+        r = await self.helpers.request(url)
         try:
-            json = results.json()
+            json = r.json()
             if json and type(json) == dict:
                 for result in json.get("results", []):
                     if result and type(result) == dict:
@@ -50,14 +52,15 @@ def query(self, query):
                             domain = task.get("domain", "")
                             url = task.get("url", "")
                             if domain or url:
-                                yield domain, url
+                                results.add((domain, url))
                         page = result.get("page", {})
                         if page and type(page) == dict:
                             domain = page.get("domain", "")
                             url = page.get("url", "")
                             if domain or url:
-                                yield domain, url
+                                results.add((domain, url))
             else:
                 self.debug(f'No results for "{query}"')
         except Exception:
             self.verbose(f"Error retrieving urlscan results")
+        return results
diff --git a/bbot/modules/viewdns.py b/bbot/modules/viewdns.py
index 0714bdc8e5..8ddc3e818c 100644
--- a/bbot/modules/viewdns.py
+++ b/bbot/modules/viewdns.py
@@ -39,6 +39,7 @@ async def handle_event(self, event):
             # todo: registrar?
 
     async def query(self, query):
+        results = set()
         url = f"{self.base_url}/reversewhois/?q={query}"
         r = await self.helpers.request(url)
         status_code = getattr(r, "status_code", 0)
@@ -47,7 +48,7 @@ async def query(self, query):
 
         content = getattr(r, "content", b"")
         html = BeautifulSoup(content, features="lxml")
-        yielded = set()
+        found = set()
         for table_row in html.findAll("tr"):
             table_cells = table_row.findAll("td")
             # make double-sure we're in the right table by checking the date field
@@ -58,10 +59,12 @@ async def query(self, query):
                     # registrar == last cell
                     registrar = table_cells[-1].text.strip()
                     if domain and not domain == query:
-                        to_yield = (domain, registrar)
-                        to_yield_hash = hash(to_yield)
-                        if to_yield_hash not in yielded:
-                            yield to_yield
+                        result = (domain, registrar)
+                        result_hash = hash(result)
+                        if result_hash not in found:
+                            found.add(result_hash)
+                            results.add(result)
             except IndexError:
                 self.debug(f"Invalid row {str(table_row)[:40]}...")
                 continue
+        return results
diff --git a/bbot/modules/virustotal.py b/bbot/modules/virustotal.py
index 1a15985620..dac8ee6335 100644
--- a/bbot/modules/virustotal.py
+++ b/bbot/modules/virustotal.py
@@ -11,18 +11,19 @@ class virustotal(shodan_dns):
 
     base_url = "https://www.virustotal.com/api/v3"
 
-    def setup(self):
+    async def setup(self):
         self.api_key = self.config.get("api_key", "")
         self.headers = {"x-apikey": self.api_key}
-        return super().setup()
+        return await super().setup()
 
-    def ping(self):
+    async def ping(self):
         # virustotal does not have a ping function
         return
 
-    def request_url(self, query):
+    async def request_url(self, query):
         url = f"{self.base_url}/domains/{self.helpers.quote(query)}/subdomains"
-        return self.request_with_fail_count(url, headers=self.headers)
+        r = await self.request_with_fail_count(url, headers=self.headers)
+        return r
 
     def parse_results(self, r, query):
         results = set()
diff --git a/bbot/modules/wappalyzer.py b/bbot/modules/wappalyzer.py
index 5d4e51fa54..a372d1791d 100644
--- a/bbot/modules/wappalyzer.py
+++ b/bbot/modules/wappalyzer.py
@@ -22,12 +22,12 @@ class wappalyzer(BaseModule):
     scope_distance_modifier = None
     max_event_handlers = 5
 
-    def setup(self):
-        self.wappalyzer = Wappalyzer.latest()
+    async def setup(self):
+        self.wappalyzer = await self.scan.run_in_executor(Wappalyzer.latest)
         return True
 
-    def handle_event(self, event):
-        for res in self.wappalyze(event.data):
+    async def handle_event(self, event):
+        for res in await self.scan.run_in_executor(self.wappalyze, event.data):
             self.emit_event(
                 {"technology": res.lower(), "url": event.data["url"], "host": str(event.host)}, "TECHNOLOGY", event
             )
diff --git a/bbot/test/test_step_1/module_tests/test_module_social.py b/bbot/test/test_step_1/module_tests/test_module_social.py
index e69de29bb2..caded2ec78 100644
--- a/bbot/test/test_step_1/module_tests/test_module_social.py
+++ b/bbot/test/test_step_1/module_tests/test_module_social.py
@@ -0,0 +1,14 @@
+from .base import ModuleTestBase
+
+
+class TestSocial(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "excavate", "social"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": '<html><a href="https://discord.gg/asdf"/></html>'}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "SOCIAL" and e.data["platform"] == "discord" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_speculate.py b/bbot/test/test_step_1/module_tests/test_module_speculate.py
index e69de29bb2..27156707bf 100644
--- a/bbot/test/test_step_1/module_tests/test_module_speculate.py
+++ b/bbot/test/test_step_1/module_tests/test_module_speculate.py
@@ -0,0 +1,22 @@
+from .base import ModuleTestBase
+
+
+class TestSpeculate_Subdirectories(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888/subdir1/subdir2/"]
+    modules_overrides = ["httpx", "speculate"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/subdir1/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/subdir1/subdir2/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "URL_UNVERIFIED" and e.data == "http://127.0.0.1:8888/subdir1/" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py b/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
index e69de29bb2..c0c1006279 100644
--- a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
+++ b/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
@@ -0,0 +1,44 @@
+from .base import ModuleTestBase
+
+
+class TestSubdomain_Hijack(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "excavate", "subdomain_hijack"]
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json",
+            json=[
+                {
+                    "cicd_pass": True,
+                    "cname": ["us-east-1.elasticbeanstalk.com"],
+                    "discussion": "[Issue #194](https://github.com/EdOverflow/can-i-take-over-xyz/issues/194)",
+                    "documentation": "",
+                    "fingerprint": "NXDOMAIN",
+                    "http_status": None,
+                    "nxdomain": True,
+                    "service": "AWS/Elastic Beanstalk",
+                    "status": "Vulnerable",
+                    "vulnerable": True,
+                }
+            ],
+        )
+
+    def setup_after_prep(self, module_test):
+        fingerprints = module_test.module.fingerprints
+        assert fingerprints, "No subdomain hijacking fingerprints available"
+        fingerprint = next(iter(fingerprints))
+        rand_string = module_test.scan.helpers.rand_string(length=15, digits=False)
+        self.rand_subdomain = f"{rand_string}.{next(iter(fingerprint.domains))}"
+        module_test.log.critical(self.rand_subdomain)
+        respond_args = {"response_data": f'<a src="http://{self.rand_subdomain}"/>'}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            event.type == "FINDING"
+            and event.data["description"].startswith("Hijackable Subdomain")
+            and self.rand_subdomain in event.data["description"]
+            and event.data["host"] == self.rand_subdomain
+            for event in events
+        ), f"No hijackable subdomains in {events}"
diff --git a/bbot/test/test_step_1/module_tests/test_module_sublist3r.py b/bbot/test/test_step_1/module_tests/test_module_sublist3r.py
index e69de29bb2..a7cacd2310 100644
--- a/bbot/test/test_step_1/module_tests/test_module_sublist3r.py
+++ b/bbot/test/test_step_1/module_tests/test_module_sublist3r.py
@@ -0,0 +1,13 @@
+from .base import ModuleTestBase
+
+
+class TestSublist3r(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://api.sublist3r.com/search.php?domain=blacklanternsecurity.com",
+            json=["asdf.blacklanternsecurity.com", "zzzz.blacklanternsecurity.com"],
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_telerik.py b/bbot/test/test_step_1/module_tests/test_module_telerik.py
index e69de29bb2..3e6dba2299 100644
--- a/bbot/test/test_step_1/module_tests/test_module_telerik.py
+++ b/bbot/test/test_step_1/module_tests/test_module_telerik.py
@@ -0,0 +1,74 @@
+import re
+from .base import ModuleTestBase
+
+
+class TestTelerik(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "telerik"]
+    config_overrides = {"modules": {"telerik": {"exploit_RAU_crypto": True}}}
+
+    def setup_before_prep(self, module_test):
+        # Simulate Telerik.Web.UI.WebResource.axd?type=rau detection
+        expect_args = {"method": "GET", "uri": "/Telerik.Web.UI.WebResource.axd", "query_string": "type=rau"}
+        respond_args = {
+            "response_data": '{ "message" : "RadAsyncUpload handler is registered succesfully, however, it may not be accessed directly." }'
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        # Simulate Vulnerable Telerik.Web.UI.WebResource.axd
+        vuln_data = "ATTu5i4R+ViNFYO6kst0jC11wM/1iqH+W/isjhaDjNuCI7eJ/BY5d1E9eqZK27CJCMuon9u8/hgRIM/cTlgLlv4qOYjPBjs81Y3dAZAdtIr3TXiCmZi9M09a1BYMxjvGKfVky3b7PoOppeWS/3rglTwL1e8oyqLGx2NKUH5y8Cd+kLKV2f31J1sV4I5HTDKgDmvziJp3zlDrCb0Fi9ilKH+O1cbVx6SdBop/U30FxLaB/QIbt2N1rQHREJ5Skpgo7dilPxzBaTObdBhCVyB/FiJhenS/0u3h0Mpi6+A40SylICcyyxQha7+Uh7lEJ8Ne+2eTs4WqcaaQbvIhy7oHc+D0soxRKMZRjo7Up+UWHQJJh6KtWSCxUESNSdNcxjPQZE9HqsPlldVlkeC+ehSGce5bR0Ylots6Iz1OoCgMEWwxByeG3VzgxF6XpitL61A1hFcNo9euSTnCfOWh0vrQHON7DN5LpM9xr7SoD0Dnu01hZ9NS1PHhPLyN5WS87u5qdZp/z3Sxwc3wawIdo62RNf4Iz2gAKJZnPfxrE1mRn5kBe7f6O44rcuv6lcdao/DGlwbERKwRI6/n+FxGmc7H5iEKyihIwS2XUoOgsYTx5CWCDM8CuOXTk+H5fPYp9APRPbkD1IS9I/vRmvNPwWsgv8/7DzttqdBsGxiZJfCw1uZ7KSVmbItgXPAcscNxGEMaHXyJzkAl/mlM5/t/YSejwYoSW6jFfQcLdaVx2dpIpl5UmmQjFedzKeiNqpZDCk4yzXFHX24XUODYMJDtIJK2Hz1KTZmFG+LAOJjB9QOI58hFAnytcKay+JWFrzah/IvoNZxJUtlYdxw0YEyKs/ExET7AXgYQN0S+8j2PfaMMpzDSctTqpp5XBFV4Mt718GiqVnQJtWQv2p9Xl8XXOerBthbzzAciVcB8AV2WfZ51W3e4aX4kcyT/sCJhm7NR5WrNG5mX/ns0TTnGnzlPYhJcbu8uMFjMGDpXuhVyroJ7wmZucaIvesg0h5Y9cMEFviqsdy15vjMzFh+v9uO9Vicf6n9Z9JGSpWKE8wer2JU5b53Zw0cTfulAAffLWXnzOnfu&6R/cGaqQeHVAzdJ9wTFOyCsrMSTtqcjLe8AHwiPckPDUwecnJyNlkDYwDQpxGYQ9hs6YxhupK310sbCbtXB4H6Dz5rGNL40nkkyo4j2clmRr08jtFsPQ0RpE5BGsulPT3l0MxyAvPFMs8bMybUyAP+9RB9LoHE3Xo8BqDadX3HQakpPfGtiDMp+wxkWRgaNpCnXeY1QewWTF6z/duLzbu6CT6s+H4HgBHrOLTpemC2PvP2bDm0ySPHLdpapLYxU8nIYjLKIyYJgwv9S9jNckIVpcGVTWVul7CauCKxAB2mMnM9jJi8zfFwKajT5d2d9XfpkiVMrdlmikSB/ehyX1wQ=="
+        expect_args = {
+            "method": "POST",
+            "uri": "/Telerik.Web.UI.WebResource.axd",
+            "query_string": "type=rau",
+            "data": vuln_data,
+        }
+        respond_args = {
+            "response_data": '{"fileInfo":{"FileName":"RAU_crypto.bypass","ContentType":"text/html","ContentLength":5,"DateJson":"2019-01-02T03:04:05.067Z","Index":0}, "metaData":"CS8S/Z0J/b2982DRxDin0BBslA7fI0cWMuWlPu4W3FkE4tKaVoIEiAOtVlJ6D+0RQsfu8ox6gvMYxceQ0LtWyTkQBaIUa8LgLQg05DMaQuufHNx0YQ2ACi5neqDBvduj2MGiSGC0hNKzSWsHystZGUfFPLTZuJXYnff+WXurecuRzSI7d4Q1aj0bcTKKvfyQtH+fsTEafWRRZ99X/xgi4ON2OsRZ738uQHw7pQT2e1v7AtN46mxO/BmhEuZQr6m6HEvxK0pJRNkBhFUiQ+poeu8j3JzicOjvPDwFE4Rjqf3RVILt83XZrju2VpRIJqAEtf//znhH8BhT5BWvhnRo+J3ML5qoZLa2joE/QK8Ctf3UPvAFkHIUMdOH2mLNgZ+U87tdVE6fYfzvphZsLxmJRG45H8ZTZuYhJbOfei2LQ4fqHmr7p8KpJNVqoz/ev1dnBclAf5ayb40qJKEVsGXIbWEbIZwg7TTsLFc29aP7DPg=" }'
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        # Simulate DialogHandler detection
+        expect_args = {"method": "GET", "uri": "Telerik.Web.UI.SpellCheckHandler.axd"}
+        respond_args = {"status": 500}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        # Simulate DialogHandler detection
+        expect_args = {"method": "GET", "uri": "/App_Master/Telerik.Web.UI.DialogHandler.aspx"}
+        respond_args = {
+            "response_data": '<input type="hidden" name="dialogParametersHolder" id="dialogParametersHolder" /><div style=\'color:red\'>Cannot deserialize dialog parameters. Please refresh the editor page.</div><div>Error Message:Invalid length for a Base-64 char array or string.</div></form></body></html>'
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        # Fallback
+        expect_args = {"uri": re.compile(r"^/\w{10}$")}
+        respond_args = {"status": 200}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        telerik_axd_detection = False
+        telerik_axd_vulnerable = False
+        telerik_spellcheck_detection = False
+        telerik_dialoghandler_detection = False
+
+        for e in events:
+            if e.type == "FINDING" and "Telerik RAU AXD Handler detected" in e.data["description"]:
+                telerik_axd_detection = True
+                continue
+
+            if e.type == "VULNERABILITY" and "Confirmed Vulnerable Telerik (version: 2014.3.1024)":
+                telerik_axd_vulnerable = True
+                continue
+
+            if e.type == "FINDING" and "Telerik DialogHandler detected" in e.data["description"]:
+                telerik_dialoghandler_detection = True
+                continue
+
+            if e.type == "FINDING" and "Telerik SpellCheckHandler detected" in e.data["description"]:
+                telerik_spellcheck_detection = True
+                continue
+
+        assert telerik_axd_detection, "Telerik AXD detection failed"
+        assert telerik_axd_vulnerable, "Telerik vulnerable AXD detection failed"
+        assert telerik_spellcheck_detection, "Telerik spellcheck detection failed"
+        assert telerik_dialoghandler_detection, "Telerik dialoghandler detection failed"
diff --git a/bbot/test/test_step_1/module_tests/test_module_threatminer.py b/bbot/test/test_step_1/module_tests/test_module_threatminer.py
index e69de29bb2..71864f1b25 100644
--- a/bbot/test/test_step_1/module_tests/test_module_threatminer.py
+++ b/bbot/test/test_step_1/module_tests/test_module_threatminer.py
@@ -0,0 +1,12 @@
+from .base import ModuleTestBase
+
+
+class TestThreatminer(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.threatminer.org/v2/domain.php?q=blacklanternsecurity.com&rt=5",
+            json={"results": ["asdf.blacklanternsecurity.com"]},
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py b/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
index e69de29bb2..8a197dbe7b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
+++ b/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
@@ -0,0 +1,39 @@
+from .base import ModuleTestBase
+
+
+class TestUrl_Manipulation(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "url_manipulation"]
+    body = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello null!</p>';
+    </body>
+    </html>
+    """
+
+    body_match = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello AAAAAAAAAAAAAA!</p>';
+    </body>
+    </html>
+    """
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"query_string": f"{module_test.module.rand_string}=.xml".encode()}
+        respond_args = {"response_data": self.body_match}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.body}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING"
+            and e.data["description"]
+            == f"Url Manipulation: [body] Sig: [Modified URL: http://127.0.0.1:8888/?{module_test.module.rand_string}=.xml]"
+            for e in events
+        )
diff --git a/bbot/test/test_step_1/module_tests/test_module_urlscan.py b/bbot/test/test_step_1/module_tests/test_module_urlscan.py
index e69de29bb2..51ec290fcf 100644
--- a/bbot/test/test_step_1/module_tests/test_module_urlscan.py
+++ b/bbot/test/test_step_1/module_tests/test_module_urlscan.py
@@ -0,0 +1,58 @@
+from .base import ModuleTestBase
+
+
+class TestUrlScan(ModuleTestBase):
+    config_overrides = {"modules": {"urlscan": {"urls": True}}}
+
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://urlscan.io/api/v1/search/?q=blacklanternsecurity.com",
+            json={
+                "results": [
+                    {
+                        "task": {
+                            "visibility": "public",
+                            "method": "api",
+                            "domain": "asdf.blacklanternsecurity.com",
+                            "apexDomain": "blacklanternsecurity.com",
+                            "time": "2023-05-17T01:45:11.391Z",
+                            "uuid": "c558b3b3-b274-4339-99ef-301eb043741f",
+                            "url": "https://asdf.blacklanternsecurity.com/cna.html",
+                        },
+                        "stats": {
+                            "uniqIPs": 6,
+                            "uniqCountries": 3,
+                            "dataLength": 926713,
+                            "encodedDataLength": 332213,
+                            "requests": 22,
+                        },
+                        "page": {
+                            "country": "US",
+                            "server": "GitHub.com",
+                            "ip": "2606:50c0:8002::153",
+                            "mimeType": "text/html",
+                            "title": "Vulnerability Program | Black Lantern Security",
+                            "url": "https://asdf.blacklanternsecurity.com/cna.html",
+                            "tlsValidDays": 89,
+                            "tlsAgeDays": 25,
+                            "tlsValidFrom": "2023-04-21T19:16:58.000Z",
+                            "domain": "asdf.blacklanternsecurity.com",
+                            "apexDomain": "blacklanternsecurity.com",
+                            "asnname": "FASTLY, US",
+                            "asn": "AS54113",
+                            "tlsIssuer": "R3",
+                            "status": "200",
+                        },
+                        "_id": "c558b3b3-b274-4339-99ef-301eb043741f",
+                        "_score": None,
+                        "sort": [1684287911391, "c558b3b3-b274-4339-99ef-301eb043741f"],
+                        "result": "https://urlscan.io/api/v1/result/c558b3b3-b274-4339-99ef-301eb043741f/",
+                        "screenshot": "https://urlscan.io/screenshots/c558b3b3-b274-4339-99ef-301eb043741f.png",
+                    }
+                ]
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "https://asdf.blacklanternsecurity.com/cna.html" for e in events), "Failed to detect URL"
diff --git a/bbot/test/test_step_1/module_tests/test_module_viewdns.py b/bbot/test/test_step_1/module_tests/test_module_viewdns.py
index e69de29bb2..d40960e483 100644
--- a/bbot/test/test_step_1/module_tests/test_module_viewdns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_viewdns.py
@@ -0,0 +1,333 @@
+from .base import ModuleTestBase
+
+
+class TestViewDNS(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://viewdns.info/reversewhois/?q=blacklanternsecurity.com",
+            text=web_body,
+        )
+
+    def check(self, module_test, events):
+        assert any(
+            e.data == "hyperloop.com" and "affiliate" in e.tags for e in events
+        ), "Failed to detect affiliate domain"
+
+
+web_body = """<html>
+   <head>
+      <meta name="google-site-verification" content="DUBJr87ZeILnfEKxhntAq9XPSZCa2mb3W4FAwXjKpyk" />
+      <title>Reverse Whois Lookup - ViewDNS.info</title>
+      <meta keywords="viewdns, dns, info, reverse ip, pagerank, portscan, port scan, lookup, records, whois, ipwhois, dnstools, web hosting, hosting, traceroute, dns report, dnsreport, ip location, ip location finder, spam, spam database, dnsbl, propagation, dns propagation checker, checker, china, chinese, firewall, great firewall, is my site down, is site down, site down, down, dns propagate">
+      <meta description="This free tool will allow you to find domain names owned by an individual person or company.  Simply enter the email address or name of the person or company to find other domains registered using those same details.">
+      <!-- form validation -->
+      <script language="JavaScript" type="text/javascript">
+         <!--
+         /* break us out of any containing iframes */
+         if (top != self) { top.location.replace(self.location.href); }
+         
+         function validate ( form )
+         {
+           for(v=0; v<form.elements.length; v++)
+           {
+             //trim element
+             if(!String.prototype.trim) {   
+               String.prototype.trim = function () {   
+                 return this.replace(/^\s+|\s+$/g,'');   
+               };   
+             } 
+             form.elements[v].value = form.elements[v].value.trim();
+             
+               
+               //check for null value
+               if (form.elements[v].value == "") 
+               {
+                 alert( "Value cannot be blank." );
+                 form.elements[v].focus();
+                 return false ;
+               }
+               //check if a domain parameter has a .
+               if (form.elements[v].name == "domain" || form.elements[v].name == "ip")
+               {
+                 if (form.elements[v].value.indexOf('.') == -1)
+                 {
+                     //no . in domain/ip
+                     alert("Invalid Domain/IP address.");
+                     form.elements[v].focus();
+                     return false;
+                 }
+               }
+               //ensure only whitelisted characters have been entered
+               if (form.elements[v].name == "asn")
+                 var whitelist = /^[0-9]$/;
+               else if (form.elements[v].name == "url")
+                 return true;
+               else
+                 var whitelist = /^[0-9a-zA-Z.\-\_]$/;
+               var data = form.elements[v].value;
+               for (var i=0;i<data.length;i++)
+               {
+                 var thisChar = data.charAt(i);
+                 if (!whitelist.test(thisChar))
+                 {
+                     alert( "Value contains invalid characters." );
+                     form.elements[v].focus();
+                     return false;
+                 }
+               }
+           }
+          
+           return true ;
+         }
+         //-->
+      </script>
+      <!-- end form validation -->
+      <!-- form validation -->
+      <script language="JavaScript" type="text/javascript">
+         <!--
+         function validateReg ( form )
+         {
+           for(v=0; v<form.elements.length; v++)
+           {
+               //check for null value
+               if (form.elements[v].name != "site")
+               {
+                   if (form.elements[v].value == "") 
+                   {
+                     alert( "Value cannot be blank." );
+                     form.elements[v].focus();
+                     return false ;
+                   }
+                 }
+                 //make sure password length 8 and passwords match
+                 if (document.register.pass1.value != document.register.pass2.value)
+                 {
+                     alert("Passwords do not match.");
+                     return false;
+                 }
+                 if (document.register.pass1.value.length < 8)
+                 {
+                     alert("Password must be at least 8 characters.");
+                     return false;
+                 }       
+                 
+                 //check email address is valid
+                 if (form.elements[v].name == "email")
+                 {
+                     var re = /^(([^<>()[\]\\.,;:\s@\"]+(\.[^<>()[\]\\.,;:\s@\"]+)*)|(\".+\"))@((\[[0-9]{1,3}\.[0-9]{1,3}\.[0-9]{1,3}\.[0-9]{1,3}\])|(([a-zA-Z\-0-9]+\.)+[a-zA-Z]{2,}))$/;
+                 if (!re.test(form.elements[v].value))
+                 {
+                     alert("Email address is invalid.");
+                     return false;
+                 }
+             }
+           }
+          
+           return true ;
+         }
+         //-->
+      </script>
+      <!-- end form validation -->
+      <style type="text/css">
+         <!--
+            .mainlinks { text-decoration: none; color: #000000 }
+            -->
+      </style>
+      <!-- google analytics -->
+      <script type="text/javascript">
+         var _gaq = _gaq || [];
+         _gaq.push(['_setAccount', 'UA-20325459-1']);
+         _gaq.push(['_setDomainName', '.viewdns.info']);
+         _gaq.push(['_trackPageview']);
+         
+         (function() {
+           var ga = document.createElement('script'); ga.type = 'text/javascript'; ga.async = true;
+           ga.src = ('https:' == document.location.protocol ? 'https://ssl' : 'http://www') + '.google-analytics.com/ga.js';
+           var s = document.getElementsByTagName('script')[0]; s.parentNode.insertBefore(ga, s);
+         })();
+         gtag('config', 'AW-1024044984');
+      </script>
+      <!-- /google analytics -->
+      <style>
+         #header ul {
+         list-style: none;
+         padding:0;
+         padding-bottom: 2px; 
+         margin:0;
+         }
+         #header li {
+         float: left;
+         border: 1px solid #CCCCCC;
+         border-bottom-width: 0;
+         margin: 0 0.5em 0 0;
+         }
+         #header li a {
+         padding: 0 1em;
+         color: #000000;
+         text-decoration: none;
+         }
+         #header #selected {
+         position: relative;
+         top: 2px;
+         padding-top: 5px;
+         padding-bottom:4px;
+         background: white;
+         font-weight: bold;
+         }
+         #header #notselected {
+         position: relative;
+         top: 5px;
+         padding-top: 2px;
+         padding-bottom: 3px;
+         background: #e1eae2;
+         }
+         body {
+         font-family: Verdana, sans-serif;
+         }
+      </style>
+      <link rel="apple-touch-icon" href="/apple-touch-icon.png"/>
+      <!-- FBPX -->
+      <script>
+         !function(f,b,e,v,n,t,s)
+         {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
+         n.callMethod.apply(n,arguments):n.queue.push(arguments)};
+         if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
+         n.queue=[];t=b.createElement(e);t.async=!0;
+         t.src=v;s=b.getElementsByTagName(e)[0];
+         s.parentNode.insertBefore(t,s)}(window, document,'script',
+         'https://connect.facebook.net/en_US/fbevents.js');
+         fbq('init', '219605381956214');
+         fbq('track', 'PageView');
+      </script>
+      <noscript><img height="1" width="1" style="display:none"
+         src="https://www.facebook.com/tr?id=219605381956214&ev=PageView&noscript=1"
+         /></noscript>
+      <!-- FBPX -->
+   </head>
+   <body bgcolor="#ededed">
+      <font face="Verdana">
+      <table width="1000" align="center">
+         <tr height="62">
+            <td align="left" width="400"><a href="/"><img src="/images/viewdns_logo.gif" border="0" width="399" height="42.5" alt="ViewDNS.info - Your one source for DNS related tools!"></a></td>
+            <td align="center" valign="middle">
+               <script async src="//pagead2.googlesyndication.com/pagead/js/adsbygoogle.js"></script>
+               <!-- ViewDNS 468x60 -->
+               <ins class="adsbygoogle"
+                  style="display:inline-block;width:468px;height:60px"
+                  data-ad-client="ca-pub-7431844373287199"
+                  data-ad-slot="1039512844"></ins>
+               <script>
+                  (adsbygoogle = window.adsbygoogle || []).push({});
+               </script>
+            </td>
+         </tr>
+      </table>
+      <!-- tabs -->
+      <!--<div id="header" width="1000" align="center"> -->
+      <div id="header">
+         <table width="1000" align="center" cellspacing="0" cellpadding="0">
+            <tbody>
+               <tr>
+                  <td>
+                     <ul>
+                        <li id="selected"><a href="https://viewdns.info/">Tools</a></li>
+                        <li id="notselected"><a href="https://viewdns.info/api/">API</a></li>
+                        <li id="notselected"><a href="https://viewdns.info/research/">Research</a></li>
+                        <li id="notselected"><a href="https://viewdns.info/data/">Data</a></li>
+                     </ul>
+                  </td>
+               </tr>
+            </tbody>
+         </table>
+      </div>
+      <!--</div>-->
+      <!-- end tabs-->
+      <!--<div>-->
+      <table width="1000" bgcolor="#FFFFFF" style="border: 1px solid #CCCCCC; padding: 5px" align="center" id="null">
+         <tr></tr>
+         <tr>
+            <td>
+               <font size="2">
+                  <a href="/" style="color: #00721e;">ViewDNS.info</a> > <a href="/" style="color: #00721e;">Tools</a> > 
+                  <H1 style="font-size: 16; display: inline;">Reverse Whois Lookup</H1>
+                  <br><br>This free tool will allow you to find domain names owned by an individual person or company.  Simply enter the email address or name of the person or company to find other domains registered using those same details. <a href="#" onclick="javascript:document.getElementById('faq').style.visibility = 'visible'; document.getElementById('faq').style.display = 'block';"  style="color: #00721e;">FAQ</a>.<br><br>
+                  <div id="faq" style="visibility: hidden; display: none;"><u><b>Frequently Asked Questions</b></u><br>Q. Will this tool return results for all domains including ccTLD's?<br>A. Unfortunately no.  Whilst we do our best to ensure our data is as complete as possible, we are not able to return results for all ccTLD's.  Due to a number of technical limitations with whois data, the results from any Reverse Whois tool should not be considered as exhaustive.<br><br>Q. Is your data live?<br>A. Our data is not live.  We do our best to update the data as often as possible with daily updates for selected TLD's and quarterly updates for others.<br><br>Q. How do I see all records for a specific person/company rather than the limited number you show on your site?<br>A. Please <a href="mailto:feedback@viewdns.info?subject=Reverse Whois" style="color: #00721e;">email us</a> with your request and we'll see what we can do for you.<br><br></div>
+                  <form name="reversewhois" action="" method="GET" >Registrant Name or Email Address: <br>
+               </font>
+               <input name="q" type="text" size="30"><input type="submit" value="GO"></form>
+            </td>
+         </tr>
+         <tr>
+            <td>
+               <font size="2" face="Courier">Reverse Whois results for blacklanternsecurity.com<br>==============<br><br>There are 20 domains that matched this search query.<br>These are listed below:<br><br>
+               <table border="1">
+                  <tr>
+                     <td>hyperloop.com</td>
+                     <td>2003-12-04</td>
+                     <td>NETWORK SOLUTIONS, LLC.</td>
+                  </tr>
+               </table>
+               <br>
+            </td>
+         </tr>
+         <tr></tr>
+      </table>
+      <!--</div>-->
+      <table width="1000" align="center" border="0">
+         <tr align="center">
+            <td align="center">
+               <script async src="//pagead2.googlesyndication.com/pagead/js/adsbygoogle.js"></script>
+               <!-- viewdns-bottom-linkunit -->
+               <ins class="adsbygoogle"
+                  style="display:inline-block;width:728px;height:15px"
+                  data-ad-client="ca-pub-7431844373287199"
+                  data-ad-slot="9102586825"></ins>
+               <script>
+                  (adsbygoogle = window.adsbygoogle || []).push({});
+               </script>
+               <br /><br />
+               <!-- fb -->
+               <div id="fb-root"></div>
+               <script>(function(d, s, id) {
+                  var js, fjs = d.getElementsByTagName(s)[0];
+                  if (d.getElementById(id)) return;
+                  js = d.createElement(s); js.id = id;
+                  js.src = "//connect.facebook.net/en_US/sdk.js#xfbml=1&appId=187997344602848&version=v2.0";
+                  fjs.parentNode.insertBefore(js, fjs);
+                  }(document, 'script', 'facebook-jssdk'));
+               </script>
+               <!-- end fb -->
+               <a href="https://twitter.com/viewdns" class="twitter-follow-button" data-show-count="false" align="center">Follow @viewdns</a>
+               <script>!function(d,s,id){var js,fjs=d.getElementsByTagName(s)[0];if(!d.getElementById(id)){js=d.createElement(s);js.id=id;js.src="//platform.twitter.com/widgets.js";fjs.parentNode.insertBefore(js,fjs);}}(document,"script","twitter-wjs");</script>
+               <div class="fb-like" data-href="https://www.facebook.com/viewdns" data-layout="button" data-action="like" data-show-faces="true" data-share="true"></div>
+               <br />
+               <font size="1">All content &copy; 2023 ViewDNS.info<br><a href="mailto:feedback@viewdns.info?subject=Feedback" style="color: #00721e;">Feedback / Suggestions / Contact Us</a>&nbsp-&nbsp<a href="https://viewdns.info/privacy.php" style="color: #00721e;">Privacy Policy</a></font>
+            </td>
+         </tr>
+      </table>
+      <br />
+      <table width="731" align="center" border="0">
+         <tr align="center">
+            <td align="center">
+               <!--INLINE-->
+               <script type="text/javascript"><!--
+                  google_ad_client = "ca-pub-7431844373287199";
+                  /* ViewDNS 728x90 */
+                  google_ad_slot = "2958648842";
+                  google_ad_width = 728;
+                  google_ad_height = 90;
+                  google_page_url="http://viewdns.info";
+                  //-->
+               </script>
+               <script type="text/javascript"
+                  src="//pagead2.googlesyndication.com/pagead/show_ads.js"></script>
+            </td>
+         </tr>
+      </table>
+      <center>
+         <br>
+         <br>
+      </center>
+      <!-- page generated in 0.41837406158447 seconds -->
+   </body>
+</html>"""
diff --git a/bbot/test/test_step_1/module_tests/test_module_virustotal.py b/bbot/test/test_step_1/module_tests/test_module_virustotal.py
index e69de29bb2..88663bdfaa 100644
--- a/bbot/test/test_step_1/module_tests/test_module_virustotal.py
+++ b/bbot/test/test_step_1/module_tests/test_module_virustotal.py
@@ -0,0 +1,51 @@
+from .base import ModuleTestBase
+
+
+class TestVirusTotal(ModuleTestBase):
+    config_overrides = {"modules": {"virustotal": {"api_key": "asdf"}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://www.virustotal.com/api/v3/domains/blacklanternsecurity.com/subdomains",
+            json={
+                "meta": {"count": 25, "cursor": "eyJsaW1pdCI6IDEwLCAib2Zmc2V0IjogMTB9"},
+                "data": [
+                    {
+                        "attributes": {
+                            "last_dns_records": [{"type": "A", "value": "168.62.180.225", "ttl": 3600}],
+                            "whois": "Creation Date: 2013-07-30T20:14:50Z\nDNSSEC: unsigned\nDomain Name: BLACKLANTERNSECURITY.COM\nDomain Status: clientDeleteProhibited https://icann.org/epp#clientDeleteProhibited\nDomain Status: clientRenewProhibited https://icann.org/epp#clientRenewProhibited\nDomain Status: clientTransferProhibited https://icann.org/epp#clientTransferProhibited\nDomain Status: clientUpdateProhibited https://icann.org/epp#clientUpdateProhibited\nName Server: NS01.DOMAINCONTROL.COM\nName Server: NS02.DOMAINCONTROL.COM\nRegistrar Abuse Contact Email: abuse@godaddy.com\nRegistrar Abuse Contact Phone: 480-624-2505\nRegistrar IANA ID: 146\nRegistrar URL: http://www.godaddy.com\nRegistrar WHOIS Server: whois.godaddy.com\nRegistrar: GoDaddy.com, LLC\nRegistry Domain ID: 1818679075_DOMAIN_COM-VRSN\nRegistry Expiry Date: 2023-07-30T20:14:50Z\nUpdated Date: 2022-09-14T16:28:14Z",
+                            "tags": [],
+                            "popularity_ranks": {},
+                            "last_dns_records_date": 1657734301,
+                            "last_analysis_stats": {
+                                "harmless": 0,
+                                "malicious": 0,
+                                "suspicious": 0,
+                                "undetected": 86,
+                                "timeout": 0,
+                            },
+                            "creation_date": 1375215290,
+                            "reputation": 0,
+                            "registrar": "GoDaddy.com, LLC",
+                            "last_analysis_results": {},
+                            "last_update_date": 1663172894,
+                            "last_modification_date": 1657734301,
+                            "tld": "com",
+                            "categories": {},
+                            "total_votes": {"harmless": 0, "malicious": 0},
+                        },
+                        "type": "domain",
+                        "id": "asdf.blacklanternsecurity.com",
+                        "links": {"self": "https://www.virustotal.com/api/v3/domains/asdf.blacklanternsecurity.com"},
+                        "context_attributes": {"timestamp": 1657734301},
+                    }
+                ],
+                "links": {
+                    "self": "https://www.virustotal.com/api/v3/domains/blacklanternsecurity.com/subdomains?limit=10",
+                    "next": "https://www.virustotal.com/api/v3/domains/blacklanternsecurity.com/subdomains?cursor=eyJsaW1pdCI6IDEwLCAib2Zmc2V0IjogMTB9&limit=10",
+                },
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_wafw00f.py b/bbot/test/test_step_1/module_tests/test_module_wafw00f.py
index e69de29bb2..2b69c8b894 100644
--- a/bbot/test/test_step_1/module_tests/test_module_wafw00f.py
+++ b/bbot/test/test_step_1/module_tests/test_module_wafw00f.py
@@ -0,0 +1,14 @@
+from .base import ModuleTestBase
+
+
+class TestWafw00f(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "wafw00f"]
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "Proudly powered by litespeed web server"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "WAF" and "LiteSpeed" in e.data["WAF"] for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py b/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
index e69de29bb2..47e456b860 100644
--- a/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
+++ b/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
@@ -0,0 +1,20 @@
+from .base import ModuleTestBase
+
+
+class TestWappalyzer(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "wappalyzer"]
+
+    def setup_after_prep(self, module_test):
+        respond_args = {
+            "response_data": """<html><head><title>BBOT is life</title></head><body>
+<link rel="preconnect" href="https://fonts.googleapis.com">
+<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
+<link href="https://fonts.googleapis.com/css2?family=Open+Sans+Condensed:wght@700&family=Open+Sans:ital,wght@0,400;0,600;0,700;0,800;1,400&display=swap" rel="stylesheet">
+</body></html>""",
+            "headers": {"Server": "Apache/2.4.41 (Ubuntu)"},
+        }
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(e.type == "TECHNOLOGY" and e.data["technology"].lower() == "google font api" for e in events)

From 6fdb598e2e6bcfbb7d3c47106f7c98a4d6aa2908 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 01:20:26 -0400
Subject: [PATCH 037/387] removed services test

---
 bbot/test/test_step_1/module_tests/test_module_services.py | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 delete mode 100644 bbot/test/test_step_1/module_tests/test_module_services.py

diff --git a/bbot/test/test_step_1/module_tests/test_module_services.py b/bbot/test/test_step_1/module_tests/test_module_services.py
deleted file mode 100644
index e69de29bb2..0000000000

From b8000f4ffccced1fca4518e3de16fb5f1ec0e777 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 12:53:46 -0400
Subject: [PATCH 038/387] more module tests!

---
 bbot/modules/bucket_gcp.py                    |  1 -
 bbot/modules/builtwith.py                     |  1 -
 bbot/modules/emailformat.py                   |  1 -
 bbot/modules/leakix.py                        |  1 -
 bbot/modules/output/web_report.py             |  7 +-
 bbot/modules/skymem.py                        |  1 -
 bbot/modules/smuggler.py                      |  6 +-
 bbot/modules/wayback.py                       | 18 ++---
 bbot/modules/zoomeye.py                       | 35 ++++++----
 bbot/test/conftest.py                         |  4 +-
 bbot/test/test_step_1/module_tests/base.py    | 10 ---
 .../module_tests/test_module_aggregate.py     |  1 -
 .../module_tests/test_module_dnscommonsrv.py  | 13 ++--
 .../test_module_dnszonetransfer.py            |  2 +-
 .../module_tests/test_module_generic_ssrf.py  |  5 +-
 .../module_tests/test_module_host_header.py   |  5 +-
 .../module_tests/test_module_ipneighbor.py    | 23 ++++---
 .../module_tests/test_module_smuggler.py      |  9 +++
 .../test_module_subdomain_hijack.py           |  1 -
 .../module_tests/test_module_vhost.py         | 65 +++++++++++++++++++
 .../module_tests/test_module_wayback.py       | 12 ++++
 .../module_tests/test_module_web_report.py    | 65 +++++++++++++++++++
 .../module_tests/test_module_websocket.py     | 35 ++++++++++
 .../module_tests/test_module_zoomeye.py       | 36 ++++++++++
 24 files changed, 296 insertions(+), 61 deletions(-)

diff --git a/bbot/modules/bucket_gcp.py b/bbot/modules/bucket_gcp.py
index d4ac880a9c..b7e96d5b1d 100644
--- a/bbot/modules/bucket_gcp.py
+++ b/bbot/modules/bucket_gcp.py
@@ -50,5 +50,4 @@ async def check_bucket_exists(self, bucket_name, url):
         response = await self.helpers.request(url)
         status_code = getattr(response, "status_code", 0)
         existent_bucket = status_code not in (0, 400, 404)
-        self.critical(f"{bucket_name}: {url}: {existent_bucket}")
         return existent_bucket, set(), bucket_name, url
diff --git a/bbot/modules/builtwith.py b/bbot/modules/builtwith.py
index 6fabcd2833..6c5a305c1a 100644
--- a/bbot/modules/builtwith.py
+++ b/bbot/modules/builtwith.py
@@ -61,7 +61,6 @@ def parse_domains(self, r, query):
         query (string): The query used against the API
         """
         results_set = set()
-        self.critical(r.content)
         json = r.json()
         if json:
             results = json.get("Results", [])
diff --git a/bbot/modules/emailformat.py b/bbot/modules/emailformat.py
index f28e19f9d9..82b5797445 100644
--- a/bbot/modules/emailformat.py
+++ b/bbot/modules/emailformat.py
@@ -14,7 +14,6 @@ async def handle_event(self, event):
         _, query = self.helpers.split_domain(event.data)
         url = f"{self.base_url}/d/{self.helpers.quote(query)}/"
         r = await self.request_with_fail_count(url)
-        self.hugesuccess(r.content)
         if not r:
             return
         for email in self.helpers.extract_emails(r.text):
diff --git a/bbot/modules/leakix.py b/bbot/modules/leakix.py
index 6622242e83..4ebf895703 100644
--- a/bbot/modules/leakix.py
+++ b/bbot/modules/leakix.py
@@ -31,7 +31,6 @@ async def ping(self):
     async def request_url(self, query):
         url = f"{self.base_url}/api/subdomains/{self.helpers.quote(query)}"
         response = await self.request_with_fail_count(url, headers=self.headers)
-        self.hugewarning(response.json())
         return response
 
     def parse_results(self, r, query=None):
diff --git a/bbot/modules/output/web_report.py b/bbot/modules/output/web_report.py
index da973a6e38..793f26c329 100644
--- a/bbot/modules/output/web_report.py
+++ b/bbot/modules/output/web_report.py
@@ -32,7 +32,7 @@ async def setup(self):
         self._prep_output_dir("web_report.html")
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         if event.type == "URL":
             parsed = event.parsed
             host = f"{parsed.scheme}://{parsed.netloc}/"
@@ -74,7 +74,7 @@ def handle_event(self, event):
                 else:
                     self.web_assets[host][event.type].append(html.escape(event.pretty_string))
 
-    def report(self):
+    async def report(self):
         for host in self.web_assets.keys():
             self.markdown += f"# {host}\n\n"
 
@@ -93,5 +93,4 @@ def report(self):
             self.file.write(markdown.markdown(self.markdown))
             self.file.write(self.html_footer)
             self.file.flush()
-            with self._report_lock:
-                self.info(f"Web Report saved to {self.output_file}")
+            self.info(f"Web Report saved to {self.output_file}")
diff --git a/bbot/modules/skymem.py b/bbot/modules/skymem.py
index 56f5e39f65..71d0e883e7 100644
--- a/bbot/modules/skymem.py
+++ b/bbot/modules/skymem.py
@@ -33,7 +33,6 @@ async def handle_event(self, event):
             for email in self.helpers.extract_emails(r2.text):
                 self.emit_event(email, "EMAIL_ADDRESS", source=event)
             pages = re.findall(r"/domain/" + domain_id + r"\?p=(\d+)", r2.text)
-            self.critical(pages)
             if not pages:
                 break
             last_page = max([int(p) for p in pages])
diff --git a/bbot/modules/smuggler.py b/bbot/modules/smuggler.py
index 7284ccec60..f478a63641 100644
--- a/bbot/modules/smuggler.py
+++ b/bbot/modules/smuggler.py
@@ -23,11 +23,11 @@ class smuggler(BaseModule):
         }
     ]
 
-    def setup(self):
+    async def setup(self):
         self.scanned_hosts = set()
         return True
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
         host_hash = hash(host)
         if host_hash in self.scanned_hosts:
@@ -44,7 +44,7 @@ def handle_event(self, event):
             "-u",
             event.data,
         ]
-        for f in self.helpers.run_live(command):
+        async for f in self.helpers.run_live(command):
             if "Issue Found" in f:
                 technique = f.split(":")[0].rstrip()
                 text = f.split(":")[1].split("-")[0].strip()
diff --git a/bbot/modules/wayback.py b/bbot/modules/wayback.py
index 6ce7751526..133dc27e7b 100644
--- a/bbot/modules/wayback.py
+++ b/bbot/modules/wayback.py
@@ -17,19 +17,20 @@ class wayback(crobat):
 
     base_url = "http://web.archive.org"
 
-    def setup(self):
+    async def setup(self):
         self.urls = self.config.get("urls", False)
         self.garbage_threshold = self.config.get("garbage_threshold", 10)
-        return super().setup()
+        return await super().setup()
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
-        for result, event_type in self.query(query):
+        for result, event_type in await self.query(query):
             self.emit_event(result, event_type, event, abort_if=self.abort_if)
 
-    def query(self, query):
+    async def query(self, query):
+        results = set()
         waybackurl = f"{self.base_url}/cdx/search/cdx?url={self.helpers.quote(query)}&matchType=domain&output=json&fl=original&collapse=original"
-        r = self.helpers.request(waybackurl, timeout=self.http_timeout + 10)
+        r = await self.helpers.request(waybackurl, timeout=self.http_timeout + 10)
         if not r:
             self.warning(f'Error connecting to archive.org for query "{query}"')
             return
@@ -55,6 +56,7 @@ def query(self, query):
                 h = hash(dns_name)
                 if h not in dns_names:
                     dns_names.add(h)
-                    yield dns_name, "DNS_NAME"
+                    results.add((dns_name, "DNS_NAME"))
             else:
-                yield parsed_url.geturl(), "URL_UNVERIFIED"
+                results.add((parsed_url.geturl(), "URL_UNVERIFIED"))
+        return results
diff --git a/bbot/modules/zoomeye.py b/bbot/modules/zoomeye.py
index 5ebfad9fef..83f9bd641f 100644
--- a/bbot/modules/zoomeye.py
+++ b/bbot/modules/zoomeye.py
@@ -15,19 +15,20 @@ class zoomeye(shodan_dns):
 
     base_url = "https://api.zoomeye.org"
 
-    def setup(self):
+    async def setup(self):
         self.max_pages = self.config.get("max_pages", 20)
         self.headers = {"API-KEY": self.config.get("api_key", "")}
         self.include_related = self.config.get("include_related", False)
-        return super().setup()
+        return await super().setup()
 
-    def ping(self):
-        r = self.helpers.request(f"{self.base_url}/resources-info", headers=self.headers)
+    async def ping(self):
+        url = f"{self.base_url}/resources-info"
+        r = await self.helpers.request(url, headers=self.headers)
         assert int(r.json()["quota_info"]["remain_total_quota"]) > 0, "No quota remaining"
 
-    def handle_event(self, event):
+    async def handle_event(self, event):
         query = self.make_query(event)
-        results = self.query(query)
+        results = await self.query(query)
         if results:
             for hostname in results:
                 if hostname == event:
@@ -37,15 +38,23 @@ def handle_event(self, event):
                     tags = ["affiliate"]
                 self.emit_event(hostname, "DNS_NAME", event, tags=tags)
 
-    def query(self, query):
+    async def query(self, query):
+        results = set()
         query_type = 0 if self.include_related else 1
         url = f"{self.base_url}/domain/search?q={self.helpers.quote(query)}&type={query_type}&page=" + "{page}"
-        for i, j in enumerate(self.helpers.api_page_iter(url, headers=self.headers)):
-            results = list(self.parse_results(j))
-            if results:
-                yield from results
-            if not results or i >= (self.max_pages - 1) or self.scan.stopping:
-                break
+        i = 0
+        agen = self.helpers.api_page_iter(url, headers=self.headers)
+        try:
+            async for j in agen:
+                r = list(self.parse_results(j))
+                if r:
+                    results.update(set(r))
+                if not r or i >= (self.max_pages - 1):
+                    break
+                i += 1
+        finally:
+            agen.aclose()
+        return results
 
     def parse_results(self, r):
         for entry in r.get("list", []):
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 0aca0ff1bd..e2495e3221 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -3,6 +3,8 @@
 import logging
 from pytest_httpserver import HTTPServer
 
+from bbot.core.helpers.interactsh import server_list as interactsh_servers
+
 
 @pytest.hookimpl(tryfirst=True, hookwrapper=True)
 def pytest_sessionfinish(session, exitstatus):
@@ -21,7 +23,7 @@ def pytest_sessionfinish(session, exitstatus):
 
 @pytest.fixture
 def non_mocked_hosts() -> list:
-    return ["127.0.0.1"]
+    return ["127.0.0.1"] + interactsh_servers
 
 
 @pytest.fixture
diff --git a/bbot/test/test_step_1/module_tests/base.py b/bbot/test/test_step_1/module_tests/base.py
index 41294b2c6c..99a069a395 100644
--- a/bbot/test/test_step_1/module_tests/base.py
+++ b/bbot/test/test_step_1/module_tests/base.py
@@ -39,16 +39,6 @@ def to_text(self):
         return str(self)
 
 
-class TestClass:
-    @pytest_asyncio.fixture
-    async def my_fixture(self, bbot_httpserver):
-        yield bbot_httpserver
-
-    @pytest.mark.asyncio
-    async def test_asdf(self, my_fixture):
-        log.critical(my_fixture)
-
-
 class ModuleTestBase:
     targets = ["blacklanternsecurity.com"]
     scan_name = None
diff --git a/bbot/test/test_step_1/module_tests/test_module_aggregate.py b/bbot/test/test_step_1/module_tests/test_module_aggregate.py
index b3d72c57e9..1049fb2a22 100644
--- a/bbot/test/test_step_1/module_tests/test_module_aggregate.py
+++ b/bbot/test/test_step_1/module_tests/test_module_aggregate.py
@@ -5,7 +5,6 @@ class TestAggregate(ModuleTestBase):
     config_overrides = {"dns_resolution": True}
 
     def check(self, module_test, events):
-        module_test.log.critical(events)
         filename = next(module_test.scan.home.glob("scan-stats-table*.txt"))
         with open(filename) as f:
             assert "| A  " in f.read()
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py b/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
index 4b2617a6bb..a77630ecd9 100644
--- a/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
+++ b/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
@@ -2,18 +2,23 @@
 
 
 class TestDNSCommonSRV(ModuleTestBase):
+    targets = ["blacklanternsecurity.notreal"]
+
     def setup_after_prep(self, module_test):
         old_resolve_fn = module_test.scan.helpers.dns.resolve
 
         async def resolve(query, **kwargs):
-            if query == "_ldap._tcp.gc._msdcs.blacklanternsecurity.com" and kwargs.get("type", "").upper() == "SRV":
-                return {"asdf.blacklanternsecurity.com"}
+            if (
+                query == "_ldap._tcp.gc._msdcs.blacklanternsecurity.notreal"
+                and kwargs.get("type", "").upper() == "SRV"
+            ):
+                return {"asdf.blacklanternsecurity.notreal"}
             return await old_resolve_fn(query, **kwargs)
 
         module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "resolve", resolve)
 
     def check(self, module_test, events):
         assert any(
-            e.data == "_ldap._tcp.gc._msdcs.blacklanternsecurity.com" for e in events
+            e.data == "_ldap._tcp.gc._msdcs.blacklanternsecurity.notreal" for e in events
         ), "Failed to detect subdomain"
-        assert not any(e.data == "_ldap._tcp.dc._msdcs.blacklanternsecurity.com" for e in events), "False positive"
+        assert not any(e.data == "_ldap._tcp.dc._msdcs.blacklanternsecurity.notreal" for e in events), "False positive"
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
index 40f450a974..212fce0d6b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
+++ b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
@@ -15,7 +15,7 @@ def setup_after_prep(self, module_test):
         async def _resolve_hostname(query, **kwargs):
             if query == "blacklanternsecurity.fakedomain" and kwargs.get("rdtype", "").upper() == "NS":
                 return [module_test.mock_record("ns01.blacklanternsecurity.fakedomain", "NS")], []
-            if query == "ns01.blacklanternsecurity.fakedomain" and kwargs.get("rdtype", "").upper() in "A":
+            if query == "ns01.blacklanternsecurity.fakedomain" and kwargs.get("rdtype", "").upper() == "A":
                 return [module_test.mock_record("127.0.0.1", "A")], []
             return await old_resolve_fn(query, **kwargs)
 
diff --git a/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py b/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
index 2d9cb1a7ae..9e5ed6264b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
+++ b/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
@@ -2,5 +2,8 @@
 
 
 class TestGeneric_SSRF(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+
     # PAUL TODO
-    pass
+    def check(self, module_test, events):
+        pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_host_header.py b/bbot/test/test_step_1/module_tests/test_module_host_header.py
index 75f24378e7..43d6bc6a0d 100644
--- a/bbot/test/test_step_1/module_tests/test_module_host_header.py
+++ b/bbot/test/test_step_1/module_tests/test_module_host_header.py
@@ -2,5 +2,8 @@
 
 
 class TestHost_Header(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+
     # PAUL TODO
-    pass
+    def check(self, module_test, events):
+        pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py b/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
index 6463c2cfaf..be3e234e29 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
@@ -3,18 +3,25 @@
 
 class TestIPNeighbor(ModuleTestBase):
     targets = ["127.0.0.15", "www.bls.notreal"]
-    config_overrides = {"scope_report_distance": 1, "dns_resolution": True}
+    config_overrides = {"scope_report_distance": 1, "dns_resolution": True, "scope_dns_search_distance": 2}
 
     def setup_after_prep(self, module_test):
-        old_resolve_fn = module_test.scan.helpers.dns.resolve
+        old_resolve_ip = module_test.scan.helpers.dns._resolve_ip
+        old_resolve_hostname = module_test.scan.helpers.dns._resolve_hostname
 
-        async def resolve(query, **kwargs):
-            module_test.log.critical(f"{query}: {kwargs}")
-            if query == "127.0.0.3" and kwargs.get("type", "").upper() == "PTR":
-                return {"www.bls.notreal"}
-            return await old_resolve_fn(query, **kwargs)
+        async def _resolve_ip(query, **kwargs):
+            if query == "127.0.0.3":
+                return [module_test.mock_record("asdf.www.bls.notreal", "PTR")], []
+            return await old_resolve_ip(query, **kwargs)
 
-        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "resolve", resolve)
+        async def _resolve_hostname(query, **kwargs):
+            if query == "asdf.www.bls.notreal" and kwargs.get("rdtype", "") == "A":
+                return [module_test.mock_record("127.0.0.3", "A")], []
+            return await old_resolve_hostname(query, **kwargs)
+
+        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "_resolve_ip", _resolve_ip)
+        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "_resolve_hostname", _resolve_hostname)
 
     def check(self, module_test, events):
         assert any(e.data == "127.0.0.3" for e in events)
+        assert not any(e.data == "127.0.0.4" for e in events)
diff --git a/bbot/test/test_step_1/module_tests/test_module_smuggler.py b/bbot/test/test_step_1/module_tests/test_module_smuggler.py
index e69de29bb2..955fcffde4 100644
--- a/bbot/test/test_step_1/module_tests/test_module_smuggler.py
+++ b/bbot/test/test_step_1/module_tests/test_module_smuggler.py
@@ -0,0 +1,9 @@
+from .base import ModuleTestBase
+
+
+class TestSmuggler(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+
+    # PAUL TODO
+    def check(self, module_test, events):
+        pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py b/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
index c0c1006279..7349fb187c 100644
--- a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
+++ b/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
@@ -30,7 +30,6 @@ def setup_after_prep(self, module_test):
         fingerprint = next(iter(fingerprints))
         rand_string = module_test.scan.helpers.rand_string(length=15, digits=False)
         self.rand_subdomain = f"{rand_string}.{next(iter(fingerprint.domains))}"
-        module_test.log.critical(self.rand_subdomain)
         respond_args = {"response_data": f'<a src="http://{self.rand_subdomain}"/>'}
         module_test.set_expect_requests(respond_args=respond_args)
 
diff --git a/bbot/test/test_step_1/module_tests/test_module_vhost.py b/bbot/test/test_step_1/module_tests/test_module_vhost.py
index e69de29bb2..bfd8037196 100644
--- a/bbot/test/test_step_1/module_tests/test_module_vhost.py
+++ b/bbot/test/test_step_1/module_tests/test_module_vhost.py
@@ -0,0 +1,65 @@
+from .base import ModuleTestBase, tempwordlist
+
+
+class TestVhost(ModuleTestBase):
+    targets = ["http://localhost:8888", "secret.localhost"]
+    modules_overrides = ["httpx", "vhost"]
+    test_wordlist = ["11111111", "admin", "cloud", "junkword1", "zzzjunkword2"]
+    config_overrides = {
+        "modules": {
+            "vhost": {
+                "wordlist": tempwordlist(test_wordlist),
+            }
+        }
+    }
+
+    def setup_after_prep(self, module_test):
+        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "admin.localhost:8888"}}
+        respond_args = {"response_data": "Alive vhost admin"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "cloud.localhost:8888"}}
+        respond_args = {"response_data": "Alive vhost cloud"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "q-cloud.localhost:8888"}}
+        respond_args = {"response_data": "Alive vhost q-cloud"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "secret.localhost:8888"}}
+        respond_args = {"response_data": "Alive vhost secret"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "host.docker.internal"}}
+        respond_args = {"response_data": "Alive vhost host.docker.internal"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"method": "GET", "uri": "/"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        basic_detection = False
+        mutaton_of_detected = False
+        basehost_mutation = False
+        special_vhost_list = False
+        wordcloud_detection = False
+
+        for e in events:
+            if e.type == "VHOST":
+                if e.data["vhost"] == "admin":
+                    basic_detection = True
+                if e.data["vhost"] == "cloud":
+                    mutaton_of_detected = True
+                if e.data["vhost"] == "q-cloud":
+                    basehost_mutation = True
+                if e.data["vhost"] == "host.docker.internal":
+                    special_vhost_list = True
+                if e.data["vhost"] == "secret":
+                    wordcloud_detection = True
+
+        assert basic_detection
+        assert mutaton_of_detected
+        assert basehost_mutation
+        assert special_vhost_list
+        assert wordcloud_detection
diff --git a/bbot/test/test_step_1/module_tests/test_module_wayback.py b/bbot/test/test_step_1/module_tests/test_module_wayback.py
index e69de29bb2..3395e0052a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_wayback.py
+++ b/bbot/test/test_step_1/module_tests/test_module_wayback.py
@@ -0,0 +1,12 @@
+from .base import ModuleTestBase
+
+
+class TestWayback(ModuleTestBase):
+    def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"http://web.archive.org/cdx/search/cdx?url=blacklanternsecurity.com&matchType=domain&output=json&fl=original&collapse=original",
+            json=[["original"], ["http://asdf.blacklanternsecurity.com"]],
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
diff --git a/bbot/test/test_step_1/module_tests/test_module_web_report.py b/bbot/test/test_step_1/module_tests/test_module_web_report.py
index e69de29bb2..14b911c19f 100644
--- a/bbot/test/test_step_1/module_tests/test_module_web_report.py
+++ b/bbot/test/test_step_1/module_tests/test_module_web_report.py
@@ -0,0 +1,65 @@
+from .base import ModuleTestBase
+
+
+class TestWebReport(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "wappalyzer", "badsecrets", "web_report", "secretsdb"]
+
+    def setup_before_prep(self, module_test):
+        # secretsdb --> FINDING
+        module_test.httpx_mock.add_response(
+            url="https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml",
+            text="""patterns:
+- pattern:
+    confidence: 99
+    name: Asymmetric Private Key
+    regex: '-----BEGIN ((EC|PGP|DSA|RSA|OPENSSH) )?PRIVATE KEY( BLOCK)?-----'""",
+        )
+        # wappalyzer --> TECHNOLOGY
+        # badsecrets --> VULNERABILITY
+        respond_args = {"response_data": web_body}
+        module_test.set_expect_requests(respond_args=respond_args)
+        module_test.httpx_mock.assert_all_responses_were_requested = False
+
+    def check(self, module_test, events):
+        report_file = module_test.scan.home / "web_report.html"
+        with open(report_file) as f:
+            report_content = f.read()
+        assert "<li>[HIGH] Known Secret Found" in report_content
+        assert (
+            """<h3>URL</h3>
+<ul>
+<li><strong>http://127.0.0.1:8888/</strong>"""
+            in report_content
+        )
+        assert (
+            """<h3>FINDING</h3>
+<ul>
+<li>Possible secret (Asymmetric Private Key)"""
+            in report_content
+        )
+        assert "<h3>TECHNOLOGY</h3>" in report_content
+        assert "<p>flask</p>" in report_content
+
+
+web_body = """
+<html>
+<body>
+<link rel="preconnect" href="https://fonts.googleapis.com">
+<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
+<link href="https://fonts.googleapis.com/css2?family=Open+Sans+Condensed:wght@700&family=Open+Sans:ital,wght@0,400;0,600;0,700;0,800;1,400&display=swap" rel="stylesheet">
+    <form method="post" action="./query.aspx" id="form1">
+<div class="aspNetHidden">
+<input type="hidden" name="__VIEWSTATE" id="__VIEWSTATE" value="rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu" />
+</div>
+
+<div class="aspNetHidden">
+
+    <input type="hidden" name="__VIEWSTATEGENERATOR" id="__VIEWSTATEGENERATOR" value="EDD8C9AE" />
+    <input type="hidden" name="__VIEWSTATEENCRYPTED" id="__VIEWSTATEENCRYPTED" value="" />
+</div>
+    </form>
+    <p>-----BEGIN PGP PRIVATE KEY BLOCK-----</p>
+</body>
+</html>
+"""
diff --git a/bbot/test/test_step_1/module_tests/test_module_websocket.py b/bbot/test/test_step_1/module_tests/test_module_websocket.py
index e69de29bb2..b5954b34a0 100644
--- a/bbot/test/test_step_1/module_tests/test_module_websocket.py
+++ b/bbot/test/test_step_1/module_tests/test_module_websocket.py
@@ -0,0 +1,35 @@
+import json
+import asyncio
+import logging
+import websockets
+
+from .base import ModuleTestBase
+
+log = logging.getLogger("bbot.testing")
+
+results = {"events": []}
+
+
+async def websocket_handler(websocket, path):
+    results["path"] = path
+    async for message in websocket:
+        results["events"].append(message)
+
+
+# Define a coroutine for the server
+async def server_coroutine():
+    async with websockets.serve(websocket_handler, "127.0.0.1", 8765):
+        await asyncio.Future()  # run forever
+
+
+class TestWebsocket(ModuleTestBase):
+    config_overrides = {"output_modules": {"websocket": {"url": "ws://127.0.0.1:8765/testing"}}}
+
+    def setup_before_prep(self, module_test):
+        self.server_task = asyncio.create_task(server_coroutine())
+
+    def check(self, module_test, events):
+        assert results["path"] == "/testing"
+        decoded_events = [json.loads(e) for e in results["events"]]
+        assert any(e["type"] == "SCAN" for e in decoded_events)
+        self.server_task.cancel()
diff --git a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py b/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
index e69de29bb2..c561e22c67 100644
--- a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
+++ b/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
@@ -0,0 +1,36 @@
+from .base import ModuleTestBase
+
+
+class TestZoomEye(ModuleTestBase):
+    config_overrides = {"modules": {"zoomeye": {"api_key": "asdf", "include_related": True, "max_pages": 3}}}
+
+    def setup_before_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url="https://api.zoomeye.org/resources-info",
+            match_headers={"API-KEY": "asdf"},
+            json={"quota_info": {"remain_total_quota": 5}},
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.zoomeye.org/domain/search?q=blacklanternsecurity.com&type=0&page=1",
+            json={"list": [{"name": "asdf.blacklanternsecurity.com"}]},
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.zoomeye.org/domain/search?q=blacklanternsecurity.com&type=0&page=2",
+            json={"list": [{"name": "zzzz.blacklanternsecurity.com"}]},
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.zoomeye.org/domain/search?q=blacklanternsecurity.com&type=0&page=3",
+            json={"list": [{"name": "ffff.blacklanternsecurity.com"}, {"name": "affiliate.bls"}]},
+        )
+        module_test.httpx_mock.add_response(
+            url="https://api.zoomeye.org/domain/search?q=blacklanternsecurity.com&type=0&page=4",
+            json={"list": [{"name": "nope.blacklanternsecurity.com"}]},
+        )
+        module_test.httpx_mock.assert_all_responses_were_requested = False
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain #1"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain #2"
+        assert any(e.data == "ffff.blacklanternsecurity.com" for e in events), "Failed to detect subdomain #3"
+        assert any(e.data == "affiliate.bls" and "affiliate" in e.tags for e in events), "Failed to detect affiliate"
+        assert not any(e.data == "nope.blacklanternsecurity.com" for e in events), "Failed to obey max_pages"

From 9b6d50ae1ba46041ce94a95d692ae8c63950f603 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 13:00:23 -0400
Subject: [PATCH 039/387] bs4 dependency

---
 poetry.lock    | 895 ++++++++++++++++++++++++++++++++++---------------
 pyproject.toml |   1 +
 2 files changed, 627 insertions(+), 269 deletions(-)

diff --git a/poetry.lock b/poetry.lock
index 1588260caf..f69d3ed54f 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -2,29 +2,29 @@
 
 [[package]]
 name = "ansible"
-version = "7.4.0"
+version = "7.5.0"
 description = "Radically simple IT automation"
 category = "main"
 optional = false
 python-versions = ">=3.9"
 files = [
-    {file = "ansible-7.4.0-py3-none-any.whl", hash = "sha256:c9b5cae2ff8168b3dc859fff12275338cd7c84ef37f62889076f82846bb4beb5"},
-    {file = "ansible-7.4.0.tar.gz", hash = "sha256:0964d6ec7b363d2d559f245c39b01798c720a85b207672ec2c9d83cf61564b90"},
+    {file = "ansible-7.5.0-py3-none-any.whl", hash = "sha256:a2deadeb8a199abfbd7c1960bc126697be517ac4310b2f59eb2190706e6a2637"},
+    {file = "ansible-7.5.0.tar.gz", hash = "sha256:4f08ca25bb29005c1afc4125e837882ad7a2c67ff0cc9d1a361b89ad09cf8c44"},
 ]
 
 [package.dependencies]
-ansible-core = ">=2.14.4,<2.15.0"
+ansible-core = ">=2.14.5,<2.15.0"
 
 [[package]]
 name = "ansible-core"
-version = "2.14.4"
+version = "2.14.6"
 description = "Radically simple IT automation"
 category = "main"
 optional = false
 python-versions = ">=3.9"
 files = [
-    {file = "ansible-core-2.14.4.tar.gz", hash = "sha256:90b260bc264901d35fb1f0753f2b650813f54cfe6476540afbc6b25ef541ef14"},
-    {file = "ansible_core-2.14.4-py3-none-any.whl", hash = "sha256:3915ef89f74ffd6277e534b4f14843d2425a3e7bb6ffae26eecd4cc571d020cc"},
+    {file = "ansible-core-2.14.6.tar.gz", hash = "sha256:0cddb0df454561981f1c541db7ac5398d5e9de452ea1f01847acbd031fd7d2b2"},
+    {file = "ansible_core-2.14.6-py3-none-any.whl", hash = "sha256:08963309f44cd98862aba8d887ac5c2b4159cd1c2e31ac9cf47d661e985e6bb9"},
 ]
 
 [package.dependencies]
@@ -99,22 +99,41 @@ files = [
 
 [[package]]
 name = "attrs"
-version = "22.2.0"
+version = "23.1.0"
 description = "Classes Without Boilerplate"
 category = "main"
 optional = false
-python-versions = ">=3.6"
+python-versions = ">=3.7"
 files = [
-    {file = "attrs-22.2.0-py3-none-any.whl", hash = "sha256:29e95c7f6778868dbd49170f98f8818f78f3dc5e0e37c0b1f474e3561b240836"},
-    {file = "attrs-22.2.0.tar.gz", hash = "sha256:c9227bfc2f01993c03f68db37d1d15c9690188323c067c641f1a35ca58185f99"},
+    {file = "attrs-23.1.0-py3-none-any.whl", hash = "sha256:1f28b4522cdc2fb4256ac1a020c78acf9cba2c6b461ccd2c126f3aa8e8335d04"},
+    {file = "attrs-23.1.0.tar.gz", hash = "sha256:6279836d581513a26f1bf235f9acd333bc9115683f14f7e8fae46c98fc50e015"},
 ]
 
 [package.extras]
-cov = ["attrs[tests]", "coverage-enable-subprocess", "coverage[toml] (>=5.3)"]
-dev = ["attrs[docs,tests]"]
-docs = ["furo", "myst-parser", "sphinx", "sphinx-notfound-page", "sphinxcontrib-towncrier", "towncrier", "zope.interface"]
-tests = ["attrs[tests-no-zope]", "zope.interface"]
-tests-no-zope = ["cloudpickle", "cloudpickle", "hypothesis", "hypothesis", "mypy (>=0.971,<0.990)", "mypy (>=0.971,<0.990)", "pympler", "pympler", "pytest (>=4.3.0)", "pytest (>=4.3.0)", "pytest-mypy-plugins", "pytest-mypy-plugins", "pytest-xdist[psutil]", "pytest-xdist[psutil]"]
+cov = ["attrs[tests]", "coverage[toml] (>=5.3)"]
+dev = ["attrs[docs,tests]", "pre-commit"]
+docs = ["furo", "myst-parser", "sphinx", "sphinx-notfound-page", "sphinxcontrib-towncrier", "towncrier", "zope-interface"]
+tests = ["attrs[tests-no-zope]", "zope-interface"]
+tests-no-zope = ["cloudpickle", "hypothesis", "mypy (>=1.1.1)", "pympler", "pytest (>=4.3.0)", "pytest-mypy-plugins", "pytest-xdist[psutil]"]
+
+[[package]]
+name = "beautifulsoup4"
+version = "4.12.2"
+description = "Screen-scraping library"
+category = "main"
+optional = false
+python-versions = ">=3.6.0"
+files = [
+    {file = "beautifulsoup4-4.12.2-py3-none-any.whl", hash = "sha256:bd2520ca0d9d7d12694a53d44ac482d181b4ec1888909b035a3dbf40d0f57d4a"},
+    {file = "beautifulsoup4-4.12.2.tar.gz", hash = "sha256:492bbc69dca35d12daac71c4db1bfff0c876c00ef4a2ffacce226d4638eb72da"},
+]
+
+[package.dependencies]
+soupsieve = ">1.2"
+
+[package.extras]
+html5lib = ["html5lib"]
+lxml = ["lxml"]
 
 [[package]]
 name = "black"
@@ -166,6 +185,25 @@ d = ["aiohttp (>=3.7.4)"]
 jupyter = ["ipython (>=7.8.0)", "tokenize-rt (>=3.2.0)"]
 uvloop = ["uvloop (>=0.15.2)"]
 
+[[package]]
+name = "bleach"
+version = "6.0.0"
+description = "An easy safelist-based HTML-sanitizing tool."
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "bleach-6.0.0-py3-none-any.whl", hash = "sha256:33c16e3353dbd13028ab4799a0f89a83f113405c766e9c122df8a06f5b85b3f4"},
+    {file = "bleach-6.0.0.tar.gz", hash = "sha256:1a1a85c1595e07d8db14c5f09f09e6433502c51c595970edc090551f0db99414"},
+]
+
+[package.dependencies]
+six = ">=1.9.0"
+webencodings = "*"
+
+[package.extras]
+css = ["tinycss2 (>=1.1.0,<1.2)"]
+
 [[package]]
 name = "cattrs"
 version = "22.2.0"
@@ -184,14 +222,14 @@ exceptiongroup = {version = "*", markers = "python_version < \"3.11\""}
 
 [[package]]
 name = "certifi"
-version = "2022.12.7"
+version = "2023.5.7"
 description = "Python package for providing Mozilla's CA Bundle."
 category = "main"
 optional = false
 python-versions = ">=3.6"
 files = [
-    {file = "certifi-2022.12.7-py3-none-any.whl", hash = "sha256:4ad3232f5e926d6718ec31cfc1fcadfde020920e278684144551c91769c7bc18"},
-    {file = "certifi-2022.12.7.tar.gz", hash = "sha256:35824b4c3a97115964b408844d64aa14db1cc518f6562e8d7261699d1350a9e3"},
+    {file = "certifi-2023.5.7-py3-none-any.whl", hash = "sha256:c6c2e98f5c7869efca1f8916fed228dd91539f9f1b444c314c06eef02980c716"},
+    {file = "certifi-2023.5.7.tar.gz", hash = "sha256:0f0d56dc5a6ad56fd4ba36484d6cc34451e1c6548c61daad8c320169f91eddc7"},
 ]
 
 [[package]]
@@ -401,63 +439,63 @@ files = [
 
 [[package]]
 name = "coverage"
-version = "7.2.2"
+version = "7.2.5"
 description = "Code coverage measurement for Python"
 category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "coverage-7.2.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:c90e73bdecb7b0d1cea65a08cb41e9d672ac6d7995603d6465ed4914b98b9ad7"},
-    {file = "coverage-7.2.2-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:e2926b8abedf750c2ecf5035c07515770944acf02e1c46ab08f6348d24c5f94d"},
-    {file = "coverage-7.2.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:57b77b9099f172804e695a40ebaa374f79e4fb8b92f3e167f66facbf92e8e7f5"},
-    {file = "coverage-7.2.2-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:efe1c0adad110bf0ad7fb59f833880e489a61e39d699d37249bdf42f80590169"},
-    {file = "coverage-7.2.2-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:2199988e0bc8325d941b209f4fd1c6fa007024b1442c5576f1a32ca2e48941e6"},
-    {file = "coverage-7.2.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:81f63e0fb74effd5be736cfe07d710307cc0a3ccb8f4741f7f053c057615a137"},
-    {file = "coverage-7.2.2-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:186e0fc9cf497365036d51d4d2ab76113fb74f729bd25da0975daab2e107fd90"},
-    {file = "coverage-7.2.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:420f94a35e3e00a2b43ad5740f935358e24478354ce41c99407cddd283be00d2"},
-    {file = "coverage-7.2.2-cp310-cp310-win32.whl", hash = "sha256:38004671848b5745bb05d4d621526fca30cee164db42a1f185615f39dc997292"},
-    {file = "coverage-7.2.2-cp310-cp310-win_amd64.whl", hash = "sha256:0ce383d5f56d0729d2dd40e53fe3afeb8f2237244b0975e1427bfb2cf0d32bab"},
-    {file = "coverage-7.2.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:3eb55b7b26389dd4f8ae911ba9bc8c027411163839dea4c8b8be54c4ee9ae10b"},
-    {file = "coverage-7.2.2-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:d2b96123a453a2d7f3995ddb9f28d01fd112319a7a4d5ca99796a7ff43f02af5"},
-    {file = "coverage-7.2.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:299bc75cb2a41e6741b5e470b8c9fb78d931edbd0cd009c58e5c84de57c06731"},
-    {file = "coverage-7.2.2-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:5e1df45c23d4230e3d56d04414f9057eba501f78db60d4eeecfcb940501b08fd"},
-    {file = "coverage-7.2.2-cp311-cp311-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:006ed5582e9cbc8115d2e22d6d2144a0725db542f654d9d4fda86793832f873d"},
-    {file = "coverage-7.2.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:d683d230b5774816e7d784d7ed8444f2a40e7a450e5720d58af593cb0b94a212"},
-    {file = "coverage-7.2.2-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:8efb48fa743d1c1a65ee8787b5b552681610f06c40a40b7ef94a5b517d885c54"},
-    {file = "coverage-7.2.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:4c752d5264053a7cf2fe81c9e14f8a4fb261370a7bb344c2a011836a96fb3f57"},
-    {file = "coverage-7.2.2-cp311-cp311-win32.whl", hash = "sha256:55272f33da9a5d7cccd3774aeca7a01e500a614eaea2a77091e9be000ecd401d"},
-    {file = "coverage-7.2.2-cp311-cp311-win_amd64.whl", hash = "sha256:92ebc1619650409da324d001b3a36f14f63644c7f0a588e331f3b0f67491f512"},
-    {file = "coverage-7.2.2-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:5afdad4cc4cc199fdf3e18088812edcf8f4c5a3c8e6cb69127513ad4cb7471a9"},
-    {file = "coverage-7.2.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:0484d9dd1e6f481b24070c87561c8d7151bdd8b044c93ac99faafd01f695c78e"},
-    {file = "coverage-7.2.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:d530191aa9c66ab4f190be8ac8cc7cfd8f4f3217da379606f3dd4e3d83feba69"},
-    {file = "coverage-7.2.2-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4ac0f522c3b6109c4b764ffec71bf04ebc0523e926ca7cbe6c5ac88f84faced0"},
-    {file = "coverage-7.2.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:ba279aae162b20444881fc3ed4e4f934c1cf8620f3dab3b531480cf602c76b7f"},
-    {file = "coverage-7.2.2-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:53d0fd4c17175aded9c633e319360d41a1f3c6e352ba94edcb0fa5167e2bad67"},
-    {file = "coverage-7.2.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:8c99cb7c26a3039a8a4ee3ca1efdde471e61b4837108847fb7d5be7789ed8fd9"},
-    {file = "coverage-7.2.2-cp37-cp37m-win32.whl", hash = "sha256:5cc0783844c84af2522e3a99b9b761a979a3ef10fb87fc4048d1ee174e18a7d8"},
-    {file = "coverage-7.2.2-cp37-cp37m-win_amd64.whl", hash = "sha256:817295f06eacdc8623dc4df7d8b49cea65925030d4e1e2a7c7218380c0072c25"},
-    {file = "coverage-7.2.2-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:6146910231ece63facfc5984234ad1b06a36cecc9fd0c028e59ac7c9b18c38c6"},
-    {file = "coverage-7.2.2-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:387fb46cb8e53ba7304d80aadca5dca84a2fbf6fe3faf6951d8cf2d46485d1e5"},
-    {file = "coverage-7.2.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:046936ab032a2810dcaafd39cc4ef6dd295df1a7cbead08fe996d4765fca9fe4"},
-    {file = "coverage-7.2.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:e627dee428a176ffb13697a2c4318d3f60b2ccdde3acdc9b3f304206ec130ccd"},
-    {file = "coverage-7.2.2-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4fa54fb483decc45f94011898727802309a109d89446a3c76387d016057d2c84"},
-    {file = "coverage-7.2.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:3668291b50b69a0c1ef9f462c7df2c235da3c4073f49543b01e7eb1dee7dd540"},
-    {file = "coverage-7.2.2-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:7c20b731211261dc9739bbe080c579a1835b0c2d9b274e5fcd903c3a7821cf88"},
-    {file = "coverage-7.2.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:5764e1f7471cb8f64b8cda0554f3d4c4085ae4b417bfeab236799863703e5de2"},
-    {file = "coverage-7.2.2-cp38-cp38-win32.whl", hash = "sha256:4f01911c010122f49a3e9bdc730eccc66f9b72bd410a3a9d3cb8448bb50d65d3"},
-    {file = "coverage-7.2.2-cp38-cp38-win_amd64.whl", hash = "sha256:c448b5c9e3df5448a362208b8d4b9ed85305528313fca1b479f14f9fe0d873b8"},
-    {file = "coverage-7.2.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:bfe7085783cda55e53510482fa7b5efc761fad1abe4d653b32710eb548ebdd2d"},
-    {file = "coverage-7.2.2-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:9d22e94e6dc86de981b1b684b342bec5e331401599ce652900ec59db52940005"},
-    {file = "coverage-7.2.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:507e4720791977934bba016101579b8c500fb21c5fa3cd4cf256477331ddd988"},
-    {file = "coverage-7.2.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:bc4803779f0e4b06a2361f666e76f5c2e3715e8e379889d02251ec911befd149"},
-    {file = "coverage-7.2.2-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:db8c2c5ace167fd25ab5dd732714c51d4633f58bac21fb0ff63b0349f62755a8"},
-    {file = "coverage-7.2.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:4f68ee32d7c4164f1e2c8797535a6d0a3733355f5861e0f667e37df2d4b07140"},
-    {file = "coverage-7.2.2-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:d52f0a114b6a58305b11a5cdecd42b2e7f1ec77eb20e2b33969d702feafdd016"},
-    {file = "coverage-7.2.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:797aad79e7b6182cb49c08cc5d2f7aa7b2128133b0926060d0a8889ac43843be"},
-    {file = "coverage-7.2.2-cp39-cp39-win32.whl", hash = "sha256:db45eec1dfccdadb179b0f9ca616872c6f700d23945ecc8f21bb105d74b1c5fc"},
-    {file = "coverage-7.2.2-cp39-cp39-win_amd64.whl", hash = "sha256:8dbe2647bf58d2c5a6c5bcc685f23b5f371909a5624e9f5cd51436d6a9f6c6ef"},
-    {file = "coverage-7.2.2-pp37.pp38.pp39-none-any.whl", hash = "sha256:872d6ce1f5be73f05bea4df498c140b9e7ee5418bfa2cc8204e7f9b817caa968"},
-    {file = "coverage-7.2.2.tar.gz", hash = "sha256:36dd42da34fe94ed98c39887b86db9d06777b1c8f860520e21126a75507024f2"},
+    {file = "coverage-7.2.5-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:883123d0bbe1c136f76b56276074b0c79b5817dd4238097ffa64ac67257f4b6c"},
+    {file = "coverage-7.2.5-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:d2fbc2a127e857d2f8898aaabcc34c37771bf78a4d5e17d3e1f5c30cd0cbc62a"},
+    {file = "coverage-7.2.5-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:5f3671662dc4b422b15776cdca89c041a6349b4864a43aa2350b6b0b03bbcc7f"},
+    {file = "coverage-7.2.5-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:780551e47d62095e088f251f5db428473c26db7829884323e56d9c0c3118791a"},
+    {file = "coverage-7.2.5-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:066b44897c493e0dcbc9e6a6d9f8bbb6607ef82367cf6810d387c09f0cd4fe9a"},
+    {file = "coverage-7.2.5-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:b9a4ee55174b04f6af539218f9f8083140f61a46eabcaa4234f3c2a452c4ed11"},
+    {file = "coverage-7.2.5-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:706ec567267c96717ab9363904d846ec009a48d5f832140b6ad08aad3791b1f5"},
+    {file = "coverage-7.2.5-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:ae453f655640157d76209f42c62c64c4d4f2c7f97256d3567e3b439bd5c9b06c"},
+    {file = "coverage-7.2.5-cp310-cp310-win32.whl", hash = "sha256:f81c9b4bd8aa747d417407a7f6f0b1469a43b36a85748145e144ac4e8d303cb5"},
+    {file = "coverage-7.2.5-cp310-cp310-win_amd64.whl", hash = "sha256:dc945064a8783b86fcce9a0a705abd7db2117d95e340df8a4333f00be5efb64c"},
+    {file = "coverage-7.2.5-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:40cc0f91c6cde033da493227797be2826cbf8f388eaa36a0271a97a332bfd7ce"},
+    {file = "coverage-7.2.5-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:a66e055254a26c82aead7ff420d9fa8dc2da10c82679ea850d8feebf11074d88"},
+    {file = "coverage-7.2.5-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:c10fbc8a64aa0f3ed136b0b086b6b577bc64d67d5581acd7cc129af52654384e"},
+    {file = "coverage-7.2.5-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:9a22cbb5ede6fade0482111fa7f01115ff04039795d7092ed0db43522431b4f2"},
+    {file = "coverage-7.2.5-cp311-cp311-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:292300f76440651529b8ceec283a9370532f4ecba9ad67d120617021bb5ef139"},
+    {file = "coverage-7.2.5-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:7ff8f3fb38233035028dbc93715551d81eadc110199e14bbbfa01c5c4a43f8d8"},
+    {file = "coverage-7.2.5-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:a08c7401d0b24e8c2982f4e307124b671c6736d40d1c39e09d7a8687bddf83ed"},
+    {file = "coverage-7.2.5-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:ef9659d1cda9ce9ac9585c045aaa1e59223b143f2407db0eaee0b61a4f266fb6"},
+    {file = "coverage-7.2.5-cp311-cp311-win32.whl", hash = "sha256:30dcaf05adfa69c2a7b9f7dfd9f60bc8e36b282d7ed25c308ef9e114de7fc23b"},
+    {file = "coverage-7.2.5-cp311-cp311-win_amd64.whl", hash = "sha256:97072cc90f1009386c8a5b7de9d4fc1a9f91ba5ef2146c55c1f005e7b5c5e068"},
+    {file = "coverage-7.2.5-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:bebea5f5ed41f618797ce3ffb4606c64a5de92e9c3f26d26c2e0aae292f015c1"},
+    {file = "coverage-7.2.5-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:828189fcdda99aae0d6bf718ea766b2e715eabc1868670a0a07bf8404bf58c33"},
+    {file = "coverage-7.2.5-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:6e8a95f243d01ba572341c52f89f3acb98a3b6d1d5d830efba86033dd3687ade"},
+    {file = "coverage-7.2.5-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e8834e5f17d89e05697c3c043d3e58a8b19682bf365048837383abfe39adaed5"},
+    {file = "coverage-7.2.5-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:d1f25ee9de21a39b3a8516f2c5feb8de248f17da7eead089c2e04aa097936b47"},
+    {file = "coverage-7.2.5-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:1637253b11a18f453e34013c665d8bf15904c9e3c44fbda34c643fbdc9d452cd"},
+    {file = "coverage-7.2.5-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:8e575a59315a91ccd00c7757127f6b2488c2f914096077c745c2f1ba5b8c0969"},
+    {file = "coverage-7.2.5-cp37-cp37m-win32.whl", hash = "sha256:509ecd8334c380000d259dc66feb191dd0a93b21f2453faa75f7f9cdcefc0718"},
+    {file = "coverage-7.2.5-cp37-cp37m-win_amd64.whl", hash = "sha256:12580845917b1e59f8a1c2ffa6af6d0908cb39220f3019e36c110c943dc875b0"},
+    {file = "coverage-7.2.5-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:b5016e331b75310610c2cf955d9f58a9749943ed5f7b8cfc0bb89c6134ab0a84"},
+    {file = "coverage-7.2.5-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:373ea34dca98f2fdb3e5cb33d83b6d801007a8074f992b80311fc589d3e6b790"},
+    {file = "coverage-7.2.5-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:a063aad9f7b4c9f9da7b2550eae0a582ffc7623dca1c925e50c3fbde7a579771"},
+    {file = "coverage-7.2.5-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:38c0a497a000d50491055805313ed83ddba069353d102ece8aef5d11b5faf045"},
+    {file = "coverage-7.2.5-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a2b3b05e22a77bb0ae1a3125126a4e08535961c946b62f30985535ed40e26614"},
+    {file = "coverage-7.2.5-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:0342a28617e63ad15d96dca0f7ae9479a37b7d8a295f749c14f3436ea59fdcb3"},
+    {file = "coverage-7.2.5-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:cf97ed82ca986e5c637ea286ba2793c85325b30f869bf64d3009ccc1a31ae3fd"},
+    {file = "coverage-7.2.5-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:c2c41c1b1866b670573657d584de413df701f482574bad7e28214a2362cb1fd1"},
+    {file = "coverage-7.2.5-cp38-cp38-win32.whl", hash = "sha256:10b15394c13544fce02382360cab54e51a9e0fd1bd61ae9ce012c0d1e103c813"},
+    {file = "coverage-7.2.5-cp38-cp38-win_amd64.whl", hash = "sha256:a0b273fe6dc655b110e8dc89b8ec7f1a778d78c9fd9b4bda7c384c8906072212"},
+    {file = "coverage-7.2.5-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:5c587f52c81211d4530fa6857884d37f514bcf9453bdeee0ff93eaaf906a5c1b"},
+    {file = "coverage-7.2.5-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:4436cc9ba5414c2c998eaedee5343f49c02ca93b21769c5fdfa4f9d799e84200"},
+    {file = "coverage-7.2.5-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:6599bf92f33ab041e36e06d25890afbdf12078aacfe1f1d08c713906e49a3fe5"},
+    {file = "coverage-7.2.5-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:857abe2fa6a4973f8663e039ead8d22215d31db613ace76e4a98f52ec919068e"},
+    {file = "coverage-7.2.5-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f6f5cab2d7f0c12f8187a376cc6582c477d2df91d63f75341307fcdcb5d60303"},
+    {file = "coverage-7.2.5-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:aa387bd7489f3e1787ff82068b295bcaafbf6f79c3dad3cbc82ef88ce3f48ad3"},
+    {file = "coverage-7.2.5-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:156192e5fd3dbbcb11cd777cc469cf010a294f4c736a2b2c891c77618cb1379a"},
+    {file = "coverage-7.2.5-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:bd3b4b8175c1db502adf209d06136c000df4d245105c8839e9d0be71c94aefe1"},
+    {file = "coverage-7.2.5-cp39-cp39-win32.whl", hash = "sha256:ddc5a54edb653e9e215f75de377354e2455376f416c4378e1d43b08ec50acc31"},
+    {file = "coverage-7.2.5-cp39-cp39-win_amd64.whl", hash = "sha256:338aa9d9883aaaad53695cb14ccdeb36d4060485bb9388446330bef9c361c252"},
+    {file = "coverage-7.2.5-pp37.pp38.pp39-none-any.whl", hash = "sha256:8877d9b437b35a85c18e3c6499b23674684bf690f5d96c1006a1ef61f9fdf0f3"},
+    {file = "coverage-7.2.5.tar.gz", hash = "sha256:f99ef080288f09ffc687423b8d60978cf3a465d3f404a18d1a05474bd8575a47"},
 ]
 
 [package.dependencies]
@@ -468,31 +506,31 @@ toml = ["tomli"]
 
 [[package]]
 name = "cryptography"
-version = "40.0.1"
+version = "40.0.2"
 description = "cryptography is a package which provides cryptographic recipes and primitives to Python developers."
 category = "main"
 optional = false
 python-versions = ">=3.6"
 files = [
-    {file = "cryptography-40.0.1-cp36-abi3-macosx_10_12_universal2.whl", hash = "sha256:918cb89086c7d98b1b86b9fdb70c712e5a9325ba6f7d7cfb509e784e0cfc6917"},
-    {file = "cryptography-40.0.1-cp36-abi3-macosx_10_12_x86_64.whl", hash = "sha256:9618a87212cb5200500e304e43691111570e1f10ec3f35569fdfcd17e28fd797"},
-    {file = "cryptography-40.0.1-cp36-abi3-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3a4805a4ca729d65570a1b7cac84eac1e431085d40387b7d3bbaa47e39890b88"},
-    {file = "cryptography-40.0.1-cp36-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:63dac2d25c47f12a7b8aa60e528bfb3c51c5a6c5a9f7c86987909c6c79765554"},
-    {file = "cryptography-40.0.1-cp36-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:0a4e3406cfed6b1f6d6e87ed243363652b2586b2d917b0609ca4f97072994405"},
-    {file = "cryptography-40.0.1-cp36-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:1e0af458515d5e4028aad75f3bb3fe7a31e46ad920648cd59b64d3da842e4356"},
-    {file = "cryptography-40.0.1-cp36-abi3-musllinux_1_1_aarch64.whl", hash = "sha256:d8aa3609d337ad85e4eb9bb0f8bcf6e4409bfb86e706efa9a027912169e89122"},
-    {file = "cryptography-40.0.1-cp36-abi3-musllinux_1_1_x86_64.whl", hash = "sha256:cf91e428c51ef692b82ce786583e214f58392399cf65c341bc7301d096fa3ba2"},
-    {file = "cryptography-40.0.1-cp36-abi3-win32.whl", hash = "sha256:650883cc064297ef3676b1db1b7b1df6081794c4ada96fa457253c4cc40f97db"},
-    {file = "cryptography-40.0.1-cp36-abi3-win_amd64.whl", hash = "sha256:a805a7bce4a77d51696410005b3e85ae2839bad9aa38894afc0aa99d8e0c3160"},
-    {file = "cryptography-40.0.1-pp38-pypy38_pp73-macosx_10_12_x86_64.whl", hash = "sha256:cd033d74067d8928ef00a6b1327c8ea0452523967ca4463666eeba65ca350d4c"},
-    {file = "cryptography-40.0.1-pp38-pypy38_pp73-manylinux_2_28_aarch64.whl", hash = "sha256:d36bbeb99704aabefdca5aee4eba04455d7a27ceabd16f3b3ba9bdcc31da86c4"},
-    {file = "cryptography-40.0.1-pp38-pypy38_pp73-manylinux_2_28_x86_64.whl", hash = "sha256:32057d3d0ab7d4453778367ca43e99ddb711770477c4f072a51b3ca69602780a"},
-    {file = "cryptography-40.0.1-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:f5d7b79fa56bc29580faafc2ff736ce05ba31feaa9d4735048b0de7d9ceb2b94"},
-    {file = "cryptography-40.0.1-pp39-pypy39_pp73-macosx_10_12_x86_64.whl", hash = "sha256:7c872413353c70e0263a9368c4993710070e70ab3e5318d85510cc91cce77e7c"},
-    {file = "cryptography-40.0.1-pp39-pypy39_pp73-manylinux_2_28_aarch64.whl", hash = "sha256:28d63d75bf7ae4045b10de5413fb1d6338616e79015999ad9cf6fc538f772d41"},
-    {file = "cryptography-40.0.1-pp39-pypy39_pp73-manylinux_2_28_x86_64.whl", hash = "sha256:6f2bbd72f717ce33100e6467572abaedc61f1acb87b8d546001328d7f466b778"},
-    {file = "cryptography-40.0.1-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:cc3a621076d824d75ab1e1e530e66e7e8564e357dd723f2533225d40fe35c60c"},
-    {file = "cryptography-40.0.1.tar.gz", hash = "sha256:2803f2f8b1e95f614419926c7e6f55d828afc614ca5ed61543877ae668cc3472"},
+    {file = "cryptography-40.0.2-cp36-abi3-macosx_10_12_universal2.whl", hash = "sha256:8f79b5ff5ad9d3218afb1e7e20ea74da5f76943ee5edb7f76e56ec5161ec782b"},
+    {file = "cryptography-40.0.2-cp36-abi3-macosx_10_12_x86_64.whl", hash = "sha256:05dc219433b14046c476f6f09d7636b92a1c3e5808b9a6536adf4932b3b2c440"},
+    {file = "cryptography-40.0.2-cp36-abi3-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:4df2af28d7bedc84fe45bd49bc35d710aede676e2a4cb7fc6d103a2adc8afe4d"},
+    {file = "cryptography-40.0.2-cp36-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:0dcca15d3a19a66e63662dc8d30f8036b07be851a8680eda92d079868f106288"},
+    {file = "cryptography-40.0.2-cp36-abi3-manylinux_2_28_aarch64.whl", hash = "sha256:a04386fb7bc85fab9cd51b6308633a3c271e3d0d3eae917eebab2fac6219b6d2"},
+    {file = "cryptography-40.0.2-cp36-abi3-manylinux_2_28_x86_64.whl", hash = "sha256:adc0d980fd2760c9e5de537c28935cc32b9353baaf28e0814df417619c6c8c3b"},
+    {file = "cryptography-40.0.2-cp36-abi3-musllinux_1_1_aarch64.whl", hash = "sha256:d5a1bd0e9e2031465761dfa920c16b0065ad77321d8a8c1f5ee331021fda65e9"},
+    {file = "cryptography-40.0.2-cp36-abi3-musllinux_1_1_x86_64.whl", hash = "sha256:a95f4802d49faa6a674242e25bfeea6fc2acd915b5e5e29ac90a32b1139cae1c"},
+    {file = "cryptography-40.0.2-cp36-abi3-win32.whl", hash = "sha256:aecbb1592b0188e030cb01f82d12556cf72e218280f621deed7d806afd2113f9"},
+    {file = "cryptography-40.0.2-cp36-abi3-win_amd64.whl", hash = "sha256:b12794f01d4cacfbd3177b9042198f3af1c856eedd0a98f10f141385c809a14b"},
+    {file = "cryptography-40.0.2-pp38-pypy38_pp73-macosx_10_12_x86_64.whl", hash = "sha256:142bae539ef28a1c76794cca7f49729e7c54423f615cfd9b0b1fa90ebe53244b"},
+    {file = "cryptography-40.0.2-pp38-pypy38_pp73-manylinux_2_28_aarch64.whl", hash = "sha256:956ba8701b4ffe91ba59665ed170a2ebbdc6fc0e40de5f6059195d9f2b33ca0e"},
+    {file = "cryptography-40.0.2-pp38-pypy38_pp73-manylinux_2_28_x86_64.whl", hash = "sha256:4f01c9863da784558165f5d4d916093737a75203a5c5286fde60e503e4276c7a"},
+    {file = "cryptography-40.0.2-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:3daf9b114213f8ba460b829a02896789751626a2a4e7a43a28ee77c04b5e4958"},
+    {file = "cryptography-40.0.2-pp39-pypy39_pp73-macosx_10_12_x86_64.whl", hash = "sha256:48f388d0d153350f378c7f7b41497a54ff1513c816bcbbcafe5b829e59b9ce5b"},
+    {file = "cryptography-40.0.2-pp39-pypy39_pp73-manylinux_2_28_aarch64.whl", hash = "sha256:c0764e72b36a3dc065c155e5b22f93df465da9c39af65516fe04ed3c68c92636"},
+    {file = "cryptography-40.0.2-pp39-pypy39_pp73-manylinux_2_28_x86_64.whl", hash = "sha256:cbaba590180cba88cb99a5f76f90808a624f18b169b90a4abb40c1fd8c19420e"},
+    {file = "cryptography-40.0.2-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:7a38250f433cd41df7fcb763caa3ee9362777fdb4dc642b9a349721d2bf47404"},
+    {file = "cryptography-40.0.2.tar.gz", hash = "sha256:c33c0d32b8594fa647d2e01dbccc303478e16fdd7cf98652d5b3ed11aa5e5c99"},
 ]
 
 [package.dependencies]
@@ -550,26 +588,26 @@ wmi = ["wmi (>=1.5.1,<2.0.0)"]
 
 [[package]]
 name = "docutils"
-version = "0.19"
+version = "0.20.1"
 description = "Docutils -- Python Documentation Utilities"
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "docutils-0.19-py3-none-any.whl", hash = "sha256:5e1de4d849fee02c63b040a4a3fd567f4ab104defd8a5511fbbc24a8a017efbc"},
-    {file = "docutils-0.19.tar.gz", hash = "sha256:33995a6753c30b7f577febfc2c50411fec6aac7f7ffeb7c4cfe5991072dcf9e6"},
+    {file = "docutils-0.20.1-py3-none-any.whl", hash = "sha256:96f387a2c5562db4476f09f13bbab2192e764cac08ebbf3a34a95d9b1e4a59d6"},
+    {file = "docutils-0.20.1.tar.gz", hash = "sha256:f08a4e276c3a1583a86dce3e34aba3fe04d02bba2dd51ed16106244e8a923e3b"},
 ]
 
 [[package]]
 name = "dunamai"
-version = "1.16.0"
+version = "1.17.0"
 description = "Dynamic version generation"
 category = "dev"
 optional = false
 python-versions = ">=3.5,<4.0"
 files = [
-    {file = "dunamai-1.16.0-py3-none-any.whl", hash = "sha256:dc92d817f3bc155e8b129e8c705c36bb15a7e950e2698a93aea142732a888e98"},
-    {file = "dunamai-1.16.0.tar.gz", hash = "sha256:bfe8e23cc5a1ceed1c7f791674ea24cf832a53a5da73f046eeb43367ccfc3f77"},
+    {file = "dunamai-1.17.0-py3-none-any.whl", hash = "sha256:5aa4ac1085de10691269af021b10497261a5dd644f277e2a21822212604d877b"},
+    {file = "dunamai-1.17.0.tar.gz", hash = "sha256:459381b585a1e78e4070f0d38a6afb4d67de2ee95064bf6b0438ec620dde0820"},
 ]
 
 [package.dependencies]
@@ -592,19 +630,19 @@ test = ["pytest (>=6)"]
 
 [[package]]
 name = "filelock"
-version = "3.10.7"
+version = "3.12.0"
 description = "A platform independent file lock."
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "filelock-3.10.7-py3-none-any.whl", hash = "sha256:bde48477b15fde2c7e5a0713cbe72721cb5a5ad32ee0b8f419907960b9d75536"},
-    {file = "filelock-3.10.7.tar.gz", hash = "sha256:892be14aa8efc01673b5ed6589dbccb95f9a8596f0507e232626155495c18105"},
+    {file = "filelock-3.12.0-py3-none-any.whl", hash = "sha256:ad98852315c2ab702aeb628412cbf7e95b7ce8c3bf9565670b4eaecf1db370a9"},
+    {file = "filelock-3.12.0.tar.gz", hash = "sha256:fc03ae43288c013d2ea83c8597001b1129db351aad9c57fe2409327916b8e718"},
 ]
 
 [package.extras]
-docs = ["furo (>=2022.12.7)", "sphinx (>=6.1.3)", "sphinx-autodoc-typehints (>=1.22,!=1.23.4)"]
-testing = ["covdefaults (>=2.3)", "coverage (>=7.2.2)", "diff-cover (>=7.5)", "pytest (>=7.2.2)", "pytest-cov (>=4)", "pytest-mock (>=3.10)", "pytest-timeout (>=2.1)"]
+docs = ["furo (>=2023.3.27)", "sphinx (>=6.1.3)", "sphinx-autodoc-typehints (>=1.23,!=1.23.4)"]
+testing = ["covdefaults (>=2.3)", "coverage (>=7.2.3)", "diff-cover (>=7.5)", "pytest (>=7.3.1)", "pytest-cov (>=4)", "pytest-mock (>=3.10)", "pytest-timeout (>=2.1)"]
 
 [[package]]
 name = "flake8"
@@ -665,14 +703,14 @@ files = [
 
 [[package]]
 name = "httpcore"
-version = "0.17.0"
+version = "0.17.1"
 description = "A minimal low-level HTTP client."
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "httpcore-0.17.0-py3-none-any.whl", hash = "sha256:0fdfea45e94f0c9fd96eab9286077f9ff788dd186635ae61b312693e4d943599"},
-    {file = "httpcore-0.17.0.tar.gz", hash = "sha256:cc045a3241afbf60ce056202301b4d8b6af08845e3294055eb26b09913ef903c"},
+    {file = "httpcore-0.17.1-py3-none-any.whl", hash = "sha256:628e768aaeec1f7effdc6408ba1c3cdbd7487c1fc570f7d66844ec4f003e1ca4"},
+    {file = "httpcore-0.17.1.tar.gz", hash = "sha256:caf508597c525f9b8bfff187e270666309f63115af30f7d68b16143a403c8356"},
 ]
 
 [package.dependencies]
@@ -687,14 +725,14 @@ socks = ["socksio (>=1.0.0,<2.0.0)"]
 
 [[package]]
 name = "httpx"
-version = "0.24.0"
+version = "0.24.1"
 description = "The next generation HTTP client."
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "httpx-0.24.0-py3-none-any.whl", hash = "sha256:447556b50c1921c351ea54b4fe79d91b724ed2b027462ab9a329465d147d5a4e"},
-    {file = "httpx-0.24.0.tar.gz", hash = "sha256:507d676fc3e26110d41df7d35ebd8b3b8585052450f4097401c9be59d928c63e"},
+    {file = "httpx-0.24.1-py3-none-any.whl", hash = "sha256:06781eb9ac53cde990577af654bd990a4949de37a28bdb4a230d434f3a30b9bd"},
+    {file = "httpx-0.24.1.tar.gz", hash = "sha256:5853a43053df830c20f8110c5e69fe44d035d850b2dfe795e196f00fdb774bdd"},
 ]
 
 [package.dependencies]
@@ -734,6 +772,26 @@ files = [
     {file = "idna-3.4.tar.gz", hash = "sha256:814f528e8dead7d329833b91c5faa87d60bf71824cd12a7530b5526063d02cb4"},
 ]
 
+[[package]]
+name = "importlib-metadata"
+version = "6.6.0"
+description = "Read metadata from Python packages"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "importlib_metadata-6.6.0-py3-none-any.whl", hash = "sha256:43dd286a2cd8995d5eaef7fee2066340423b818ed3fd70adf0bad5f1fac53fed"},
+    {file = "importlib_metadata-6.6.0.tar.gz", hash = "sha256:92501cdf9cc66ebd3e612f1b4f0c0765dfa42f0fa38ffb319b6bd84dd675d705"},
+]
+
+[package.dependencies]
+zipp = ">=0.5"
+
+[package.extras]
+docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)", "sphinx-lint"]
+perf = ["ipython"]
+testing = ["flake8 (<5)", "flufl.flake8", "importlib-resources (>=1.3)", "packaging", "pyfakefs", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)", "pytest-perf (>=0.9.2)"]
+
 [[package]]
 name = "iniconfig"
 version = "2.0.0"
@@ -746,6 +804,41 @@ files = [
     {file = "iniconfig-2.0.0.tar.gz", hash = "sha256:2d91e135bf72d31a410b17c16da610a82cb55f6b0477d1a902134b24a455b8b3"},
 ]
 
+[[package]]
+name = "jaraco-classes"
+version = "3.2.3"
+description = "Utility functions for Python class constructs"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "jaraco.classes-3.2.3-py3-none-any.whl", hash = "sha256:2353de3288bc6b82120752201c6b1c1a14b058267fa424ed5ce5984e3b922158"},
+    {file = "jaraco.classes-3.2.3.tar.gz", hash = "sha256:89559fa5c1d3c34eff6f631ad80bb21f378dbcbb35dd161fd2c6b93f5be2f98a"},
+]
+
+[package.dependencies]
+more-itertools = "*"
+
+[package.extras]
+docs = ["jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)"]
+testing = ["flake8 (<5)", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)"]
+
+[[package]]
+name = "jeepney"
+version = "0.8.0"
+description = "Low-level, pure Python DBus protocol wrapper."
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "jeepney-0.8.0-py3-none-any.whl", hash = "sha256:c0a454ad016ca575060802ee4d590dd912e35c122fa04e70306de3d076cce755"},
+    {file = "jeepney-0.8.0.tar.gz", hash = "sha256:5efe48d255973902f6badc3ce55e2aa6c5c3b3bc642059ef3a91247bcfcc5806"},
+]
+
+[package.extras]
+test = ["async-timeout", "pytest", "pytest-asyncio (>=0.17)", "pytest-trio", "testpath", "trio"]
+trio = ["async_generator", "trio"]
+
 [[package]]
 name = "jinja2"
 version = "3.1.2"
@@ -764,6 +857,30 @@ MarkupSafe = ">=2.0"
 [package.extras]
 i18n = ["Babel (>=2.7)"]
 
+[[package]]
+name = "keyring"
+version = "23.13.1"
+description = "Store and access your passwords safely."
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "keyring-23.13.1-py3-none-any.whl", hash = "sha256:771ed2a91909389ed6148631de678f82ddc73737d85a927f382a8a1b157898cd"},
+    {file = "keyring-23.13.1.tar.gz", hash = "sha256:ba2e15a9b35e21908d0aaf4e0a47acc52d6ae33444df0da2b49d41a46ef6d678"},
+]
+
+[package.dependencies]
+importlib-metadata = {version = ">=4.11.4", markers = "python_version < \"3.12\""}
+"jaraco.classes" = "*"
+jeepney = {version = ">=0.4.2", markers = "sys_platform == \"linux\""}
+pywin32-ctypes = {version = ">=0.2.0", markers = "sys_platform == \"win32\""}
+SecretStorage = {version = ">=3.2", markers = "sys_platform == \"linux\""}
+
+[package.extras]
+completion = ["shtab"]
+docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)"]
+testing = ["flake8 (<5)", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)"]
+
 [[package]]
 name = "lockfile"
 version = "0.12.2"
@@ -776,6 +893,31 @@ files = [
     {file = "lockfile-0.12.2.tar.gz", hash = "sha256:6aed02de03cba24efabcd600b30540140634fc06cfa603822d508d5361e9f799"},
 ]
 
+[[package]]
+name = "markdown-it-py"
+version = "2.2.0"
+description = "Python port of markdown-it. Markdown parsing, done right!"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "markdown-it-py-2.2.0.tar.gz", hash = "sha256:7c9a5e412688bc771c67432cbfebcdd686c93ce6484913dccf06cb5a0bea35a1"},
+    {file = "markdown_it_py-2.2.0-py3-none-any.whl", hash = "sha256:5a35f8d1870171d9acc47b99612dc146129b631baf04970128b568f190d0cc30"},
+]
+
+[package.dependencies]
+mdurl = ">=0.1,<1.0"
+
+[package.extras]
+benchmarking = ["psutil", "pytest", "pytest-benchmark"]
+code-style = ["pre-commit (>=3.0,<4.0)"]
+compare = ["commonmark (>=0.9,<1.0)", "markdown (>=3.4,<4.0)", "mistletoe (>=1.0,<2.0)", "mistune (>=2.0,<3.0)", "panflute (>=2.3,<3.0)"]
+linkify = ["linkify-it-py (>=1,<3)"]
+plugins = ["mdit-py-plugins"]
+profiling = ["gprof2dot"]
+rtd = ["attrs", "myst-parser", "pyyaml", "sphinx", "sphinx-copybutton", "sphinx-design", "sphinx_book_theme"]
+testing = ["coverage", "pytest", "pytest-cov", "pytest-regressions"]
+
 [[package]]
 name = "markupsafe"
 version = "2.1.2"
@@ -848,6 +990,30 @@ files = [
     {file = "mccabe-0.7.0.tar.gz", hash = "sha256:348e0240c33b60bbdf4e523192ef919f28cb2c3d7d5c7794f74009290f236325"},
 ]
 
+[[package]]
+name = "mdurl"
+version = "0.1.2"
+description = "Markdown URL utilities"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "mdurl-0.1.2-py3-none-any.whl", hash = "sha256:84008a41e51615a49fc9966191ff91509e3c40b939176e643fd50a5c2196b8f8"},
+    {file = "mdurl-0.1.2.tar.gz", hash = "sha256:bb413d29f5eea38f31dd4754dd7377d4465116fb207585f97bf925588687c1ba"},
+]
+
+[[package]]
+name = "more-itertools"
+version = "9.1.0"
+description = "More routines for operating on iterables, beyond itertools"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "more-itertools-9.1.0.tar.gz", hash = "sha256:cabaa341ad0389ea83c17a94566a53ae4c9d07349861ecb14dc6d0345cf9ac5d"},
+    {file = "more_itertools-9.1.0-py3-none-any.whl", hash = "sha256:d2bc7f02446e86a68911e58ded76d6561eea00cddfb2a91e7019bbb586c799f3"},
+]
+
 [[package]]
 name = "mypy-extensions"
 version = "1.0.0"
@@ -893,14 +1059,14 @@ dev = ["black", "mypy", "pytest"]
 
 [[package]]
 name = "packaging"
-version = "23.0"
+version = "23.1"
 description = "Core utilities for Python packages"
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "packaging-23.0-py3-none-any.whl", hash = "sha256:714ac14496c3e68c99c29b00845f7a2b85f3bb6f1078fd9f72fd20f0570002b2"},
-    {file = "packaging-23.0.tar.gz", hash = "sha256:b6ad297f8907de0fa2fe1ccbd26fdaf387f5f47c7275fedf8cce89f99446cf97"},
+    {file = "packaging-23.1-py3-none-any.whl", hash = "sha256:994793af429502c4ea2ebf6bf664629d07c1a9fe974af92966e4b8d2df7edc61"},
+    {file = "packaging-23.1.tar.gz", hash = "sha256:a392980d2b6cffa644431898be54b0045151319d1e7ec34f0cfed48767dd334f"},
 ]
 
 [[package]]
@@ -930,21 +1096,36 @@ files = [
 [package.dependencies]
 ptyprocess = ">=0.5"
 
+[[package]]
+name = "pkginfo"
+version = "1.9.6"
+description = "Query metadata from sdists / bdists / installed packages."
+category = "dev"
+optional = false
+python-versions = ">=3.6"
+files = [
+    {file = "pkginfo-1.9.6-py3-none-any.whl", hash = "sha256:4b7a555a6d5a22169fcc9cf7bfd78d296b0361adad412a346c1226849af5e546"},
+    {file = "pkginfo-1.9.6.tar.gz", hash = "sha256:8fd5896e8718a4372f0ea9cc9d96f6417c9b986e23a4d116dda26b62cc29d046"},
+]
+
+[package.extras]
+testing = ["pytest", "pytest-cov"]
+
 [[package]]
 name = "platformdirs"
-version = "3.2.0"
+version = "3.5.1"
 description = "A small Python package for determining appropriate platform-specific dirs, e.g. a \"user data dir\"."
 category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "platformdirs-3.2.0-py3-none-any.whl", hash = "sha256:ebe11c0d7a805086e99506aa331612429a72ca7cd52a1f0d277dc4adc20cb10e"},
-    {file = "platformdirs-3.2.0.tar.gz", hash = "sha256:d5b638ca397f25f979350ff789db335903d7ea010ab28903f57b27e1b16c2b08"},
+    {file = "platformdirs-3.5.1-py3-none-any.whl", hash = "sha256:e2378146f1964972c03c085bb5662ae80b2b8c06226c54b2ff4aa9483e8a13a5"},
+    {file = "platformdirs-3.5.1.tar.gz", hash = "sha256:412dae91f52a6f84830f39a8078cecd0e866cb72294a5c66808e74d5e88d251f"},
 ]
 
 [package.extras]
-docs = ["furo (>=2022.12.7)", "proselint (>=0.13)", "sphinx (>=6.1.3)", "sphinx-autodoc-typehints (>=1.22,!=1.23.4)"]
-test = ["appdirs (==1.4.4)", "covdefaults (>=2.3)", "pytest (>=7.2.2)", "pytest-cov (>=4)", "pytest-mock (>=3.10)"]
+docs = ["furo (>=2023.3.27)", "proselint (>=0.13)", "sphinx (>=6.2.1)", "sphinx-autodoc-typehints (>=1.23,!=1.23.4)"]
+test = ["appdirs (==1.4.4)", "covdefaults (>=2.3)", "pytest (>=7.3.1)", "pytest-cov (>=4)", "pytest-mock (>=3.10)"]
 
 [[package]]
 name = "pluggy"
@@ -964,14 +1145,14 @@ testing = ["pytest", "pytest-benchmark"]
 
 [[package]]
 name = "poetry-dynamic-versioning"
-version = "0.21.4"
+version = "0.21.5"
 description = "Plugin for Poetry to enable dynamic versioning based on VCS tags"
 category = "dev"
 optional = false
 python-versions = ">=3.7,<4.0"
 files = [
-    {file = "poetry_dynamic_versioning-0.21.4-py3-none-any.whl", hash = "sha256:a1ed0c25ca8fd64c69bb362adecfbe057b3db9bd1e9aba100b2c85e51e7cf5fb"},
-    {file = "poetry_dynamic_versioning-0.21.4.tar.gz", hash = "sha256:186fbee28ed14969ac2403905330dab9cb9d231d604ed57a05cf9add2f117b79"},
+    {file = "poetry_dynamic_versioning-0.21.5-py3-none-any.whl", hash = "sha256:4f299e4bfe780e0dd85e8e9ed3ddfa42d050447a36ac8f5e8c1ebd66f66c82cc"},
+    {file = "poetry_dynamic_versioning-0.21.5.tar.gz", hash = "sha256:aa3ff2883394daf80d0cfb1e12d10ecdedc407a8b7c296545ad8b6124979dffc"},
 ]
 
 [package.dependencies]
@@ -984,26 +1165,26 @@ plugin = ["poetry (>=1.2.0,<2.0.0)"]
 
 [[package]]
 name = "psutil"
-version = "5.9.4"
+version = "5.9.5"
 description = "Cross-platform lib for process and system monitoring in Python."
 category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*"
 files = [
-    {file = "psutil-5.9.4-cp27-cp27m-macosx_10_9_x86_64.whl", hash = "sha256:c1ca331af862803a42677c120aff8a814a804e09832f166f226bfd22b56feee8"},
-    {file = "psutil-5.9.4-cp27-cp27m-manylinux2010_i686.whl", hash = "sha256:68908971daf802203f3d37e78d3f8831b6d1014864d7a85937941bb35f09aefe"},
-    {file = "psutil-5.9.4-cp27-cp27m-manylinux2010_x86_64.whl", hash = "sha256:3ff89f9b835100a825b14c2808a106b6fdcc4b15483141482a12c725e7f78549"},
-    {file = "psutil-5.9.4-cp27-cp27m-win32.whl", hash = "sha256:852dd5d9f8a47169fe62fd4a971aa07859476c2ba22c2254d4a1baa4e10b95ad"},
-    {file = "psutil-5.9.4-cp27-cp27m-win_amd64.whl", hash = "sha256:9120cd39dca5c5e1c54b59a41d205023d436799b1c8c4d3ff71af18535728e94"},
-    {file = "psutil-5.9.4-cp27-cp27mu-manylinux2010_i686.whl", hash = "sha256:6b92c532979bafc2df23ddc785ed116fced1f492ad90a6830cf24f4d1ea27d24"},
-    {file = "psutil-5.9.4-cp27-cp27mu-manylinux2010_x86_64.whl", hash = "sha256:efeae04f9516907be44904cc7ce08defb6b665128992a56957abc9b61dca94b7"},
-    {file = "psutil-5.9.4-cp36-abi3-macosx_10_9_x86_64.whl", hash = "sha256:54d5b184728298f2ca8567bf83c422b706200bcbbfafdc06718264f9393cfeb7"},
-    {file = "psutil-5.9.4-cp36-abi3-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:16653106f3b59386ffe10e0bad3bb6299e169d5327d3f187614b1cb8f24cf2e1"},
-    {file = "psutil-5.9.4-cp36-abi3-manylinux_2_12_x86_64.manylinux2010_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:54c0d3d8e0078b7666984e11b12b88af2db11d11249a8ac8920dd5ef68a66e08"},
-    {file = "psutil-5.9.4-cp36-abi3-win32.whl", hash = "sha256:149555f59a69b33f056ba1c4eb22bb7bf24332ce631c44a319cec09f876aaeff"},
-    {file = "psutil-5.9.4-cp36-abi3-win_amd64.whl", hash = "sha256:fd8522436a6ada7b4aad6638662966de0d61d241cb821239b2ae7013d41a43d4"},
-    {file = "psutil-5.9.4-cp38-abi3-macosx_11_0_arm64.whl", hash = "sha256:6001c809253a29599bc0dfd5179d9f8a5779f9dffea1da0f13c53ee568115e1e"},
-    {file = "psutil-5.9.4.tar.gz", hash = "sha256:3d7f9739eb435d4b1338944abe23f49584bde5395f27487d2ee25ad9a8774a62"},
+    {file = "psutil-5.9.5-cp27-cp27m-macosx_10_9_x86_64.whl", hash = "sha256:be8929ce4313f9f8146caad4272f6abb8bf99fc6cf59344a3167ecd74f4f203f"},
+    {file = "psutil-5.9.5-cp27-cp27m-manylinux2010_i686.whl", hash = "sha256:ab8ed1a1d77c95453db1ae00a3f9c50227ebd955437bcf2a574ba8adbf6a74d5"},
+    {file = "psutil-5.9.5-cp27-cp27m-manylinux2010_x86_64.whl", hash = "sha256:4aef137f3345082a3d3232187aeb4ac4ef959ba3d7c10c33dd73763fbc063da4"},
+    {file = "psutil-5.9.5-cp27-cp27mu-manylinux2010_i686.whl", hash = "sha256:ea8518d152174e1249c4f2a1c89e3e6065941df2fa13a1ab45327716a23c2b48"},
+    {file = "psutil-5.9.5-cp27-cp27mu-manylinux2010_x86_64.whl", hash = "sha256:acf2aef9391710afded549ff602b5887d7a2349831ae4c26be7c807c0a39fac4"},
+    {file = "psutil-5.9.5-cp27-none-win32.whl", hash = "sha256:5b9b8cb93f507e8dbaf22af6a2fd0ccbe8244bf30b1baad6b3954e935157ae3f"},
+    {file = "psutil-5.9.5-cp27-none-win_amd64.whl", hash = "sha256:8c5f7c5a052d1d567db4ddd231a9d27a74e8e4a9c3f44b1032762bd7b9fdcd42"},
+    {file = "psutil-5.9.5-cp36-abi3-macosx_10_9_x86_64.whl", hash = "sha256:3c6f686f4225553615612f6d9bc21f1c0e305f75d7d8454f9b46e901778e7217"},
+    {file = "psutil-5.9.5-cp36-abi3-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:7a7dd9997128a0d928ed4fb2c2d57e5102bb6089027939f3b722f3a210f9a8da"},
+    {file = "psutil-5.9.5-cp36-abi3-manylinux_2_12_x86_64.manylinux2010_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:89518112647f1276b03ca97b65cc7f64ca587b1eb0278383017c2a0dcc26cbe4"},
+    {file = "psutil-5.9.5-cp36-abi3-win32.whl", hash = "sha256:104a5cc0e31baa2bcf67900be36acde157756b9c44017b86b2c049f11957887d"},
+    {file = "psutil-5.9.5-cp36-abi3-win_amd64.whl", hash = "sha256:b258c0c1c9d145a1d5ceffab1134441c4c5113b2417fafff7315a917a026c3c9"},
+    {file = "psutil-5.9.5-cp38-abi3-macosx_11_0_arm64.whl", hash = "sha256:c607bb3b57dc779d55e1554846352b4e358c10fff3abf3514a7a6601beebdb30"},
+    {file = "psutil-5.9.5.tar.gz", hash = "sha256:5410638e4df39c54d957fc51ce03048acd8e6d60abc0f5107af51e5fb566eb3c"},
 ]
 
 [package.extras]
@@ -1047,45 +1228,44 @@ files = [
 
 [[package]]
 name = "pycryptodome"
-version = "3.17"
+version = "3.18.0"
 description = "Cryptographic library for Python"
 category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*"
 files = [
-    {file = "pycryptodome-3.17-cp27-cp27m-macosx_10_9_x86_64.whl", hash = "sha256:2c5631204ebcc7ae33d11c43037b2dafe25e2ab9c1de6448eb6502ac69c19a56"},
-    {file = "pycryptodome-3.17-cp27-cp27m-manylinux2010_i686.whl", hash = "sha256:04779cc588ad8f13c80a060b0b1c9d1c203d051d8a43879117fe6b8aaf1cd3fa"},
-    {file = "pycryptodome-3.17-cp27-cp27m-manylinux2010_x86_64.whl", hash = "sha256:f812d58c5af06d939b2baccdda614a3ffd80531a26e5faca2c9f8b1770b2b7af"},
-    {file = "pycryptodome-3.17-cp27-cp27m-manylinux2014_aarch64.whl", hash = "sha256:9453b4e21e752df8737fdffac619e93c9f0ec55ead9a45df782055eb95ef37d9"},
-    {file = "pycryptodome-3.17-cp27-cp27m-musllinux_1_1_aarch64.whl", hash = "sha256:121d61663267f73692e8bde5ec0d23c9146465a0d75cad75c34f75c752527b01"},
-    {file = "pycryptodome-3.17-cp27-cp27m-win32.whl", hash = "sha256:ba2d4fcb844c6ba5df4bbfee9352ad5352c5ae939ac450e06cdceff653280450"},
-    {file = "pycryptodome-3.17-cp27-cp27m-win_amd64.whl", hash = "sha256:87e2ca3aa557781447428c4b6c8c937f10ff215202ab40ece5c13a82555c10d6"},
-    {file = "pycryptodome-3.17-cp27-cp27mu-manylinux2010_i686.whl", hash = "sha256:f44c0d28716d950135ff21505f2c764498eda9d8806b7c78764165848aa419bc"},
-    {file = "pycryptodome-3.17-cp27-cp27mu-manylinux2010_x86_64.whl", hash = "sha256:5a790bc045003d89d42e3b9cb3cc938c8561a57a88aaa5691512e8540d1ae79c"},
-    {file = "pycryptodome-3.17-cp27-cp27mu-manylinux2014_aarch64.whl", hash = "sha256:d086d46774e27b280e4cece8ab3d87299cf0d39063f00f1e9290d096adc5662a"},
-    {file = "pycryptodome-3.17-cp27-cp27mu-musllinux_1_1_aarch64.whl", hash = "sha256:5587803d5b66dfd99e7caa31ed91fba0fdee3661c5d93684028ad6653fce725f"},
-    {file = "pycryptodome-3.17-cp35-abi3-macosx_10_9_universal2.whl", hash = "sha256:e7debd9c439e7b84f53be3cf4ba8b75b3d0b6e6015212355d6daf44ac672e210"},
-    {file = "pycryptodome-3.17-cp35-abi3-macosx_10_9_x86_64.whl", hash = "sha256:ca1ceb6303be1282148f04ac21cebeebdb4152590842159877778f9cf1634f09"},
-    {file = "pycryptodome-3.17-cp35-abi3-manylinux2014_aarch64.whl", hash = "sha256:dc22cc00f804485a3c2a7e2010d9f14a705555f67020eb083e833cabd5bd82e4"},
-    {file = "pycryptodome-3.17-cp35-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:80ea8333b6a5f2d9e856ff2293dba2e3e661197f90bf0f4d5a82a0a6bc83a626"},
-    {file = "pycryptodome-3.17-cp35-abi3-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:c133f6721fba313722a018392a91e3c69d3706ae723484841752559e71d69dc6"},
-    {file = "pycryptodome-3.17-cp35-abi3-musllinux_1_1_aarch64.whl", hash = "sha256:333306eaea01fde50a73c4619e25631e56c4c61bd0fb0a2346479e67e3d3a820"},
-    {file = "pycryptodome-3.17-cp35-abi3-musllinux_1_1_i686.whl", hash = "sha256:1a30f51b990994491cec2d7d237924e5b6bd0d445da9337d77de384ad7f254f9"},
-    {file = "pycryptodome-3.17-cp35-abi3-musllinux_1_1_x86_64.whl", hash = "sha256:909e36a43fe4a8a3163e9c7fc103867825d14a2ecb852a63d3905250b308a4e5"},
-    {file = "pycryptodome-3.17-cp35-abi3-win32.whl", hash = "sha256:a3228728a3808bc9f18c1797ec1179a0efb5068c817b2ffcf6bcd012494dffb2"},
-    {file = "pycryptodome-3.17-cp35-abi3-win_amd64.whl", hash = "sha256:9ec565e89a6b400eca814f28d78a9ef3f15aea1df74d95b28b7720739b28f37f"},
-    {file = "pycryptodome-3.17-pp27-pypy_73-macosx_10_9_x86_64.whl", hash = "sha256:e1819b67bcf6ca48341e9b03c2e45b1c891fa8eb1a8458482d14c2805c9616f2"},
-    {file = "pycryptodome-3.17-pp27-pypy_73-manylinux2010_x86_64.whl", hash = "sha256:f8e550caf52472ae9126953415e4fc554ab53049a5691c45b8816895c632e4d7"},
-    {file = "pycryptodome-3.17-pp27-pypy_73-win32.whl", hash = "sha256:afbcdb0eda20a0e1d44e3a1ad6d4ec3c959210f4b48cabc0e387a282f4c7deb8"},
-    {file = "pycryptodome-3.17-pp38-pypy38_pp73-macosx_10_9_x86_64.whl", hash = "sha256:a74f45aee8c5cc4d533e585e0e596e9f78521e1543a302870a27b0ae2106381e"},
-    {file = "pycryptodome-3.17-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:38bbd6717eac084408b4094174c0805bdbaba1f57fc250fd0309ae5ec9ed7e09"},
-    {file = "pycryptodome-3.17-pp38-pypy38_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:f68d6c8ea2974a571cacb7014dbaada21063a0375318d88ac1f9300bc81e93c3"},
-    {file = "pycryptodome-3.17-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:8198f2b04c39d817b206ebe0db25a6653bb5f463c2319d6f6d9a80d012ac1e37"},
-    {file = "pycryptodome-3.17-pp39-pypy39_pp73-macosx_10_9_x86_64.whl", hash = "sha256:3a232474cd89d3f51e4295abe248a8b95d0332d153bf46444e415409070aae1e"},
-    {file = "pycryptodome-3.17-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4992ec965606054e8326e83db1c8654f0549cdb26fce1898dc1a20bc7684ec1c"},
-    {file = "pycryptodome-3.17-pp39-pypy39_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:53068e33c74f3b93a8158dacaa5d0f82d254a81b1002e0cd342be89fcb3433eb"},
-    {file = "pycryptodome-3.17-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:74794a2e2896cd0cf56fdc9db61ef755fa812b4a4900fa46c49045663a92b8d0"},
-    {file = "pycryptodome-3.17.tar.gz", hash = "sha256:bce2e2d8e82fcf972005652371a3e8731956a0c1fbb719cc897943b3695ad91b"},
+    {file = "pycryptodome-3.18.0-cp27-cp27m-macosx_10_9_x86_64.whl", hash = "sha256:d1497a8cd4728db0e0da3c304856cb37c0c4e3d0b36fcbabcc1600f18504fc54"},
+    {file = "pycryptodome-3.18.0-cp27-cp27m-manylinux2010_i686.whl", hash = "sha256:928078c530da78ff08e10eb6cada6e0dff386bf3d9fa9871b4bbc9fbc1efe024"},
+    {file = "pycryptodome-3.18.0-cp27-cp27m-manylinux2010_x86_64.whl", hash = "sha256:157c9b5ba5e21b375f052ca78152dd309a09ed04703fd3721dce3ff8ecced148"},
+    {file = "pycryptodome-3.18.0-cp27-cp27m-manylinux2014_aarch64.whl", hash = "sha256:d20082bdac9218649f6abe0b885927be25a917e29ae0502eaf2b53f1233ce0c2"},
+    {file = "pycryptodome-3.18.0-cp27-cp27m-musllinux_1_1_aarch64.whl", hash = "sha256:e8ad74044e5f5d2456c11ed4cfd3e34b8d4898c0cb201c4038fe41458a82ea27"},
+    {file = "pycryptodome-3.18.0-cp27-cp27m-win32.whl", hash = "sha256:62a1e8847fabb5213ccde38915563140a5b338f0d0a0d363f996b51e4a6165cf"},
+    {file = "pycryptodome-3.18.0-cp27-cp27m-win_amd64.whl", hash = "sha256:16bfd98dbe472c263ed2821284118d899c76968db1a6665ade0c46805e6b29a4"},
+    {file = "pycryptodome-3.18.0-cp27-cp27mu-manylinux2010_i686.whl", hash = "sha256:7a3d22c8ee63de22336679e021c7f2386f7fc465477d59675caa0e5706387944"},
+    {file = "pycryptodome-3.18.0-cp27-cp27mu-manylinux2010_x86_64.whl", hash = "sha256:78d863476e6bad2a592645072cc489bb90320972115d8995bcfbee2f8b209918"},
+    {file = "pycryptodome-3.18.0-cp27-cp27mu-manylinux2014_aarch64.whl", hash = "sha256:b6a610f8bfe67eab980d6236fdc73bfcdae23c9ed5548192bb2d530e8a92780e"},
+    {file = "pycryptodome-3.18.0-cp27-cp27mu-musllinux_1_1_aarch64.whl", hash = "sha256:422c89fd8df8a3bee09fb8d52aaa1e996120eafa565437392b781abec2a56e14"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-macosx_10_9_universal2.whl", hash = "sha256:9ad6f09f670c466aac94a40798e0e8d1ef2aa04589c29faa5b9b97566611d1d1"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-macosx_10_9_x86_64.whl", hash = "sha256:53aee6be8b9b6da25ccd9028caf17dcdce3604f2c7862f5167777b707fbfb6cb"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-manylinux2014_aarch64.whl", hash = "sha256:10da29526a2a927c7d64b8f34592f461d92ae55fc97981aab5bbcde8cb465bb6"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f21efb8438971aa16924790e1c3dba3a33164eb4000106a55baaed522c261acf"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:4944defabe2ace4803f99543445c27dd1edbe86d7d4edb87b256476a91e9ffa4"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-musllinux_1_1_aarch64.whl", hash = "sha256:51eae079ddb9c5f10376b4131be9589a6554f6fd84f7f655180937f611cd99a2"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-musllinux_1_1_i686.whl", hash = "sha256:83c75952dcf4a4cebaa850fa257d7a860644c70a7cd54262c237c9f2be26f76e"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-musllinux_1_1_x86_64.whl", hash = "sha256:957b221d062d5752716923d14e0926f47670e95fead9d240fa4d4862214b9b2f"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-win32.whl", hash = "sha256:795bd1e4258a2c689c0b1f13ce9684fa0dd4c0e08680dcf597cf9516ed6bc0f3"},
+    {file = "pycryptodome-3.18.0-cp35-abi3-win_amd64.whl", hash = "sha256:b1d9701d10303eec8d0bd33fa54d44e67b8be74ab449052a8372f12a66f93fb9"},
+    {file = "pycryptodome-3.18.0-pp27-pypy_73-manylinux2010_x86_64.whl", hash = "sha256:cb1be4d5af7f355e7d41d36d8eec156ef1382a88638e8032215c215b82a4b8ec"},
+    {file = "pycryptodome-3.18.0-pp27-pypy_73-win32.whl", hash = "sha256:fc0a73f4db1e31d4a6d71b672a48f3af458f548059aa05e83022d5f61aac9c08"},
+    {file = "pycryptodome-3.18.0-pp38-pypy38_pp73-macosx_10_9_x86_64.whl", hash = "sha256:f022a4fd2a5263a5c483a2bb165f9cb27f2be06f2f477113783efe3fe2ad887b"},
+    {file = "pycryptodome-3.18.0-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:363dd6f21f848301c2dcdeb3c8ae5f0dee2286a5e952a0f04954b82076f23825"},
+    {file = "pycryptodome-3.18.0-pp38-pypy38_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:12600268763e6fec3cefe4c2dcdf79bde08d0b6dc1813887e789e495cb9f3403"},
+    {file = "pycryptodome-3.18.0-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:4604816adebd4faf8810782f137f8426bf45fee97d8427fa8e1e49ea78a52e2c"},
+    {file = "pycryptodome-3.18.0-pp39-pypy39_pp73-macosx_10_9_x86_64.whl", hash = "sha256:01489bbdf709d993f3058e2996f8f40fee3f0ea4d995002e5968965fa2fe89fb"},
+    {file = "pycryptodome-3.18.0-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:3811e31e1ac3069988f7a1c9ee7331b942e605dfc0f27330a9ea5997e965efb2"},
+    {file = "pycryptodome-3.18.0-pp39-pypy39_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:6f4b967bb11baea9128ec88c3d02f55a3e338361f5e4934f5240afcb667fdaec"},
+    {file = "pycryptodome-3.18.0-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:9c8eda4f260072f7dbe42f473906c659dcbadd5ae6159dfb49af4da1293ae380"},
+    {file = "pycryptodome-3.18.0.tar.gz", hash = "sha256:c9adee653fc882d98956e33ca2c1fb582e23a8af7ac82fee75bd6113c55a0413"},
 ]
 
 [[package]]
@@ -1153,6 +1333,21 @@ files = [
     {file = "pyflakes-3.0.1.tar.gz", hash = "sha256:ec8b276a6b60bd80defed25add7e439881c19e64850afd9b346283d4165fd0fd"},
 ]
 
+[[package]]
+name = "pygments"
+version = "2.15.1"
+description = "Pygments is a syntax highlighting package written in Python."
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "Pygments-2.15.1-py3-none-any.whl", hash = "sha256:db2db3deb4b4179f399a09054b023b6a586b76499d36965813c71aa8ed7b5fd1"},
+    {file = "Pygments-2.15.1.tar.gz", hash = "sha256:8ace4d3c1dd481894b2005f560ead0f9f19ee64fe983366be1a21e171d12775c"},
+]
+
+[package.extras]
+plugins = ["importlib-metadata"]
+
 [[package]]
 name = "pytest"
 version = "7.3.1"
@@ -1216,17 +1411,18 @@ testing = ["fields", "hunter", "process-tests", "pytest-xdist", "six", "virtuale
 
 [[package]]
 name = "pytest-httpserver"
-version = "1.0.6"
+version = "1.0.7"
 description = "pytest-httpserver is a httpserver for pytest"
 category = "dev"
 optional = false
-python-versions = ">=3.7,<4.0"
+python-versions = ">=3.8,<4.0"
 files = [
-    {file = "pytest_httpserver-1.0.6-py3-none-any.whl", hash = "sha256:ac2379acc91fe8bdbe2911c93af8dd130e33b5899fb9934d15669480739c6d32"},
-    {file = "pytest_httpserver-1.0.6.tar.gz", hash = "sha256:9040d07bf59ac45d8de3db1d4468fd2d1d607975e4da4c872ecc0402cdbf7b3e"},
+    {file = "pytest_httpserver-1.0.7-py3-none-any.whl", hash = "sha256:e86556f2ff2783c04f19bd634f48f1880056267038be49886b973e843bf5b244"},
+    {file = "pytest_httpserver-1.0.7.tar.gz", hash = "sha256:f0317d679221fadab1faef17d71fba18f52a416e21fd68cbf60ef46b693c66f9"},
 ]
 
 [package.dependencies]
+twine = ">=4.0.2,<5.0.0"
 Werkzeug = ">=2.0.0"
 
 [[package]]
@@ -1285,6 +1481,18 @@ setuptools = ">=62.4.0"
 devel = ["coverage", "docutils", "isort", "testscenarios (>=0.4)", "testtools", "twine"]
 test = ["coverage", "docutils", "testscenarios (>=0.4)", "testtools"]
 
+[[package]]
+name = "pywin32-ctypes"
+version = "0.2.0"
+description = ""
+category = "dev"
+optional = false
+python-versions = "*"
+files = [
+    {file = "pywin32-ctypes-0.2.0.tar.gz", hash = "sha256:24ffc3b341d457d48e8922352130cf2644024a4ff09762a2261fd34c36ee5942"},
+    {file = "pywin32_ctypes-0.2.0-py2.py3-none-any.whl", hash = "sha256:9dc2d991b3479cc2df15930958b674a48a227d5361d413827a4cfd0b5876fc98"},
+]
+
 [[package]]
 name = "pyyaml"
 version = "6.0"
@@ -1335,16 +1543,36 @@ files = [
     {file = "PyYAML-6.0.tar.gz", hash = "sha256:68fb519c14306fec9720a2a5b45bc9f0c8d1b9c72adf45c37baedfcd949c35a2"},
 ]
 
+[[package]]
+name = "readme-renderer"
+version = "37.3"
+description = "readme_renderer is a library for rendering \"readme\" descriptions for Warehouse"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "readme_renderer-37.3-py3-none-any.whl", hash = "sha256:f67a16caedfa71eef48a31b39708637a6f4664c4394801a7b0d6432d13907343"},
+    {file = "readme_renderer-37.3.tar.gz", hash = "sha256:cd653186dfc73055656f090f227f5cb22a046d7f71a841dfa305f55c9a513273"},
+]
+
+[package.dependencies]
+bleach = ">=2.1.0"
+docutils = ">=0.13.1"
+Pygments = ">=2.5.1"
+
+[package.extras]
+md = ["cmarkgfm (>=0.8.0)"]
+
 [[package]]
 name = "requests"
-version = "2.30.0"
+version = "2.31.0"
 description = "Python HTTP for Humans."
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "requests-2.30.0-py3-none-any.whl", hash = "sha256:10e94cc4f3121ee6da529d358cdaeaff2f1c409cd377dbc72b825852f2f7e294"},
-    {file = "requests-2.30.0.tar.gz", hash = "sha256:239d7d4458afcb28a692cdd298d87542235f4ca8d36d03a15bfc128a6559a2f4"},
+    {file = "requests-2.31.0-py3-none-any.whl", hash = "sha256:58cd2187c01e70e6e26505bca751777aa9f2ee0b7f4300988b709f44e013003f"},
+    {file = "requests-2.31.0.tar.gz", hash = "sha256:942c5a758f98d790eaed1a29cb6eefc7ffb0d1cf7af05c3d2791656dbd6ad1e1"},
 ]
 
 [package.dependencies]
@@ -1404,6 +1632,21 @@ files = [
 requests = ">=1.0.0"
 six = "*"
 
+[[package]]
+name = "requests-toolbelt"
+version = "1.0.0"
+description = "A utility belt for advanced users of python-requests"
+category = "dev"
+optional = false
+python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*"
+files = [
+    {file = "requests-toolbelt-1.0.0.tar.gz", hash = "sha256:7681a0a3d047012b5bdc0ee37d7f8f07ebe76ab08caeccfc3921ce23c88d5bc6"},
+    {file = "requests_toolbelt-1.0.0-py2.py3-none-any.whl", hash = "sha256:cccfdd665f0a24fcf4726e690f65639d272bb0637b9b92dfd91a5568ccf6bd06"},
+]
+
+[package.dependencies]
+requests = ">=2.0.1,<3.0.0"
+
 [[package]]
 name = "resolvelib"
 version = "0.8.1"
@@ -1422,21 +1665,71 @@ lint = ["black", "flake8", "isort", "mypy", "types-requests"]
 release = ["build", "towncrier", "twine"]
 test = ["commentjson", "packaging", "pytest"]
 
+[[package]]
+name = "rfc3986"
+version = "2.0.0"
+description = "Validating URI References per RFC 3986"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "rfc3986-2.0.0-py2.py3-none-any.whl", hash = "sha256:50b1502b60e289cb37883f3dfd34532b8873c7de9f49bb546641ce9cbd256ebd"},
+    {file = "rfc3986-2.0.0.tar.gz", hash = "sha256:97aacf9dbd4bfd829baad6e6309fa6573aaf1be3f6fa735c8ab05e46cecb261c"},
+]
+
+[package.extras]
+idna2008 = ["idna"]
+
+[[package]]
+name = "rich"
+version = "13.3.5"
+description = "Render rich text, tables, progress bars, syntax highlighting, markdown and more to the terminal"
+category = "dev"
+optional = false
+python-versions = ">=3.7.0"
+files = [
+    {file = "rich-13.3.5-py3-none-any.whl", hash = "sha256:69cdf53799e63f38b95b9bf9c875f8c90e78dd62b2f00c13a911c7a3b9fa4704"},
+    {file = "rich-13.3.5.tar.gz", hash = "sha256:2d11b9b8dd03868f09b4fffadc84a6a8cda574e40dc90821bd845720ebb8e89c"},
+]
+
+[package.dependencies]
+markdown-it-py = ">=2.2.0,<3.0.0"
+pygments = ">=2.13.0,<3.0.0"
+
+[package.extras]
+jupyter = ["ipywidgets (>=7.5.1,<9)"]
+
+[[package]]
+name = "secretstorage"
+version = "3.3.3"
+description = "Python bindings to FreeDesktop.org Secret Service API"
+category = "dev"
+optional = false
+python-versions = ">=3.6"
+files = [
+    {file = "SecretStorage-3.3.3-py3-none-any.whl", hash = "sha256:f356e6628222568e3af06f2eba8df495efa13b3b63081dafd4f7d9a7b7bc9f99"},
+    {file = "SecretStorage-3.3.3.tar.gz", hash = "sha256:2403533ef369eca6d2ba81718576c5e0f564d5cca1b58f73a8b23e7d4eeebd77"},
+]
+
+[package.dependencies]
+cryptography = ">=2.0"
+jeepney = ">=0.6"
+
 [[package]]
 name = "setuptools"
-version = "67.6.1"
+version = "67.8.0"
 description = "Easily download, build, install, upgrade, and uninstall Python packages"
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "setuptools-67.6.1-py3-none-any.whl", hash = "sha256:e728ca814a823bf7bf60162daf9db95b93d532948c4c0bea762ce62f60189078"},
-    {file = "setuptools-67.6.1.tar.gz", hash = "sha256:257de92a9d50a60b8e22abfcbb771571fde0dbf3ec234463212027a4eeecbe9a"},
+    {file = "setuptools-67.8.0-py3-none-any.whl", hash = "sha256:5df61bf30bb10c6f756eb19e7c9f3b473051f48db77fddbe06ff2ca307df9a6f"},
+    {file = "setuptools-67.8.0.tar.gz", hash = "sha256:62642358adc77ffa87233bc4d2354c4b2682d214048f500964dbe760ccedf102"},
 ]
 
 [package.extras]
 docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "pygments-github-lexers (==0.0.5)", "rst.linker (>=1.9)", "sphinx (>=3.5)", "sphinx-favicon", "sphinx-hoverxref (<2)", "sphinx-inline-tabs", "sphinx-lint", "sphinx-notfound-page (==0.8.3)", "sphinx-reredirects", "sphinxcontrib-towncrier"]
-testing = ["build[virtualenv]", "filelock (>=3.4.0)", "flake8 (<5)", "flake8-2020", "ini2toml[lite] (>=0.9)", "jaraco.envs (>=2.2)", "jaraco.path (>=3.2.0)", "pip (>=19.1)", "pip-run (>=8.8)", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)", "pytest-perf", "pytest-timeout", "pytest-xdist", "tomli-w (>=1.0.0)", "virtualenv (>=13.0.0)", "wheel"]
+testing = ["build[virtualenv]", "filelock (>=3.4.0)", "flake8-2020", "ini2toml[lite] (>=0.9)", "jaraco.envs (>=2.2)", "jaraco.path (>=3.2.0)", "pip (>=19.1)", "pip-run (>=8.8)", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-mypy (>=0.9.1)", "pytest-perf", "pytest-ruff", "pytest-timeout", "pytest-xdist", "tomli-w (>=1.0.0)", "virtualenv (>=13.0.0)", "wheel"]
 testing-integration = ["build[virtualenv]", "filelock (>=3.4.0)", "jaraco.envs (>=2.2)", "jaraco.path (>=3.2.0)", "pytest", "pytest-enabler", "pytest-xdist", "tomli", "virtualenv (>=13.0.0)", "wheel"]
 
 [[package]]
@@ -1463,6 +1756,18 @@ files = [
     {file = "sniffio-1.3.0.tar.gz", hash = "sha256:e60305c5e5d314f5389259b7f22aaa33d8f7dee49763119234af3755c55b9101"},
 ]
 
+[[package]]
+name = "soupsieve"
+version = "2.4.1"
+description = "A modern CSS selector implementation for Beautiful Soup."
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "soupsieve-2.4.1-py3-none-any.whl", hash = "sha256:1c1bfee6819544a3447586c889157365a27e10d88cde3ad3da0cf0ddf646feb8"},
+    {file = "soupsieve-2.4.1.tar.gz", hash = "sha256:89d12b2d5dfcd2c9e8c22326da9d9aa9cb3dfab0a83a024f05704076ee8d35ea"},
+]
+
 [[package]]
 name = "tabulate"
 version = "0.8.10"
@@ -1480,14 +1785,14 @@ widechars = ["wcwidth"]
 
 [[package]]
 name = "tldextract"
-version = "3.4.0"
+version = "3.4.4"
 description = "Accurately separates a URL's subdomain, domain, and public suffix, using the Public Suffix List (PSL). By default, this includes the public ICANN TLDs and their exceptions. You can optionally support the Public Suffix List's private domains as well."
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "tldextract-3.4.0-py3-none-any.whl", hash = "sha256:47aa4d8f1a4da79a44529c9a2ddc518663b25d371b805194ec5ce2a5f615ccd2"},
-    {file = "tldextract-3.4.0.tar.gz", hash = "sha256:78aef13ac1459d519b457a03f1f74c1bf1c2808122a6bcc0e6840f81ba55ad73"},
+    {file = "tldextract-3.4.4-py3-none-any.whl", hash = "sha256:581e7dbefc90e7bb857bb6f768d25c811a3c5f0892ed56a9a2999ddb7b1b70c2"},
+    {file = "tldextract-3.4.4.tar.gz", hash = "sha256:5fe3210c577463545191d45ad522d3d5e78d55218ce97215e82004dcae1e1234"},
 ]
 
 [package.dependencies]
@@ -1510,16 +1815,39 @@ files = [
 
 [[package]]
 name = "tomlkit"
-version = "0.11.7"
+version = "0.11.8"
 description = "Style preserving TOML library"
 category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "tomlkit-0.11.7-py3-none-any.whl", hash = "sha256:5325463a7da2ef0c6bbfefb62a3dc883aebe679984709aee32a317907d0a8d3c"},
-    {file = "tomlkit-0.11.7.tar.gz", hash = "sha256:f392ef70ad87a672f02519f99967d28a4d3047133e2d1df936511465fbb3791d"},
+    {file = "tomlkit-0.11.8-py3-none-any.whl", hash = "sha256:8c726c4c202bdb148667835f68d68780b9a003a9ec34167b6c673b38eff2a171"},
+    {file = "tomlkit-0.11.8.tar.gz", hash = "sha256:9330fc7faa1db67b541b28e62018c17d20be733177d290a13b24c62d1614e0c3"},
 ]
 
+[[package]]
+name = "twine"
+version = "4.0.2"
+description = "Collection of utilities for publishing packages on PyPI"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "twine-4.0.2-py3-none-any.whl", hash = "sha256:929bc3c280033347a00f847236564d1c52a3e61b1ac2516c97c48f3ceab756d8"},
+    {file = "twine-4.0.2.tar.gz", hash = "sha256:9e102ef5fdd5a20661eb88fad46338806c3bd32cf1db729603fe3697b1bc83c8"},
+]
+
+[package.dependencies]
+importlib-metadata = ">=3.6"
+keyring = ">=15.1"
+pkginfo = ">=1.8.1"
+readme-renderer = ">=35.0"
+requests = ">=2.20"
+requests-toolbelt = ">=0.8.0,<0.9.0 || >0.9.0"
+rfc3986 = ">=1.4.0"
+rich = ">=12.0.0"
+urllib3 = ">=1.26.0"
+
 [[package]]
 name = "typing-extensions"
 version = "4.5.0"
@@ -1549,118 +1877,131 @@ six = "*"
 
 [[package]]
 name = "urllib3"
-version = "1.26.15"
+version = "2.0.2"
 description = "HTTP library with thread-safe connection pooling, file post, and more."
 category = "main"
 optional = false
-python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*, !=3.5.*"
+python-versions = ">=3.7"
 files = [
-    {file = "urllib3-1.26.15-py2.py3-none-any.whl", hash = "sha256:aa751d169e23c7479ce47a0cb0da579e3ede798f994f5816a74e4f4500dcea42"},
-    {file = "urllib3-1.26.15.tar.gz", hash = "sha256:8a388717b9476f934a21484e8c8e61875ab60644d29b9b39e11e4b9dc1c6b305"},
+    {file = "urllib3-2.0.2-py3-none-any.whl", hash = "sha256:d055c2f9d38dc53c808f6fdc8eab7360b6fdbbde02340ed25cfbcd817c62469e"},
+    {file = "urllib3-2.0.2.tar.gz", hash = "sha256:61717a1095d7e155cdb737ac7bb2f4324a858a1e2e6466f6d03ff630ca68d3cc"},
 ]
 
 [package.extras]
-brotli = ["brotli (>=1.0.9)", "brotlicffi (>=0.8.0)", "brotlipy (>=0.6.0)"]
-secure = ["certifi", "cryptography (>=1.3.4)", "idna (>=2.0.0)", "ipaddress", "pyOpenSSL (>=0.14)", "urllib3-secure-extra"]
-socks = ["PySocks (>=1.5.6,!=1.5.7,<2.0)"]
+brotli = ["brotli (>=1.0.9)", "brotlicffi (>=0.8.0)"]
+secure = ["certifi", "cryptography (>=1.9)", "idna (>=2.0.0)", "pyopenssl (>=17.1.0)", "urllib3-secure-extra"]
+socks = ["pysocks (>=1.5.6,!=1.5.7,<2.0)"]
+zstd = ["zstandard (>=0.18.0)"]
+
+[[package]]
+name = "webencodings"
+version = "0.5.1"
+description = "Character encoding aliases for legacy web content"
+category = "dev"
+optional = false
+python-versions = "*"
+files = [
+    {file = "webencodings-0.5.1-py2.py3-none-any.whl", hash = "sha256:a0af1213f3c2226497a97e2b3aa01a7e4bee4f403f95be16fc9acd2947514a78"},
+    {file = "webencodings-0.5.1.tar.gz", hash = "sha256:b36a1c245f2d304965eb4e0a82848379241dc04b865afcc4aab16748587e1923"},
+]
 
 [[package]]
 name = "websockets"
-version = "11.0.2"
+version = "11.0.3"
 description = "An implementation of the WebSocket Protocol (RFC 6455 & 7692)"
 category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "websockets-11.0.2-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:580cc95c58118f8c39106be71e24d0b7e1ad11a155f40a2ee687f99b3e5e432e"},
-    {file = "websockets-11.0.2-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:143782041e95b63083b02107f31cda999f392903ae331de1307441f3a4557d51"},
-    {file = "websockets-11.0.2-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:8df63dcd955eb6b2e371d95aacf8b7c535e482192cff1b6ce927d8f43fb4f552"},
-    {file = "websockets-11.0.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ca9b2dced5cbbc5094678cc1ec62160f7b0fe4defd601cd28a36fde7ee71bbb5"},
-    {file = "websockets-11.0.2-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:e0eeeea3b01c97fd3b5049a46c908823f68b59bf0e18d79b231d8d6764bc81ee"},
-    {file = "websockets-11.0.2-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:502683c5dedfc94b9f0f6790efb26aa0591526e8403ad443dce922cd6c0ec83b"},
-    {file = "websockets-11.0.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:d3cc3e48b6c9f7df8c3798004b9c4b92abca09eeea5e1b0a39698f05b7a33b9d"},
-    {file = "websockets-11.0.2-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:808b8a33c961bbd6d33c55908f7c137569b09ea7dd024bce969969aa04ecf07c"},
-    {file = "websockets-11.0.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:34a6f8996964ccaa40da42ee36aa1572adcb1e213665e24aa2f1037da6080909"},
-    {file = "websockets-11.0.2-cp310-cp310-win32.whl", hash = "sha256:8f24cd758cbe1607a91b720537685b64e4d39415649cac9177cd1257317cf30c"},
-    {file = "websockets-11.0.2-cp310-cp310-win_amd64.whl", hash = "sha256:3b87cd302f08ea9e74fdc080470eddbed1e165113c1823fb3ee6328bc40ca1d3"},
-    {file = "websockets-11.0.2-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:3565a8f8c7bdde7c29ebe46146bd191290413ee6f8e94cf350609720c075b0a1"},
-    {file = "websockets-11.0.2-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:f97e03d4d5a4f0dca739ea274be9092822f7430b77d25aa02da6775e490f6846"},
-    {file = "websockets-11.0.2-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:8f392587eb2767afa8a34e909f2fec779f90b630622adc95d8b5e26ea8823cb8"},
-    {file = "websockets-11.0.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:7742cd4524622cc7aa71734b51294644492a961243c4fe67874971c4d3045982"},
-    {file = "websockets-11.0.2-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:46dda4bc2030c335abe192b94e98686615f9274f6b56f32f2dd661fb303d9d12"},
-    {file = "websockets-11.0.2-cp311-cp311-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d6b2bfa1d884c254b841b0ff79373b6b80779088df6704f034858e4d705a4802"},
-    {file = "websockets-11.0.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:1df2413266bf48430ef2a752c49b93086c6bf192d708e4a9920544c74cd2baa6"},
-    {file = "websockets-11.0.2-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:cf45d273202b0c1cec0f03a7972c655b93611f2e996669667414557230a87b88"},
-    {file = "websockets-11.0.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:3a09cce3dacb6ad638fdfa3154d9e54a98efe7c8f68f000e55ca9c716496ca67"},
-    {file = "websockets-11.0.2-cp311-cp311-win32.whl", hash = "sha256:2174a75d579d811279855df5824676d851a69f52852edb0e7551e0eeac6f59a4"},
-    {file = "websockets-11.0.2-cp311-cp311-win_amd64.whl", hash = "sha256:c78ca3037a954a4209b9f900e0eabbc471fb4ebe96914016281df2c974a93e3e"},
-    {file = "websockets-11.0.2-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:3a2100b02d1aaf66dc48ff1b2a72f34f6ebc575a02bc0350cc8e9fbb35940166"},
-    {file = "websockets-11.0.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:dca9708eea9f9ed300394d4775beb2667288e998eb6f542cdb6c02027430c599"},
-    {file = "websockets-11.0.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:320ddceefd2364d4afe6576195201a3632a6f2e6d207b0c01333e965b22dbc84"},
-    {file = "websockets-11.0.2-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:b2a573c8d71b7af937852b61e7ccb37151d719974146b5dc734aad350ef55a02"},
-    {file = "websockets-11.0.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:13bd5bebcd16a4b5e403061b8b9dcc5c77e7a71e3c57e072d8dff23e33f70fba"},
-    {file = "websockets-11.0.2-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:95c09427c1c57206fe04277bf871b396476d5a8857fa1b99703283ee497c7a5d"},
-    {file = "websockets-11.0.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:2eb042734e710d39e9bc58deab23a65bd2750e161436101488f8af92f183c239"},
-    {file = "websockets-11.0.2-cp37-cp37m-win32.whl", hash = "sha256:5875f623a10b9ba154cb61967f940ab469039f0b5e61c80dd153a65f024d9fb7"},
-    {file = "websockets-11.0.2-cp37-cp37m-win_amd64.whl", hash = "sha256:634239bc844131863762865b75211a913c536817c0da27f691400d49d256df1d"},
-    {file = "websockets-11.0.2-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:3178d965ec204773ab67985a09f5696ca6c3869afeed0bb51703ea404a24e975"},
-    {file = "websockets-11.0.2-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:955fcdb304833df2e172ce2492b7b47b4aab5dcc035a10e093d911a1916f2c87"},
-    {file = "websockets-11.0.2-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:cb46d2c7631b2e6f10f7c8bac7854f7c5e5288f024f1c137d4633c79ead1e3c0"},
-    {file = "websockets-11.0.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:25aae96c1060e85836552a113495db6d857400288161299d77b7b20f2ac569f2"},
-    {file = "websockets-11.0.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:2abeeae63154b7f63d9f764685b2d299e9141171b8b896688bd8baec6b3e2303"},
-    {file = "websockets-11.0.2-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:daa1e8ea47507555ed7a34f8b49398d33dff5b8548eae3de1dc0ef0607273a33"},
-    {file = "websockets-11.0.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:954eb789c960fa5daaed3cfe336abc066941a5d456ff6be8f0e03dd89886bb4c"},
-    {file = "websockets-11.0.2-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:3ffe251a31f37e65b9b9aca5d2d67fd091c234e530f13d9dce4a67959d5a3fba"},
-    {file = "websockets-11.0.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:adf6385f677ed2e0b021845b36f55c43f171dab3a9ee0ace94da67302f1bc364"},
-    {file = "websockets-11.0.2-cp38-cp38-win32.whl", hash = "sha256:aa7b33c1fb2f7b7b9820f93a5d61ffd47f5a91711bc5fa4583bbe0c0601ec0b2"},
-    {file = "websockets-11.0.2-cp38-cp38-win_amd64.whl", hash = "sha256:220d5b93764dd70d7617f1663da64256df7e7ea31fc66bc52c0e3750ee134ae3"},
-    {file = "websockets-11.0.2-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:0fb4480556825e4e6bf2eebdbeb130d9474c62705100c90e59f2f56459ddab42"},
-    {file = "websockets-11.0.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:ec00401846569aaf018700249996143f567d50050c5b7b650148989f956547af"},
-    {file = "websockets-11.0.2-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:87c69f50281126dcdaccd64d951fb57fbce272578d24efc59bce72cf264725d0"},
-    {file = "websockets-11.0.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:232b6ba974f5d09b1b747ac232f3a3d8f86de401d7b565e837cc86988edf37ac"},
-    {file = "websockets-11.0.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:392d409178db1e46d1055e51cc850136d302434e12d412a555e5291ab810f622"},
-    {file = "websockets-11.0.2-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a4fe2442091ff71dee0769a10449420fd5d3b606c590f78dd2b97d94b7455640"},
-    {file = "websockets-11.0.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:ede13a6998ba2568b21825809d96e69a38dc43184bdeebbde3699c8baa21d015"},
-    {file = "websockets-11.0.2-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:4c54086b2d2aec3c3cb887ad97e9c02c6be9f1d48381c7419a4aa932d31661e4"},
-    {file = "websockets-11.0.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:e37a76ccd483a6457580077d43bc3dfe1fd784ecb2151fcb9d1c73f424deaeba"},
-    {file = "websockets-11.0.2-cp39-cp39-win32.whl", hash = "sha256:d1881518b488a920434a271a6e8a5c9481a67c4f6352ebbdd249b789c0467ddc"},
-    {file = "websockets-11.0.2-cp39-cp39-win_amd64.whl", hash = "sha256:25e265686ea385f22a00cc2b719b880797cd1bb53b46dbde969e554fb458bfde"},
-    {file = "websockets-11.0.2-pp37-pypy37_pp73-macosx_10_9_x86_64.whl", hash = "sha256:ce69f5c742eefd039dce8622e99d811ef2135b69d10f9aa79fbf2fdcc1e56cd7"},
-    {file = "websockets-11.0.2-pp37-pypy37_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:b985ba2b9e972cf99ddffc07df1a314b893095f62c75bc7c5354a9c4647c6503"},
-    {file = "websockets-11.0.2-pp37-pypy37_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:1b52def56d2a26e0e9c464f90cadb7e628e04f67b0ff3a76a4d9a18dfc35e3dd"},
-    {file = "websockets-11.0.2-pp37-pypy37_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:d70a438ef2a22a581d65ad7648e949d4ccd20e3c8ed7a90bbc46df4e60320891"},
-    {file = "websockets-11.0.2-pp37-pypy37_pp73-win_amd64.whl", hash = "sha256:752fbf420c71416fb1472fec1b4cb8631c1aa2be7149e0a5ba7e5771d75d2bb9"},
-    {file = "websockets-11.0.2-pp38-pypy38_pp73-macosx_10_9_x86_64.whl", hash = "sha256:dd906b0cdc417ea7a5f13bb3c6ca3b5fd563338dc596996cb0fdd7872d691c0a"},
-    {file = "websockets-11.0.2-pp38-pypy38_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:3e79065ff6549dd3c765e7916067e12a9c91df2affea0ac51bcd302aaf7ad207"},
-    {file = "websockets-11.0.2-pp38-pypy38_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:46388a050d9e40316e58a3f0838c63caacb72f94129eb621a659a6e49bad27ce"},
-    {file = "websockets-11.0.2-pp38-pypy38_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:5c7de298371d913824f71b30f7685bb07ad13969c79679cca5b1f7f94fec012f"},
-    {file = "websockets-11.0.2-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:6d872c972c87c393e6a49c1afbdc596432df8c06d0ff7cd05aa18e885e7cfb7c"},
-    {file = "websockets-11.0.2-pp39-pypy39_pp73-macosx_10_9_x86_64.whl", hash = "sha256:b444366b605d2885f0034dd889faf91b4b47668dd125591e2c64bfde611ac7e1"},
-    {file = "websockets-11.0.2-pp39-pypy39_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:e8b967a4849db6b567dec3f7dd5d97b15ce653e3497b8ce0814e470d5e074750"},
-    {file = "websockets-11.0.2-pp39-pypy39_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:2acdc82099999e44fa7bd8c886f03c70a22b1d53ae74252f389be30d64fd6004"},
-    {file = "websockets-11.0.2-pp39-pypy39_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:518ed6782d9916c5721ebd61bb7651d244178b74399028302c8617d0620af291"},
-    {file = "websockets-11.0.2-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:58477b041099bb504e1a5ddd8aa86302ed1d5c6995bdd3db2b3084ef0135d277"},
-    {file = "websockets-11.0.2-py3-none-any.whl", hash = "sha256:5004c087d17251938a52cce21b3dbdabeecbbe432ce3f5bbbf15d8692c36eac9"},
-    {file = "websockets-11.0.2.tar.gz", hash = "sha256:b1a69701eb98ed83dd099de4a686dc892c413d974fa31602bc00aca7cb988ac9"},
+    {file = "websockets-11.0.3-cp310-cp310-macosx_10_9_universal2.whl", hash = "sha256:3ccc8a0c387629aec40f2fc9fdcb4b9d5431954f934da3eaf16cdc94f67dbfac"},
+    {file = "websockets-11.0.3-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:d67ac60a307f760c6e65dad586f556dde58e683fab03323221a4e530ead6f74d"},
+    {file = "websockets-11.0.3-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:84d27a4832cc1a0ee07cdcf2b0629a8a72db73f4cf6de6f0904f6661227f256f"},
+    {file = "websockets-11.0.3-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ffd7dcaf744f25f82190856bc26ed81721508fc5cbf2a330751e135ff1283564"},
+    {file = "websockets-11.0.3-cp310-cp310-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:7622a89d696fc87af8e8d280d9b421db5133ef5b29d3f7a1ce9f1a7bf7fcfa11"},
+    {file = "websockets-11.0.3-cp310-cp310-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:bceab846bac555aff6427d060f2fcfff71042dba6f5fca7dc4f75cac815e57ca"},
+    {file = "websockets-11.0.3-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:54c6e5b3d3a8936a4ab6870d46bdd6ec500ad62bde9e44462c32d18f1e9a8e54"},
+    {file = "websockets-11.0.3-cp310-cp310-musllinux_1_1_i686.whl", hash = "sha256:41f696ba95cd92dc047e46b41b26dd24518384749ed0d99bea0a941ca87404c4"},
+    {file = "websockets-11.0.3-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:86d2a77fd490ae3ff6fae1c6ceaecad063d3cc2320b44377efdde79880e11526"},
+    {file = "websockets-11.0.3-cp310-cp310-win32.whl", hash = "sha256:2d903ad4419f5b472de90cd2d40384573b25da71e33519a67797de17ef849b69"},
+    {file = "websockets-11.0.3-cp310-cp310-win_amd64.whl", hash = "sha256:1d2256283fa4b7f4c7d7d3e84dc2ece74d341bce57d5b9bf385df109c2a1a82f"},
+    {file = "websockets-11.0.3-cp311-cp311-macosx_10_9_universal2.whl", hash = "sha256:e848f46a58b9fcf3d06061d17be388caf70ea5b8cc3466251963c8345e13f7eb"},
+    {file = "websockets-11.0.3-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:aa5003845cdd21ac0dc6c9bf661c5beddd01116f6eb9eb3c8e272353d45b3288"},
+    {file = "websockets-11.0.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:b58cbf0697721120866820b89f93659abc31c1e876bf20d0b3d03cef14faf84d"},
+    {file = "websockets-11.0.3-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:660e2d9068d2bedc0912af508f30bbeb505bbbf9774d98def45f68278cea20d3"},
+    {file = "websockets-11.0.3-cp311-cp311-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:c1f0524f203e3bd35149f12157438f406eff2e4fb30f71221c8a5eceb3617b6b"},
+    {file = "websockets-11.0.3-cp311-cp311-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:def07915168ac8f7853812cc593c71185a16216e9e4fa886358a17ed0fd9fcf6"},
+    {file = "websockets-11.0.3-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:b30c6590146e53149f04e85a6e4fcae068df4289e31e4aee1fdf56a0dead8f97"},
+    {file = "websockets-11.0.3-cp311-cp311-musllinux_1_1_i686.whl", hash = "sha256:619d9f06372b3a42bc29d0cd0354c9bb9fb39c2cbc1a9c5025b4538738dbffaf"},
+    {file = "websockets-11.0.3-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:01f5567d9cf6f502d655151645d4e8b72b453413d3819d2b6f1185abc23e82dd"},
+    {file = "websockets-11.0.3-cp311-cp311-win32.whl", hash = "sha256:e1459677e5d12be8bbc7584c35b992eea142911a6236a3278b9b5ce3326f282c"},
+    {file = "websockets-11.0.3-cp311-cp311-win_amd64.whl", hash = "sha256:e7837cb169eca3b3ae94cc5787c4fed99eef74c0ab9506756eea335e0d6f3ed8"},
+    {file = "websockets-11.0.3-cp37-cp37m-macosx_10_9_x86_64.whl", hash = "sha256:9f59a3c656fef341a99e3d63189852be7084c0e54b75734cde571182c087b152"},
+    {file = "websockets-11.0.3-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:2529338a6ff0eb0b50c7be33dc3d0e456381157a31eefc561771ee431134a97f"},
+    {file = "websockets-11.0.3-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:34fd59a4ac42dff6d4681d8843217137f6bc85ed29722f2f7222bd619d15e95b"},
+    {file = "websockets-11.0.3-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:332d126167ddddec94597c2365537baf9ff62dfcc9db4266f263d455f2f031cb"},
+    {file = "websockets-11.0.3-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:6505c1b31274723ccaf5f515c1824a4ad2f0d191cec942666b3d0f3aa4cb4007"},
+    {file = "websockets-11.0.3-cp37-cp37m-musllinux_1_1_i686.whl", hash = "sha256:f467ba0050b7de85016b43f5a22b46383ef004c4f672148a8abf32bc999a87f0"},
+    {file = "websockets-11.0.3-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:9d9acd80072abcc98bd2c86c3c9cd4ac2347b5a5a0cae7ed5c0ee5675f86d9af"},
+    {file = "websockets-11.0.3-cp37-cp37m-win32.whl", hash = "sha256:e590228200fcfc7e9109509e4d9125eace2042fd52b595dd22bbc34bb282307f"},
+    {file = "websockets-11.0.3-cp37-cp37m-win_amd64.whl", hash = "sha256:b16fff62b45eccb9c7abb18e60e7e446998093cdcb50fed33134b9b6878836de"},
+    {file = "websockets-11.0.3-cp38-cp38-macosx_10_9_universal2.whl", hash = "sha256:fb06eea71a00a7af0ae6aefbb932fb8a7df3cb390cc217d51a9ad7343de1b8d0"},
+    {file = "websockets-11.0.3-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:8a34e13a62a59c871064dfd8ffb150867e54291e46d4a7cf11d02c94a5275bae"},
+    {file = "websockets-11.0.3-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:4841ed00f1026dfbced6fca7d963c4e7043aa832648671b5138008dc5a8f6d99"},
+    {file = "websockets-11.0.3-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:1a073fc9ab1c8aff37c99f11f1641e16da517770e31a37265d2755282a5d28aa"},
+    {file = "websockets-11.0.3-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:68b977f21ce443d6d378dbd5ca38621755f2063d6fdb3335bda981d552cfff86"},
+    {file = "websockets-11.0.3-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e1a99a7a71631f0efe727c10edfba09ea6bee4166a6f9c19aafb6c0b5917d09c"},
+    {file = "websockets-11.0.3-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:bee9fcb41db2a23bed96c6b6ead6489702c12334ea20a297aa095ce6d31370d0"},
+    {file = "websockets-11.0.3-cp38-cp38-musllinux_1_1_i686.whl", hash = "sha256:4b253869ea05a5a073ebfdcb5cb3b0266a57c3764cf6fe114e4cd90f4bfa5f5e"},
+    {file = "websockets-11.0.3-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:1553cb82942b2a74dd9b15a018dce645d4e68674de2ca31ff13ebc2d9f283788"},
+    {file = "websockets-11.0.3-cp38-cp38-win32.whl", hash = "sha256:f61bdb1df43dc9c131791fbc2355535f9024b9a04398d3bd0684fc16ab07df74"},
+    {file = "websockets-11.0.3-cp38-cp38-win_amd64.whl", hash = "sha256:03aae4edc0b1c68498f41a6772d80ac7c1e33c06c6ffa2ac1c27a07653e79d6f"},
+    {file = "websockets-11.0.3-cp39-cp39-macosx_10_9_universal2.whl", hash = "sha256:777354ee16f02f643a4c7f2b3eff8027a33c9861edc691a2003531f5da4f6bc8"},
+    {file = "websockets-11.0.3-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:8c82f11964f010053e13daafdc7154ce7385ecc538989a354ccc7067fd7028fd"},
+    {file = "websockets-11.0.3-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:3580dd9c1ad0701169e4d6fc41e878ffe05e6bdcaf3c412f9d559389d0c9e016"},
+    {file = "websockets-11.0.3-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:6f1a3f10f836fab6ca6efa97bb952300b20ae56b409414ca85bff2ad241d2a61"},
+    {file = "websockets-11.0.3-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:df41b9bc27c2c25b486bae7cf42fccdc52ff181c8c387bfd026624a491c2671b"},
+    {file = "websockets-11.0.3-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:279e5de4671e79a9ac877427f4ac4ce93751b8823f276b681d04b2156713b9dd"},
+    {file = "websockets-11.0.3-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:1fdf26fa8a6a592f8f9235285b8affa72748dc12e964a5518c6c5e8f916716f7"},
+    {file = "websockets-11.0.3-cp39-cp39-musllinux_1_1_i686.whl", hash = "sha256:69269f3a0b472e91125b503d3c0b3566bda26da0a3261c49f0027eb6075086d1"},
+    {file = "websockets-11.0.3-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:97b52894d948d2f6ea480171a27122d77af14ced35f62e5c892ca2fae9344311"},
+    {file = "websockets-11.0.3-cp39-cp39-win32.whl", hash = "sha256:c7f3cb904cce8e1be667c7e6fef4516b98d1a6a0635a58a57528d577ac18a128"},
+    {file = "websockets-11.0.3-cp39-cp39-win_amd64.whl", hash = "sha256:c792ea4eabc0159535608fc5658a74d1a81020eb35195dd63214dcf07556f67e"},
+    {file = "websockets-11.0.3-pp37-pypy37_pp73-macosx_10_9_x86_64.whl", hash = "sha256:f2e58f2c36cc52d41f2659e4c0cbf7353e28c8c9e63e30d8c6d3494dc9fdedcf"},
+    {file = "websockets-11.0.3-pp37-pypy37_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:de36fe9c02995c7e6ae6efe2e205816f5f00c22fd1fbf343d4d18c3d5ceac2f5"},
+    {file = "websockets-11.0.3-pp37-pypy37_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:0ac56b661e60edd453585f4bd68eb6a29ae25b5184fd5ba51e97652580458998"},
+    {file = "websockets-11.0.3-pp37-pypy37_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e052b8467dd07d4943936009f46ae5ce7b908ddcac3fda581656b1b19c083d9b"},
+    {file = "websockets-11.0.3-pp37-pypy37_pp73-win_amd64.whl", hash = "sha256:42cc5452a54a8e46a032521d7365da775823e21bfba2895fb7b77633cce031bb"},
+    {file = "websockets-11.0.3-pp38-pypy38_pp73-macosx_10_9_x86_64.whl", hash = "sha256:e6316827e3e79b7b8e7d8e3b08f4e331af91a48e794d5d8b099928b6f0b85f20"},
+    {file = "websockets-11.0.3-pp38-pypy38_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8531fdcad636d82c517b26a448dcfe62f720e1922b33c81ce695d0edb91eb931"},
+    {file = "websockets-11.0.3-pp38-pypy38_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:c114e8da9b475739dde229fd3bc6b05a6537a88a578358bc8eb29b4030fac9c9"},
+    {file = "websockets-11.0.3-pp38-pypy38_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:e063b1865974611313a3849d43f2c3f5368093691349cf3c7c8f8f75ad7cb280"},
+    {file = "websockets-11.0.3-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:92b2065d642bf8c0a82d59e59053dd2fdde64d4ed44efe4870fa816c1232647b"},
+    {file = "websockets-11.0.3-pp39-pypy39_pp73-macosx_10_9_x86_64.whl", hash = "sha256:0ee68fe502f9031f19d495dae2c268830df2760c0524cbac5d759921ba8c8e82"},
+    {file = "websockets-11.0.3-pp39-pypy39_pp73-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:dcacf2c7a6c3a84e720d1bb2b543c675bf6c40e460300b628bab1b1efc7c034c"},
+    {file = "websockets-11.0.3-pp39-pypy39_pp73-manylinux_2_5_i686.manylinux1_i686.manylinux_2_17_i686.manylinux2014_i686.whl", hash = "sha256:b67c6f5e5a401fc56394f191f00f9b3811fe843ee93f4a70df3c389d1adf857d"},
+    {file = "websockets-11.0.3-pp39-pypy39_pp73-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1d5023a4b6a5b183dc838808087033ec5df77580485fc533e7dab2567851b0a4"},
+    {file = "websockets-11.0.3-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:ed058398f55163a79bb9f06a90ef9ccc063b204bb346c4de78efc5d15abfe602"},
+    {file = "websockets-11.0.3-py3-none-any.whl", hash = "sha256:6681ba9e7f8f3b19440921e99efbb40fc89f26cd71bf539e45d8c8a25c976dc6"},
+    {file = "websockets-11.0.3.tar.gz", hash = "sha256:88fc51d9a26b10fc331be344f1781224a375b78488fc343620184e95a4b27016"},
 ]
 
 [[package]]
 name = "werkzeug"
-version = "2.2.3"
+version = "2.3.4"
 description = "The comprehensive WSGI web application library."
 category = "dev"
 optional = false
-python-versions = ">=3.7"
+python-versions = ">=3.8"
 files = [
-    {file = "Werkzeug-2.2.3-py3-none-any.whl", hash = "sha256:56433961bc1f12533306c624f3be5e744389ac61d722175d543e1751285da612"},
-    {file = "Werkzeug-2.2.3.tar.gz", hash = "sha256:2e1ccc9417d4da358b9de6f174e3ac094391ea1d4fbef2d667865d819dfd0afe"},
+    {file = "Werkzeug-2.3.4-py3-none-any.whl", hash = "sha256:48e5e61472fee0ddee27ebad085614ebedb7af41e88f687aaf881afb723a162f"},
+    {file = "Werkzeug-2.3.4.tar.gz", hash = "sha256:1d5a58e0377d1fe39d061a5de4469e414e78ccb1e1e59c0f5ad6fa1c36c52b76"},
 ]
 
 [package.dependencies]
 MarkupSafe = ">=2.1.1"
 
 [package.extras]
-watchdog = ["watchdog"]
+watchdog = ["watchdog (>=2.3)"]
 
 [[package]]
 name = "wordninja"
@@ -1700,7 +2041,23 @@ files = [
 [package.dependencies]
 xmltodict = ">=0.12.0,<0.13.0"
 
+[[package]]
+name = "zipp"
+version = "3.15.0"
+description = "Backport of pathlib-compatible object wrapper for zip files"
+category = "dev"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "zipp-3.15.0-py3-none-any.whl", hash = "sha256:48904fc76a60e542af151aded95726c1a5c34ed43ab4134b597665c86d7ad556"},
+    {file = "zipp-3.15.0.tar.gz", hash = "sha256:112929ad649da941c23de50f356a2b5570c954b65150642bccdd66bf194d224b"},
+]
+
+[package.extras]
+docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)", "sphinx-lint"]
+testing = ["big-O", "flake8 (<5)", "jaraco.functools", "jaraco.itertools", "more-itertools", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)"]
+
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "e8bc6b97f09142c3d7099d7378d826270a470ee7b454bd39f8c52779d57153cf"
+content-hash = "c5092124743e444c67155b37f9fc595214da3828c7e5b712d04c8b7ce6100cc8"
diff --git a/pyproject.toml b/pyproject.toml
index fb77583d86..ec84bfe8f3 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -29,6 +29,7 @@ tabulate = "0.8.10"
 cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
 httpx = {extras = ["http2"], version = "^0.24.0"}
+beautifulsoup4 = "^4.12.2"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From 73296a2af3b16222b7d389d0cc53035ffb49648a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 13:31:46 -0400
Subject: [PATCH 040/387] fixing tests

---
 bbot/core/logger/logger.py                       | 16 ++++++++++------
 bbot/test/bbot_fixtures.py                       |  1 -
 .../module_tests/test_module_censys.py           |  2 ++
 .../module_tests/test_module_github.py           |  2 +-
 pyproject.toml                                   |  5 +++++
 5 files changed, 18 insertions(+), 8 deletions(-)

diff --git a/bbot/core/logger/logger.py b/bbot/core/logger/logger.py
index e7ffe96628..88d3ef73b4 100644
--- a/bbot/core/logger/logger.py
+++ b/bbot/core/logger/logger.py
@@ -16,6 +16,15 @@
 _log_level_override = None
 
 
+# Log to stderr
+stderr_handler = logging.StreamHandler(sys.stderr)
+
+# Log to stdout
+stdout_handler = logging.StreamHandler(sys.stdout)
+
+log_listener = None
+
+
 class ColoredFormatter(logging.Formatter):
     """
     Pretty colors for terminal
@@ -120,12 +129,6 @@ def log_listener_setup(logging_queue):
     if not mkdir(log_dir, raise_error=False):
         error_and_exit(f"Failure creating or error writing to BBOT logs directory ({log_dir})")
 
-    # Log to stderr
-    stderr_handler = logging.StreamHandler(sys.stderr)
-
-    # Log to stdout
-    stdout_handler = logging.StreamHandler(sys.stdout)
-
     # Main log file
     main_handler = logging.handlers.TimedRotatingFileHandler(
         f"{log_dir}/bbot.log", when="d", interval=1, backupCount=14
@@ -166,6 +169,7 @@ def stderr_filter(record):
 
     handlers = [stdout_handler, stderr_handler, main_handler, debug_handler]
 
+    global log_listener
     log_listener = QueueListener(logging_queue, *handlers)
     log_listener.start()
     atexit.register(stop_listener, log_listener)
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index f30710b5b0..3ff6f41ae2 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -33,7 +33,6 @@ def match_data(self, request: Request) -> bool:
 test_config = OmegaConf.load(Path(__file__).parent / "test.conf")
 if test_config.get("debug", False):
     os.environ["BBOT_DEBUG"] = "True"
-os.environ["BBOT_TESTING"] = "True"
 
 from .bbot_fixtures import *  # noqa: F401
 import bbot.core.logger  # noqa: F401
diff --git a/bbot/test/test_step_1/module_tests/test_module_censys.py b/bbot/test/test_step_1/module_tests/test_module_censys.py
index e2792e6131..630c0454fc 100644
--- a/bbot/test/test_step_1/module_tests/test_module_censys.py
+++ b/bbot/test/test_step_1/module_tests/test_module_censys.py
@@ -2,6 +2,8 @@
 
 
 class TestCensys(ModuleTestBase):
+    config_overrides = {"modules": {"censys": {"api_key": "asdf"}}}
+
     def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://search.censys.io/api/v1/account",
diff --git a/bbot/test/test_step_1/module_tests/test_module_github.py b/bbot/test/test_step_1/module_tests/test_module_github.py
index 52f8154e9f..8fb27c9ea1 100644
--- a/bbot/test/test_step_1/module_tests/test_module_github.py
+++ b/bbot/test/test_step_1/module_tests/test_module_github.py
@@ -2,7 +2,7 @@
 
 
 class TestGithub(ModuleTestBase):
-    config_overrides = {"omit_event_types": [], "scope_report_distance": 1}
+    config_overrides = {"modules": {"github": {"api_key": "asdf"}}, "omit_event_types": [], "scope_report_distance": 1}
 
     def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(url="https://api.github.com/zen")
diff --git a/pyproject.toml b/pyproject.toml
index ec84bfe8f3..a6d9860e8a 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -42,6 +42,11 @@ pytest-rerunfailures = "^11.1.2"
 pytest-asyncio = "^0.21.0"
 pytest-httpx = "^0.22.0"
 
+[pytest]
+env = [
+    "BBOT_TESTING = True"
+]    
+
 [build-system]
 requires = ["poetry-core>=1.0.0", "poetry-dynamic-versioning"]
 build-backend = "poetry_dynamic_versioning.backend"

From 52138978501830bc7b1c613139ccd0e4bbf35060 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 13:48:22 -0400
Subject: [PATCH 041/387] fixed censys test, better logging

---
 bbot/core/logger/logger.py                               | 9 ++++++++-
 bbot/test/bbot_fixtures.py                               | 7 +++++--
 bbot/test/test_step_1/module_tests/test_module_censys.py | 2 +-
 3 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/bbot/core/logger/logger.py b/bbot/core/logger/logger.py
index 88d3ef73b4..57feb6f8f1 100644
--- a/bbot/core/logger/logger.py
+++ b/bbot/core/logger/logger.py
@@ -30,6 +30,9 @@ class ColoredFormatter(logging.Formatter):
     Pretty colors for terminal
     """
 
+    formatter = logging.Formatter("%(levelname)s %(message)s")
+    module_formatter = logging.Formatter("%(levelname)s %(name)s: %(message)s")
+
     def format(self, record):
         colored_record = copy(record)
         levelname = colored_record.levelname
@@ -37,7 +40,11 @@ def format(self, record):
         colored_record.levelname = colorize(f"[{levelshort}]", level=levelname)
         if levelname == "CRITICAL" or levelname.startswith("HUGE"):
             colored_record.msg = colorize(colored_record.msg, level=levelname)
-        return logging.Formatter.format(self, colored_record)
+        # remove name
+        if colored_record.name.startswith("bbot.modules."):
+            colored_record.name = colored_record.name.split("bbot.modules.")[-1]
+            return self.module_formatter.format(colored_record)
+        return self.formatter.format(colored_record)
 
 
 def addLoggingLevel(levelName, levelNum, methodName=None):
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index 3ff6f41ae2..c1c87207d5 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -34,12 +34,15 @@ def match_data(self, request: Request) -> bool:
 if test_config.get("debug", False):
     os.environ["BBOT_DEBUG"] = "True"
 
+# clear log handlers (pytest takes care of this)
+from bbot.core.logger import logger
+
+logger.log_listener.handlers = []
+
 from .bbot_fixtures import *  # noqa: F401
 import bbot.core.logger  # noqa: F401
 from bbot.core.errors import *  # noqa: F401
 
-log = logging.getLogger(f"bbot.test")
-
 # silence pytest_httpserver
 log = logging.getLogger("werkzeug")
 log.setLevel(logging.CRITICAL)
diff --git a/bbot/test/test_step_1/module_tests/test_module_censys.py b/bbot/test/test_step_1/module_tests/test_module_censys.py
index 630c0454fc..c3c87649c1 100644
--- a/bbot/test/test_step_1/module_tests/test_module_censys.py
+++ b/bbot/test/test_step_1/module_tests/test_module_censys.py
@@ -2,7 +2,7 @@
 
 
 class TestCensys(ModuleTestBase):
-    config_overrides = {"modules": {"censys": {"api_key": "asdf"}}}
+    config_overrides = {"modules": {"censys": {"api_id": "api_id", "api_secret": "api_secret"}}}
 
     def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(

From a2d58d490b218b87ce8c443054c34a131ca68434 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 13:52:39 -0400
Subject: [PATCH 042/387] added lxml

---
 poetry.lock    | 95 +++++++++++++++++++++++++++++++++++++++++++++++++-
 pyproject.toml |  1 +
 2 files changed, 95 insertions(+), 1 deletion(-)

diff --git a/poetry.lock b/poetry.lock
index f69d3ed54f..31f9015c82 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -893,6 +893,99 @@ files = [
     {file = "lockfile-0.12.2.tar.gz", hash = "sha256:6aed02de03cba24efabcd600b30540140634fc06cfa603822d508d5361e9f799"},
 ]
 
+[[package]]
+name = "lxml"
+version = "4.9.2"
+description = "Powerful and Pythonic XML processing library combining libxml2/libxslt with the ElementTree API."
+category = "main"
+optional = false
+python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, != 3.4.*"
+files = [
+    {file = "lxml-4.9.2-cp27-cp27m-macosx_10_15_x86_64.whl", hash = "sha256:76cf573e5a365e790396a5cc2b909812633409306c6531a6877c59061e42c4f2"},
+    {file = "lxml-4.9.2-cp27-cp27m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:b1f42b6921d0e81b1bcb5e395bc091a70f41c4d4e55ba99c6da2b31626c44892"},
+    {file = "lxml-4.9.2-cp27-cp27m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:9f102706d0ca011de571de32c3247c6476b55bb6bc65a20f682f000b07a4852a"},
+    {file = "lxml-4.9.2-cp27-cp27m-win32.whl", hash = "sha256:8d0b4612b66ff5d62d03bcaa043bb018f74dfea51184e53f067e6fdcba4bd8de"},
+    {file = "lxml-4.9.2-cp27-cp27m-win_amd64.whl", hash = "sha256:4c8f293f14abc8fd3e8e01c5bd86e6ed0b6ef71936ded5bf10fe7a5efefbaca3"},
+    {file = "lxml-4.9.2-cp27-cp27mu-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2899456259589aa38bfb018c364d6ae7b53c5c22d8e27d0ec7609c2a1ff78b50"},
+    {file = "lxml-4.9.2-cp27-cp27mu-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:6749649eecd6a9871cae297bffa4ee76f90b4504a2a2ab528d9ebe912b101975"},
+    {file = "lxml-4.9.2-cp310-cp310-macosx_10_15_x86_64.whl", hash = "sha256:a08cff61517ee26cb56f1e949cca38caabe9ea9fbb4b1e10a805dc39844b7d5c"},
+    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:85cabf64adec449132e55616e7ca3e1000ab449d1d0f9d7f83146ed5bdcb6d8a"},
+    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:8340225bd5e7a701c0fa98284c849c9b9fc9238abf53a0ebd90900f25d39a4e4"},
+    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:1ab8f1f932e8f82355e75dda5413a57612c6ea448069d4fb2e217e9a4bed13d4"},
+    {file = "lxml-4.9.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:699a9af7dffaf67deeae27b2112aa06b41c370d5e7633e0ee0aea2e0b6c211f7"},
+    {file = "lxml-4.9.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:b9cc34af337a97d470040f99ba4282f6e6bac88407d021688a5d585e44a23184"},
+    {file = "lxml-4.9.2-cp310-cp310-win32.whl", hash = "sha256:d02a5399126a53492415d4906ab0ad0375a5456cc05c3fc0fc4ca11771745cda"},
+    {file = "lxml-4.9.2-cp310-cp310-win_amd64.whl", hash = "sha256:a38486985ca49cfa574a507e7a2215c0c780fd1778bb6290c21193b7211702ab"},
+    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:c83203addf554215463b59f6399835201999b5e48019dc17f182ed5ad87205c9"},
+    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:2a87fa548561d2f4643c99cd13131acb607ddabb70682dcf1dff5f71f781a4bf"},
+    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:d6b430a9938a5a5d85fc107d852262ddcd48602c120e3dbb02137c83d212b380"},
+    {file = "lxml-4.9.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:3efea981d956a6f7173b4659849f55081867cf897e719f57383698af6f618a92"},
+    {file = "lxml-4.9.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:df0623dcf9668ad0445e0558a21211d4e9a149ea8f5666917c8eeec515f0a6d1"},
+    {file = "lxml-4.9.2-cp311-cp311-win32.whl", hash = "sha256:da248f93f0418a9e9d94b0080d7ebc407a9a5e6d0b57bb30db9b5cc28de1ad33"},
+    {file = "lxml-4.9.2-cp311-cp311-win_amd64.whl", hash = "sha256:3818b8e2c4b5148567e1b09ce739006acfaa44ce3156f8cbbc11062994b8e8dd"},
+    {file = "lxml-4.9.2-cp35-cp35m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:ca989b91cf3a3ba28930a9fc1e9aeafc2a395448641df1f387a2d394638943b0"},
+    {file = "lxml-4.9.2-cp35-cp35m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:822068f85e12a6e292803e112ab876bc03ed1f03dddb80154c395f891ca6b31e"},
+    {file = "lxml-4.9.2-cp35-cp35m-win32.whl", hash = "sha256:be7292c55101e22f2a3d4d8913944cbea71eea90792bf914add27454a13905df"},
+    {file = "lxml-4.9.2-cp35-cp35m-win_amd64.whl", hash = "sha256:998c7c41910666d2976928c38ea96a70d1aa43be6fe502f21a651e17483a43c5"},
+    {file = "lxml-4.9.2-cp36-cp36m-macosx_10_15_x86_64.whl", hash = "sha256:b26a29f0b7fc6f0897f043ca366142d2b609dc60756ee6e4e90b5f762c6adc53"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:ab323679b8b3030000f2be63e22cdeea5b47ee0abd2d6a1dc0c8103ddaa56cd7"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:689bb688a1db722485e4610a503e3e9210dcc20c520b45ac8f7533c837be76fe"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:f49e52d174375a7def9915c9f06ec4e569d235ad428f70751765f48d5926678c"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:36c3c175d34652a35475a73762b545f4527aec044910a651d2bf50de9c3352b1"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:a35f8b7fa99f90dd2f5dc5a9fa12332642f087a7641289ca6c40d6e1a2637d8e"},
+    {file = "lxml-4.9.2-cp36-cp36m-musllinux_1_1_aarch64.whl", hash = "sha256:58bfa3aa19ca4c0f28c5dde0ff56c520fbac6f0daf4fac66ed4c8d2fb7f22e74"},
+    {file = "lxml-4.9.2-cp36-cp36m-musllinux_1_1_x86_64.whl", hash = "sha256:bc718cd47b765e790eecb74d044cc8d37d58562f6c314ee9484df26276d36a38"},
+    {file = "lxml-4.9.2-cp36-cp36m-win32.whl", hash = "sha256:d5bf6545cd27aaa8a13033ce56354ed9e25ab0e4ac3b5392b763d8d04b08e0c5"},
+    {file = "lxml-4.9.2-cp36-cp36m-win_amd64.whl", hash = "sha256:3ab9fa9d6dc2a7f29d7affdf3edebf6ece6fb28a6d80b14c3b2fb9d39b9322c3"},
+    {file = "lxml-4.9.2-cp37-cp37m-macosx_10_15_x86_64.whl", hash = "sha256:05ca3f6abf5cf78fe053da9b1166e062ade3fa5d4f92b4ed688127ea7d7b1d03"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:a5da296eb617d18e497bcf0a5c528f5d3b18dadb3619fbdadf4ed2356ef8d941"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:04876580c050a8c5341d706dd464ff04fd597095cc8c023252566a8826505726"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:c9ec3eaf616d67db0764b3bb983962b4f385a1f08304fd30c7283954e6a7869b"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2a29ba94d065945944016b6b74e538bdb1751a1db6ffb80c9d3c2e40d6fa9894"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:a82d05da00a58b8e4c0008edbc8a4b6ec5a4bc1e2ee0fb6ed157cf634ed7fa45"},
+    {file = "lxml-4.9.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:223f4232855ade399bd409331e6ca70fb5578efef22cf4069a6090acc0f53c0e"},
+    {file = "lxml-4.9.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:d17bc7c2ccf49c478c5bdd447594e82692c74222698cfc9b5daae7ae7e90743b"},
+    {file = "lxml-4.9.2-cp37-cp37m-win32.whl", hash = "sha256:b64d891da92e232c36976c80ed7ebb383e3f148489796d8d31a5b6a677825efe"},
+    {file = "lxml-4.9.2-cp37-cp37m-win_amd64.whl", hash = "sha256:a0a336d6d3e8b234a3aae3c674873d8f0e720b76bc1d9416866c41cd9500ffb9"},
+    {file = "lxml-4.9.2-cp38-cp38-macosx_10_15_x86_64.whl", hash = "sha256:da4dd7c9c50c059aba52b3524f84d7de956f7fef88f0bafcf4ad7dde94a064e8"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:821b7f59b99551c69c85a6039c65b75f5683bdc63270fec660f75da67469ca24"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:e5168986b90a8d1f2f9dc1b841467c74221bd752537b99761a93d2d981e04889"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:8e20cb5a47247e383cf4ff523205060991021233ebd6f924bca927fcf25cf86f"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:13598ecfbd2e86ea7ae45ec28a2a54fb87ee9b9fdb0f6d343297d8e548392c03"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:880bbbcbe2fca64e2f4d8e04db47bcdf504936fa2b33933efd945e1b429bea8c"},
+    {file = "lxml-4.9.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:7d2278d59425777cfcb19735018d897ca8303abe67cc735f9f97177ceff8027f"},
+    {file = "lxml-4.9.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:5344a43228767f53a9df6e5b253f8cdca7dfc7b7aeae52551958192f56d98457"},
+    {file = "lxml-4.9.2-cp38-cp38-win32.whl", hash = "sha256:925073b2fe14ab9b87e73f9a5fde6ce6392da430f3004d8b72cc86f746f5163b"},
+    {file = "lxml-4.9.2-cp38-cp38-win_amd64.whl", hash = "sha256:9b22c5c66f67ae00c0199f6055705bc3eb3fcb08d03d2ec4059a2b1b25ed48d7"},
+    {file = "lxml-4.9.2-cp39-cp39-macosx_10_15_x86_64.whl", hash = "sha256:5f50a1c177e2fa3ee0667a5ab79fdc6b23086bc8b589d90b93b4bd17eb0e64d1"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:090c6543d3696cbe15b4ac6e175e576bcc3f1ccfbba970061b7300b0c15a2140"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:63da2ccc0857c311d764e7d3d90f429c252e83b52d1f8f1d1fe55be26827d1f4"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:5b4545b8a40478183ac06c073e81a5ce4cf01bf1734962577cf2bb569a5b3bbf"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2e430cd2824f05f2d4f687701144556646bae8f249fd60aa1e4c768ba7018947"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:6804daeb7ef69e7b36f76caddb85cccd63d0c56dedb47555d2fc969e2af6a1a5"},
+    {file = "lxml-4.9.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:a6e441a86553c310258aca15d1c05903aaf4965b23f3bc2d55f200804e005ee5"},
+    {file = "lxml-4.9.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:ca34efc80a29351897e18888c71c6aca4a359247c87e0b1c7ada14f0ab0c0fb2"},
+    {file = "lxml-4.9.2-cp39-cp39-win32.whl", hash = "sha256:6b418afe5df18233fc6b6093deb82a32895b6bb0b1155c2cdb05203f583053f1"},
+    {file = "lxml-4.9.2-cp39-cp39-win_amd64.whl", hash = "sha256:f1496ea22ca2c830cbcbd473de8f114a320da308438ae65abad6bab7867fe38f"},
+    {file = "lxml-4.9.2-pp37-pypy37_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:b264171e3143d842ded311b7dccd46ff9ef34247129ff5bf5066123c55c2431c"},
+    {file = "lxml-4.9.2-pp37-pypy37_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:0dc313ef231edf866912e9d8f5a042ddab56c752619e92dfd3a2c277e6a7299a"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-macosx_10_15_x86_64.whl", hash = "sha256:16efd54337136e8cd72fb9485c368d91d77a47ee2d42b057564aae201257d419"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:0f2b1e0d79180f344ff9f321327b005ca043a50ece8713de61d1cb383fb8ac05"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:7b770ed79542ed52c519119473898198761d78beb24b107acf3ad65deae61f1f"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:efa29c2fe6b4fdd32e8ef81c1528506895eca86e1d8c4657fda04c9b3786ddf9"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-macosx_10_15_x86_64.whl", hash = "sha256:7e91ee82f4199af8c43d8158024cbdff3d931df350252288f0d4ce656df7f3b5"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:b23e19989c355ca854276178a0463951a653309fb8e57ce674497f2d9f208746"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:01d36c05f4afb8f7c20fd9ed5badca32a2029b93b1750f571ccc0b142531caf7"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:7b515674acfdcadb0eb5d00d8a709868173acece5cb0be3dd165950cbfdf5409"},
+    {file = "lxml-4.9.2.tar.gz", hash = "sha256:2455cfaeb7ac70338b3257f41e21f0724f4b5b0c0e7702da67ee6c3640835b67"},
+]
+
+[package.extras]
+cssselect = ["cssselect (>=0.7)"]
+html5 = ["html5lib"]
+htmlsoup = ["BeautifulSoup4"]
+source = ["Cython (>=0.29.7)"]
+
 [[package]]
 name = "markdown-it-py"
 version = "2.2.0"
@@ -2060,4 +2153,4 @@ testing = ["big-O", "flake8 (<5)", "jaraco.functools", "jaraco.itertools", "more
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "c5092124743e444c67155b37f9fc595214da3828c7e5b712d04c8b7ce6100cc8"
+content-hash = "f30334a8b48e6a692970f165e84f766b289193ba25b120a0494ace050052bf21"
diff --git a/pyproject.toml b/pyproject.toml
index a6d9860e8a..ebfd59ad75 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -30,6 +30,7 @@ cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
 httpx = {extras = ["http2"], version = "^0.24.0"}
 beautifulsoup4 = "^4.12.2"
+lxml = "^4.9.2"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From ddfe965b0bacb6f19c2ab13ab0e7ea537e0f2381 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 15:25:56 -0400
Subject: [PATCH 043/387] fixed iis shortnames test

---
 bbot/modules/dnsdumpster.py    |   2 +-
 bbot/modules/iis_shortnames.py |   5 +-
 bbot/modules/viewdns.py        |   2 +-
 poetry.lock                    | 458 +--------------------------------
 pyproject.toml                 |   6 +-
 5 files changed, 11 insertions(+), 462 deletions(-)

diff --git a/bbot/modules/dnsdumpster.py b/bbot/modules/dnsdumpster.py
index cff5b0692f..8009540865 100644
--- a/bbot/modules/dnsdumpster.py
+++ b/bbot/modules/dnsdumpster.py
@@ -10,7 +10,7 @@ class dnsdumpster(crobat):
     flags = ["subdomain-enum", "passive", "safe"]
     meta = {"description": "Query dnsdumpster for subdomains"}
 
-    deps_pip = ["bs4", "lxml~=4.9.2"]
+    deps_pip = ["beautifulsoup4", "lxml~=4.9.2"]
 
     base_url = "https://dnsdumpster.com"
 
diff --git a/bbot/modules/iis_shortnames.py b/bbot/modules/iis_shortnames.py
index 3ee204321f..7a5be37c14 100644
--- a/bbot/modules/iis_shortnames.py
+++ b/bbot/modules/iis_shortnames.py
@@ -71,7 +71,7 @@ async def duplicate_check(self, target, method, url_hint, affirmative_status_cod
         duplicates = []
         count = 2
         base_hint = re.sub(r"~\d", "", url_hint)
-        suffix = "\\a.aspx"
+        suffix = "/a.aspx"
 
         while 1:
             payload = encode_all(f"{base_hint}~{str(count)}*")
@@ -107,7 +107,7 @@ async def solve_shortname_recursive(
 
         tasks = []
         for c in valid_chars:
-            suffix = "\\a.aspx"
+            suffix = "/a.aspx"
             wildcard = "*" if extension_mode else "*~1*"
             payload = encode_all(f"{prefix}{c}{wildcard}")
             url = f"{target}{payload}{suffix}"
@@ -189,7 +189,6 @@ async def handle_event(self, event):
                             file_name_hints += duplicates
 
                     # check for the case of a folder and file with the same filename
-
                     for d in file_name_hints:
                         if await self.directory_confirm(normalized_url, method, d, affirmative_status_code):
                             self.verbose(f"Confirmed Directory URL_HINT: {d} from node {normalized_url}")
diff --git a/bbot/modules/viewdns.py b/bbot/modules/viewdns.py
index 8ddc3e818c..69f03f5aa2 100644
--- a/bbot/modules/viewdns.py
+++ b/bbot/modules/viewdns.py
@@ -15,7 +15,7 @@ class viewdns(BaseModule):
     meta = {
         "description": "Query viewdns.info's reverse whois for related domains",
     }
-    deps_pip = ["bs4", "lxml~=4.9.2"]
+    deps_pip = ["beautifulsoup4", "lxml~=4.9.2"]
     base_url = "https://viewdns.info"
     in_scope_only = True
     _qsize = 1
diff --git a/poetry.lock b/poetry.lock
index 31f9015c82..d1f8465257 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -116,25 +116,6 @@ docs = ["furo", "myst-parser", "sphinx", "sphinx-notfound-page", "sphinxcontrib-
 tests = ["attrs[tests-no-zope]", "zope-interface"]
 tests-no-zope = ["cloudpickle", "hypothesis", "mypy (>=1.1.1)", "pympler", "pytest (>=4.3.0)", "pytest-mypy-plugins", "pytest-xdist[psutil]"]
 
-[[package]]
-name = "beautifulsoup4"
-version = "4.12.2"
-description = "Screen-scraping library"
-category = "main"
-optional = false
-python-versions = ">=3.6.0"
-files = [
-    {file = "beautifulsoup4-4.12.2-py3-none-any.whl", hash = "sha256:bd2520ca0d9d7d12694a53d44ac482d181b4ec1888909b035a3dbf40d0f57d4a"},
-    {file = "beautifulsoup4-4.12.2.tar.gz", hash = "sha256:492bbc69dca35d12daac71c4db1bfff0c876c00ef4a2ffacce226d4638eb72da"},
-]
-
-[package.dependencies]
-soupsieve = ">1.2"
-
-[package.extras]
-html5lib = ["html5lib"]
-lxml = ["lxml"]
-
 [[package]]
 name = "black"
 version = "23.3.0"
@@ -185,25 +166,6 @@ d = ["aiohttp (>=3.7.4)"]
 jupyter = ["ipython (>=7.8.0)", "tokenize-rt (>=3.2.0)"]
 uvloop = ["uvloop (>=0.15.2)"]
 
-[[package]]
-name = "bleach"
-version = "6.0.0"
-description = "An easy safelist-based HTML-sanitizing tool."
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "bleach-6.0.0-py3-none-any.whl", hash = "sha256:33c16e3353dbd13028ab4799a0f89a83f113405c766e9c122df8a06f5b85b3f4"},
-    {file = "bleach-6.0.0.tar.gz", hash = "sha256:1a1a85c1595e07d8db14c5f09f09e6433502c51c595970edc090551f0db99414"},
-]
-
-[package.dependencies]
-six = ">=1.9.0"
-webencodings = "*"
-
-[package.extras]
-css = ["tinycss2 (>=1.1.0,<1.2)"]
-
 [[package]]
 name = "cattrs"
 version = "22.2.0"
@@ -772,26 +734,6 @@ files = [
     {file = "idna-3.4.tar.gz", hash = "sha256:814f528e8dead7d329833b91c5faa87d60bf71824cd12a7530b5526063d02cb4"},
 ]
 
-[[package]]
-name = "importlib-metadata"
-version = "6.6.0"
-description = "Read metadata from Python packages"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "importlib_metadata-6.6.0-py3-none-any.whl", hash = "sha256:43dd286a2cd8995d5eaef7fee2066340423b818ed3fd70adf0bad5f1fac53fed"},
-    {file = "importlib_metadata-6.6.0.tar.gz", hash = "sha256:92501cdf9cc66ebd3e612f1b4f0c0765dfa42f0fa38ffb319b6bd84dd675d705"},
-]
-
-[package.dependencies]
-zipp = ">=0.5"
-
-[package.extras]
-docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)", "sphinx-lint"]
-perf = ["ipython"]
-testing = ["flake8 (<5)", "flufl.flake8", "importlib-resources (>=1.3)", "packaging", "pyfakefs", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)", "pytest-perf (>=0.9.2)"]
-
 [[package]]
 name = "iniconfig"
 version = "2.0.0"
@@ -804,41 +746,6 @@ files = [
     {file = "iniconfig-2.0.0.tar.gz", hash = "sha256:2d91e135bf72d31a410b17c16da610a82cb55f6b0477d1a902134b24a455b8b3"},
 ]
 
-[[package]]
-name = "jaraco-classes"
-version = "3.2.3"
-description = "Utility functions for Python class constructs"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "jaraco.classes-3.2.3-py3-none-any.whl", hash = "sha256:2353de3288bc6b82120752201c6b1c1a14b058267fa424ed5ce5984e3b922158"},
-    {file = "jaraco.classes-3.2.3.tar.gz", hash = "sha256:89559fa5c1d3c34eff6f631ad80bb21f378dbcbb35dd161fd2c6b93f5be2f98a"},
-]
-
-[package.dependencies]
-more-itertools = "*"
-
-[package.extras]
-docs = ["jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)"]
-testing = ["flake8 (<5)", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)"]
-
-[[package]]
-name = "jeepney"
-version = "0.8.0"
-description = "Low-level, pure Python DBus protocol wrapper."
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "jeepney-0.8.0-py3-none-any.whl", hash = "sha256:c0a454ad016ca575060802ee4d590dd912e35c122fa04e70306de3d076cce755"},
-    {file = "jeepney-0.8.0.tar.gz", hash = "sha256:5efe48d255973902f6badc3ce55e2aa6c5c3b3bc642059ef3a91247bcfcc5806"},
-]
-
-[package.extras]
-test = ["async-timeout", "pytest", "pytest-asyncio (>=0.17)", "pytest-trio", "testpath", "trio"]
-trio = ["async_generator", "trio"]
-
 [[package]]
 name = "jinja2"
 version = "3.1.2"
@@ -857,30 +764,6 @@ MarkupSafe = ">=2.0"
 [package.extras]
 i18n = ["Babel (>=2.7)"]
 
-[[package]]
-name = "keyring"
-version = "23.13.1"
-description = "Store and access your passwords safely."
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "keyring-23.13.1-py3-none-any.whl", hash = "sha256:771ed2a91909389ed6148631de678f82ddc73737d85a927f382a8a1b157898cd"},
-    {file = "keyring-23.13.1.tar.gz", hash = "sha256:ba2e15a9b35e21908d0aaf4e0a47acc52d6ae33444df0da2b49d41a46ef6d678"},
-]
-
-[package.dependencies]
-importlib-metadata = {version = ">=4.11.4", markers = "python_version < \"3.12\""}
-"jaraco.classes" = "*"
-jeepney = {version = ">=0.4.2", markers = "sys_platform == \"linux\""}
-pywin32-ctypes = {version = ">=0.2.0", markers = "sys_platform == \"win32\""}
-SecretStorage = {version = ">=3.2", markers = "sys_platform == \"linux\""}
-
-[package.extras]
-completion = ["shtab"]
-docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)"]
-testing = ["flake8 (<5)", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)"]
-
 [[package]]
 name = "lockfile"
 version = "0.12.2"
@@ -893,124 +776,6 @@ files = [
     {file = "lockfile-0.12.2.tar.gz", hash = "sha256:6aed02de03cba24efabcd600b30540140634fc06cfa603822d508d5361e9f799"},
 ]
 
-[[package]]
-name = "lxml"
-version = "4.9.2"
-description = "Powerful and Pythonic XML processing library combining libxml2/libxslt with the ElementTree API."
-category = "main"
-optional = false
-python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, != 3.4.*"
-files = [
-    {file = "lxml-4.9.2-cp27-cp27m-macosx_10_15_x86_64.whl", hash = "sha256:76cf573e5a365e790396a5cc2b909812633409306c6531a6877c59061e42c4f2"},
-    {file = "lxml-4.9.2-cp27-cp27m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:b1f42b6921d0e81b1bcb5e395bc091a70f41c4d4e55ba99c6da2b31626c44892"},
-    {file = "lxml-4.9.2-cp27-cp27m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:9f102706d0ca011de571de32c3247c6476b55bb6bc65a20f682f000b07a4852a"},
-    {file = "lxml-4.9.2-cp27-cp27m-win32.whl", hash = "sha256:8d0b4612b66ff5d62d03bcaa043bb018f74dfea51184e53f067e6fdcba4bd8de"},
-    {file = "lxml-4.9.2-cp27-cp27m-win_amd64.whl", hash = "sha256:4c8f293f14abc8fd3e8e01c5bd86e6ed0b6ef71936ded5bf10fe7a5efefbaca3"},
-    {file = "lxml-4.9.2-cp27-cp27mu-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2899456259589aa38bfb018c364d6ae7b53c5c22d8e27d0ec7609c2a1ff78b50"},
-    {file = "lxml-4.9.2-cp27-cp27mu-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:6749649eecd6a9871cae297bffa4ee76f90b4504a2a2ab528d9ebe912b101975"},
-    {file = "lxml-4.9.2-cp310-cp310-macosx_10_15_x86_64.whl", hash = "sha256:a08cff61517ee26cb56f1e949cca38caabe9ea9fbb4b1e10a805dc39844b7d5c"},
-    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:85cabf64adec449132e55616e7ca3e1000ab449d1d0f9d7f83146ed5bdcb6d8a"},
-    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:8340225bd5e7a701c0fa98284c849c9b9fc9238abf53a0ebd90900f25d39a4e4"},
-    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:1ab8f1f932e8f82355e75dda5413a57612c6ea448069d4fb2e217e9a4bed13d4"},
-    {file = "lxml-4.9.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:699a9af7dffaf67deeae27b2112aa06b41c370d5e7633e0ee0aea2e0b6c211f7"},
-    {file = "lxml-4.9.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:b9cc34af337a97d470040f99ba4282f6e6bac88407d021688a5d585e44a23184"},
-    {file = "lxml-4.9.2-cp310-cp310-win32.whl", hash = "sha256:d02a5399126a53492415d4906ab0ad0375a5456cc05c3fc0fc4ca11771745cda"},
-    {file = "lxml-4.9.2-cp310-cp310-win_amd64.whl", hash = "sha256:a38486985ca49cfa574a507e7a2215c0c780fd1778bb6290c21193b7211702ab"},
-    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:c83203addf554215463b59f6399835201999b5e48019dc17f182ed5ad87205c9"},
-    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:2a87fa548561d2f4643c99cd13131acb607ddabb70682dcf1dff5f71f781a4bf"},
-    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:d6b430a9938a5a5d85fc107d852262ddcd48602c120e3dbb02137c83d212b380"},
-    {file = "lxml-4.9.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:3efea981d956a6f7173b4659849f55081867cf897e719f57383698af6f618a92"},
-    {file = "lxml-4.9.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:df0623dcf9668ad0445e0558a21211d4e9a149ea8f5666917c8eeec515f0a6d1"},
-    {file = "lxml-4.9.2-cp311-cp311-win32.whl", hash = "sha256:da248f93f0418a9e9d94b0080d7ebc407a9a5e6d0b57bb30db9b5cc28de1ad33"},
-    {file = "lxml-4.9.2-cp311-cp311-win_amd64.whl", hash = "sha256:3818b8e2c4b5148567e1b09ce739006acfaa44ce3156f8cbbc11062994b8e8dd"},
-    {file = "lxml-4.9.2-cp35-cp35m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:ca989b91cf3a3ba28930a9fc1e9aeafc2a395448641df1f387a2d394638943b0"},
-    {file = "lxml-4.9.2-cp35-cp35m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:822068f85e12a6e292803e112ab876bc03ed1f03dddb80154c395f891ca6b31e"},
-    {file = "lxml-4.9.2-cp35-cp35m-win32.whl", hash = "sha256:be7292c55101e22f2a3d4d8913944cbea71eea90792bf914add27454a13905df"},
-    {file = "lxml-4.9.2-cp35-cp35m-win_amd64.whl", hash = "sha256:998c7c41910666d2976928c38ea96a70d1aa43be6fe502f21a651e17483a43c5"},
-    {file = "lxml-4.9.2-cp36-cp36m-macosx_10_15_x86_64.whl", hash = "sha256:b26a29f0b7fc6f0897f043ca366142d2b609dc60756ee6e4e90b5f762c6adc53"},
-    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:ab323679b8b3030000f2be63e22cdeea5b47ee0abd2d6a1dc0c8103ddaa56cd7"},
-    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:689bb688a1db722485e4610a503e3e9210dcc20c520b45ac8f7533c837be76fe"},
-    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:f49e52d174375a7def9915c9f06ec4e569d235ad428f70751765f48d5926678c"},
-    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:36c3c175d34652a35475a73762b545f4527aec044910a651d2bf50de9c3352b1"},
-    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:a35f8b7fa99f90dd2f5dc5a9fa12332642f087a7641289ca6c40d6e1a2637d8e"},
-    {file = "lxml-4.9.2-cp36-cp36m-musllinux_1_1_aarch64.whl", hash = "sha256:58bfa3aa19ca4c0f28c5dde0ff56c520fbac6f0daf4fac66ed4c8d2fb7f22e74"},
-    {file = "lxml-4.9.2-cp36-cp36m-musllinux_1_1_x86_64.whl", hash = "sha256:bc718cd47b765e790eecb74d044cc8d37d58562f6c314ee9484df26276d36a38"},
-    {file = "lxml-4.9.2-cp36-cp36m-win32.whl", hash = "sha256:d5bf6545cd27aaa8a13033ce56354ed9e25ab0e4ac3b5392b763d8d04b08e0c5"},
-    {file = "lxml-4.9.2-cp36-cp36m-win_amd64.whl", hash = "sha256:3ab9fa9d6dc2a7f29d7affdf3edebf6ece6fb28a6d80b14c3b2fb9d39b9322c3"},
-    {file = "lxml-4.9.2-cp37-cp37m-macosx_10_15_x86_64.whl", hash = "sha256:05ca3f6abf5cf78fe053da9b1166e062ade3fa5d4f92b4ed688127ea7d7b1d03"},
-    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:a5da296eb617d18e497bcf0a5c528f5d3b18dadb3619fbdadf4ed2356ef8d941"},
-    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:04876580c050a8c5341d706dd464ff04fd597095cc8c023252566a8826505726"},
-    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:c9ec3eaf616d67db0764b3bb983962b4f385a1f08304fd30c7283954e6a7869b"},
-    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2a29ba94d065945944016b6b74e538bdb1751a1db6ffb80c9d3c2e40d6fa9894"},
-    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:a82d05da00a58b8e4c0008edbc8a4b6ec5a4bc1e2ee0fb6ed157cf634ed7fa45"},
-    {file = "lxml-4.9.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:223f4232855ade399bd409331e6ca70fb5578efef22cf4069a6090acc0f53c0e"},
-    {file = "lxml-4.9.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:d17bc7c2ccf49c478c5bdd447594e82692c74222698cfc9b5daae7ae7e90743b"},
-    {file = "lxml-4.9.2-cp37-cp37m-win32.whl", hash = "sha256:b64d891da92e232c36976c80ed7ebb383e3f148489796d8d31a5b6a677825efe"},
-    {file = "lxml-4.9.2-cp37-cp37m-win_amd64.whl", hash = "sha256:a0a336d6d3e8b234a3aae3c674873d8f0e720b76bc1d9416866c41cd9500ffb9"},
-    {file = "lxml-4.9.2-cp38-cp38-macosx_10_15_x86_64.whl", hash = "sha256:da4dd7c9c50c059aba52b3524f84d7de956f7fef88f0bafcf4ad7dde94a064e8"},
-    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:821b7f59b99551c69c85a6039c65b75f5683bdc63270fec660f75da67469ca24"},
-    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:e5168986b90a8d1f2f9dc1b841467c74221bd752537b99761a93d2d981e04889"},
-    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:8e20cb5a47247e383cf4ff523205060991021233ebd6f924bca927fcf25cf86f"},
-    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:13598ecfbd2e86ea7ae45ec28a2a54fb87ee9b9fdb0f6d343297d8e548392c03"},
-    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:880bbbcbe2fca64e2f4d8e04db47bcdf504936fa2b33933efd945e1b429bea8c"},
-    {file = "lxml-4.9.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:7d2278d59425777cfcb19735018d897ca8303abe67cc735f9f97177ceff8027f"},
-    {file = "lxml-4.9.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:5344a43228767f53a9df6e5b253f8cdca7dfc7b7aeae52551958192f56d98457"},
-    {file = "lxml-4.9.2-cp38-cp38-win32.whl", hash = "sha256:925073b2fe14ab9b87e73f9a5fde6ce6392da430f3004d8b72cc86f746f5163b"},
-    {file = "lxml-4.9.2-cp38-cp38-win_amd64.whl", hash = "sha256:9b22c5c66f67ae00c0199f6055705bc3eb3fcb08d03d2ec4059a2b1b25ed48d7"},
-    {file = "lxml-4.9.2-cp39-cp39-macosx_10_15_x86_64.whl", hash = "sha256:5f50a1c177e2fa3ee0667a5ab79fdc6b23086bc8b589d90b93b4bd17eb0e64d1"},
-    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:090c6543d3696cbe15b4ac6e175e576bcc3f1ccfbba970061b7300b0c15a2140"},
-    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:63da2ccc0857c311d764e7d3d90f429c252e83b52d1f8f1d1fe55be26827d1f4"},
-    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:5b4545b8a40478183ac06c073e81a5ce4cf01bf1734962577cf2bb569a5b3bbf"},
-    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2e430cd2824f05f2d4f687701144556646bae8f249fd60aa1e4c768ba7018947"},
-    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:6804daeb7ef69e7b36f76caddb85cccd63d0c56dedb47555d2fc969e2af6a1a5"},
-    {file = "lxml-4.9.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:a6e441a86553c310258aca15d1c05903aaf4965b23f3bc2d55f200804e005ee5"},
-    {file = "lxml-4.9.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:ca34efc80a29351897e18888c71c6aca4a359247c87e0b1c7ada14f0ab0c0fb2"},
-    {file = "lxml-4.9.2-cp39-cp39-win32.whl", hash = "sha256:6b418afe5df18233fc6b6093deb82a32895b6bb0b1155c2cdb05203f583053f1"},
-    {file = "lxml-4.9.2-cp39-cp39-win_amd64.whl", hash = "sha256:f1496ea22ca2c830cbcbd473de8f114a320da308438ae65abad6bab7867fe38f"},
-    {file = "lxml-4.9.2-pp37-pypy37_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:b264171e3143d842ded311b7dccd46ff9ef34247129ff5bf5066123c55c2431c"},
-    {file = "lxml-4.9.2-pp37-pypy37_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:0dc313ef231edf866912e9d8f5a042ddab56c752619e92dfd3a2c277e6a7299a"},
-    {file = "lxml-4.9.2-pp38-pypy38_pp73-macosx_10_15_x86_64.whl", hash = "sha256:16efd54337136e8cd72fb9485c368d91d77a47ee2d42b057564aae201257d419"},
-    {file = "lxml-4.9.2-pp38-pypy38_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:0f2b1e0d79180f344ff9f321327b005ca043a50ece8713de61d1cb383fb8ac05"},
-    {file = "lxml-4.9.2-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:7b770ed79542ed52c519119473898198761d78beb24b107acf3ad65deae61f1f"},
-    {file = "lxml-4.9.2-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:efa29c2fe6b4fdd32e8ef81c1528506895eca86e1d8c4657fda04c9b3786ddf9"},
-    {file = "lxml-4.9.2-pp39-pypy39_pp73-macosx_10_15_x86_64.whl", hash = "sha256:7e91ee82f4199af8c43d8158024cbdff3d931df350252288f0d4ce656df7f3b5"},
-    {file = "lxml-4.9.2-pp39-pypy39_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:b23e19989c355ca854276178a0463951a653309fb8e57ce674497f2d9f208746"},
-    {file = "lxml-4.9.2-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:01d36c05f4afb8f7c20fd9ed5badca32a2029b93b1750f571ccc0b142531caf7"},
-    {file = "lxml-4.9.2-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:7b515674acfdcadb0eb5d00d8a709868173acece5cb0be3dd165950cbfdf5409"},
-    {file = "lxml-4.9.2.tar.gz", hash = "sha256:2455cfaeb7ac70338b3257f41e21f0724f4b5b0c0e7702da67ee6c3640835b67"},
-]
-
-[package.extras]
-cssselect = ["cssselect (>=0.7)"]
-html5 = ["html5lib"]
-htmlsoup = ["BeautifulSoup4"]
-source = ["Cython (>=0.29.7)"]
-
-[[package]]
-name = "markdown-it-py"
-version = "2.2.0"
-description = "Python port of markdown-it. Markdown parsing, done right!"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "markdown-it-py-2.2.0.tar.gz", hash = "sha256:7c9a5e412688bc771c67432cbfebcdd686c93ce6484913dccf06cb5a0bea35a1"},
-    {file = "markdown_it_py-2.2.0-py3-none-any.whl", hash = "sha256:5a35f8d1870171d9acc47b99612dc146129b631baf04970128b568f190d0cc30"},
-]
-
-[package.dependencies]
-mdurl = ">=0.1,<1.0"
-
-[package.extras]
-benchmarking = ["psutil", "pytest", "pytest-benchmark"]
-code-style = ["pre-commit (>=3.0,<4.0)"]
-compare = ["commonmark (>=0.9,<1.0)", "markdown (>=3.4,<4.0)", "mistletoe (>=1.0,<2.0)", "mistune (>=2.0,<3.0)", "panflute (>=2.3,<3.0)"]
-linkify = ["linkify-it-py (>=1,<3)"]
-plugins = ["mdit-py-plugins"]
-profiling = ["gprof2dot"]
-rtd = ["attrs", "myst-parser", "pyyaml", "sphinx", "sphinx-copybutton", "sphinx-design", "sphinx_book_theme"]
-testing = ["coverage", "pytest", "pytest-cov", "pytest-regressions"]
-
 [[package]]
 name = "markupsafe"
 version = "2.1.2"
@@ -1083,30 +848,6 @@ files = [
     {file = "mccabe-0.7.0.tar.gz", hash = "sha256:348e0240c33b60bbdf4e523192ef919f28cb2c3d7d5c7794f74009290f236325"},
 ]
 
-[[package]]
-name = "mdurl"
-version = "0.1.2"
-description = "Markdown URL utilities"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "mdurl-0.1.2-py3-none-any.whl", hash = "sha256:84008a41e51615a49fc9966191ff91509e3c40b939176e643fd50a5c2196b8f8"},
-    {file = "mdurl-0.1.2.tar.gz", hash = "sha256:bb413d29f5eea38f31dd4754dd7377d4465116fb207585f97bf925588687c1ba"},
-]
-
-[[package]]
-name = "more-itertools"
-version = "9.1.0"
-description = "More routines for operating on iterables, beyond itertools"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "more-itertools-9.1.0.tar.gz", hash = "sha256:cabaa341ad0389ea83c17a94566a53ae4c9d07349861ecb14dc6d0345cf9ac5d"},
-    {file = "more_itertools-9.1.0-py3-none-any.whl", hash = "sha256:d2bc7f02446e86a68911e58ded76d6561eea00cddfb2a91e7019bbb586c799f3"},
-]
-
 [[package]]
 name = "mypy-extensions"
 version = "1.0.0"
@@ -1189,21 +930,6 @@ files = [
 [package.dependencies]
 ptyprocess = ">=0.5"
 
-[[package]]
-name = "pkginfo"
-version = "1.9.6"
-description = "Query metadata from sdists / bdists / installed packages."
-category = "dev"
-optional = false
-python-versions = ">=3.6"
-files = [
-    {file = "pkginfo-1.9.6-py3-none-any.whl", hash = "sha256:4b7a555a6d5a22169fcc9cf7bfd78d296b0361adad412a346c1226849af5e546"},
-    {file = "pkginfo-1.9.6.tar.gz", hash = "sha256:8fd5896e8718a4372f0ea9cc9d96f6417c9b986e23a4d116dda26b62cc29d046"},
-]
-
-[package.extras]
-testing = ["pytest", "pytest-cov"]
-
 [[package]]
 name = "platformdirs"
 version = "3.5.1"
@@ -1426,21 +1152,6 @@ files = [
     {file = "pyflakes-3.0.1.tar.gz", hash = "sha256:ec8b276a6b60bd80defed25add7e439881c19e64850afd9b346283d4165fd0fd"},
 ]
 
-[[package]]
-name = "pygments"
-version = "2.15.1"
-description = "Pygments is a syntax highlighting package written in Python."
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "Pygments-2.15.1-py3-none-any.whl", hash = "sha256:db2db3deb4b4179f399a09054b023b6a586b76499d36965813c71aa8ed7b5fd1"},
-    {file = "Pygments-2.15.1.tar.gz", hash = "sha256:8ace4d3c1dd481894b2005f560ead0f9f19ee64fe983366be1a21e171d12775c"},
-]
-
-[package.extras]
-plugins = ["importlib-metadata"]
-
 [[package]]
 name = "pytest"
 version = "7.3.1"
@@ -1504,18 +1215,17 @@ testing = ["fields", "hunter", "process-tests", "pytest-xdist", "six", "virtuale
 
 [[package]]
 name = "pytest-httpserver"
-version = "1.0.7"
+version = "1.0.8"
 description = "pytest-httpserver is a httpserver for pytest"
 category = "dev"
 optional = false
 python-versions = ">=3.8,<4.0"
 files = [
-    {file = "pytest_httpserver-1.0.7-py3-none-any.whl", hash = "sha256:e86556f2ff2783c04f19bd634f48f1880056267038be49886b973e843bf5b244"},
-    {file = "pytest_httpserver-1.0.7.tar.gz", hash = "sha256:f0317d679221fadab1faef17d71fba18f52a416e21fd68cbf60ef46b693c66f9"},
+    {file = "pytest_httpserver-1.0.8-py3-none-any.whl", hash = "sha256:24cd3d9f6a0b927c7bfc400d0b3fda7442721b8267ce29942bf307b190f0bb09"},
+    {file = "pytest_httpserver-1.0.8.tar.gz", hash = "sha256:e052f69bc8a9073db02484681e8e47004dd1fb3763b0ae833bd899e5895c559a"},
 ]
 
 [package.dependencies]
-twine = ">=4.0.2,<5.0.0"
 Werkzeug = ">=2.0.0"
 
 [[package]]
@@ -1574,18 +1284,6 @@ setuptools = ">=62.4.0"
 devel = ["coverage", "docutils", "isort", "testscenarios (>=0.4)", "testtools", "twine"]
 test = ["coverage", "docutils", "testscenarios (>=0.4)", "testtools"]
 
-[[package]]
-name = "pywin32-ctypes"
-version = "0.2.0"
-description = ""
-category = "dev"
-optional = false
-python-versions = "*"
-files = [
-    {file = "pywin32-ctypes-0.2.0.tar.gz", hash = "sha256:24ffc3b341d457d48e8922352130cf2644024a4ff09762a2261fd34c36ee5942"},
-    {file = "pywin32_ctypes-0.2.0-py2.py3-none-any.whl", hash = "sha256:9dc2d991b3479cc2df15930958b674a48a227d5361d413827a4cfd0b5876fc98"},
-]
-
 [[package]]
 name = "pyyaml"
 version = "6.0"
@@ -1636,26 +1334,6 @@ files = [
     {file = "PyYAML-6.0.tar.gz", hash = "sha256:68fb519c14306fec9720a2a5b45bc9f0c8d1b9c72adf45c37baedfcd949c35a2"},
 ]
 
-[[package]]
-name = "readme-renderer"
-version = "37.3"
-description = "readme_renderer is a library for rendering \"readme\" descriptions for Warehouse"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "readme_renderer-37.3-py3-none-any.whl", hash = "sha256:f67a16caedfa71eef48a31b39708637a6f4664c4394801a7b0d6432d13907343"},
-    {file = "readme_renderer-37.3.tar.gz", hash = "sha256:cd653186dfc73055656f090f227f5cb22a046d7f71a841dfa305f55c9a513273"},
-]
-
-[package.dependencies]
-bleach = ">=2.1.0"
-docutils = ">=0.13.1"
-Pygments = ">=2.5.1"
-
-[package.extras]
-md = ["cmarkgfm (>=0.8.0)"]
-
 [[package]]
 name = "requests"
 version = "2.31.0"
@@ -1725,21 +1403,6 @@ files = [
 requests = ">=1.0.0"
 six = "*"
 
-[[package]]
-name = "requests-toolbelt"
-version = "1.0.0"
-description = "A utility belt for advanced users of python-requests"
-category = "dev"
-optional = false
-python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*"
-files = [
-    {file = "requests-toolbelt-1.0.0.tar.gz", hash = "sha256:7681a0a3d047012b5bdc0ee37d7f8f07ebe76ab08caeccfc3921ce23c88d5bc6"},
-    {file = "requests_toolbelt-1.0.0-py2.py3-none-any.whl", hash = "sha256:cccfdd665f0a24fcf4726e690f65639d272bb0637b9b92dfd91a5568ccf6bd06"},
-]
-
-[package.dependencies]
-requests = ">=2.0.1,<3.0.0"
-
 [[package]]
 name = "resolvelib"
 version = "0.8.1"
@@ -1758,56 +1421,6 @@ lint = ["black", "flake8", "isort", "mypy", "types-requests"]
 release = ["build", "towncrier", "twine"]
 test = ["commentjson", "packaging", "pytest"]
 
-[[package]]
-name = "rfc3986"
-version = "2.0.0"
-description = "Validating URI References per RFC 3986"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "rfc3986-2.0.0-py2.py3-none-any.whl", hash = "sha256:50b1502b60e289cb37883f3dfd34532b8873c7de9f49bb546641ce9cbd256ebd"},
-    {file = "rfc3986-2.0.0.tar.gz", hash = "sha256:97aacf9dbd4bfd829baad6e6309fa6573aaf1be3f6fa735c8ab05e46cecb261c"},
-]
-
-[package.extras]
-idna2008 = ["idna"]
-
-[[package]]
-name = "rich"
-version = "13.3.5"
-description = "Render rich text, tables, progress bars, syntax highlighting, markdown and more to the terminal"
-category = "dev"
-optional = false
-python-versions = ">=3.7.0"
-files = [
-    {file = "rich-13.3.5-py3-none-any.whl", hash = "sha256:69cdf53799e63f38b95b9bf9c875f8c90e78dd62b2f00c13a911c7a3b9fa4704"},
-    {file = "rich-13.3.5.tar.gz", hash = "sha256:2d11b9b8dd03868f09b4fffadc84a6a8cda574e40dc90821bd845720ebb8e89c"},
-]
-
-[package.dependencies]
-markdown-it-py = ">=2.2.0,<3.0.0"
-pygments = ">=2.13.0,<3.0.0"
-
-[package.extras]
-jupyter = ["ipywidgets (>=7.5.1,<9)"]
-
-[[package]]
-name = "secretstorage"
-version = "3.3.3"
-description = "Python bindings to FreeDesktop.org Secret Service API"
-category = "dev"
-optional = false
-python-versions = ">=3.6"
-files = [
-    {file = "SecretStorage-3.3.3-py3-none-any.whl", hash = "sha256:f356e6628222568e3af06f2eba8df495efa13b3b63081dafd4f7d9a7b7bc9f99"},
-    {file = "SecretStorage-3.3.3.tar.gz", hash = "sha256:2403533ef369eca6d2ba81718576c5e0f564d5cca1b58f73a8b23e7d4eeebd77"},
-]
-
-[package.dependencies]
-cryptography = ">=2.0"
-jeepney = ">=0.6"
-
 [[package]]
 name = "setuptools"
 version = "67.8.0"
@@ -1849,18 +1462,6 @@ files = [
     {file = "sniffio-1.3.0.tar.gz", hash = "sha256:e60305c5e5d314f5389259b7f22aaa33d8f7dee49763119234af3755c55b9101"},
 ]
 
-[[package]]
-name = "soupsieve"
-version = "2.4.1"
-description = "A modern CSS selector implementation for Beautiful Soup."
-category = "main"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "soupsieve-2.4.1-py3-none-any.whl", hash = "sha256:1c1bfee6819544a3447586c889157365a27e10d88cde3ad3da0cf0ddf646feb8"},
-    {file = "soupsieve-2.4.1.tar.gz", hash = "sha256:89d12b2d5dfcd2c9e8c22326da9d9aa9cb3dfab0a83a024f05704076ee8d35ea"},
-]
-
 [[package]]
 name = "tabulate"
 version = "0.8.10"
@@ -1918,29 +1519,6 @@ files = [
     {file = "tomlkit-0.11.8.tar.gz", hash = "sha256:9330fc7faa1db67b541b28e62018c17d20be733177d290a13b24c62d1614e0c3"},
 ]
 
-[[package]]
-name = "twine"
-version = "4.0.2"
-description = "Collection of utilities for publishing packages on PyPI"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "twine-4.0.2-py3-none-any.whl", hash = "sha256:929bc3c280033347a00f847236564d1c52a3e61b1ac2516c97c48f3ceab756d8"},
-    {file = "twine-4.0.2.tar.gz", hash = "sha256:9e102ef5fdd5a20661eb88fad46338806c3bd32cf1db729603fe3697b1bc83c8"},
-]
-
-[package.dependencies]
-importlib-metadata = ">=3.6"
-keyring = ">=15.1"
-pkginfo = ">=1.8.1"
-readme-renderer = ">=35.0"
-requests = ">=2.20"
-requests-toolbelt = ">=0.8.0,<0.9.0 || >0.9.0"
-rfc3986 = ">=1.4.0"
-rich = ">=12.0.0"
-urllib3 = ">=1.26.0"
-
 [[package]]
 name = "typing-extensions"
 version = "4.5.0"
@@ -1986,18 +1564,6 @@ secure = ["certifi", "cryptography (>=1.9)", "idna (>=2.0.0)", "pyopenssl (>=17.
 socks = ["pysocks (>=1.5.6,!=1.5.7,<2.0)"]
 zstd = ["zstandard (>=0.18.0)"]
 
-[[package]]
-name = "webencodings"
-version = "0.5.1"
-description = "Character encoding aliases for legacy web content"
-category = "dev"
-optional = false
-python-versions = "*"
-files = [
-    {file = "webencodings-0.5.1-py2.py3-none-any.whl", hash = "sha256:a0af1213f3c2226497a97e2b3aa01a7e4bee4f403f95be16fc9acd2947514a78"},
-    {file = "webencodings-0.5.1.tar.gz", hash = "sha256:b36a1c245f2d304965eb4e0a82848379241dc04b865afcc4aab16748587e1923"},
-]
-
 [[package]]
 name = "websockets"
 version = "11.0.3"
@@ -2134,23 +1700,7 @@ files = [
 [package.dependencies]
 xmltodict = ">=0.12.0,<0.13.0"
 
-[[package]]
-name = "zipp"
-version = "3.15.0"
-description = "Backport of pathlib-compatible object wrapper for zip files"
-category = "dev"
-optional = false
-python-versions = ">=3.7"
-files = [
-    {file = "zipp-3.15.0-py3-none-any.whl", hash = "sha256:48904fc76a60e542af151aded95726c1a5c34ed43ab4134b597665c86d7ad556"},
-    {file = "zipp-3.15.0.tar.gz", hash = "sha256:112929ad649da941c23de50f356a2b5570c954b65150642bccdd66bf194d224b"},
-]
-
-[package.extras]
-docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)", "sphinx-lint"]
-testing = ["big-O", "flake8 (<5)", "jaraco.functools", "jaraco.itertools", "more-itertools", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=1.3)", "pytest-flake8", "pytest-mypy (>=0.9.1)"]
-
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "f30334a8b48e6a692970f165e84f766b289193ba25b120a0494ace050052bf21"
+content-hash = "084cb45bd37c294d262dc6a40819b67f18cca2447e56d843fb4ca56c16484e39"
diff --git a/pyproject.toml b/pyproject.toml
index ebfd59ad75..0126a80f27 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -29,8 +29,6 @@ tabulate = "0.8.10"
 cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
 httpx = {extras = ["http2"], version = "^0.24.0"}
-beautifulsoup4 = "^4.12.2"
-lxml = "^4.9.2"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"
@@ -38,10 +36,12 @@ flake8 = "^6.0.0"
 black = "^23.1.0"
 pytest-cov = "^4.0.0"
 poetry-dynamic-versioning = "^0.21.4"
-pytest-httpserver = "^1.0.6"
 pytest-rerunfailures = "^11.1.2"
 pytest-asyncio = "^0.21.0"
 pytest-httpx = "^0.22.0"
+urllib3 = "^2.0.2"
+werkzeug = "^2.3.4"
+pytest-httpserver = "^1.0.8"
 
 [pytest]
 env = [

From 2560239a94168e4f54434ea7cc32b8f4be0adb9e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 15:44:20 -0400
Subject: [PATCH 044/387] fix azure_tenant test

---
 bbot/core/helpers/logger.py | 2 +-
 bbot/modules/viewdns.py     | 3 ++-
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/bbot/core/helpers/logger.py b/bbot/core/helpers/logger.py
index 1c7a126a10..b70d4b4b41 100644
--- a/bbot/core/helpers/logger.py
+++ b/bbot/core/helpers/logger.py
@@ -48,5 +48,5 @@ def log_to_stderr(msg, level="INFO", logname=True):
         if levelname == "CRITICAL" or levelname.startswith("HUGE"):
             msg = colorize(msg, level=levelname)
         if logname:
-            msg = f"{levelshort} bbot: {msg}"
+            msg = f"{levelshort} {msg}"
         print(msg, file=sys.stderr)
diff --git a/bbot/modules/viewdns.py b/bbot/modules/viewdns.py
index 69f03f5aa2..9c7148ce94 100644
--- a/bbot/modules/viewdns.py
+++ b/bbot/modules/viewdns.py
@@ -1,5 +1,4 @@
 import re
-from bs4 import BeautifulSoup
 
 from bbot.modules.base import BaseModule
 
@@ -39,6 +38,8 @@ async def handle_event(self, event):
             # todo: registrar?
 
     async def query(self, query):
+        from bs4 import BeautifulSoup
+
         results = set()
         url = f"{self.base_url}/reversewhois/?q={query}"
         r = await self.helpers.request(url)

From c20699bb2d636b79aa1d7bcb8ea42e959b7b38db Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 16:05:05 -0400
Subject: [PATCH 045/387] fix neo4j test

---
 bbot/modules/viewdns.py                       |  4 ++--
 bbot/test/test_step_1/module_tests/base.py    | 12 +++++-----
 .../module_tests/test_module_anubisdb.py      |  2 +-
 .../module_tests/test_module_asn.py           |  4 ++--
 .../module_tests/test_module_azure_tenant.py  |  2 +-
 .../module_tests/test_module_badsecrets.py    |  2 +-
 .../module_tests/test_module_bevigil.py       |  2 +-
 .../module_tests/test_module_binaryedge.py    |  2 +-
 .../module_tests/test_module_bucket_aws.py    |  2 +-
 .../module_tests/test_module_builtwith.py     |  2 +-
 .../module_tests/test_module_bypass403.py     |  6 ++---
 .../module_tests/test_module_c99.py           |  2 +-
 .../module_tests/test_module_censys.py        |  2 +-
 .../module_tests/test_module_certspotter.py   |  2 +-
 .../module_tests/test_module_crobat.py        |  2 +-
 .../module_tests/test_module_crt.py           |  2 +-
 .../module_tests/test_module_dnscommonsrv.py  |  2 +-
 .../module_tests/test_module_dnsdumpster.py   |  2 +-
 .../test_module_dnszonetransfer.py            |  2 +-
 .../module_tests/test_module_emailformat.py   |  2 +-
 .../module_tests/test_module_excavate.py      | 22 +++++++++++++------
 .../module_tests/test_module_ffuf.py          |  4 ++--
 .../test_module_ffuf_shortnames.py            |  2 +-
 .../module_tests/test_module_fullhunt.py      |  2 +-
 .../module_tests/test_module_github.py        |  2 +-
 .../module_tests/test_module_gowitness.py     |  2 +-
 .../module_tests/test_module_hackertarget.py  |  2 +-
 .../module_tests/test_module_http.py          |  2 +-
 .../module_tests/test_module_httpx.py         |  2 +-
 .../module_tests/test_module_hunt.py          |  2 +-
 .../module_tests/test_module_hunterio.py      |  2 +-
 .../test_module_iis_shortnames.py             |  2 +-
 .../module_tests/test_module_ipneighbor.py    |  2 +-
 .../module_tests/test_module_ipstack.py       |  2 +-
 .../module_tests/test_module_leakix.py        |  2 +-
 .../module_tests/test_module_masscan.py       |  2 +-
 .../module_tests/test_module_massdns.py       |  2 +-
 .../module_tests/test_module_naabu.py         |  2 +-
 .../module_tests/test_module_neo4j.py         |  6 ++++-
 .../module_tests/test_module_ntlm.py          |  2 +-
 .../module_tests/test_module_nuclei.py        |  8 +++----
 .../module_tests/test_module_otx.py           |  2 +-
 .../test_module_paramminer_cookies.py         |  2 +-
 .../test_module_paramminer_getparams.py       |  2 +-
 .../test_module_paramminer_headers.py         |  2 +-
 .../module_tests/test_module_passivetotal.py  |  4 ++--
 .../module_tests/test_module_pgp.py           |  2 +-
 .../module_tests/test_module_rapiddns.py      |  2 +-
 .../module_tests/test_module_riddler.py       |  2 +-
 .../module_tests/test_module_robots.py        |  2 +-
 .../module_tests/test_module_secretsdb.py     |  2 +-
 .../test_module_securitytrails.py             |  2 +-
 .../module_tests/test_module_shodan_dns.py    |  2 +-
 .../module_tests/test_module_skymem.py        |  2 +-
 .../module_tests/test_module_social.py        |  2 +-
 .../module_tests/test_module_speculate.py     |  2 +-
 .../test_module_subdomain_hijack.py           |  4 ++--
 .../module_tests/test_module_sublist3r.py     |  2 +-
 .../module_tests/test_module_telerik.py       |  2 +-
 .../module_tests/test_module_threatminer.py   |  2 +-
 .../test_module_url_manipulation.py           |  2 +-
 .../module_tests/test_module_urlscan.py       |  2 +-
 .../module_tests/test_module_vhost.py         |  2 +-
 .../module_tests/test_module_viewdns.py       |  2 +-
 .../module_tests/test_module_virustotal.py    |  2 +-
 .../module_tests/test_module_wafw00f.py       |  2 +-
 .../module_tests/test_module_wappalyzer.py    |  2 +-
 .../module_tests/test_module_wayback.py       |  2 +-
 .../module_tests/test_module_web_report.py    |  2 +-
 .../module_tests/test_module_websocket.py     |  2 +-
 .../module_tests/test_module_zoomeye.py       |  2 +-
 bbot/test/test_step_2/test_scope.py           |  2 +-
 72 files changed, 105 insertions(+), 93 deletions(-)

diff --git a/bbot/modules/viewdns.py b/bbot/modules/viewdns.py
index 9c7148ce94..a38e8d9f9f 100644
--- a/bbot/modules/viewdns.py
+++ b/bbot/modules/viewdns.py
@@ -38,8 +38,6 @@ async def handle_event(self, event):
             # todo: registrar?
 
     async def query(self, query):
-        from bs4 import BeautifulSoup
-
         results = set()
         url = f"{self.base_url}/reversewhois/?q={query}"
         r = await self.helpers.request(url)
@@ -48,6 +46,8 @@ async def query(self, query):
             self.verbose(f"Error retrieving reverse whois results (status code: {status_code})")
 
         content = getattr(r, "content", b"")
+        from bs4 import BeautifulSoup
+
         html = BeautifulSoup(content, features="lxml")
         found = set()
         for table_row in html.findAll("tr"):
diff --git a/bbot/test/test_step_1/module_tests/base.py b/bbot/test/test_step_1/module_tests/base.py
index 99a069a395..3029fb359b 100644
--- a/bbot/test/test_step_1/module_tests/base.py
+++ b/bbot/test/test_step_1/module_tests/base.py
@@ -57,14 +57,14 @@ def __init__(self, module_test_base, httpx_mock, httpserver, monkeypatch, reques
             self.httpserver = httpserver
             self.monkeypatch = monkeypatch
             self.request_fixture = request
+            self.preloaded = module_loader.preloaded()
 
             # handle output, internal module types
-            preloaded = module_loader.preloaded()
             output_modules = None
             modules = list(module_test_base.modules)
             output_modules = []
             for module in list(modules):
-                module_type = preloaded[module]["type"]
+                module_type = self.preloaded[module]["type"]
                 if module_type in ("internal", "output"):
                     modules.remove(module)
                     if module_type == "output":
@@ -101,9 +101,9 @@ def mock_record(self, *args, **kwargs):
     @pytest_asyncio.fixture
     async def module_test(self, httpx_mock, bbot_httpserver, monkeypatch, request):
         module_test = self.ModuleTest(self, httpx_mock, bbot_httpserver, monkeypatch, request)
-        self.setup_before_prep(module_test)
+        await self.setup_before_prep(module_test)
         await module_test.scan.prep()
-        self.setup_after_prep(module_test)
+        await self.setup_after_prep(module_test)
         module_test.events = [e async for e in module_test.scan.start()]
         yield module_test
 
@@ -133,8 +133,8 @@ def modules(self):
             return self.modules_overrides
         return [self.name]
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         pass
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         pass
diff --git a/bbot/test/test_step_1/module_tests/test_module_anubisdb.py b/bbot/test/test_step_1/module_tests/test_module_anubisdb.py
index d4a7168d89..dbebf86212 100644
--- a/bbot/test/test_step_1/module_tests/test_module_anubisdb.py
+++ b/bbot/test/test_step_1/module_tests/test_module_anubisdb.py
@@ -2,7 +2,7 @@
 
 
 class TestAnubisdb(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.module.abort_if = lambda e: False
         module_test.httpx_mock.add_response(
             url=f"https://jldc.me/anubis/subdomains/blacklanternsecurity.com",
diff --git a/bbot/test/test_step_1/module_tests/test_module_asn.py b/bbot/test/test_step_1/module_tests/test_module_asn.py
index b027dfc04a..401d6d7d1a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_asn.py
+++ b/bbot/test/test_step_1/module_tests/test_module_asn.py
@@ -75,7 +75,7 @@ class TestASNBGPView(ModuleTestBase):
         "@meta": {"time_zone": "UTC", "api_version": 1, "execution_time": "56.55 ms"},
     }
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.bgpview.io/ip/8.8.8.8", json=self.response_get_asn_bgpview
         )
@@ -223,7 +223,7 @@ class TestASNRipe(ModuleTestBase):
         "time": "2023-02-17T21:25:29.417812",
     }
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://stat.ripe.net/data/network-info/data.json?resource=8.8.8.8",
             json=self.response_get_asn_ripe,
diff --git a/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py b/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py
index 9e37b02069..28f2ab4c2a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py
+++ b/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py
@@ -35,7 +35,7 @@ class TestAzure_Tenant(ModuleTestBase):
   </s:Body>
 </s:Envelope>"""
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             method="POST",
             url="https://autodiscover-s.outlook.com/autodiscover/autodiscover.svc",
diff --git a/bbot/test/test_step_1/module_tests/test_module_badsecrets.py b/bbot/test/test_step_1/module_tests/test_module_badsecrets.py
index daa39f946a..c7b18376ed 100644
--- a/bbot/test/test_step_1/module_tests/test_module_badsecrets.py
+++ b/bbot/test/test_step_1/module_tests/test_module_badsecrets.py
@@ -43,7 +43,7 @@ class TestBadSecrets(ModuleTestBase):
 
     modules_overrides = ["badsecrets", "httpx"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"uri": "/test.aspx"}
         respond_args = {"response_data": self.sample_viewstate}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_bevigil.py b/bbot/test/test_step_1/module_tests/test_module_bevigil.py
index bceeecc4a9..e8ab13d7a4 100644
--- a/bbot/test/test_step_1/module_tests/test_module_bevigil.py
+++ b/bbot/test/test_step_1/module_tests/test_module_bevigil.py
@@ -4,7 +4,7 @@
 class TestBeVigil(ModuleTestBase):
     config_overrides = {"modules": {"bevigil": {"api_key": "asdf", "urls": True}}}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"https://osint.bevigil.com/api/blacklanternsecurity.com/subdomains/",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_binaryedge.py b/bbot/test/test_step_1/module_tests/test_module_binaryedge.py
index 4845413da0..505c62376f 100644
--- a/bbot/test/test_step_1/module_tests/test_module_binaryedge.py
+++ b/bbot/test/test_step_1/module_tests/test_module_binaryedge.py
@@ -4,7 +4,7 @@
 class TestBinaryEdge(ModuleTestBase):
     config_overrides = {"modules": {"binaryedge": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"https://api.binaryedge.io/v2/query/domains/subdomain/blacklanternsecurity.com",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py b/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py
index 5be98dd86e..d11cc304b8 100644
--- a/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py
+++ b/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py
@@ -44,7 +44,7 @@ def bucket_setup(self):
         <a href="{self.url_2}"/>
         """
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         self.bucket_setup()
         # patch mutations
         module_test.scan.helpers.word_cloud.mutations = lambda b, cloud=False: [
diff --git a/bbot/test/test_step_1/module_tests/test_module_builtwith.py b/bbot/test/test_step_1/module_tests/test_module_builtwith.py
index 5ff69993fd..0fc4de9d56 100644
--- a/bbot/test/test_step_1/module_tests/test_module_builtwith.py
+++ b/bbot/test/test_step_1/module_tests/test_module_builtwith.py
@@ -4,7 +4,7 @@
 class TestBuiltWith(ModuleTestBase):
     config_overrides = {"modules": {"builtwith": {"api_key": "asdf"}}}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"https://api.builtwith.com/v20/api.json?KEY=asdf&LOOKUP=blacklanternsecurity.com&NOMETA=yes&NOATTR=yes&HIDETEXT=yes&HIDEDL=yes",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_bypass403.py b/bbot/test/test_step_1/module_tests/test_module_bypass403.py
index 7446352319..5bcbeebf31 100644
--- a/bbot/test/test_step_1/module_tests/test_module_bypass403.py
+++ b/bbot/test/test_step_1/module_tests/test_module_bypass403.py
@@ -6,7 +6,7 @@ class TestBypass403(ModuleTestBase):
     targets = ["http://127.0.0.1:8888/test"]
     modules_overrides = ["bypass403", "httpx"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/test..;/"}
         respond_args = {"response_data": "alive"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
@@ -23,7 +23,7 @@ class TestBypass403_aspnetcookieless(ModuleTestBase):
     targets = ["http://127.0.0.1:8888/admin.aspx"]
     modules_overrides = ["bypass403", "httpx"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": re.compile(r"\/\([sS]\(\w+\)\)\/.+\.aspx")}
         respond_args = {"response_data": "alive"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
@@ -39,7 +39,7 @@ class TestBypass403_waf(ModuleTestBase):
     targets = ["http://127.0.0.1:8888/test"]
     modules_overrides = ["bypass403", "httpx"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/test..;/"}
         respond_args = {"response_data": "The requested URL was rejected"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_c99.py b/bbot/test/test_step_1/module_tests/test_module_c99.py
index 98c5e87652..9efc2a8c50 100644
--- a/bbot/test/test_step_1/module_tests/test_module_c99.py
+++ b/bbot/test/test_step_1/module_tests/test_module_c99.py
@@ -4,7 +4,7 @@
 class TestC99(ModuleTestBase):
     config_overrides = {"modules": {"c99": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.c99.nl/randomnumber?key=asdf&between=1,100&json",
             json={"success": True, "output": 65},
diff --git a/bbot/test/test_step_1/module_tests/test_module_censys.py b/bbot/test/test_step_1/module_tests/test_module_censys.py
index c3c87649c1..0eb2017804 100644
--- a/bbot/test/test_step_1/module_tests/test_module_censys.py
+++ b/bbot/test/test_step_1/module_tests/test_module_censys.py
@@ -4,7 +4,7 @@
 class TestCensys(ModuleTestBase):
     config_overrides = {"modules": {"censys": {"api_id": "api_id", "api_secret": "api_secret"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://search.censys.io/api/v1/account",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_certspotter.py b/bbot/test/test_step_1/module_tests/test_module_certspotter.py
index fb6bb002c6..a9ab7eb36b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_certspotter.py
+++ b/bbot/test/test_step_1/module_tests/test_module_certspotter.py
@@ -2,7 +2,7 @@
 
 
 class TestCertspotter(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.module.abort_if = lambda e: False
         for t in self.targets:
             module_test.httpx_mock.add_response(
diff --git a/bbot/test/test_step_1/module_tests/test_module_crobat.py b/bbot/test/test_step_1/module_tests/test_module_crobat.py
index c797541c27..f04d75809e 100644
--- a/bbot/test/test_step_1/module_tests/test_module_crobat.py
+++ b/bbot/test/test_step_1/module_tests/test_module_crobat.py
@@ -2,7 +2,7 @@
 
 
 class TestCrobat(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://sonar.omnisint.io/subdomains/blacklanternsecurity.com",
             json=["asdf.blacklanternsecurity.com"],
diff --git a/bbot/test/test_step_1/module_tests/test_module_crt.py b/bbot/test/test_step_1/module_tests/test_module_crt.py
index f7a13e98de..5ee8ae4d31 100644
--- a/bbot/test/test_step_1/module_tests/test_module_crt.py
+++ b/bbot/test/test_step_1/module_tests/test_module_crt.py
@@ -2,7 +2,7 @@
 
 
 class TestCRT(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.module.abort_if = lambda e: False
         for t in self.targets:
             module_test.httpx_mock.add_response(
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py b/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
index a77630ecd9..bdb6f1207b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
+++ b/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
@@ -4,7 +4,7 @@
 class TestDNSCommonSRV(ModuleTestBase):
     targets = ["blacklanternsecurity.notreal"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         old_resolve_fn = module_test.scan.helpers.dns.resolve
 
         async def resolve(query, **kwargs):
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py b/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py
index b7b1067cf4..6bf045d5c4 100644
--- a/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py
+++ b/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py
@@ -2,7 +2,7 @@
 
 
 class TestDNSDumpster(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"https://dnsdumpster.com",
             headers={"Set-Cookie": "csrftoken=asdf"},
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
index 212fce0d6b..c67d46f869 100644
--- a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
+++ b/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
@@ -9,7 +9,7 @@ class TestDNSZoneTransfer(ModuleTestBase):
     targets = ["blacklanternsecurity.fakedomain"]
     config_overrides = {"dns_resolution": True}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         old_resolve_fn = module_test.scan.helpers.dns._resolve_hostname
 
         async def _resolve_hostname(query, **kwargs):
diff --git a/bbot/test/test_step_1/module_tests/test_module_emailformat.py b/bbot/test/test_step_1/module_tests/test_module_emailformat.py
index ff1c0d3b36..fdac8cb42a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_emailformat.py
+++ b/bbot/test/test_step_1/module_tests/test_module_emailformat.py
@@ -2,7 +2,7 @@
 
 
 class TestEmailFormat(ModuleTestBase):
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://www.email-format.com/d/blacklanternsecurity.com/",
             text="<p>info@blacklanternsecurity.com</a>",
diff --git a/bbot/test/test_step_1/module_tests/test_module_excavate.py b/bbot/test/test_step_1/module_tests/test_module_excavate.py
index 250506f5e1..eba35d4892 100644
--- a/bbot/test/test_step_1/module_tests/test_module_excavate.py
+++ b/bbot/test/test_step_1/module_tests/test_module_excavate.py
@@ -6,7 +6,7 @@ class TestExcavate(ModuleTestBase):
     modules_overrides = ["excavate", "httpx"]
     config_overrides = {"web_spider_distance": 1, "web_spider_depth": 1}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         response_data = """
         ftp://ftp.test.notreal
         \\nhttps://www1.test.notreal
@@ -96,7 +96,7 @@ def check(self, module_test, events):
 class TestExcavate2(TestExcavate):
     targets = ["http://127.0.0.1:8888/", "test.notreal", "http://127.0.0.1:8888/subdir/"]
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         # root relative
         expect_args = {"method": "GET", "uri": "/rootrelative.html"}
         respond_args = {"response_data": "alive"}
@@ -109,7 +109,11 @@ def setup_before_prep(self, module_test):
 
         expect_args = {"method": "GET", "uri": "/subdir/"}
         respond_args = {
-            "response_data": "<a href='/rootrelative.html'>root relative</a><a href='pagerelative.html'>page relative</a>"
+            "response_data": """
+                <a href='/rootrelative.html'>root relative</a>
+                <a href='pagerelative1.html'>page relative 1</a>
+                <a href='./pagerelative2.html'>page relative 2</a>
+                """
         }
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
@@ -117,7 +121,8 @@ def setup_before_prep(self, module_test):
 
     def check(self, module_test, events):
         root_relative_detection = False
-        page_relative_detection = False
+        page_relative_detection_1 = False
+        page_relative_detection_1 = False
         root_page_confusion_1 = False
         root_page_confusion_2 = False
 
@@ -126,8 +131,10 @@ def check(self, module_test, events):
                 # these cases represent the desired behavior for parsing relative links
                 if e.data == "http://127.0.0.1:8888/rootrelative.html":
                     root_relative_detection = True
-                if e.data == "http://127.0.0.1:8888/subdir/pagerelative.html":
-                    page_relative_detection = True
+                if e.data == "http://127.0.0.1:8888/subdir/pagerelative1.html":
+                    page_relative_detection_1 = True
+                if e.data == "http://127.0.0.1:8888/subdir/pagerelative2.html":
+                    page_relative_detection_2 = True
 
                 # these cases indicates that excavate parsed the relative links incorrectly
                 if e.data == "http://127.0.0.1:8888/pagerelative.html":
@@ -136,6 +143,7 @@ def check(self, module_test, events):
                     root_page_confusion_2 = True
 
         assert root_relative_detection, "Failed to properly excavate root-relative URL"
-        assert page_relative_detection, "Failed to properly excavate page-relative URL"
+        assert page_relative_detection_1, "Failed to properly excavate page-relative URL"
+        assert page_relative_detection_2, "Failed to properly excavate page-relative URL"
         assert not root_page_confusion_1, "Incorrectly detected page-relative URL"
         assert not root_page_confusion_2, "Incorrectly detected root-relative URL"
diff --git a/bbot/test/test_step_1/module_tests/test_module_ffuf.py b/bbot/test/test_step_1/module_tests/test_module_ffuf.py
index 9da9805567..96756e7b20 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ffuf.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ffuf.py
@@ -13,7 +13,7 @@ class TestFFUF(ModuleTestBase):
     }
     modules_overrides = ["ffuf", "httpx"]
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/admin"}
         respond_args = {"response_data": "alive admin page"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
@@ -31,7 +31,7 @@ class TestFFUF2(TestFFUF):
     test_wordlist = ["11111111", "console", "junkword1", "zzzjunkword2"]
     config_overrides = {"modules": {"ffuf": {"wordlist": tempwordlist(test_wordlist), "extensions": "php"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/console.php"}
         respond_args = {"response_data": "alive admin page"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py b/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py
index 09312dcee3..3d59653eb1 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py
@@ -15,7 +15,7 @@ class TestFFUFShortnames(ModuleTestBase):
     }
     modules_overrides = ["ffuf_shortnames", "httpx"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpserver.no_handler_status_code = 404
 
         seed_events = []
diff --git a/bbot/test/test_step_1/module_tests/test_module_fullhunt.py b/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
index 1847ad40c7..547063495a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
+++ b/bbot/test/test_step_1/module_tests/test_module_fullhunt.py
@@ -4,7 +4,7 @@
 class TestFullhunt(ModuleTestBase):
     config_overrides = {"modules": {"fullhunt": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://fullhunt.io/api/v1/auth/status",
             match_headers={"x-api-key": "asdf"},
diff --git a/bbot/test/test_step_1/module_tests/test_module_github.py b/bbot/test/test_step_1/module_tests/test_module_github.py
index 8fb27c9ea1..220bf019dd 100644
--- a/bbot/test/test_step_1/module_tests/test_module_github.py
+++ b/bbot/test/test_step_1/module_tests/test_module_github.py
@@ -4,7 +4,7 @@
 class TestGithub(ModuleTestBase):
     config_overrides = {"modules": {"github": {"api_key": "asdf"}}, "omit_event_types": [], "scope_report_distance": 1}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(url="https://api.github.com/zen")
         module_test.httpx_mock.add_response(
             url="https://api.github.com/search/code?per_page=100&type=Code&q=blacklanternsecurity.com&page=1",
diff --git a/bbot/test/test_step_1/module_tests/test_module_gowitness.py b/bbot/test/test_step_1/module_tests/test_module_gowitness.py
index 9b3cc08082..35e0db799c 100644
--- a/bbot/test/test_step_1/module_tests/test_module_gowitness.py
+++ b/bbot/test/test_step_1/module_tests/test_module_gowitness.py
@@ -11,7 +11,7 @@ class TestGowitness(ModuleTestBase):
     shutil.rmtree(home_dir, ignore_errors=True)
     config_overrides = {"force_deps": True, "home": str(home_dir)}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         respond_args = {
             "response_data": """<html><head><title>BBOT is life</title></head><body>
 <link rel="preconnect" href="https://fonts.googleapis.com">
diff --git a/bbot/test/test_step_1/module_tests/test_module_hackertarget.py b/bbot/test/test_step_1/module_tests/test_module_hackertarget.py
index d32faa7bb5..748b645c63 100644
--- a/bbot/test/test_step_1/module_tests/test_module_hackertarget.py
+++ b/bbot/test/test_step_1/module_tests/test_module_hackertarget.py
@@ -2,7 +2,7 @@
 
 
 class TestHackertarget(ModuleTestBase):
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.hackertarget.com/hostsearch/?q=blacklanternsecurity.com",
             text="asdf.blacklanternsecurity.com\nzzzz.blacklanternsecurity.com",
diff --git a/bbot/test/test_step_1/module_tests/test_module_http.py b/bbot/test/test_step_1/module_tests/test_module_http.py
index d1dd57daa6..3b4e819b97 100644
--- a/bbot/test/test_step_1/module_tests/test_module_http.py
+++ b/bbot/test/test_step_1/module_tests/test_module_http.py
@@ -15,7 +15,7 @@ class TestHTTP(ModuleTestBase):
         }
     }
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             method="PUT", headers={"Authorization": "bearer auth_token"}, url=self.downstream_url
         )
diff --git a/bbot/test/test_step_1/module_tests/test_module_httpx.py b/bbot/test/test_step_1/module_tests/test_module_httpx.py
index a737b2d762..b66aa6ce0d 100644
--- a/bbot/test/test_step_1/module_tests/test_module_httpx.py
+++ b/bbot/test/test_step_1/module_tests/test_module_httpx.py
@@ -5,7 +5,7 @@
 class TestHTTPX(ModuleTestBase):
     targets = ["http://127.0.0.1:8888/url", "127.0.0.1:8888"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         request_args = dict(uri="/", headers={"test": "header"})
         respond_args = dict(response_data=json.dumps({"open": "port"}))
         module_test.set_expect_requests(request_args, respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunt.py b/bbot/test/test_step_1/module_tests/test_module_hunt.py
index d5809fa1e0..9c65626098 100644
--- a/bbot/test/test_step_1/module_tests/test_module_hunt.py
+++ b/bbot/test/test_step_1/module_tests/test_module_hunt.py
@@ -5,7 +5,7 @@ class TestHunt(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "hunt"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": '<html><a href="/hackme.php?cipher=xor">ping</a></html>'}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunterio.py b/bbot/test/test_step_1/module_tests/test_module_hunterio.py
index ff09ed0d8b..9033091176 100644
--- a/bbot/test/test_step_1/module_tests/test_module_hunterio.py
+++ b/bbot/test/test_step_1/module_tests/test_module_hunterio.py
@@ -4,7 +4,7 @@
 class TestHunterio(ModuleTestBase):
     config_overrides = {"modules": {"hunterio": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.hunter.io/v2/account?api_key=asdf",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py b/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
index 338d4e3b3c..43ef07b5a2 100644
--- a/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
+++ b/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
@@ -8,7 +8,7 @@ class TestIIS_Shortnames(ModuleTestBase):
     modules_overrides = ["httpx", "iis_shortnames"]
     config_overrides = {"modules": {"iis_shortnames": {"detect_only": False}}}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpserver.no_handler_status_code = 404
 
         expect_args = {"method": "GET", "uri": "/"}
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py b/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
index be3e234e29..fbccc69a70 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
@@ -5,7 +5,7 @@ class TestIPNeighbor(ModuleTestBase):
     targets = ["127.0.0.15", "www.bls.notreal"]
     config_overrides = {"scope_report_distance": 1, "dns_resolution": True, "scope_dns_search_distance": 2}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         old_resolve_ip = module_test.scan.helpers.dns._resolve_ip
         old_resolve_hostname = module_test.scan.helpers.dns._resolve_hostname
 
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipstack.py b/bbot/test/test_step_1/module_tests/test_module_ipstack.py
index 8e45c338c2..0e848ac6fb 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ipstack.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ipstack.py
@@ -5,7 +5,7 @@ class TestIPStack(ModuleTestBase):
     targets = ["8.8.8.8"]
     config_overrides = {"modules": {"ipstack": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="http://api.ipstack.com//check?access_key=asdf",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_leakix.py b/bbot/test/test_step_1/module_tests/test_module_leakix.py
index 9266660f45..b6bfbd8bf4 100644
--- a/bbot/test/test_step_1/module_tests/test_module_leakix.py
+++ b/bbot/test/test_step_1/module_tests/test_module_leakix.py
@@ -4,7 +4,7 @@
 class TestLeakIX(ModuleTestBase):
     config_overrides = {"modules": {"leakix": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://leakix.net/host/1.2.3.4.5",
             match_headers={"api-key": "asdf"},
diff --git a/bbot/test/test_step_1/module_tests/test_module_masscan.py b/bbot/test/test_step_1/module_tests/test_module_masscan.py
index 2d4fd44631..121b4f9751 100644
--- a/bbot/test/test_step_1/module_tests/test_module_masscan.py
+++ b/bbot/test/test_step_1/module_tests/test_module_masscan.py
@@ -18,7 +18,7 @@ class TestMasscan(ModuleTestBase):
 {   "ip": "8.8.8.8",   "timestamp": "1680197558", "ports": [ {"port": 443, "proto": "tcp", "status": "open", "reason": "syn-ack", "ttl": 54} ] }
 ]"""
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         self.masscan_run = False
 
         async def run_masscan(command, *args, **kwargs):
diff --git a/bbot/test/test_step_1/module_tests/test_module_massdns.py b/bbot/test/test_step_1/module_tests/test_module_massdns.py
index 5d2fcdfb61..04f4860dd6 100644
--- a/bbot/test/test_step_1/module_tests/test_module_massdns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_massdns.py
@@ -5,7 +5,7 @@ class TestMassdns(ModuleTestBase):
     subdomain_wordlist = tempwordlist(["www", "asdf"])
     config_overrides = {"modules": {"massdns": {"wordlist": str(subdomain_wordlist)}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://raw.githubusercontent.com/blacklanternsecurity/public-dns-servers/master/nameservers.txt",
             text="8.8.8.8\n8.8.4.4\n1.1.1.1",
diff --git a/bbot/test/test_step_1/module_tests/test_module_naabu.py b/bbot/test/test_step_1/module_tests/test_module_naabu.py
index 2f985d5a22..ed8cd049cc 100644
--- a/bbot/test/test_step_1/module_tests/test_module_naabu.py
+++ b/bbot/test/test_step_1/module_tests/test_module_naabu.py
@@ -2,7 +2,7 @@
 
 
 class TestNaabu(ModuleTestBase):
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": "alive"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_neo4j.py b/bbot/test/test_step_1/module_tests/test_module_neo4j.py
index 97cb754e0a..7a5a010631 100644
--- a/bbot/test/test_step_1/module_tests/test_module_neo4j.py
+++ b/bbot/test/test_step_1/module_tests/test_module_neo4j.py
@@ -2,7 +2,11 @@
 
 
 class TestNeo4j(ModuleTestBase):
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
+        # install py2neo
+        deps_pip = module_test.preloaded["neo4j"]["deps"]["pip"]
+        await module_test.scan.helpers.depsinstaller.pip_install(deps_pip)
+
         class MockGraph:
             def __init__(self, *args, **kwargs):
                 self.used = False
diff --git a/bbot/test/test_step_1/module_tests/test_module_ntlm.py b/bbot/test/test_step_1/module_tests/test_module_ntlm.py
index 814e2578e7..790f2e0d22 100644
--- a/bbot/test/test_step_1/module_tests/test_module_ntlm.py
+++ b/bbot/test/test_step_1/module_tests/test_module_ntlm.py
@@ -6,7 +6,7 @@ class TestNTLM(ModuleTestBase):
     modules_overrides = ["httpx", "ntlm"]
     config_overrides = {"modules": {"ntlm": {"try_all": True}}}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         request_args = dict(uri="/", headers={"test": "header"})
         module_test.set_expect_requests(request_args, {})
         request_args = dict(
diff --git a/bbot/test/test_step_1/module_tests/test_module_nuclei.py b/bbot/test/test_step_1/module_tests/test_module_nuclei.py
index b8eca8a3b5..cd27ba3b6d 100644
--- a/bbot/test/test_step_1/module_tests/test_module_nuclei.py
+++ b/bbot/test/test_step_1/module_tests/test_module_nuclei.py
@@ -36,7 +36,7 @@ class TestNucleiManual(ModuleTestBase):
 </body></html>
 """
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": self.test_html}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
@@ -70,7 +70,7 @@ class TestNucleiSevere(TestNucleiManual):
         "interactsh_disable": True,
     }
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/etc/passwd"}
         respond_args = {"response_data": "<html>root:.*:0:0:</html>"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
@@ -88,7 +88,7 @@ class TestNucleiTechnology(TestNucleiManual):
         "modules": {"nuclei": {"mode": "technology", "concurrency": 2, "tags": "apache"}},
     }
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         self.caplog = module_test.request_fixture.getfixturevalue("caplog")
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {
@@ -116,7 +116,7 @@ class TestNucleiBudget(TestNucleiManual):
         }
     }
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": "<html><title>SpiderFoot</title><p>support@spiderfoot.net</p></html>"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_otx.py b/bbot/test/test_step_1/module_tests/test_module_otx.py
index 7481e29056..1c41cd962d 100644
--- a/bbot/test/test_step_1/module_tests/test_module_otx.py
+++ b/bbot/test/test_step_1/module_tests/test_module_otx.py
@@ -2,7 +2,7 @@
 
 
 class TestOTX(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"https://otx.alienvault.com/api/v1/indicators/domain/blacklanternsecurity.com/passive_dns",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
index c0ebbb3e04..87c569aaba 100644
--- a/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
+++ b/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
@@ -23,7 +23,7 @@ class TestParamminer_Cookies(TestParamminer_Headers):
     </html>
     """
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.scan.modules["paramminer_cookies"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
         module_test.monkeypatch.setattr(
             helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
index f6cbdebeac..d8fe73aaa6 100644
--- a/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
@@ -22,7 +22,7 @@ class TestParamminer_Getparams(TestParamminer_Headers):
     </html>
     """
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
         module_test.monkeypatch.setattr(
             helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py b/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
index 7fc2e63959..4ee4e80e89 100644
--- a/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
+++ b/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
@@ -26,7 +26,7 @@ class TestParamminer_Headers(ModuleTestBase):
     </html>
     """
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.scan.modules["paramminer_headers"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
         module_test.monkeypatch.setattr(
             helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
diff --git a/bbot/test/test_step_1/module_tests/test_module_passivetotal.py b/bbot/test/test_step_1/module_tests/test_module_passivetotal.py
index 5d2835979b..9048a41e0a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_passivetotal.py
+++ b/bbot/test/test_step_1/module_tests/test_module_passivetotal.py
@@ -4,7 +4,7 @@
 class TestPassiveTotal(ModuleTestBase):
     config_overrides = {"modules": {"passivetotal": {"username": "jon@bls.fakedomain", "api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.passivetotal.org/v2/account/quota",
             json={"user": {"counts": {"search_api": 10}, "limits": {"search_api": 20}}},
@@ -14,7 +14,7 @@ def setup_before_prep(self, module_test):
             json={"subdomains": ["asdf"]},
         )
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.monkeypatch.setattr(module_test.scan.modules["passivetotal"], "abort_if", lambda e: False)
 
     def check(self, module_test, events):
diff --git a/bbot/test/test_step_1/module_tests/test_module_pgp.py b/bbot/test/test_step_1/module_tests/test_module_pgp.py
index dac4152577..e6f122dd93 100644
--- a/bbot/test/test_step_1/module_tests/test_module_pgp.py
+++ b/bbot/test/test_step_1/module_tests/test_module_pgp.py
@@ -25,7 +25,7 @@ class TestPGP(ModuleTestBase):
 </pre>
 </body></html>"""
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=blacklanternsecurity.com",
             text=self.web_body,
diff --git a/bbot/test/test_step_1/module_tests/test_module_rapiddns.py b/bbot/test/test_step_1/module_tests/test_module_rapiddns.py
index e324a5ac14..be49cb8815 100644
--- a/bbot/test/test_step_1/module_tests/test_module_rapiddns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_rapiddns.py
@@ -6,7 +6,7 @@ class TestRapidDNS(ModuleTestBase):
 <td>asdf.blacklanternsecurity.com</td>
 <td><a href="/sameip/asdf.blacklanternsecurity.com.?t=cname#result" target="_blank" title="asdf.blacklanternsecurity.com. same ip website">asdf.blacklanternsecurity.com.</a>"""
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.module.abort_if = lambda e: False
         module_test.httpx_mock.add_response(
             url=f"https://rapiddns.io/subdomain/blacklanternsecurity.com?full=1#result", text=self.web_body
diff --git a/bbot/test/test_step_1/module_tests/test_module_riddler.py b/bbot/test/test_step_1/module_tests/test_module_riddler.py
index f06a0513b0..d7be9de564 100644
--- a/bbot/test/test_step_1/module_tests/test_module_riddler.py
+++ b/bbot/test/test_step_1/module_tests/test_module_riddler.py
@@ -6,7 +6,7 @@ class TestRiddler(ModuleTestBase):
 <td>asdf.blacklanternsecurity.com</td>
 <td><a href="/sameip/asdf.blacklanternsecurity.com.?t=cname#result" target="_blank" title="asdf.blacklanternsecurity.com. same ip website">asdf.blacklanternsecurity.com.</a>"""
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.module.abort_if = lambda e: False
         module_test.httpx_mock.add_response(
             url=f"https://riddler.io/search/exportcsv?q=pld:blacklanternsecurity.com", text=self.web_body
diff --git a/bbot/test/test_step_1/module_tests/test_module_robots.py b/bbot/test/test_step_1/module_tests/test_module_robots.py
index aba68778fc..3d9156bb4c 100644
--- a/bbot/test/test_step_1/module_tests/test_module_robots.py
+++ b/bbot/test/test_step_1/module_tests/test_module_robots.py
@@ -7,7 +7,7 @@ class TestRobots(ModuleTestBase):
     modules_overrides = ["httpx", "robots"]
     config_overrides = {"modules": {"robots": {"include_sitemap": True}}}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         sample_robots = f"Allow: /allow/\nDisallow: /disallow/\nJunk: test.com\nDisallow: /*/wildcard.txt\nSitemap: {self.targets[0]}/sitemap.txt"
 
         expect_args = {"method": "GET", "uri": "/robots.txt"}
diff --git a/bbot/test/test_step_1/module_tests/test_module_secretsdb.py b/bbot/test/test_step_1/module_tests/test_module_secretsdb.py
index 5c0d1a00df..67b6e28bcc 100644
--- a/bbot/test/test_step_1/module_tests/test_module_secretsdb.py
+++ b/bbot/test/test_step_1/module_tests/test_module_secretsdb.py
@@ -5,7 +5,7 @@ class TestSecretsDB(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "secretsdb"]
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml",
             text="""patterns:
diff --git a/bbot/test/test_step_1/module_tests/test_module_securitytrails.py b/bbot/test/test_step_1/module_tests/test_module_securitytrails.py
index 8e015baf88..5010f3bc49 100644
--- a/bbot/test/test_step_1/module_tests/test_module_securitytrails.py
+++ b/bbot/test/test_step_1/module_tests/test_module_securitytrails.py
@@ -4,7 +4,7 @@
 class TestSecurityTrails(ModuleTestBase):
     config_overrides = {"modules": {"securitytrails": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.securitytrails.com/v1/ping?apikey=asdf",
         )
diff --git a/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py b/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
index dfe19dfaec..90a93fe9b3 100644
--- a/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
@@ -4,7 +4,7 @@
 class TestShodan_DNS(ModuleTestBase):
     config_overrides = {"modules": {"shodan_dns": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.shodan.io/api-info?key=asdf",
         )
diff --git a/bbot/test/test_step_1/module_tests/test_module_skymem.py b/bbot/test/test_step_1/module_tests/test_module_skymem.py
index a7c7268b1a..23da240727 100644
--- a/bbot/test/test_step_1/module_tests/test_module_skymem.py
+++ b/bbot/test/test_step_1/module_tests/test_module_skymem.py
@@ -4,7 +4,7 @@
 class TestSkymem(ModuleTestBase):
     targets = ["blacklanternsecurity.com"]
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://www.skymem.info/srch?q=blacklanternsecurity.com",
             text=page_1_body,
diff --git a/bbot/test/test_step_1/module_tests/test_module_social.py b/bbot/test/test_step_1/module_tests/test_module_social.py
index caded2ec78..6771b17153 100644
--- a/bbot/test/test_step_1/module_tests/test_module_social.py
+++ b/bbot/test/test_step_1/module_tests/test_module_social.py
@@ -5,7 +5,7 @@ class TestSocial(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "excavate", "social"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": '<html><a href="https://discord.gg/asdf"/></html>'}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_speculate.py b/bbot/test/test_step_1/module_tests/test_module_speculate.py
index 27156707bf..e1272d868e 100644
--- a/bbot/test/test_step_1/module_tests/test_module_speculate.py
+++ b/bbot/test/test_step_1/module_tests/test_module_speculate.py
@@ -5,7 +5,7 @@ class TestSpeculate_Subdirectories(ModuleTestBase):
     targets = ["http://127.0.0.1:8888/subdir1/subdir2/"]
     modules_overrides = ["httpx", "speculate"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": "alive"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py b/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
index 7349fb187c..ace21d3529 100644
--- a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
+++ b/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
@@ -5,7 +5,7 @@ class TestSubdomain_Hijack(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "excavate", "subdomain_hijack"]
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json",
             json=[
@@ -24,7 +24,7 @@ def setup_before_prep(self, module_test):
             ],
         )
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         fingerprints = module_test.module.fingerprints
         assert fingerprints, "No subdomain hijacking fingerprints available"
         fingerprint = next(iter(fingerprints))
diff --git a/bbot/test/test_step_1/module_tests/test_module_sublist3r.py b/bbot/test/test_step_1/module_tests/test_module_sublist3r.py
index a7cacd2310..656b4696c0 100644
--- a/bbot/test/test_step_1/module_tests/test_module_sublist3r.py
+++ b/bbot/test/test_step_1/module_tests/test_module_sublist3r.py
@@ -2,7 +2,7 @@
 
 
 class TestSublist3r(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"https://api.sublist3r.com/search.php?domain=blacklanternsecurity.com",
             json=["asdf.blacklanternsecurity.com", "zzzz.blacklanternsecurity.com"],
diff --git a/bbot/test/test_step_1/module_tests/test_module_telerik.py b/bbot/test/test_step_1/module_tests/test_module_telerik.py
index 3e6dba2299..34924451b7 100644
--- a/bbot/test/test_step_1/module_tests/test_module_telerik.py
+++ b/bbot/test/test_step_1/module_tests/test_module_telerik.py
@@ -7,7 +7,7 @@ class TestTelerik(ModuleTestBase):
     modules_overrides = ["httpx", "telerik"]
     config_overrides = {"modules": {"telerik": {"exploit_RAU_crypto": True}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         # Simulate Telerik.Web.UI.WebResource.axd?type=rau detection
         expect_args = {"method": "GET", "uri": "/Telerik.Web.UI.WebResource.axd", "query_string": "type=rau"}
         respond_args = {
diff --git a/bbot/test/test_step_1/module_tests/test_module_threatminer.py b/bbot/test/test_step_1/module_tests/test_module_threatminer.py
index 71864f1b25..879ca08f86 100644
--- a/bbot/test/test_step_1/module_tests/test_module_threatminer.py
+++ b/bbot/test/test_step_1/module_tests/test_module_threatminer.py
@@ -2,7 +2,7 @@
 
 
 class TestThreatminer(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.threatminer.org/v2/domain.php?q=blacklanternsecurity.com&rt=5",
             json={"results": ["asdf.blacklanternsecurity.com"]},
diff --git a/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py b/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
index 8a197dbe7b..725a96fecf 100644
--- a/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
+++ b/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
@@ -22,7 +22,7 @@ class TestUrl_Manipulation(ModuleTestBase):
     </html>
     """
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"query_string": f"{module_test.module.rand_string}=.xml".encode()}
         respond_args = {"response_data": self.body_match}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_urlscan.py b/bbot/test/test_step_1/module_tests/test_module_urlscan.py
index 51ec290fcf..d108f2f565 100644
--- a/bbot/test/test_step_1/module_tests/test_module_urlscan.py
+++ b/bbot/test/test_step_1/module_tests/test_module_urlscan.py
@@ -4,7 +4,7 @@
 class TestUrlScan(ModuleTestBase):
     config_overrides = {"modules": {"urlscan": {"urls": True}}}
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://urlscan.io/api/v1/search/?q=blacklanternsecurity.com",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_vhost.py b/bbot/test/test_step_1/module_tests/test_module_vhost.py
index bfd8037196..16f9991f6e 100644
--- a/bbot/test/test_step_1/module_tests/test_module_vhost.py
+++ b/bbot/test/test_step_1/module_tests/test_module_vhost.py
@@ -13,7 +13,7 @@ class TestVhost(ModuleTestBase):
         }
     }
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/", "headers": {"Host": "admin.localhost:8888"}}
         respond_args = {"response_data": "Alive vhost admin"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_viewdns.py b/bbot/test/test_step_1/module_tests/test_module_viewdns.py
index d40960e483..5a235b0194 100644
--- a/bbot/test/test_step_1/module_tests/test_module_viewdns.py
+++ b/bbot/test/test_step_1/module_tests/test_module_viewdns.py
@@ -2,7 +2,7 @@
 
 
 class TestViewDNS(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://viewdns.info/reversewhois/?q=blacklanternsecurity.com",
             text=web_body,
diff --git a/bbot/test/test_step_1/module_tests/test_module_virustotal.py b/bbot/test/test_step_1/module_tests/test_module_virustotal.py
index 88663bdfaa..a6325978f0 100644
--- a/bbot/test/test_step_1/module_tests/test_module_virustotal.py
+++ b/bbot/test/test_step_1/module_tests/test_module_virustotal.py
@@ -4,7 +4,7 @@
 class TestVirusTotal(ModuleTestBase):
     config_overrides = {"modules": {"virustotal": {"api_key": "asdf"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://www.virustotal.com/api/v3/domains/blacklanternsecurity.com/subdomains",
             json={
diff --git a/bbot/test/test_step_1/module_tests/test_module_wafw00f.py b/bbot/test/test_step_1/module_tests/test_module_wafw00f.py
index 2b69c8b894..38f1d5764a 100644
--- a/bbot/test/test_step_1/module_tests/test_module_wafw00f.py
+++ b/bbot/test/test_step_1/module_tests/test_module_wafw00f.py
@@ -5,7 +5,7 @@ class TestWafw00f(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "wafw00f"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": "Proudly powered by litespeed web server"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
diff --git a/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py b/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
index 47e456b860..99376ec457 100644
--- a/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
+++ b/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
@@ -5,7 +5,7 @@ class TestWappalyzer(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "wappalyzer"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         respond_args = {
             "response_data": """<html><head><title>BBOT is life</title></head><body>
 <link rel="preconnect" href="https://fonts.googleapis.com">
diff --git a/bbot/test/test_step_1/module_tests/test_module_wayback.py b/bbot/test/test_step_1/module_tests/test_module_wayback.py
index 3395e0052a..cf09d8e2c5 100644
--- a/bbot/test/test_step_1/module_tests/test_module_wayback.py
+++ b/bbot/test/test_step_1/module_tests/test_module_wayback.py
@@ -2,7 +2,7 @@
 
 
 class TestWayback(ModuleTestBase):
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"http://web.archive.org/cdx/search/cdx?url=blacklanternsecurity.com&matchType=domain&output=json&fl=original&collapse=original",
             json=[["original"], ["http://asdf.blacklanternsecurity.com"]],
diff --git a/bbot/test/test_step_1/module_tests/test_module_web_report.py b/bbot/test/test_step_1/module_tests/test_module_web_report.py
index 14b911c19f..6051cc60de 100644
--- a/bbot/test/test_step_1/module_tests/test_module_web_report.py
+++ b/bbot/test/test_step_1/module_tests/test_module_web_report.py
@@ -5,7 +5,7 @@ class TestWebReport(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "wappalyzer", "badsecrets", "web_report", "secretsdb"]
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         # secretsdb --> FINDING
         module_test.httpx_mock.add_response(
             url="https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml",
diff --git a/bbot/test/test_step_1/module_tests/test_module_websocket.py b/bbot/test/test_step_1/module_tests/test_module_websocket.py
index b5954b34a0..d1620702ce 100644
--- a/bbot/test/test_step_1/module_tests/test_module_websocket.py
+++ b/bbot/test/test_step_1/module_tests/test_module_websocket.py
@@ -25,7 +25,7 @@ async def server_coroutine():
 class TestWebsocket(ModuleTestBase):
     config_overrides = {"output_modules": {"websocket": {"url": "ws://127.0.0.1:8765/testing"}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         self.server_task = asyncio.create_task(server_coroutine())
 
     def check(self, module_test, events):
diff --git a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py b/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
index c561e22c67..438050218b 100644
--- a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
+++ b/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
@@ -4,7 +4,7 @@
 class TestZoomEye(ModuleTestBase):
     config_overrides = {"modules": {"zoomeye": {"api_key": "asdf", "include_related": True, "max_pages": 3}}}
 
-    def setup_before_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://api.zoomeye.org/resources-info",
             match_headers={"API-KEY": "asdf"},
diff --git a/bbot/test/test_step_2/test_scope.py b/bbot/test/test_step_2/test_scope.py
index cc39902ee9..6985890b50 100644
--- a/bbot/test/test_step_2/test_scope.py
+++ b/bbot/test/test_step_2/test_scope.py
@@ -8,7 +8,7 @@ class Scope_test_blacklist(ModuleTestBase):
 
     blacklist = ["127.0.0.1"]
 
-    def setup_after_prep(self, module_test):
+    async def setup_after_prep(self, module_test):
         expect_args = {"method": "GET", "uri": "/"}
         respond_args = {"response_data": "alive"}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)

From c8e139f20aa4d53bbd7d2d5789d95b67f2607364 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 16:20:52 -0400
Subject: [PATCH 046/387] speed up nuclei, fix web_report test

---
 bbot/modules/deadly/nuclei.py                    | 16 ++++++++++------
 bbot/test/conftest.py                            |  5 +++++
 .../module_tests/test_module_web_report.py       |  1 -
 .../module_tests/test_module_zoomeye.py          |  1 -
 bbot/test/test_step_2/test_modules_basic.py      |  1 -
 5 files changed, 15 insertions(+), 9 deletions(-)

diff --git a/bbot/modules/deadly/nuclei.py b/bbot/modules/deadly/nuclei.py
index f7c7ee2c86..8ffe308a20 100644
--- a/bbot/modules/deadly/nuclei.py
+++ b/bbot/modules/deadly/nuclei.py
@@ -278,6 +278,7 @@ def __init__(self, budget, templates_dir):
         self.yaml_list = self.get_yaml_list()
         self.budget_paths = self.find_budget_paths(budget)
         self.collapsable_templates, self.severity_stats = self.find_collapsable_templates()
+        self._yaml_files
 
     def get_yaml_list(self):
         return list(self.templates_dir.rglob("*.yaml"))
@@ -357,9 +358,12 @@ def find_collapsable_templates(self):
         return collapsable_templates, severity_dict
 
     def parse_yaml(self, yamlfile):
-        with open(yamlfile, "r") as stream:
-            try:
-                y = yaml.safe_load(stream)
-                return y
-            except yaml.YAMLError as e:
-                self.debug(f"failed to read yaml file: {e}")
+        if yamlfile not in self._yaml_files:
+            with open(yamlfile, "r") as stream:
+                try:
+                    y = yaml.safe_load(stream)
+                    self._yaml_files[yamlfile] = y
+                except yaml.YAMLError as e:
+                    self.warning(f"failed to load yaml file: {e}")
+                    return {}
+        return self._yaml_files[yamlfile]
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index e2495e3221..094be9dd80 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -26,6 +26,11 @@ def non_mocked_hosts() -> list:
     return ["127.0.0.1"] + interactsh_servers
 
 
+@pytest.fixture
+def assert_all_responses_were_requested() -> bool:
+    return False
+
+
 @pytest.fixture
 def bbot_httpserver():
     server = HTTPServer(host="127.0.0.1", port=8888)
diff --git a/bbot/test/test_step_1/module_tests/test_module_web_report.py b/bbot/test/test_step_1/module_tests/test_module_web_report.py
index 6051cc60de..0f931445fe 100644
--- a/bbot/test/test_step_1/module_tests/test_module_web_report.py
+++ b/bbot/test/test_step_1/module_tests/test_module_web_report.py
@@ -19,7 +19,6 @@ async def setup_before_prep(self, module_test):
         # badsecrets --> VULNERABILITY
         respond_args = {"response_data": web_body}
         module_test.set_expect_requests(respond_args=respond_args)
-        module_test.httpx_mock.assert_all_responses_were_requested = False
 
     def check(self, module_test, events):
         report_file = module_test.scan.home / "web_report.html"
diff --git a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py b/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
index 438050218b..c6c0b53280 100644
--- a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
+++ b/bbot/test/test_step_1/module_tests/test_module_zoomeye.py
@@ -26,7 +26,6 @@ async def setup_before_prep(self, module_test):
             url="https://api.zoomeye.org/domain/search?q=blacklanternsecurity.com&type=0&page=4",
             json={"list": [{"name": "nope.blacklanternsecurity.com"}]},
         )
-        module_test.httpx_mock.assert_all_responses_were_requested = False
 
     def check(self, module_test, events):
         assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain #1"
diff --git a/bbot/test/test_step_2/test_modules_basic.py b/bbot/test/test_step_2/test_modules_basic.py
index 9925eb1c8b..0c0b73129a 100644
--- a/bbot/test/test_step_2/test_modules_basic.py
+++ b/bbot/test/test_step_2/test_modules_basic.py
@@ -12,7 +12,6 @@ async def test_modules_basic(
     with open(fallback_nameservers, "w") as f:
         f.write("8.8.8.8\n")
 
-    httpx_mock.assert_all_responses_were_requested = False
     for http_method in ("GET", "CONNECT", "HEAD", "POST", "PUT", "TRACE", "DEBUG", "PATCH", "DELETE", "OPTIONS"):
         httpx_mock.add_response(method=http_method, url=re.compile(r".*"), json={"test": "test"})
 

From 985e98e1b488aec6b91ed7a584f35a93294d2508 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 16:30:03 -0400
Subject: [PATCH 047/387] fix nuclei budget tests

---
 bbot/modules/deadly/nuclei.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/deadly/nuclei.py b/bbot/modules/deadly/nuclei.py
index 8ffe308a20..0b0f6bc6ee 100644
--- a/bbot/modules/deadly/nuclei.py
+++ b/bbot/modules/deadly/nuclei.py
@@ -274,11 +274,11 @@ async def filter_event(self, event):
 
 class NucleiBudget:
     def __init__(self, budget, templates_dir):
+        self._yaml_files = {}
         self.templates_dir = templates_dir
         self.yaml_list = self.get_yaml_list()
         self.budget_paths = self.find_budget_paths(budget)
         self.collapsable_templates, self.severity_stats = self.find_collapsable_templates()
-        self._yaml_files
 
     def get_yaml_list(self):
         return list(self.templates_dir.rglob("*.yaml"))

From e722fb4ed05a947333e8ba5fd9acaa51ad4313f1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 16:58:39 -0400
Subject: [PATCH 048/387] fix module basic tests

---
 bbot/modules/masscan.py                     |  2 +-
 bbot/test/bbot_fixtures.py                  | 75 +---------------
 bbot/test/test_step_2/test_modules_basic.py | 94 +--------------------
 bbot/test/test_step_2/test_scan.py          |  2 -
 bbot/test/test_step_2/test_target.py        |  2 +-
 5 files changed, 4 insertions(+), 171 deletions(-)

diff --git a/bbot/modules/masscan.py b/bbot/modules/masscan.py
index e7f2507b6f..647a27a3dd 100644
--- a/bbot/modules/masscan.py
+++ b/bbot/modules/masscan.py
@@ -254,7 +254,7 @@ def _build_targets(self, target):
                 targets.append(t)
         return ",".join(str(t) for t in targets), invalid_targets
 
-    def cleanup(self):
+    async def cleanup(self):
         if self.ping_first:
             with suppress(Exception):
                 self.ping_cache_fd.close()
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index c1c87207d5..5a75c81a6c 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -57,53 +57,6 @@ def match_data(self, request: Request) -> bool:
 log = logging.getLogger(f"bbot.test.fixtures")
 
 
-@pytest.fixture
-def patch_commands():
-    import subprocess
-
-    sample_output = [
-        # massdns
-        """{"name":"www.blacklanternsecurity.com.","type":"A","class":"IN","status":"NOERROR","rx_ts":1659985004071981831,"data":{"answers":[{"ttl":3580,"type":"CNAME","class":"IN","name":"www.blacklanternsecurity.com.","data":"blacklanternsecurity.github.io."},{"ttl":3580,"type":"A","class":"IN","name":"blacklanternsecurity.github.io.","data":"185.199.108.153"},{"ttl":3580,"type":"A","class":"IN","name":"blacklanternsecurity.github.io.","data":"185.199.109.153"},{"ttl":3580,"type":"A","class":"IN","name":"blacklanternsecurity.github.io.","data":"185.199.110.153"},{"ttl":3580,"type":"A","class":"IN","name":"blacklanternsecurity.github.io.","data":"185.199.111.153"}]},"flags":["rd","ra"],"resolver":"8.8.8.8:53"}""",
-        # httpx
-        """{"timestamp":"2022-11-14T12:15:47.152132075-05:00","hash":{"body_md5":"84238dfc8092e5d9c0dac8ef93371a07","body_mmh3":"-1139337416","body_sha256":"ea8fac7c65fb589b0d53560f5251f74f9e9b243478dcb6b3ea79b5e36449c8d9","body_simhash":"9899951357530060719","header_md5":"fbe962f8536d2df0ee25efbf3ba8ba6e","header_mmh3":"1030635337","header_sha256":"2bec212a3ad091763a68ed40e6b004a546036c5b5e0ec02713f8625ab573e9ab","header_simhash":"15614709017155972447"},"port":"80","url":"http://example.com:80","input":"http://example.com:80","title":"Example Domain","scheme":"http","webserver":"ECS (agb/A434)","body":"\u003c!doctype html\u003e\n\u003chtml\u003e\n\u003chead\u003e\n    \u003ctitle\u003eExample Domain\u003c/title\u003e\n\n    \u003cmeta charset=\"utf-8\" /\u003e\n    \u003cmeta http-equiv=\"Content-type\" content=\"text/html; charset=utf-8\" /\u003e\n    \u003cmeta name=\"viewport\" content=\"width=device-width, initial-scale=1\" /\u003e\n    \u003cstyle type=\"text/css\"\u003e\n    body {\n        background-color: #f0f0f2;\n        margin: 0;\n        padding: 0;\n        font-family: -apple-system, system-ui, BlinkMacSystemFont, \"Segoe UI\", \"Open Sans\", \"Helvetica Neue\", Helvetica, Arial, sans-serif;\n        \n    }\n    div {\n        width: 600px;\n        margin: 5em auto;\n        padding: 2em;\n        background-color: #fdfdff;\n        border-radius: 0.5em;\n        box-shadow: 2px 3px 7px 2px rgba(0,0,0,0.02);\n    }\n    a:link, a:visited {\n        color: #38488f;\n        text-decoration: none;\n    }\n    @media (max-width: 700px) {\n        div {\n            margin: 0 auto;\n            width: auto;\n        }\n    }\n    \u003c/style\u003e    \n\u003c/head\u003e\n\n\u003cbody\u003e\n\u003cdiv\u003e\n    \u003ch1\u003eExample Domain\u003c/h1\u003e\n    \u003cp\u003eThis domain is for use in illustrative examples in documents. You may use this\n    domain in literature without prior coordination or asking for permission.\u003c/p\u003e\n    \u003cp\u003e\u003ca href=\"https://www.iana.org/domains/example\"\u003eMore information...\u003c/a\u003e\u003c/p\u003e\n\u003c/div\u003e\n\u003c/body\u003e\n\u003c/html\u003e\n","content_type":"text/html","method":"GET","host":"93.184.216.34","path":"/","header":{"age":"551615","cache_control":"max-age=604800","content_type":"text/html; charset=UTF-8","date":"Mon, 14 Nov 2022 17:15:47 GMT","etag":"\"3147526947+gzip\"","expires":"Mon, 21 Nov 2022 17:15:47 GMT","last_modified":"Thu, 17 Oct 2019 07:18:26 GMT","server":"ECS (agb/A434)","vary":"Accept-Encoding","x_cache":"HIT"},"raw_header":"HTTP/1.1 200 OK\r\nConnection: close\r\nAge: 551615\r\nCache-Control: max-age=604800\r\nContent-Type: text/html; charset=UTF-8\r\nDate: Mon, 14 Nov 2022 17:15:47 GMT\r\nEtag: \"3147526947+gzip\"\r\nExpires: Mon, 21 Nov 2022 17:15:47 GMT\r\nLast-Modified: Thu, 17 Oct 2019 07:18:26 GMT\r\nServer: ECS (agb/A434)\r\nVary: Accept-Encoding\r\nX-Cache: HIT\r\n\r\n","request":"GET / HTTP/1.1\r\nHost: example.com\r\nUser-Agent: Xenu Link Sleuth/1.3.8\r\nAccept-Charset: utf-8\r\nAccept-Encoding: gzip\r\n\r\n","time":"99.670794ms","a":["93.184.216.34","2606:2800:220:1:248:1893:25c8:1946"],"words":298,"lines":47,"status_code":200,"content_length":1256,"failed":false}""",
-        # nuclei
-        """{"template":"technologies/tech-detect.yaml","template-url":"https://github.com/projectdiscovery/nuclei-templates/blob/master/technologies/tech-detect.yaml","template-id":"tech-detect","info":{"name":"Wappalyzer Technology Detection","author":["hakluke"],"tags":["tech"],"reference":null,"severity":"info"},"matcher-name":"caddy","type":"http","host":"https://api.publicapis.org/health","matched-at":"https://api.publicapis.org:443/health","ip":"138.197.231.124","timestamp":"2022-04-15T17:09:01.021589723-04:00","curl-command":"curl -X 'GET' -d '' -H 'Accept: */*' -H 'Accept-Language: en' -H 'User-Agent: Mozilla/5.0 (Windows NT 6.3; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/41.0.2226.0 Safari/537.36' 'https://api.publicapis.org/health'","matcher-status":true,"matched-line":null}""",
-        # naabu
-        """{"ip":"8.8.8.8","port":443,"timestamp":"2022-08-03T16:01:15.684442081Z"}"""
-        # ffuf
-        """{"input":{"FUZZ":"L2luZGV4Lmh0bWw="},"position":1,"status":200,"length":1256,"words":298,"lines":47,"content-type":"text/html;charset=UTF-8","redirectlocation":"","url":"http://example.com:80//index.html","duration":101243249,"resultfile":"","host":"example.com:80"}""",
-        "https://api.publicapis.org:443/health",
-        # fingerprintx
-        """{"ip":"8.8.8.8","port":443,"protocol":"https","tls":true,"transport":"tcp","version":"HTTP server (unknown)","metadata":{"status":"302 Found","statusCode":302,"responseHeaders":{"Access-Control-Allow-Origin":["*"],"Alt-Svc":["h3=\":443\"; ma=2592000,h3-29=\":443\"; ma=2592000"],"Content-Length":["216"],"Content-Type":["text/html; charset=UTF-8"],"Date":["Mon, 15 May 2023 18:34:49 GMT"],"Location":["https://dns.google/"],"Server":["HTTP server (unknown)"],"X-Content-Type-Options":["nosniff"],"X-Frame-Options":["SAMEORIGIN"],"X-Xss-Protection":["0"]},"technologies":["HTTP/3"]}}"""
-        # open port
-        "api.publicapis.org:443",
-        # host
-        "api.publicapis.org",
-        # url
-        "https://8.8.8.8",
-    ]
-
-    def patch_scan_commands(scanner):
-        async def run(*args, **kwargs):
-            log.debug(f"helpers.command.run(args={args}, kwargs={kwargs})")
-            text = kwargs.get("text", True)
-            output = "\n".join(sample_output)
-            return subprocess.run(["echo", output], text=text)
-
-        def run_live(*args, **kwargs):
-            log.debug(f"helpers.command.run_live(args={args}, kwargs={kwargs})")
-            for line in sample_output:
-                yield line
-
-        from bbot.core.helpers.command import run as old_run, run_live as old_run_live
-
-        scanner.helpers.run = run
-        scanner.helpers.run_live = run_live
-        return old_run, old_run_live
-
-    return patch_scan_commands
-
-
 @pytest.fixture
 def bbot_scanner():
     from bbot.scanner import Scanner
@@ -131,36 +84,10 @@ def merge(self, *args, **kwargs):
 
 
 @pytest.fixture
-def patch_ansible(monkeypatch):
-    from ansible_runner.interface import run
-
-    class AnsibleRunnerResult:
-        status = "successful"
-        rc = 0
-        events = []
-
-    def ansible_run(*args, **kwargs):
-        return AnsibleRunnerResult()
-
-    from bbot.core.helpers.depsinstaller import installer
-
-    ensure_root = installer.DepsInstaller.ensure_root
-
-    def patch_scan_ansible(scanner):
-        monkeypatch.setattr(installer, "run", ansible_run)
-        monkeypatch.setattr(scanner.helpers.depsinstaller, "ensure_root", lambda *args, **kwargs: None)
-        return run, ensure_root
-
-    return patch_scan_ansible
-
-
-@pytest.fixture
-def scan(monkeypatch, patch_ansible, patch_commands, bbot_config):
+def scan(monkeypatch, bbot_config):
     from bbot.scanner import Scanner
 
     bbot_scan = Scanner("127.0.0.1", modules=["ipneighbor"], config=bbot_config)
-    patch_commands(bbot_scan)
-    patch_ansible(bbot_scan)
 
     fallback_nameservers_file = bbot_scan.helpers.bbot_home / "fallback_nameservers.txt"
     with open(fallback_nameservers_file, "w") as f:
diff --git a/bbot/test/test_step_2/test_modules_basic.py b/bbot/test/test_step_2/test_modules_basic.py
index 0c0b73129a..459dc3fff5 100644
--- a/bbot/test/test_step_2/test_modules_basic.py
+++ b/bbot/test/test_step_2/test_modules_basic.py
@@ -1,13 +1,10 @@
 import re
-from contextlib import suppress
 
 from ..bbot_fixtures import *
 
 
 @pytest.mark.asyncio
-async def test_modules_basic(
-    patch_commands, patch_ansible, scan, helpers, events, bbot_config, bbot_scanner, httpx_mock
-):
+async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, httpx_mock):
     fallback_nameservers = scan.helpers.temp_dir / "nameservers.txt"
     with open(fallback_nameservers, "w") as f:
         f.write("8.8.8.8\n")
@@ -88,8 +85,6 @@ async def test_modules_basic(
         config=bbot_config,
     )
     scan2.helpers.dns.fallback_nameservers_file = fallback_nameservers
-    patch_commands(scan2)
-    patch_ansible(scan2)
     await scan2.load_modules()
     scan2.status = "RUNNING"
 
@@ -160,90 +155,3 @@ async def test_modules_basic(
         assert all(
             o for o in preloaded.get("options_desc", {}).values()
         ), f"{module_name}.options_desc descriptions must not be blank"
-
-    # setups
-    futures = {}
-    for module_name, module in scan2.modules.items():
-        log.info(f"Testing {module_name}.setup()")
-        future = scan2._thread_pool.submit(module.setup)
-        futures[future] = module
-    for future in helpers.as_completed(futures):
-        module = futures[future]
-        result = future.result()
-        if type(result) == tuple:
-            assert len(result) == 2, f"if tuple, {module.name}.setup() return value must have length of 2"
-            status, msg = result
-            assert status in (
-                True,
-                False,
-                None,
-            ), f"if tuple, the first element of {module.name}.setup()'s return value must be either True, False, or None"
-            assert (
-                type(msg) == str
-            ), f"if tuple, the second element of {module.name}.setup()'s return value must be a message of type str"
-        else:
-            assert result in (
-                True,
-                False,
-                None,
-            ), f"{module.name}.setup() must return a status of either True, False, or None"
-        if result == False:
-            module.set_error_state()
-
-    futures.clear()
-
-    # handle_event / handle_batch
-    futures = {}
-    for module_name, module in scan2.modules.items():
-        module.emit_event = lambda *args, **kwargs: None
-        module._filter = lambda *args, **kwargs: True, ""
-        events_to_submit = [e for e in events.all if e.type in module.watched_events]
-        if module.batch_size > 1:
-            log.info(f"Testing {module_name}.handle_batch()")
-            future = scan2._thread_pool.submit(module.handle_batch, *events_to_submit)
-            futures[future] = module
-        else:
-            for e in events_to_submit:
-                log.info(f"Testing {module_name}.handle_event()")
-                future = scan2._thread_pool.submit(module.handle_event, e)
-                futures[future] = module
-    for future in helpers.as_completed(futures):
-        try:
-            assert future.result() == None
-        except Exception as e:
-            import traceback
-
-            module = futures[future]
-            assert module.errored == True, f'Error in module "{module}": {e}\n{traceback.format_exc()}'
-    futures.clear()
-
-    # finishes
-    futures = {}
-    for module_name, module in scan2.modules.items():
-        log.info(f"Testing {module_name}.finish()")
-        future = scan2._thread_pool.submit(module.finish)
-        futures[future] = module
-    for future in helpers.as_completed(futures):
-        assert future.result() == None
-    futures.clear()
-
-    # cleanups
-    futures = {}
-    for module_name, module in scan2.modules.items():
-        log.info(f"Testing {module_name}.cleanup()")
-        future = scan2._thread_pool.submit(module.cleanup)
-        futures[future] = module
-    for future in helpers.as_completed(futures):
-        assert future.result() == None
-    futures.clear()
-
-    # event filters
-    for module_name, module in scan2.modules.items():
-        log.info(f"Testing {module_name}.filter_event()")
-        result = module.filter_event(events.emoji)
-        with suppress(ValueError, TypeError):
-            result, reason = result
-        assert result in (
-            True,
-            False,
-        ), f"{module_name}.filter_event() must return either True or False"
diff --git a/bbot/test/test_step_2/test_scan.py b/bbot/test/test_step_2/test_scan.py
index 2bde71a382..2a4b0c8e24 100644
--- a/bbot/test/test_step_2/test_scan.py
+++ b/bbot/test/test_step_2/test_scan.py
@@ -3,8 +3,6 @@
 
 @pytest.mark.asyncio
 async def test_scan(
-    patch_ansible,
-    patch_commands,
     events,
     bbot_config,
     helpers,
diff --git a/bbot/test/test_step_2/test_target.py b/bbot/test/test_step_2/test_target.py
index 2e9f00f441..90db526c7f 100644
--- a/bbot/test/test_step_2/test_target.py
+++ b/bbot/test/test_step_2/test_target.py
@@ -1,7 +1,7 @@
 from ..bbot_fixtures import *  # noqa: F401
 
 
-def test_target(patch_ansible, bbot_config, bbot_scanner):
+def test_target(bbot_config, bbot_scanner):
     scan1 = bbot_scanner("api.publicapis.org", "8.8.8.8/30", "2001:4860:4860::8888/126", config=bbot_config)
     scan2 = bbot_scanner("8.8.8.8/29", "publicapis.org", "2001:4860:4860::8888/125", config=bbot_config)
     scan3 = bbot_scanner("8.8.8.8/29", "publicapis.org", "2001:4860:4860::8888/125", config=bbot_config)

From b93bd17a05c034804ff090816226f28e174a2b0d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 17:55:57 -0400
Subject: [PATCH 049/387] succeed dammit

---
 bbot/test/test_step_2/test_python_api.py |  8 ++++--
 bbot/test/test_step_2/test_scan.py       | 36 ++++--------------------
 2 files changed, 11 insertions(+), 33 deletions(-)

diff --git a/bbot/test/test_step_2/test_python_api.py b/bbot/test/test_step_2/test_python_api.py
index f4ef428af9..77fc43f4c0 100644
--- a/bbot/test/test_step_2/test_python_api.py
+++ b/bbot/test/test_step_2/test_python_api.py
@@ -2,16 +2,18 @@
 
 
 @pytest.mark.asyncio
-def test_python_api(bbot_config):
+async def test_python_api(bbot_config):
     from bbot.scanner import Scanner
 
     # make sure events are properly yielded
     scan1 = Scanner("127.0.0.1", config=bbot_config)
-    events1 = list(scan1.start())
+    events1 = []
+    async for event in scan1.start():
+        events1.append(event)
     assert any("127.0.0.1" == e for e in events1)
     # make sure output files work
     scan2 = Scanner("127.0.0.1", config=bbot_config, output_modules=["json"], name="python_api_test")
-    scan2.start_without_generator()
+    await scan2.start_without_generator()
     out_file = scan2.helpers.scans_dir / "python_api_test" / "output.json"
     assert list(scan2.helpers.read_file(out_file))
     # make sure config loads properly
diff --git a/bbot/test/test_step_2/test_scan.py b/bbot/test/test_step_2/test_scan.py
index 2a4b0c8e24..1b50e02414 100644
--- a/bbot/test/test_step_2/test_scan.py
+++ b/bbot/test/test_step_2/test_scan.py
@@ -7,7 +7,6 @@ async def test_scan(
     bbot_config,
     helpers,
     neograph,
-    websocketapp,
     monkeypatch,
     bbot_scanner,
 ):
@@ -45,38 +44,13 @@ async def test_scan(
     assert scan2.in_scope("8.8.8.8")
     assert not scan2.in_scope("8.8.4.4")
 
-    scan3 = bbot_scanner(
-        "127.0.0.0/30",
-        "127.0.0.2:8443",
-        "https://localhost",
-        "[::1]:80",
-        "http://[::1]:8080",
-        modules=["ipneighbor"],
-        output_modules=list(available_output_modules),
-        config=bbot_config,
-        blacklist=["http://127.0.0.3:8000/asdf"],
-        whitelist=["127.0.0.0/29"],
-    )
-    patch_commands(scan3)
-    patch_ansible(scan3)
-    assert "targets" in scan3.json
-    assert "127.0.0.3" in scan3.target
-    assert "127.0.0.4" not in scan3.target
-    assert "127.0.0.4" in scan3.whitelist
-    assert scan3.whitelisted("127.0.0.4")
-    assert "127.0.0.3" in scan3.blacklist
-    assert scan3.blacklisted("127.0.0.3")
-    assert scan3.in_scope("127.0.0.1")
-    assert not scan3.in_scope("127.0.0.3")
-    scan3.prep()
-    monkeypatch.setattr(scan3.modules["websocket"], "ws", websocketapp())
-    events = list(scan3.start())
-
     # make sure DNS resolution works
     dns_config = OmegaConf.create({"dns_resolution": True})
     dns_config = OmegaConf.merge(bbot_config, dns_config)
     scan4 = bbot_scanner("8.8.8.8", config=dns_config)
-    events = list(scan4.start())
+    events = []
+    async for event in scan4.start():
+        events.append(event)
     event_data = [e.data for e in events]
     assert "dns.google" in event_data
 
@@ -84,6 +58,8 @@ async def test_scan(
     no_dns_config = OmegaConf.create({"dns_resolution": False})
     no_dns_config = OmegaConf.merge(bbot_config, no_dns_config)
     scan5 = bbot_scanner("8.8.8.8", config=no_dns_config)
-    events = list(scan5.start())
+    events = []
+    async for event in scan5.start():
+        events.append(event)
     event_data = [e.data for e in events]
     assert "dns.google" not in event_data

From e71ecfd53c97021c69ef9b3deee5330a5c57b9c7 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 22 May 2023 22:36:55 -0400
Subject: [PATCH 050/387] forgot keyword

---
 bbot/test/test_step_2/test_web.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/test_step_2/test_web.py b/bbot/test/test_step_2/test_web.py
index b0c76bf4fc..8475cc631e 100644
--- a/bbot/test/test_step_2/test_web.py
+++ b/bbot/test/test_step_2/test_web.py
@@ -150,7 +150,7 @@ async def test_web_curl(bbot_scanner, bbot_config, bbot_httpserver):
 
 @pytest.mark.asyncio
 async def test_web_http_compare(httpx_mock, helpers):
-    httpx_mock.add_response(re.compile(r"http://www.example.com.*"), text="wat")
+    httpx_mock.add_response(url=re.compile(r"http://www\.example\.com.*"), text="wat")
     compare_helper = helpers.http_compare("http://www.example.com")
     await compare_helper.compare("http://www.example.com", headers={"asdf": "asdf"})
     await compare_helper.compare("http://www.example.com", cookies={"asdf": "asdf"})

From 3309314bceeb1ece8a654b55483f3addcead22be Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 00:01:41 -0400
Subject: [PATCH 051/387] small testing rework

---
 bbot/cli.py                                   | 12 ++--
 .../{module_tests => }/test__module__tests.py |  8 +--
 .../test_agent.py                             |  0
 .../{test_step_2 => test_step_1}/test_cli.py  | 67 +++++++++++++++++--
 .../test_cloud_helpers.py                     |  0
 .../test_command.py                           |  0
 .../test_config.py                            |  0
 .../test_depsinstaller.py                     |  0
 .../{test_step_2 => test_step_1}/test_dns.py  |  0
 .../test_events.py                            |  0
 .../test_files.py                             |  0
 .../test_helpers.py                           |  0
 .../test_manager.py                           |  0
 .../test_modules_basic.py                     |  0
 .../test_python_api.py                        |  0
 .../{test_step_2 => test_step_1}/test_scan.py |  0
 .../test_scope.py                             |  2 +-
 .../test_target.py                            |  0
 .../{test_step_2 => test_step_1}/test_web.py  |  0
 .../module_tests/__init__.py                  |  0
 .../module_tests/base.py                      |  0
 .../module_tests/test_module_affiliates.py    |  0
 .../module_tests/test_module_aggregate.py     |  0
 .../module_tests/test_module_anubisdb.py      |  0
 .../module_tests/test_module_asn.py           |  0
 .../test_module_asset_inventory.py            |  0
 .../module_tests/test_module_azure_tenant.py  |  0
 .../module_tests/test_module_badsecrets.py    |  0
 .../module_tests/test_module_bevigil.py       |  0
 .../module_tests/test_module_binaryedge.py    |  0
 .../module_tests/test_module_bucket_aws.py    |  0
 .../module_tests/test_module_bucket_azure.py  |  0
 .../test_module_bucket_digitalocean.py        |  0
 .../test_module_bucket_firebase.py            |  0
 .../module_tests/test_module_bucket_gcp.py    |  0
 .../module_tests/test_module_builtwith.py     |  0
 .../module_tests/test_module_bypass403.py     |  0
 .../module_tests/test_module_c99.py           |  0
 .../module_tests/test_module_censys.py        |  0
 .../module_tests/test_module_certspotter.py   |  0
 .../module_tests/test_module_crobat.py        |  0
 .../module_tests/test_module_crt.py           |  0
 .../module_tests/test_module_csv.py           |  0
 .../module_tests/test_module_dnscommonsrv.py  |  0
 .../module_tests/test_module_dnsdumpster.py   |  0
 .../test_module_dnszonetransfer.py            |  0
 .../module_tests/test_module_emailformat.py   |  0
 .../module_tests/test_module_excavate.py      |  0
 .../module_tests/test_module_ffuf.py          |  0
 .../test_module_ffuf_shortnames.py            |  0
 .../module_tests/test_module_fingerprintx.py  |  0
 .../module_tests/test_module_fullhunt.py      |  0
 .../module_tests/test_module_generic_ssrf.py  |  0
 .../module_tests/test_module_github.py        |  0
 .../module_tests/test_module_gowitness.py     |  0
 .../module_tests/test_module_hackertarget.py  |  0
 .../module_tests/test_module_host_header.py   |  0
 .../module_tests/test_module_http.py          |  0
 .../module_tests/test_module_httpx.py         |  0
 .../module_tests/test_module_human.py         |  0
 .../module_tests/test_module_hunt.py          |  0
 .../module_tests/test_module_hunterio.py      |  0
 .../test_module_iis_shortnames.py             |  0
 .../module_tests/test_module_ipneighbor.py    |  0
 .../module_tests/test_module_ipstack.py       |  0
 .../module_tests/test_module_json.py          |  0
 .../module_tests/test_module_leakix.py        |  0
 .../module_tests/test_module_masscan.py       |  0
 .../module_tests/test_module_massdns.py       |  0
 .../module_tests/test_module_naabu.py         |  0
 .../module_tests/test_module_neo4j.py         |  0
 .../module_tests/test_module_ntlm.py          |  0
 .../module_tests/test_module_nuclei.py        |  0
 .../module_tests/test_module_otx.py           |  0
 .../test_module_paramminer_cookies.py         |  0
 .../test_module_paramminer_getparams.py       |  0
 .../test_module_paramminer_headers.py         |  0
 .../module_tests/test_module_passivetotal.py  |  0
 .../module_tests/test_module_pgp.py           |  0
 .../module_tests/test_module_python.py        |  0
 .../module_tests/test_module_rapiddns.py      |  0
 .../module_tests/test_module_riddler.py       |  0
 .../module_tests/test_module_robots.py        |  0
 .../module_tests/test_module_secretsdb.py     |  0
 .../test_module_securitytrails.py             |  0
 .../module_tests/test_module_shodan_dns.py    |  0
 .../module_tests/test_module_skymem.py        |  0
 .../module_tests/test_module_smuggler.py      |  0
 .../module_tests/test_module_social.py        |  0
 .../module_tests/test_module_speculate.py     |  0
 .../module_tests/test_module_sslcert.py       |  0
 .../test_module_subdomain_hijack.py           |  0
 .../module_tests/test_module_sublist3r.py     |  0
 .../module_tests/test_module_telerik.py       |  0
 .../module_tests/test_module_threatminer.py   |  0
 .../test_module_url_manipulation.py           |  0
 .../module_tests/test_module_urlscan.py       |  0
 .../module_tests/test_module_vhost.py         |  0
 .../module_tests/test_module_viewdns.py       |  0
 .../module_tests/test_module_virustotal.py    |  0
 .../module_tests/test_module_wafw00f.py       |  0
 .../module_tests/test_module_wappalyzer.py    |  0
 .../module_tests/test_module_wayback.py       |  0
 .../module_tests/test_module_web_report.py    |  0
 .../module_tests/test_module_websocket.py     |  0
 .../module_tests/test_module_zoomeye.py       |  0
 106 files changed, 70 insertions(+), 19 deletions(-)
 rename bbot/test/test_step_1/{module_tests => }/test__module__tests.py (81%)
 rename bbot/test/{test_step_2 => test_step_1}/test_agent.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_cli.py (71%)
 rename bbot/test/{test_step_2 => test_step_1}/test_cloud_helpers.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_command.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_config.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_depsinstaller.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_dns.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_events.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_files.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_helpers.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_manager.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_modules_basic.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_python_api.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_scan.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_scope.py (91%)
 rename bbot/test/{test_step_2 => test_step_1}/test_target.py (100%)
 rename bbot/test/{test_step_2 => test_step_1}/test_web.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/__init__.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/base.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_affiliates.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_aggregate.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_anubisdb.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_asn.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_asset_inventory.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_azure_tenant.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_badsecrets.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_bevigil.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_binaryedge.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_bucket_aws.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_bucket_azure.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_bucket_digitalocean.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_bucket_firebase.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_bucket_gcp.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_builtwith.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_bypass403.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_c99.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_censys.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_certspotter.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_crobat.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_crt.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_csv.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_dnscommonsrv.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_dnsdumpster.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_dnszonetransfer.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_emailformat.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_excavate.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_ffuf.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_ffuf_shortnames.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_fingerprintx.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_fullhunt.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_generic_ssrf.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_github.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_gowitness.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_hackertarget.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_host_header.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_http.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_httpx.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_human.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_hunt.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_hunterio.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_iis_shortnames.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_ipneighbor.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_ipstack.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_json.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_leakix.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_masscan.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_massdns.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_naabu.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_neo4j.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_ntlm.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_nuclei.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_otx.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_paramminer_cookies.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_paramminer_getparams.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_paramminer_headers.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_passivetotal.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_pgp.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_python.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_rapiddns.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_riddler.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_robots.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_secretsdb.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_securitytrails.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_shodan_dns.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_skymem.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_smuggler.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_social.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_speculate.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_sslcert.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_subdomain_hijack.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_sublist3r.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_telerik.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_threatminer.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_url_manipulation.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_urlscan.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_vhost.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_viewdns.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_virustotal.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_wafw00f.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_wappalyzer.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_wayback.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_web_report.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_websocket.py (100%)
 rename bbot/test/{test_step_1 => test_step_2}/module_tests/test_module_zoomeye.py (100%)

diff --git a/bbot/cli.py b/bbot/cli.py
index 32e2a8c33c..a8d44af27d 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -101,12 +101,8 @@ async def _main():
                     k for k, v in module_loader.preloaded(type="output").items() if "console" in v["config"]
                 ]
 
-                # If no options are specified, use the default set
-                if not options.output_modules:
-                    options.output_modules = default_output_modules
-
                 # if none of the output modules provided on the command line are consoleable, don't turn off the defaults. Instead, just add the one specified to the defaults.
-                elif not any(o in consoleable_output_modules for o in options.output_modules):
+                if not any(o in consoleable_output_modules for o in options.output_modules):
                     options.output_modules += default_output_modules
 
                 scanner = Scanner(
@@ -124,9 +120,9 @@ async def _main():
                 if options.install_all_deps:
                     all_modules = list(module_loader.preloaded())
                     scanner.helpers.depsinstaller.force_deps = True
-                    scanner.helpers.depsinstaller.install(*all_modules)
+                    succeeded, failed = await scanner.helpers.depsinstaller.install(*all_modules)
                     log.info("Finished installing module dependencies")
-                    return
+                    return False if failed else True
 
                 scan_name = str(scanner.name)
 
@@ -244,7 +240,7 @@ async def _main():
                         log.hugewarning(f"You enabled the following deadly modules: {','.join(deadly_modules)}")
                         log.hugewarning(f"Deadly modules are highly intrusive")
                         log.hugewarning(f"Please specify --allow-deadly to continue")
-                        return
+                        return False
                     if active_modules:
                         if active_modules:
                             if active_aggressive_modules:
diff --git a/bbot/test/test_step_1/module_tests/test__module__tests.py b/bbot/test/test_step_1/test__module__tests.py
similarity index 81%
rename from bbot/test/test_step_1/module_tests/test__module__tests.py
rename to bbot/test/test_step_1/test__module__tests.py
index 4fbc60aa8a..0d08555578 100644
--- a/bbot/test/test_step_1/module_tests/test__module__tests.py
+++ b/bbot/test/test_step_1/test__module__tests.py
@@ -2,14 +2,14 @@
 import importlib
 from pathlib import Path
 
-from .base import ModuleTestBase
+from ..test_step_2.module_tests.base import ModuleTestBase
 from bbot.modules import module_loader
 
 log = logging.getLogger("bbot.test.modules")
 
-parent_dir = Path(__file__).parent
+module_tests_dir = Path(__file__).parent.parent / "test_step_2" / "module_tests"
 
-_module_test_files = list(parent_dir.glob("test_module_*.py"))
+_module_test_files = list(module_tests_dir.glob("test_module_*.py"))
 _module_test_files.sort(key=lambda p: p.name)
 module_test_files = [m.name.split("test_module_")[-1].split(".")[0] for m in _module_test_files]
 
@@ -23,7 +23,7 @@ def test__module__tests():
     # make sure each test file has a test class
     for file in _module_test_files:
         module_name = file.stem
-        import_path = f"bbot.test.test_step_1.module_tests.{module_name}"
+        import_path = f"bbot.test.test_step_2.module_tests.{module_name}"
         module_test_variables = importlib.import_module(import_path, "bbot")
         module_pass = False
         for var_name in dir(module_test_variables):
diff --git a/bbot/test/test_step_2/test_agent.py b/bbot/test/test_step_1/test_agent.py
similarity index 100%
rename from bbot/test/test_step_2/test_agent.py
rename to bbot/test/test_step_1/test_agent.py
diff --git a/bbot/test/test_step_2/test_cli.py b/bbot/test/test_step_1/test_cli.py
similarity index 71%
rename from bbot/test/test_step_2/test_cli.py
rename to bbot/test/test_step_1/test_cli.py
index 524ac02eeb..a0e821a12e 100644
--- a/bbot/test/test_step_2/test_cli.py
+++ b/bbot/test/test_step_1/test_cli.py
@@ -1,7 +1,8 @@
 from ..bbot_fixtures import *
 
 
-def test_cli(monkeypatch, bbot_config):
+@pytest.mark.asyncio
+async def test_cli(monkeypatch, bbot_config):
     from bbot import cli
 
     monkeypatch.setattr(sys, "exit", lambda *args, **kwargs: True)
@@ -35,7 +36,7 @@ def test_cli(monkeypatch, bbot_config):
             "/tmp",
         ],
     )
-    cli.main()
+    await cli._main()
 
     scan_home = scans_home / "test_cli_scan"
     assert (scan_home / "wordcloud.tsv").is_file()
@@ -61,19 +62,73 @@ def test_cli(monkeypatch, bbot_config):
 
     # show version
     monkeypatch.setattr("sys.argv", ["bbot", "--version"])
-    cli.main()
+    await cli._main()
+
+    # start agent
+    monkeypatch.setattr("sys.argv", ["bbot", "--agent-mode"])
+    task = asyncio.create_task(cli._main())
+    await asyncio.sleep(2)
+    task.cancel()
+    await task
+
+    # no args
+    monkeypatch.setattr("sys.argv", ["bbot"])
+    await cli._main()
+
+    # enable module by flag
+    monkeypatch.setattr("sys.argv", ["bbot", "-f", "report"])
+    await cli._main()
+
+    # unconsoleable output module
+    monkeypatch.setattr("sys.argv", ["bbot", "-om", "web_report"])
+    await cli._main()
+
+    # install all deps
+    monkeypatch.setattr("sys.argv", ["bbot", "--install-all-deps"])
+    success = await cli._main()
+    assert success, "--install-all-deps failed for at least one module"
+
+    # unresolved dependency
+    monkeypatch.setattr("sys.argv", ["bbot", "-m", "wappalyzer"])
+    await cli._main()
+
+    # resolved dependency, excluded module
+    monkeypatch.setattr("sys.argv", ["bbot", "-m", "ffuf_shortnames", "-em", "ffuf_shortnames"])
+    await cli._main()
+
+    # require flags
+    monkeypatch.setattr("sys.argv", ["bbot", "-f", "active", "-rf", "passive"])
+    await cli._main()
+
+    # excluded flags
+    monkeypatch.setattr("sys.argv", ["bbot", "-f", "active", "-ef", "active"])
+    await cli._main()
+
+    # slow modules
+    monkeypatch.setattr("sys.argv", ["bbot", "-m", "massdns"])
+    await cli._main()
+
+    # deadly modules
+    monkeypatch.setattr("sys.argv", ["bbot", "-m", "nuclei"])
+    result = await cli._main()
+    assert result == False
+
+    # --allow-deadly
+    monkeypatch.setattr("sys.argv", ["bbot", "-m", "nuclei", "--allow-deadly"])
+    result = await cli._main()
+    assert result != False
 
     # show current config
     monkeypatch.setattr("sys.argv", ["bbot", "-y", "--current-config"])
-    cli.main()
+    await cli._main()
 
     # list modules
     monkeypatch.setattr("sys.argv", ["bbot", "-l"])
-    cli.main()
+    await cli._main()
 
     # list module options
     monkeypatch.setattr("sys.argv", ["bbot", "--help-all"])
-    cli.main()
+    await cli._main()
 
     # unpatch sys.argv
     monkeypatch.setattr("sys.argv", old_sys_argv)
diff --git a/bbot/test/test_step_2/test_cloud_helpers.py b/bbot/test/test_step_1/test_cloud_helpers.py
similarity index 100%
rename from bbot/test/test_step_2/test_cloud_helpers.py
rename to bbot/test/test_step_1/test_cloud_helpers.py
diff --git a/bbot/test/test_step_2/test_command.py b/bbot/test/test_step_1/test_command.py
similarity index 100%
rename from bbot/test/test_step_2/test_command.py
rename to bbot/test/test_step_1/test_command.py
diff --git a/bbot/test/test_step_2/test_config.py b/bbot/test/test_step_1/test_config.py
similarity index 100%
rename from bbot/test/test_step_2/test_config.py
rename to bbot/test/test_step_1/test_config.py
diff --git a/bbot/test/test_step_2/test_depsinstaller.py b/bbot/test/test_step_1/test_depsinstaller.py
similarity index 100%
rename from bbot/test/test_step_2/test_depsinstaller.py
rename to bbot/test/test_step_1/test_depsinstaller.py
diff --git a/bbot/test/test_step_2/test_dns.py b/bbot/test/test_step_1/test_dns.py
similarity index 100%
rename from bbot/test/test_step_2/test_dns.py
rename to bbot/test/test_step_1/test_dns.py
diff --git a/bbot/test/test_step_2/test_events.py b/bbot/test/test_step_1/test_events.py
similarity index 100%
rename from bbot/test/test_step_2/test_events.py
rename to bbot/test/test_step_1/test_events.py
diff --git a/bbot/test/test_step_2/test_files.py b/bbot/test/test_step_1/test_files.py
similarity index 100%
rename from bbot/test/test_step_2/test_files.py
rename to bbot/test/test_step_1/test_files.py
diff --git a/bbot/test/test_step_2/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
similarity index 100%
rename from bbot/test/test_step_2/test_helpers.py
rename to bbot/test/test_step_1/test_helpers.py
diff --git a/bbot/test/test_step_2/test_manager.py b/bbot/test/test_step_1/test_manager.py
similarity index 100%
rename from bbot/test/test_step_2/test_manager.py
rename to bbot/test/test_step_1/test_manager.py
diff --git a/bbot/test/test_step_2/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
similarity index 100%
rename from bbot/test/test_step_2/test_modules_basic.py
rename to bbot/test/test_step_1/test_modules_basic.py
diff --git a/bbot/test/test_step_2/test_python_api.py b/bbot/test/test_step_1/test_python_api.py
similarity index 100%
rename from bbot/test/test_step_2/test_python_api.py
rename to bbot/test/test_step_1/test_python_api.py
diff --git a/bbot/test/test_step_2/test_scan.py b/bbot/test/test_step_1/test_scan.py
similarity index 100%
rename from bbot/test/test_step_2/test_scan.py
rename to bbot/test/test_step_1/test_scan.py
diff --git a/bbot/test/test_step_2/test_scope.py b/bbot/test/test_step_1/test_scope.py
similarity index 91%
rename from bbot/test/test_step_2/test_scope.py
rename to bbot/test/test_step_1/test_scope.py
index 6985890b50..e51fec9735 100644
--- a/bbot/test/test_step_2/test_scope.py
+++ b/bbot/test/test_step_1/test_scope.py
@@ -1,5 +1,5 @@
 from ..bbot_fixtures import *  # noqa: F401
-from ..test_step_1.module_tests.base import ModuleTestBase
+from ..test_step_2.module_tests.base import ModuleTestBase
 
 
 class Scope_test_blacklist(ModuleTestBase):
diff --git a/bbot/test/test_step_2/test_target.py b/bbot/test/test_step_1/test_target.py
similarity index 100%
rename from bbot/test/test_step_2/test_target.py
rename to bbot/test/test_step_1/test_target.py
diff --git a/bbot/test/test_step_2/test_web.py b/bbot/test/test_step_1/test_web.py
similarity index 100%
rename from bbot/test/test_step_2/test_web.py
rename to bbot/test/test_step_1/test_web.py
diff --git a/bbot/test/test_step_1/module_tests/__init__.py b/bbot/test/test_step_2/module_tests/__init__.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/__init__.py
rename to bbot/test/test_step_2/module_tests/__init__.py
diff --git a/bbot/test/test_step_1/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/base.py
rename to bbot/test/test_step_2/module_tests/base.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_affiliates.py b/bbot/test/test_step_2/module_tests/test_module_affiliates.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_affiliates.py
rename to bbot/test/test_step_2/module_tests/test_module_affiliates.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_aggregate.py b/bbot/test/test_step_2/module_tests/test_module_aggregate.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_aggregate.py
rename to bbot/test/test_step_2/module_tests/test_module_aggregate.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_anubisdb.py b/bbot/test/test_step_2/module_tests/test_module_anubisdb.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_anubisdb.py
rename to bbot/test/test_step_2/module_tests/test_module_anubisdb.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_asn.py b/bbot/test/test_step_2/module_tests/test_module_asn.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_asn.py
rename to bbot/test/test_step_2/module_tests/test_module_asn.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_asset_inventory.py b/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_asset_inventory.py
rename to bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_azure_tenant.py b/bbot/test/test_step_2/module_tests/test_module_azure_tenant.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_azure_tenant.py
rename to bbot/test/test_step_2/module_tests/test_module_azure_tenant.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_badsecrets.py b/bbot/test/test_step_2/module_tests/test_module_badsecrets.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_badsecrets.py
rename to bbot/test/test_step_2/module_tests/test_module_badsecrets.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_bevigil.py b/bbot/test/test_step_2/module_tests/test_module_bevigil.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_bevigil.py
rename to bbot/test/test_step_2/module_tests/test_module_bevigil.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_binaryedge.py b/bbot/test/test_step_2/module_tests/test_module_binaryedge.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_binaryedge.py
rename to bbot/test/test_step_2/module_tests/test_module_binaryedge.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_aws.py b/bbot/test/test_step_2/module_tests/test_module_bucket_aws.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_bucket_aws.py
rename to bbot/test/test_step_2/module_tests/test_module_bucket_aws.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_azure.py b/bbot/test/test_step_2/module_tests/test_module_bucket_azure.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_bucket_azure.py
rename to bbot/test/test_step_2/module_tests/test_module_bucket_azure.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_digitalocean.py b/bbot/test/test_step_2/module_tests/test_module_bucket_digitalocean.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_bucket_digitalocean.py
rename to bbot/test/test_step_2/module_tests/test_module_bucket_digitalocean.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_firebase.py b/bbot/test/test_step_2/module_tests/test_module_bucket_firebase.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_bucket_firebase.py
rename to bbot/test/test_step_2/module_tests/test_module_bucket_firebase.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_bucket_gcp.py b/bbot/test/test_step_2/module_tests/test_module_bucket_gcp.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_bucket_gcp.py
rename to bbot/test/test_step_2/module_tests/test_module_bucket_gcp.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_builtwith.py b/bbot/test/test_step_2/module_tests/test_module_builtwith.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_builtwith.py
rename to bbot/test/test_step_2/module_tests/test_module_builtwith.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_bypass403.py b/bbot/test/test_step_2/module_tests/test_module_bypass403.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_bypass403.py
rename to bbot/test/test_step_2/module_tests/test_module_bypass403.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_c99.py b/bbot/test/test_step_2/module_tests/test_module_c99.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_c99.py
rename to bbot/test/test_step_2/module_tests/test_module_c99.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_censys.py b/bbot/test/test_step_2/module_tests/test_module_censys.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_censys.py
rename to bbot/test/test_step_2/module_tests/test_module_censys.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_certspotter.py b/bbot/test/test_step_2/module_tests/test_module_certspotter.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_certspotter.py
rename to bbot/test/test_step_2/module_tests/test_module_certspotter.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_crobat.py b/bbot/test/test_step_2/module_tests/test_module_crobat.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_crobat.py
rename to bbot/test/test_step_2/module_tests/test_module_crobat.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_crt.py b/bbot/test/test_step_2/module_tests/test_module_crt.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_crt.py
rename to bbot/test/test_step_2/module_tests/test_module_crt.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_csv.py b/bbot/test/test_step_2/module_tests/test_module_csv.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_csv.py
rename to bbot/test/test_step_2/module_tests/test_module_csv.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py b/bbot/test/test_step_2/module_tests/test_module_dnscommonsrv.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_dnscommonsrv.py
rename to bbot/test/test_step_2/module_tests/test_module_dnscommonsrv.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py b/bbot/test/test_step_2/module_tests/test_module_dnsdumpster.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_dnsdumpster.py
rename to bbot/test/test_step_2/module_tests/test_module_dnsdumpster.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py b/bbot/test/test_step_2/module_tests/test_module_dnszonetransfer.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_dnszonetransfer.py
rename to bbot/test/test_step_2/module_tests/test_module_dnszonetransfer.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_emailformat.py b/bbot/test/test_step_2/module_tests/test_module_emailformat.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_emailformat.py
rename to bbot/test/test_step_2/module_tests/test_module_emailformat.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_excavate.py b/bbot/test/test_step_2/module_tests/test_module_excavate.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_excavate.py
rename to bbot/test/test_step_2/module_tests/test_module_excavate.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_ffuf.py b/bbot/test/test_step_2/module_tests/test_module_ffuf.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_ffuf.py
rename to bbot/test/test_step_2/module_tests/test_module_ffuf.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py b/bbot/test/test_step_2/module_tests/test_module_ffuf_shortnames.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_ffuf_shortnames.py
rename to bbot/test/test_step_2/module_tests/test_module_ffuf_shortnames.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_fingerprintx.py b/bbot/test/test_step_2/module_tests/test_module_fingerprintx.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_fingerprintx.py
rename to bbot/test/test_step_2/module_tests/test_module_fingerprintx.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_fullhunt.py b/bbot/test/test_step_2/module_tests/test_module_fullhunt.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_fullhunt.py
rename to bbot/test/test_step_2/module_tests/test_module_fullhunt.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py b/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_generic_ssrf.py
rename to bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_github.py b/bbot/test/test_step_2/module_tests/test_module_github.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_github.py
rename to bbot/test/test_step_2/module_tests/test_module_github.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_gowitness.py b/bbot/test/test_step_2/module_tests/test_module_gowitness.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_gowitness.py
rename to bbot/test/test_step_2/module_tests/test_module_gowitness.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_hackertarget.py b/bbot/test/test_step_2/module_tests/test_module_hackertarget.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_hackertarget.py
rename to bbot/test/test_step_2/module_tests/test_module_hackertarget.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_host_header.py b/bbot/test/test_step_2/module_tests/test_module_host_header.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_host_header.py
rename to bbot/test/test_step_2/module_tests/test_module_host_header.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_http.py b/bbot/test/test_step_2/module_tests/test_module_http.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_http.py
rename to bbot/test/test_step_2/module_tests/test_module_http.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_httpx.py b/bbot/test/test_step_2/module_tests/test_module_httpx.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_httpx.py
rename to bbot/test/test_step_2/module_tests/test_module_httpx.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_human.py b/bbot/test/test_step_2/module_tests/test_module_human.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_human.py
rename to bbot/test/test_step_2/module_tests/test_module_human.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunt.py b/bbot/test/test_step_2/module_tests/test_module_hunt.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_hunt.py
rename to bbot/test/test_step_2/module_tests/test_module_hunt.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_hunterio.py b/bbot/test/test_step_2/module_tests/test_module_hunterio.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_hunterio.py
rename to bbot/test/test_step_2/module_tests/test_module_hunterio.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py b/bbot/test/test_step_2/module_tests/test_module_iis_shortnames.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_iis_shortnames.py
rename to bbot/test/test_step_2/module_tests/test_module_iis_shortnames.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipneighbor.py b/bbot/test/test_step_2/module_tests/test_module_ipneighbor.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_ipneighbor.py
rename to bbot/test/test_step_2/module_tests/test_module_ipneighbor.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_ipstack.py b/bbot/test/test_step_2/module_tests/test_module_ipstack.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_ipstack.py
rename to bbot/test/test_step_2/module_tests/test_module_ipstack.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_json.py b/bbot/test/test_step_2/module_tests/test_module_json.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_json.py
rename to bbot/test/test_step_2/module_tests/test_module_json.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_leakix.py b/bbot/test/test_step_2/module_tests/test_module_leakix.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_leakix.py
rename to bbot/test/test_step_2/module_tests/test_module_leakix.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_masscan.py b/bbot/test/test_step_2/module_tests/test_module_masscan.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_masscan.py
rename to bbot/test/test_step_2/module_tests/test_module_masscan.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_massdns.py b/bbot/test/test_step_2/module_tests/test_module_massdns.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_massdns.py
rename to bbot/test/test_step_2/module_tests/test_module_massdns.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_naabu.py b/bbot/test/test_step_2/module_tests/test_module_naabu.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_naabu.py
rename to bbot/test/test_step_2/module_tests/test_module_naabu.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_neo4j.py b/bbot/test/test_step_2/module_tests/test_module_neo4j.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_neo4j.py
rename to bbot/test/test_step_2/module_tests/test_module_neo4j.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_ntlm.py b/bbot/test/test_step_2/module_tests/test_module_ntlm.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_ntlm.py
rename to bbot/test/test_step_2/module_tests/test_module_ntlm.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_nuclei.py b/bbot/test/test_step_2/module_tests/test_module_nuclei.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_nuclei.py
rename to bbot/test/test_step_2/module_tests/test_module_nuclei.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_otx.py b/bbot/test/test_step_2/module_tests/test_module_otx.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_otx.py
rename to bbot/test/test_step_2/module_tests/test_module_otx.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_paramminer_cookies.py
rename to bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_paramminer_getparams.py
rename to bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_paramminer_headers.py
rename to bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_passivetotal.py b/bbot/test/test_step_2/module_tests/test_module_passivetotal.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_passivetotal.py
rename to bbot/test/test_step_2/module_tests/test_module_passivetotal.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_pgp.py b/bbot/test/test_step_2/module_tests/test_module_pgp.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_pgp.py
rename to bbot/test/test_step_2/module_tests/test_module_pgp.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_python.py b/bbot/test/test_step_2/module_tests/test_module_python.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_python.py
rename to bbot/test/test_step_2/module_tests/test_module_python.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_rapiddns.py b/bbot/test/test_step_2/module_tests/test_module_rapiddns.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_rapiddns.py
rename to bbot/test/test_step_2/module_tests/test_module_rapiddns.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_riddler.py b/bbot/test/test_step_2/module_tests/test_module_riddler.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_riddler.py
rename to bbot/test/test_step_2/module_tests/test_module_riddler.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_robots.py b/bbot/test/test_step_2/module_tests/test_module_robots.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_robots.py
rename to bbot/test/test_step_2/module_tests/test_module_robots.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_secretsdb.py b/bbot/test/test_step_2/module_tests/test_module_secretsdb.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_secretsdb.py
rename to bbot/test/test_step_2/module_tests/test_module_secretsdb.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_securitytrails.py b/bbot/test/test_step_2/module_tests/test_module_securitytrails.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_securitytrails.py
rename to bbot/test/test_step_2/module_tests/test_module_securitytrails.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_shodan_dns.py b/bbot/test/test_step_2/module_tests/test_module_shodan_dns.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_shodan_dns.py
rename to bbot/test/test_step_2/module_tests/test_module_shodan_dns.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_skymem.py b/bbot/test/test_step_2/module_tests/test_module_skymem.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_skymem.py
rename to bbot/test/test_step_2/module_tests/test_module_skymem.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_smuggler.py b/bbot/test/test_step_2/module_tests/test_module_smuggler.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_smuggler.py
rename to bbot/test/test_step_2/module_tests/test_module_smuggler.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_social.py b/bbot/test/test_step_2/module_tests/test_module_social.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_social.py
rename to bbot/test/test_step_2/module_tests/test_module_social.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_speculate.py b/bbot/test/test_step_2/module_tests/test_module_speculate.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_speculate.py
rename to bbot/test/test_step_2/module_tests/test_module_speculate.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_sslcert.py b/bbot/test/test_step_2/module_tests/test_module_sslcert.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_sslcert.py
rename to bbot/test/test_step_2/module_tests/test_module_sslcert.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py b/bbot/test/test_step_2/module_tests/test_module_subdomain_hijack.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_subdomain_hijack.py
rename to bbot/test/test_step_2/module_tests/test_module_subdomain_hijack.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_sublist3r.py b/bbot/test/test_step_2/module_tests/test_module_sublist3r.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_sublist3r.py
rename to bbot/test/test_step_2/module_tests/test_module_sublist3r.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_telerik.py b/bbot/test/test_step_2/module_tests/test_module_telerik.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_telerik.py
rename to bbot/test/test_step_2/module_tests/test_module_telerik.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_threatminer.py b/bbot/test/test_step_2/module_tests/test_module_threatminer.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_threatminer.py
rename to bbot/test/test_step_2/module_tests/test_module_threatminer.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_url_manipulation.py b/bbot/test/test_step_2/module_tests/test_module_url_manipulation.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_url_manipulation.py
rename to bbot/test/test_step_2/module_tests/test_module_url_manipulation.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_urlscan.py b/bbot/test/test_step_2/module_tests/test_module_urlscan.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_urlscan.py
rename to bbot/test/test_step_2/module_tests/test_module_urlscan.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_vhost.py b/bbot/test/test_step_2/module_tests/test_module_vhost.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_vhost.py
rename to bbot/test/test_step_2/module_tests/test_module_vhost.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_viewdns.py b/bbot/test/test_step_2/module_tests/test_module_viewdns.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_viewdns.py
rename to bbot/test/test_step_2/module_tests/test_module_viewdns.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_virustotal.py b/bbot/test/test_step_2/module_tests/test_module_virustotal.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_virustotal.py
rename to bbot/test/test_step_2/module_tests/test_module_virustotal.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_wafw00f.py b/bbot/test/test_step_2/module_tests/test_module_wafw00f.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_wafw00f.py
rename to bbot/test/test_step_2/module_tests/test_module_wafw00f.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_wappalyzer.py b/bbot/test/test_step_2/module_tests/test_module_wappalyzer.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_wappalyzer.py
rename to bbot/test/test_step_2/module_tests/test_module_wappalyzer.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_wayback.py b/bbot/test/test_step_2/module_tests/test_module_wayback.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_wayback.py
rename to bbot/test/test_step_2/module_tests/test_module_wayback.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_web_report.py b/bbot/test/test_step_2/module_tests/test_module_web_report.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_web_report.py
rename to bbot/test/test_step_2/module_tests/test_module_web_report.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_websocket.py b/bbot/test/test_step_2/module_tests/test_module_websocket.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_websocket.py
rename to bbot/test/test_step_2/module_tests/test_module_websocket.py
diff --git a/bbot/test/test_step_1/module_tests/test_module_zoomeye.py b/bbot/test/test_step_2/module_tests/test_module_zoomeye.py
similarity index 100%
rename from bbot/test/test_step_1/module_tests/test_module_zoomeye.py
rename to bbot/test/test_step_2/module_tests/test_module_zoomeye.py

From 7036a6033c920b903ad8f404b96ae0cf07f5efdf Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 00:22:07 -0400
Subject: [PATCH 052/387] better asset inventory tests

---
 bbot/test/test_step_2/module_tests/base.py    |  4 +---
 .../test_module_asset_inventory.py            | 22 +++++++++++++++++++
 2 files changed, 23 insertions(+), 3 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index 3029fb359b..096f667b90 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -62,7 +62,7 @@ def __init__(self, module_test_base, httpx_mock, httpserver, monkeypatch, reques
             # handle output, internal module types
             output_modules = None
             modules = list(module_test_base.modules)
-            output_modules = []
+            output_modules = ["python"]
             for module in list(modules):
                 module_type = self.preloaded[module]["type"]
                 if module_type in ("internal", "output"):
@@ -71,8 +71,6 @@ def __init__(self, module_test_base, httpx_mock, httpserver, monkeypatch, reques
                         output_modules.append(module)
                     elif module_type == "internal":
                         self.config = OmegaConf.merge(self.config, {module: True})
-            if not output_modules:
-                output_modules = None
 
             self.scan = Scanner(
                 *module_test_base.targets,
diff --git a/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py b/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
index b128fd6275..b0ff63c8a5 100644
--- a/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
+++ b/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
@@ -3,9 +3,31 @@
 
 class TestAsset_Inventory(ModuleTestBase):
     targets = ["8.8.8.8"]
+    scan_name = "asset_inventory_test"
     config_overrides = {"dns_resolution": True}
+    modules_overrides = ["asset_inventory", "speculate", "sslcert"]
 
     def check(self, module_test, events):
+        assert any(e.type == "OPEN_TCP_PORT" for e in events), "No open port found"
+        assert any(e.type == "DNS_NAME" for e in events), "No DNS name found"
+        filename = next(module_test.scan.home.glob("asset-inventory.csv"))
+        with open(filename) as f:
+            assert "8.8.8.8,,8.8.8.8" in f.read()
+        filename = next(module_test.scan.home.glob("asset-inventory-ip-addresses-table*.txt"))
+        with open(filename) as f:
+            assert "8.8.0.0/16" in f.read()
+        filename = next(module_test.scan.home.glob("asset-inventory-domains-table*.txt"))
+        with open(filename) as f:
+            assert "dns.google" in f.read()
+
+
+class TestAsset_InventoryEmitPrevious(TestAsset_Inventory):
+    config_overrides = {"dns_resolution": True, "output_modules": {"asset_inventory": {"use_previous": True}}}
+    modules_overrides = ["asset_inventory"]
+
+    def check(self, module_test, events):
+        assert any(e.type == "OPEN_TCP_PORT" for e in events), "No open port found"
+        assert any(e.type == "DNS_NAME" for e in events), "No DNS name found"
         filename = next(module_test.scan.home.glob("asset-inventory.csv"))
         with open(filename) as f:
             assert "8.8.8.8,,8.8.8.8" in f.read()

From afe47c60899bfe3da38826ce0705169c110a829d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 00:38:29 -0400
Subject: [PATCH 053/387] better test coverage

---
 bbot/agent/agent.py                 | 31 +----------------------------
 bbot/core/helpers/dns.py            | 11 ----------
 bbot/test/test_step_1/test_agent.py |  8 ++++++++
 3 files changed, 9 insertions(+), 41 deletions(-)

diff --git a/bbot/agent/agent.py b/bbot/agent/agent.py
index f2a98b0cd1..6c170cfacb 100644
--- a/bbot/agent/agent.py
+++ b/bbot/agent/agent.py
@@ -107,36 +107,7 @@ async def send(self, message):
                 await asyncio.sleep(1)
                 # rebuild = True
 
-    async def on_message(self, websocket, path):
-        message = await websocket.recv()
-        try:
-            message = json.loads(message)
-        except Exception as e:
-            log.warning(f'Failed to JSON-decode message "{message}": {e}')
-            return
-        message = messages.Message(**message)
-
-        if message.command == "ping":
-            if self.scan is None:
-                await self.send({"conversation": str(message.conversation), "message_type": "pong"})
-                return
-            else:
-                log.warning(f'Invalid command: "{message.command}"')
-
-        command_type = None
-        try:
-            command_type = getattr(messages, message.command)
-        except AttributeError:
-            log.warning(f'Invalid command: "{message.command}"')
-
-        command_args = command_type(**message.arguments)
-        command_fn = getattr(self, message.command)
-        async with self.error_hndle():
-            response = await command_fn(**command_args.dict())
-            log.info(str(response))
-            await self.send({"conversation": str(message.conversation), "message": response})
-
-    async def start_scan(self, scan_id="", name=None, targets=[], modules=[], output_modules=[], config={}):
+    async def start_scan(self, scan_id, name=None, targets=[], modules=[], output_modules=[], config={}):
         async with self._scan_lock:
             if self.scan is None:
                 log.success(
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 48bb444cc4..917652a1b6 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -1,7 +1,6 @@
 import asyncio
 import logging
 import ipaddress
-import traceback
 import dns.exception
 import dns.asyncresolver
 from contextlib import suppress
@@ -576,16 +575,6 @@ async def is_wildcard_domain(self, domain, log_info=False):
 
         return wildcard_domain_results
 
-    def _catch_keyboardinterrupt(self, callback, *args, **kwargs):
-        try:
-            return callback(*args, **kwargs)
-        except Exception as e:
-            log.error(f"Error in {callback.__qualname__}(): {e}")
-            log.trace(traceback.format_exc())
-        except KeyboardInterrupt:
-            if self.parent_helper.scan:
-                self.parent_helper.scan.stop()
-
     def debug(self, *args, **kwargs):
         if self._debug:
             log.debug(*args, **kwargs)
diff --git a/bbot/test/test_step_1/test_agent.py b/bbot/test/test_step_1/test_agent.py
index a673effeae..2497791ef5 100644
--- a/bbot/test/test_step_1/test_agent.py
+++ b/bbot/test/test_step_1/test_agent.py
@@ -132,9 +132,17 @@ async def websocket_handler(websocket, path):
 
 @pytest.mark.asyncio
 async def test_agent(agent):
+    scan_status = await agent.scan_status()
+    assert scan_status["error"] == "Scan not in progress"
+
     global success
     async with websockets.serve(websocket_handler, "127.0.0.1", 8765):
         asyncio.create_task(agent.start())
         # wait for 30 seconds
         await asyncio.wait_for(scan_done.wait(), 10)
         assert success
+
+        await agent.start_scan("scan_to_be_cancelled", targets=["127.0.0.1"], modules=["ipneighbor"])
+        await agent.start_scan("scan_to_be_rejected", targets=["127.0.0.1"], modules=["ipneighbor"])
+        await asyncio.sleep(0.1)
+        await agent.stop_scan()

From 866502242e39867e46937e3ce2c9f154342d3da6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 00:50:15 -0400
Subject: [PATCH 054/387] better test coverage

---
 bbot/test/helpers.py                          | 93 -------------------
 bbot/test/test_step_1/test_scan.py            | 12 ++-
 .../module_tests/test_module_crobat.py        | 12 ++-
 3 files changed, 22 insertions(+), 95 deletions(-)
 delete mode 100644 bbot/test/helpers.py

diff --git a/bbot/test/helpers.py b/bbot/test/helpers.py
deleted file mode 100644
index a4aa453c9a..0000000000
--- a/bbot/test/helpers.py
+++ /dev/null
@@ -1,93 +0,0 @@
-import logging
-from abc import abstractmethod
-from omegaconf import OmegaConf
-
-log = logging.getLogger("bbot.test.helpers")
-
-
-class MockHelper:
-    targets = ["blacklanternsecurity.com"]
-    blacklist = None
-    whitelist = None
-    config_overrides = {}
-    additional_modules = []
-
-    def __init__(self, request, **kwargs):
-        self.name = kwargs.get("module_name", self.__class__.__name__.lower())
-        self.bbot_config = request.getfixturevalue("bbot_config")
-        self.bbot_scanner = request.getfixturevalue("bbot_scanner")
-        self.config = OmegaConf.merge(self.bbot_config, OmegaConf.create(self.config_overrides))
-        modules = [self.name] + self.additional_modules
-        self.scans = []
-        self.scan = self.add_scan(
-            *self.targets,
-            modules=modules,
-            name=f"{self.name}_test",
-            config=self.config,
-            whitelist=self.whitelist,
-            blacklist=self.blacklist,
-        )
-
-    def add_scan(self, *args, **kwargs):
-        scan = self.bbot_scanner(*args, **kwargs)
-        self.scans.append(scan)
-        return scan
-
-    def setup(self, scan):
-        pass
-
-    async def run(self):
-        for i, scan in enumerate(self.scans):
-            if i == 0:
-                self.scan = scan
-            await scan.prep()
-            self.setup(scan)
-
-        self._after_scan_prep()
-        for i, scan in enumerate(self.scans):
-            events = [e async for e in scan.start()]
-            self.check_events(events)
-
-    @abstractmethod
-    def check_events(self, events):
-        raise NotImplementedError
-
-    @property
-    def module(self):
-        return self.scan.modules[self.name]
-
-    def _after_scan_prep(self):
-        pass
-
-
-class RequestMockHelper(MockHelper):
-    def __init__(self, request, **kwargs):
-        self.httpx_mock = request.getfixturevalue("httpx_mock")
-        super().__init__(request, **kwargs)
-
-    @abstractmethod
-    def mock_args(self):
-        raise NotImplementedError
-
-    def _after_scan_prep(self):
-        self.mock_args()
-
-
-class HttpxMockHelper(MockHelper):
-    targets = ["http://127.0.0.1:8888/"]
-
-    def __init__(self, request, **kwargs):
-        self.bbot_httpserver = request.getfixturevalue("bbot_httpserver")
-        super().__init__(request, **kwargs)
-
-    @abstractmethod
-    def mock_args(self):
-        raise NotImplementedError
-
-    def set_expect_requests(self, expect_args={}, respond_args={}):
-        if "uri" not in expect_args:
-            expect_args["uri"] = "/"
-        self.bbot_httpserver.expect_request(**expect_args).respond_with_data(**respond_args)
-
-    def _after_scan_prep(self):
-        self.mock_args()
diff --git a/bbot/test/test_step_1/test_scan.py b/bbot/test/test_step_1/test_scan.py
index 1b50e02414..6aeae96317 100644
--- a/bbot/test/test_step_1/test_scan.py
+++ b/bbot/test/test_step_1/test_scan.py
@@ -11,8 +11,13 @@ async def test_scan(
     bbot_scanner,
 ):
     scan0 = bbot_scanner(
-        "8.8.8.8/31", "evilcorp.com", blacklist=["8.8.8.8/28", "www.evilcorp.com"], config=bbot_config
+        "8.8.8.8/31",
+        "evilcorp.com",
+        blacklist=["8.8.8.8/28", "www.evilcorp.com"],
+        modules=["ipneighbor"],
+        config=bbot_config,
     )
+    await scan0.load_modules()
     assert scan0.whitelisted("8.8.8.8")
     assert scan0.whitelisted("8.8.8.9")
     assert scan0.blacklisted("8.8.8.15")
@@ -27,6 +32,11 @@ async def test_scan(
     assert scan0.in_scope("test.api.evilcorp.com")
     assert not scan0.in_scope("test.www.evilcorp.com")
     assert not scan0.in_scope("www.evilcorp.co.uk")
+    j = scan0.json
+    assert "8.8.8.8/31" in j["targets"]
+    assert "8.8.8.8/31" in j["whitelist"]
+    assert "8.8.8.0/28" in j["blacklist"]
+    assert "ipneighbor" in j["modules"]
 
     scan1 = bbot_scanner("8.8.8.8", whitelist=["8.8.4.4"], config=bbot_config)
     assert not scan1.blacklisted("8.8.8.8")
diff --git a/bbot/test/test_step_2/module_tests/test_module_crobat.py b/bbot/test/test_step_2/module_tests/test_module_crobat.py
index f04d75809e..da02a58a0d 100644
--- a/bbot/test/test_step_2/module_tests/test_module_crobat.py
+++ b/bbot/test/test_step_2/module_tests/test_module_crobat.py
@@ -2,7 +2,7 @@
 
 
 class TestCrobat(ModuleTestBase):
-    async def setup_after_prep(self, module_test):
+    async def setup_before_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url="https://sonar.omnisint.io/subdomains/blacklanternsecurity.com",
             json=["asdf.blacklanternsecurity.com"],
@@ -10,3 +10,13 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+
+
+class TestCrobatSetErrorState(TestCrobat):
+    modules_overrides = ["crobat"]
+
+    async def setup_after_prep(self, module_test):
+        module_test.scan.modules["crobat"].set_error_state()
+
+    def check(self, module_test, events):
+        assert module_test.scan.modules["crobat"].errored == True

From 8a8eaba853d77e3f1de18544db6fdcc1fddce709 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 09:59:32 -0400
Subject: [PATCH 055/387] consolidate skymem tests

---
 .../module_tests/test_module_skymem.py        | 1209 +----------------
 1 file changed, 15 insertions(+), 1194 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_skymem.py b/bbot/test/test_step_2/module_tests/test_module_skymem.py
index 23da240727..58ae02950e 100644
--- a/bbot/test/test_step_2/module_tests/test_module_skymem.py
+++ b/bbot/test/test_step_2/module_tests/test_module_skymem.py
@@ -25,1198 +25,19 @@ def check(self, module_test, events):
 
 
 page_1_body = """
-<!DOCTYPE html>
-<html lang="en">
-<head>
-    <meta charset="utf-8" />    
-    <meta name="viewport" content="width=device-width, initial-scale=1">
-    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
-    <title>q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails</title>
-    <meta property="fb:app_id" content="876814239665436" /> 
-    <meta name="keywords" content="email, emails, email list, email marketing, marketing,  contacts, contact">
-    <meta name="description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails">
-    <meta name="author" content="Skymem">
-    <meta property="og:title" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
-    <meta property="og:site_name" content="Skymem web page" />
-    <meta property="og:type" content="website" />
-    <meta property="og:url" content="http://www.skymem.info/srch?q=blacklanternsecurity.com" />
-    <meta property="og:description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
-    <meta property="og:image" content="http://www.skymem.info/images/www2.jpg" />
-    <meta property="og:image:type" content="image/jpeg" />
-    <meta property="og:image:width" content="400" />
-    <meta property="og:image:height" content="300" />
-    <meta name="google-site-verification" content="tfut_b-dbvVtExEHbFHdpQirHTtvQLRFmBJOBw38s7w" />
-    <meta name="robots" content="noarchive">
-    <!-- Material Design for Bootstrap fonts and icons -->
-<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,400,500,700|Material+Icons">
-<link href="/lib2/mcw/dist/material-components-web.css" rel="stylesheet" />
-<link rel="stylesheet" href="https://stackpath.bootstrapcdn.com/bootstrap/4.2.1/css/bootstrap.min.css" />
-<meta name="x-stylesheet-fallback-test" content="" class="sr-only" /><script>!function(a,b,c,d){var e,f=document,g=f.getElementsByTagName("SCRIPT"),h=g[g.length-1].previousElementSibling,i=f.defaultView&&f.defaultView.getComputedStyle?f.defaultView.getComputedStyle(h):h.currentStyle;if(i&&i[a]!==b)for(e=0;e<c.length;e++)f.write('<link href="'+c[e]+'" '+d+"/>")}("position","absolute",["/lib2/bootstrap/dist/css/bootstrap.min.css"], "rel=\u0022stylesheet\u0022 ");</script>
-<link rel="stylesheet" href="/lib2/angular-ui-grid/ui-grid.css" />
-<link rel="stylesheet" href="/css/site.min.css" />
-<script src="/lib2/angular/angular.min.js"></script>
-        <script>            
-            (function (i, s, o, g, r, a, m) {
-                i['GoogleAnalyticsObject'] = r;
-                i[r] = i[r] ||
-                    function () {
-                        (i[r].q = i[r].q || []).push(arguments);
-                    }, i[r].l = 1 * new Date();
-                a = s.createElement(o),
-                    m = s.getElementsByTagName(o)[0];
-                a.async = 1;
-                a.src = g;
-                m.parentNode.insertBefore(a, m);
-            })(window, document, 'script', '//www.google-analytics.com/analytics.js', 'ga');
-            ga('create', 'UA-177951-20', 'auto');
-            ga('send', 'pageview');
-        </script>
-    <meta name="yandex-verification" content="552f869c3d2c3790" />
-    <!-- Bing: Verify ownership for: www.skymem.info -->
-    <meta name="msvalidate.01" content="C0E58004DB6ADBA4BDA8A8683D08CEF5" />
-    <meta name="exoclick-site-verification" content="a21b82b756cc4c93d048b5d81c98ed70">
-<meta name="ahrefs-site-verification" content="2dd82e09740f685c7a184846aa6da037541576526eda4833a0c622189d9a323a">
-</head>
-<body>
-<script>
-  window.fbAsyncInit = function() {
-    FB.init({
-      appId      : '876814239665436',
-      xfbml      : true,
-      version    : 'v12.0'
-    });
-    FB.AppEvents.logPageView();
-  };
-  (function(d, s, id){
-     var js, fjs = d.getElementsByTagName(s)[0];
-     if (d.getElementById(id)) {return;}
-     js = d.createElement(s); js.id = id;
-     js.src = "https://connect.facebook.net/en_US/sdk.js";
-     fjs.parentNode.insertBefore(js, fjs);
-   }(document, 'script', 'facebook-jssdk'));
-</script>
-<div id="fb-root"></div>
-<script async defer crossorigin="anonymous" src="https://connect.facebook.net/en_US/sdk.js#xfbml=1&version=v12.0&appId=876814239665436&autoLogAppEvents=1" nonce="CJ4gP3PN"></script>
-    <header>
-        <div style="border-bottom:1px solid #ffffff;">
-            <nav class="navbar navbar-expand-md navbar-light bg-light" style="border-bottom:1px solid #d8d8d8;background-color: #fff!important;">
-                <div class="container">
-                    <a class="navbar-brand valign-center text-muted" href="/"><i class="material-icons nav-link-go1">home</i></a>
-                    <button class="navbar-toggler collapsed" type="button" data-toggle="collapse" data-target="#navbarsExample07" aria-controls="navbarsExample07" aria-expanded="false" aria-label="Toggle navigation">
-                        <span class="navbar-toggler-icon"></span>
-                    </button>
-                    <div class="navbar-collapse collapse" id="navbarsExample07" style="">
-                        <ul class="navbar-nav mr-auto">
-                            <li class="nav-item">
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/list"><i class="material-icons" style="color:#007bff;">add</i> &nbsp; <span>Create email list</span></a>
-                            </li>
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/lists"> <i class="material-icons">mail_outline</i> &nbsp; <span>Email Lists</span></a>
-                            </li>
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/"> <i class="material-icons">search</i> &nbsp; <span></span></a>
-                            </li>
-                            
-                        </ul>
-                    </div>
-                </div>
-            </nav>
-        </div>
-    </header>
-    <main role="main">\
-        
-<style>
-img {
-  margin: 0em auto;
-  display: inline-block;  
-  width: 18px;
-}
-</style>
-<script>
-    var EmptyListPackData =  {"DocResRep":{"ItemsUI":null,"UiLimit":{"Throttle":0.15,"MiningInAdCasePer":0,"MiningInNoAdCasePer":100,"ShowAd":false,"EmailShowOnFirstSearchPage":5,"RelatedEmailsMax":100,"RelatedEmailsItemsPerPage":10,"EmailSearchCountLimitOnMore":50,"DomainCountShowOnFirstSearchPage":10,"DomainRelatedLimitOnMore":200,"DomainRelatedItemsPerPage":25,"EmailsOfDomainShowPercentageOfAll":50,"ItemsPerPageOnList":5,"ListIdItemsPerPage":25,"MaxEmailsInTrial":50,"DownloadEmailsCountTrialLimit":30},"ListVersionId":null,"ListName":null,"ListFilter":{"ConditionANDs":[],"NEmailPerDomain":2000000,"EmailsLimitPerList":2000000,"HostLimitPerList":2000000,"EmailsPreviewMaxCount":100,"HostsPreviewMaxCount":5000},"ListPackDesc":null,"ListFilterItems":null,"HostORItems":null,"OtherORItems":null,"FV":null,"DomainCount":0,"EmailCount":0,"TotalNEmails":null,"FoundNEmails":null,"CloneBy":null,"ListInternalType":"Normal","MarketplaceLP":null,"OperationMod":"None","FinishedPercentage":0.0,"ListComplete":null,"ListCompleteStat":null,"TrialEmails":[],"PriceCalc":null,"BuyNowUrl":null,"TotalNDomains":null,"CreatorId":null,"CreatorName":null,"IdEntity":null,"IdDoc":null,"IdDocVer":null,"ExtraElements":null},"DocCollection":"","Resources":""}; 
-</script>
-<div ng-app="AppMain">
-    <div ng-controller="SearchResultCtrl">
-        <div class="container">
-            
-    <form class="form" role="form">
-            <div class="input-group input-group-lg mb-3"
-                 title="The search lets you find all the email addresses using one given domain name (for example, 'company.com').">
-                <input type="text" style="min-width: 200px;" ng-model="Doc.SearchRequest" class="form-control" placeholder="company.com" autofocus />
-                <span ng-init="Doc.SearchRequest='blacklanternsecurity.com'"></span>
-                <div class="input-group-append">
-                    <button type="submit" value="Submit" class="btn btn-primary btn-lg" ng-click="post()">
-                        <div class="valign-center">
-                            <i class="material-icons md-24">search</i>
-                        </div>
-                        <span class="d-none d-sm-inline-block"> Find </span> <span class="d-none d-md-inline-block">email </span> <span class="d-none d-lg-inline-block"> addresses</span>
-                    </button>
-                </div>
-            </div>     
-            <div style="position:relative; top:-18px;">
-                <a href="#a" class="popovers" style="text-decoration:none;"
-                   data-toggle="popover" data-trigger="manual" title="New feature in search"
-                   data-original-title="New feature in search"
-                   data-content="Type first and last name with domain name and we will do our best to find the email of this person. eg. <br /> <a href='/srch?q=david%20baker%20exeloncorp.com&ss=home'><strong>david baker exeloncorp.com</strong></a>">                   
-                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
-                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
-                    </div>
-                </a>
-            </div>
-    </form>
-            <div style="margin: 0 0; text-align: center;">
-            </div>
-        <div class="row ">
-                <div class="col-sm-8" style="padding-top:20px">
-                    <!-- Emails found -------------------------------------------------------------------------- -->
-                    <!-- Related emails -------------------------------------------------------------------------- -->
-                    <!-- Domain XXX emails found -------------------------------------------------------------------------- -->
-                        <div style="padding-bottom:20px">
-                            <div class="valign-center text-muted mdc-typography--headline5" title="Domain related to this search result">
-                                <!-- <i class="material-icons md-dark md-36">language</i>&nbsp; --> 
-                <img style="width: 32px; margin-right:5px;" src="https://s2.googleusercontent.com/s2/favicons?domain=blacklanternsecurity.com&sz=128" />
-                                <a href="/srch?q=blacklanternsecurity.com">blacklanternsecurity.com</a>&nbsp;
-                                <span title="Press CTRL + mouse click or middle mouse button, to open in background tab. This is a link to external web site of this domene in form https://example.com. If web site in form www.example.com or is not have SSL change to http://www.example.com">
-                                    <a href="https://blacklanternsecurity.com" target="_blank">
-                                        <i class="material-icons" style="width:20px;font-size: 18px; color:#c1c1c1">outbound_outline</i>
-                                    </a>
-                                </span>
-                                <small><small>(1768 emails)</small></small>
-                            </div>
-                            <span title="Buy Now all 1768 emails of domain blacklanternsecurity.com">
-                                &nbsp;
-                                <button type="button" class="btn btn-primary btn-sm" ng-disabled="DisabledBuyNow" ng-click="buyOneDomain('blacklanternsecurity.com')">
-                                    <i class="material-icons md-18">arrow_right</i> Buy Now
-                                </button>
-                            </span>
-                            <button class="mdc-icon-button material-icons md-18"
-                                    style="color:#aaa"
-                                    data-toggle="popover" data-trigger="focus" data-html="true" title="Buy Now"
-                                    data-content=" &lt;b&gt;Buy now&lt;/b&gt; all &lt;b&gt;1768&lt;/b&gt; emails of &lt;b&gt;blacklanternsecurity.com&lt;/b&gt; domain.&lt;br /&gt;&#xD;&#xA;                                            &lt;b&gt;Here&lt;/b&gt; is only the preview part of all emails for this domain.&lt;br /&gt;&#xD;&#xA;                                             &lt;b&gt;After &lt;/b&gt; you press &lt;b&gt;Buy now&lt;/b&gt; button we will redirect you to email list with all emails of this domain,&#xD;&#xA;                                                    where you can buy it with PayPal or any of popular credit card or with Bitcoin (see &lt;a href=&#x27;/faq&#x27;&gt;FAQ&lt;/a&gt;) &lt;br /&gt;&lt;br /&gt;&#xD;&#xA;                                            ">
-                                help_outline
-                            </button>
-                            <div ng-show="ShowProgressBar" class="ng-hide">
-                                <div class="progress position-relative" style="height: 5px;margin-bottom:2px;">
-                                    <div class="progress-bar progress-bar-striped progress-bar-animated" role="progressbar" aria-valuemin="0" aria-valuemax="100"
-                                         style="width:{{ProgressBarValue}}%;  background-color:rgb(148, 194, 250) !important;"></div>
-                                    <span class="justify-content-center d-flex position-absolute w-100"></span>
-                                </div>
-                            </div>
-                            <span hidden ng-init="Doc.DomainEmails.Host='blacklanternsecurity.com'"></span>
-                            <span hidden ng-init="Doc.DomainEmails.IdEntity='5679236812ad5b3f748a413d'"></span>
-                            <table class="table table-striped  table-sm table-hover table-bordered text-muted">
-                                <thead class="table-primary">
-                                    <tr class="info">
-                                            <th style="width:1%;">#</th>
-                                        <th>
-                                            <div class="valign-center text-muted" title="Number of domain that filtered at least one email. Other domain is not in this list but it still you can see it in filter.">
-                                                <i class="material-icons md-dark">mail_outline</i> &nbsp; Email
-                                            </div>
-                                        </th>
-                                    </tr>
-                                </thead>
-                                <tbody>
-                                            <tr>
-                                                <td scope="row">1</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">2</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">3</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">4</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">5</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">6</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">7</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">8</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">9</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">10</td>
-                                                <td>
-                                                    <a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                </tbody>
-                            </table>
-                                <a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
-                                <a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
-                        </div>
-                    <!-- Related domains -------------------------------------------------------------------------- -->
-            <br />
-            <br />
-            <br />
-            <br />
-      <div class="fb-comments" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="100%" data-numposts="5"></div>
-                </div>
-            <div class="col-sm-4" style="padding-top:60px;">
-             
-<div  style="display:inline-block;vertical-align:top;">
-    <div  style="display:inline-block;vertical-align:top;margin-top:-3px;">
-        <div class="fb-save" data-uri="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-size="small"></div>        </div>     
-    <div  style="display:inline-block;vertical-align:top;margin-top:0px;">
-        <div class="fb-like" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="" data-layout="button_count" data-action="like" data-size="small" data-share="true" data-colorscheme="light"></div>
-        </div>      
-</div>             
-<hr />
-            
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        
-    </div>
-</div>
-<br />
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        <br />
-        
-    </div>
-</div>
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        <br />
-        
-    </div>
-</div>  
-            <br />
-            <br />
-        </div>
-            </div>
-        </div>
-    </div>
-</div>
-    </main>
-    <footer class="text-muted" style="background-color: #ddd; margin-top: 60px; padding-top: 60px;">
-        <div class="container">
-            <hr>
-            <div class="row">
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">&copy; Skymem</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/">Home</a></li>
-                        <li><a href="/list">Create new email list</a></li>
-                        <li><a href="/faq">FAQ</a></li>
-                        <li><a href="/lists">Email lists</a></li>
-                <li>
-<a href="#a" class="popovers" style="text-decoration:none;"
-                   data-toggle="popover" data-trigger="manual" title="Name Extractor from text."
-                   data-original-title="Name Extractor from text."
-                   data-content="Try our new tool in (alfa version) for extracting person names from any kind of text.">                   
-                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
-                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
-                    </div>
-                </a>
-                                <a href="http://name.skymem.info"> New Tool: <b>Name Explorer</b></a>
-                            </li>
-                <li>
-                                <a href="http://martext.skymem.info"> MarText</a>
-                            </li>
-                        <li><a href="/donation">BitCoin Donations</a></li>
-                    </ul>
-                </div>
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">Contact</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/contact">Contact Us</a></li>
-                        <li><a href="https://www.facebook.com/Skymem-128969217176249/" target="_blank">Facebook page</a></li>
-            <li><a href="https://www.facebook.com/groups/169518103095402" target="_blank">Facebook group</a></li>
-            <li><a href="https://twitter.com/skymem" target="_blank">Twitter</a></li>
-                    </ul>
-                </div>
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">Policies</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/dmca-policy">DMCA Policy</a></li>
-                        <li><a href="/spam-policy">Spam Policy</a></li>
-                        <li><a href="/cookies-policy">Cookies Policy</a></li>
-                        <li><a href="/terms">Terms of Service</a></li>
-                        <li><a href="/privacy-policy">Privacy Policy</a></li>
-                        <li>
-                            <a href="http://www1395355448.e-cdn.com" rel="nofollow" target="_blank">Fight Spam!</a>
-                        </li>
-                    </ul>
-                </div>
-            </div>
-            <br />
-        </div>
-    </footer>
-    
-<script src="https://code.jquery.com/jquery-3.4.1.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous">
-</script>
-<script>(window.jQuery||document.write("\u003Cscript src=\u0022/lib2/jquery/jquery.min.js\u0022 integrity=\u0022sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
-<script src="https://stackpath.bootstrapcdn.com/bootstrap/4.3.1/js/bootstrap.bundle.min.js" integrity="sha384-xrRywqdh3PHs8keKZN+8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o" crossorigin="anonymous">
-</script>
-<script>(window.jQuery && window.jQuery.fn && window.jQuery.fn.modal||document.write("\u003Cscript src=\u0022/lib2/bootstrap/dist/js/bootstrap.bundle.min.js\u0022 integrity=\u0022sha384-xrRywqdh3PHs8keKZN\u002B8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/lodash.js/4.17.15/lodash.min.js" integrity="sha256-VeNaFBVDhoX3H+gJ37DpT/nTuZTdjYro9yBruHjVmoQ=" crossorigin="anonymous"></script>
-<script src="/lib2/angular-ui-grid/ui-grid.min.js"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/URI.js/1.19.1/URI.min.js"></script>
-<script src="/tsscripts/tsc.js?v=8ScpiXoINQWyILwjXqQp3feeposq0Ze9zjhZzJBAxc8"></script>
-<script src="/lib2/mcw/dist/material-components-web.min.js"></script>
-<script>
-    //$(function () {
-    //    $('[data-toggle="popover"]').popover();
-    //});
-    $(function () {
-        $("[data-toggle=popover]")
-            .popover({ html: true })
-            .on("focus", function () {
-                $(this).popover("show");
-            }).on("focusout", function () {
-                var _this = this;
-                if (!$(".popover:hover").length) {
-                    $(this).popover("hide");
-                }
-                else {
-                    $('.popover').mouseleave(function () {
-                        $(_this).popover("hide");
-                        $(this).off('mouseleave');
-                    });
-                }
-            });
-    });
-    $('.popover-dismiss').popover({
-        trigger: 'focus', html: true
-    });
-</script>
-<!-- Facebook Pixel Code -->
-<!-- End Facebook Pixel Code -->
-    
-</body>
-</html>
+<a href="/srch?q=page1email@blacklanternsecurity.com">page1email@blacklanternsecurity.com</a>
+<a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+<a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+"""
+
+page_2_body = """
+<a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
+<a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+<a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+"""
+
+page_3_body = """
+<a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
+<a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
+<a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
 """
-page_2_body = """<!DOCTYPE html>
-<html lang="en">
-<head>
-    <meta charset="utf-8" />    
-    <meta name="viewport" content="width=device-width, initial-scale=1">
-    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
-    <title>q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails</title>
-    <meta property="fb:app_id" content="876814239665436" /> 
-    <meta name="keywords" content="email, emails, email list, email marketing, marketing,  contacts, contact">
-    <meta name="description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails">
-    <meta name="author" content="Skymem">
-    <meta property="og:title" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
-    <meta property="og:site_name" content="Skymem web page" />
-    <meta property="og:type" content="website" />
-    <meta property="og:url" content="http://www.skymem.info/srch?q=blacklanternsecurity.com" />
-    <meta property="og:description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
-    <meta property="og:image" content="http://www.skymem.info/images/www2.jpg" />
-    <meta property="og:image:type" content="image/jpeg" />
-    <meta property="og:image:width" content="400" />
-    <meta property="og:image:height" content="300" />
-    <meta name="google-site-verification" content="tfut_b-dbvVtExEHbFHdpQirHTtvQLRFmBJOBw38s7w" />
-    <meta name="robots" content="noarchive">
-    <!-- Material Design for Bootstrap fonts and icons -->
-<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,400,500,700|Material+Icons">
-<link href="/lib2/mcw/dist/material-components-web.css" rel="stylesheet" />
-<link rel="stylesheet" href="https://stackpath.bootstrapcdn.com/bootstrap/4.2.1/css/bootstrap.min.css" />
-<meta name="x-stylesheet-fallback-test" content="" class="sr-only" /><script>!function(a,b,c,d){var e,f=document,g=f.getElementsByTagName("SCRIPT"),h=g[g.length-1].previousElementSibling,i=f.defaultView&&f.defaultView.getComputedStyle?f.defaultView.getComputedStyle(h):h.currentStyle;if(i&&i[a]!==b)for(e=0;e<c.length;e++)f.write('<link href="'+c[e]+'" '+d+"/>")}("position","absolute",["/lib2/bootstrap/dist/css/bootstrap.min.css"], "rel=\u0022stylesheet\u0022 ");</script>
-<link rel="stylesheet" href="/lib2/angular-ui-grid/ui-grid.css" />
-<link rel="stylesheet" href="/css/site.min.css" />
-<script src="/lib2/angular/angular.min.js"></script>
-        <script>            
-            (function (i, s, o, g, r, a, m) {
-                i['GoogleAnalyticsObject'] = r;
-                i[r] = i[r] ||
-                    function () {
-                        (i[r].q = i[r].q || []).push(arguments);
-                    }, i[r].l = 1 * new Date();
-                a = s.createElement(o),
-                    m = s.getElementsByTagName(o)[0];
-                a.async = 1;
-                a.src = g;
-                m.parentNode.insertBefore(a, m);
-            })(window, document, 'script', '//www.google-analytics.com/analytics.js', 'ga');
-            ga('create', 'UA-177951-20', 'auto');
-            ga('send', 'pageview');
-        </script>
-    <meta name="yandex-verification" content="552f869c3d2c3790" />
-    <!-- Bing: Verify ownership for: www.skymem.info -->
-    <meta name="msvalidate.01" content="C0E58004DB6ADBA4BDA8A8683D08CEF5" />
-    <meta name="exoclick-site-verification" content="a21b82b756cc4c93d048b5d81c98ed70">
-<meta name="ahrefs-site-verification" content="2dd82e09740f685c7a184846aa6da037541576526eda4833a0c622189d9a323a">
-</head>
-<body>
-<script>
-  window.fbAsyncInit = function() {
-    FB.init({
-      appId      : '876814239665436',
-      xfbml      : true,
-      version    : 'v12.0'
-    });
-    FB.AppEvents.logPageView();
-  };
-  (function(d, s, id){
-     var js, fjs = d.getElementsByTagName(s)[0];
-     if (d.getElementById(id)) {return;}
-     js = d.createElement(s); js.id = id;
-     js.src = "https://connect.facebook.net/en_US/sdk.js";
-     fjs.parentNode.insertBefore(js, fjs);
-   }(document, 'script', 'facebook-jssdk'));
-</script>
-<div id="fb-root"></div>
-<script async defer crossorigin="anonymous" src="https://connect.facebook.net/en_US/sdk.js#xfbml=1&version=v12.0&appId=876814239665436&autoLogAppEvents=1" nonce="CJ4gP3PN"></script>
-    <header>
-        <div style="border-bottom:1px solid #ffffff;">
-            <nav class="navbar navbar-expand-md navbar-light bg-light" style="border-bottom:1px solid #d8d8d8;background-color: #fff!important;">
-                <div class="container">
-                    <a class="navbar-brand valign-center text-muted" href="/"><i class="material-icons nav-link-go1">home</i></a>
-                    <button class="navbar-toggler collapsed" type="button" data-toggle="collapse" data-target="#navbarsExample07" aria-controls="navbarsExample07" aria-expanded="false" aria-label="Toggle navigation">
-                        <span class="navbar-toggler-icon"></span>
-                    </button>
-                    <div class="navbar-collapse collapse" id="navbarsExample07" style="">
-                        <ul class="navbar-nav mr-auto">
-                            <li class="nav-item">
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/list"><i class="material-icons" style="color:#007bff;">add</i> &nbsp; <span>Create email list</span></a>
-                            </li>
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/lists"> <i class="material-icons">mail_outline</i> &nbsp; <span>Email Lists</span></a>
-                            </li>
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/"> <i class="material-icons">search</i> &nbsp; <span></span></a>
-                            </li>
-                            
-                        </ul>
-                    </div>
-                </div>
-            </nav>
-        </div>
-    </header>
-    <main role="main">\
-        
-<style>
-img {
-  margin: 0em auto;
-  display: inline-block;  
-  width: 18px;
-}
-</style>
-<script>
-    var EmptyListPackData =  {"DocResRep":{"ItemsUI":null,"UiLimit":{"Throttle":0.15,"MiningInAdCasePer":0,"MiningInNoAdCasePer":100,"ShowAd":false,"EmailShowOnFirstSearchPage":5,"RelatedEmailsMax":100,"RelatedEmailsItemsPerPage":10,"EmailSearchCountLimitOnMore":50,"DomainCountShowOnFirstSearchPage":10,"DomainRelatedLimitOnMore":200,"DomainRelatedItemsPerPage":25,"EmailsOfDomainShowPercentageOfAll":50,"ItemsPerPageOnList":5,"ListIdItemsPerPage":25,"MaxEmailsInTrial":50,"DownloadEmailsCountTrialLimit":30},"ListVersionId":null,"ListName":null,"ListFilter":{"ConditionANDs":[],"NEmailPerDomain":2000000,"EmailsLimitPerList":2000000,"HostLimitPerList":2000000,"EmailsPreviewMaxCount":100,"HostsPreviewMaxCount":5000},"ListPackDesc":null,"ListFilterItems":null,"HostORItems":null,"OtherORItems":null,"FV":null,"DomainCount":0,"EmailCount":0,"TotalNEmails":null,"FoundNEmails":null,"CloneBy":null,"ListInternalType":"Normal","MarketplaceLP":null,"OperationMod":"None","FinishedPercentage":0.0,"ListComplete":null,"ListCompleteStat":null,"TrialEmails":[],"PriceCalc":null,"BuyNowUrl":null,"TotalNDomains":null,"CreatorId":null,"CreatorName":null,"IdEntity":null,"IdDoc":null,"IdDocVer":null,"ExtraElements":null},"DocCollection":"","Resources":""}; 
-</script>
-<div ng-app="AppMain">
-    <div ng-controller="SearchResultCtrl">
-        <div class="container">
-            
-    <form class="form" role="form">
-            <div class="input-group input-group-lg mb-3"
-                 title="The search lets you find all the email addresses using one given domain name (for example, 'company.com').">
-                <input type="text" style="min-width: 200px;" ng-model="Doc.SearchRequest" class="form-control" placeholder="company.com" autofocus />
-                <span ng-init="Doc.SearchRequest='blacklanternsecurity.com'"></span>
-                <div class="input-group-append">
-                    <button type="submit" value="Submit" class="btn btn-primary btn-lg" ng-click="post()">
-                        <div class="valign-center">
-                            <i class="material-icons md-24">search</i>
-                        </div>
-                        <span class="d-none d-sm-inline-block"> Find </span> <span class="d-none d-md-inline-block">email </span> <span class="d-none d-lg-inline-block"> addresses</span>
-                    </button>
-                </div>
-            </div>     
-            <div style="position:relative; top:-18px;">
-                <a href="#a" class="popovers" style="text-decoration:none;"
-                   data-toggle="popover" data-trigger="manual" title="New feature in search"
-                   data-original-title="New feature in search"
-                   data-content="Type first and last name with domain name and we will do our best to find the email of this person. eg. <br /> <a href='/srch?q=david%20baker%20exeloncorp.com&ss=home'><strong>david baker exeloncorp.com</strong></a>">                   
-                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
-                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
-                    </div>
-                </a>
-            </div>
-    </form>
-            <div style="margin: 0 0; text-align: center;">
-            </div>
-        <div class="row ">
-                <div class="col-sm-8" style="padding-top:20px">
-                    <!-- Emails found -------------------------------------------------------------------------- -->
-                    <!-- Related emails -------------------------------------------------------------------------- -->
-                    <!-- Domain XXX emails found -------------------------------------------------------------------------- -->
-                        <div style="padding-bottom:20px">
-                            <div class="valign-center text-muted mdc-typography--headline5" title="Domain related to this search result">
-                                <!-- <i class="material-icons md-dark md-36">language</i>&nbsp; --> 
-                <img style="width: 32px; margin-right:5px;" src="https://s2.googleusercontent.com/s2/favicons?domain=blacklanternsecurity.com&sz=128" />
-                                <a href="/srch?q=blacklanternsecurity.com">blacklanternsecurity.com</a>&nbsp;
-                                <span title="Press CTRL + mouse click or middle mouse button, to open in background tab. This is a link to external web site of this domene in form https://example.com. If web site in form www.example.com or is not have SSL change to http://www.example.com">
-                                    <a href="https://blacklanternsecurity.com" target="_blank">
-                                        <i class="material-icons" style="width:20px;font-size: 18px; color:#c1c1c1">outbound_outline</i>
-                                    </a>
-                                </span>
-                                <small><small>(1768 emails)</small></small>
-                            </div>
-                            <span title="Buy Now all 1768 emails of domain blacklanternsecurity.com">
-                                &nbsp;
-                                <button type="button" class="btn btn-primary btn-sm" ng-disabled="DisabledBuyNow" ng-click="buyOneDomain('blacklanternsecurity.com')">
-                                    <i class="material-icons md-18">arrow_right</i> Buy Now
-                                </button>
-                            </span>
-                            <button class="mdc-icon-button material-icons md-18"
-                                    style="color:#aaa"
-                                    data-toggle="popover" data-trigger="focus" data-html="true" title="Buy Now"
-                                    data-content=" &lt;b&gt;Buy now&lt;/b&gt; all &lt;b&gt;1768&lt;/b&gt; emails of &lt;b&gt;blacklanternsecurity.com&lt;/b&gt; domain.&lt;br /&gt;&#xD;&#xA;                                            &lt;b&gt;Here&lt;/b&gt; is only the preview part of all emails for this domain.&lt;br /&gt;&#xD;&#xA;                                             &lt;b&gt;After &lt;/b&gt; you press &lt;b&gt;Buy now&lt;/b&gt; button we will redirect you to email list with all emails of this domain,&#xD;&#xA;                                                    where you can buy it with PayPal or any of popular credit card or with Bitcoin (see &lt;a href=&#x27;/faq&#x27;&gt;FAQ&lt;/a&gt;) &lt;br /&gt;&lt;br /&gt;&#xD;&#xA;                                            ">
-                                help_outline
-                            </button>
-                            <div ng-show="ShowProgressBar" class="ng-hide">
-                                <div class="progress position-relative" style="height: 5px;margin-bottom:2px;">
-                                    <div class="progress-bar progress-bar-striped progress-bar-animated" role="progressbar" aria-valuemin="0" aria-valuemax="100"
-                                         style="width:{{ProgressBarValue}}%;  background-color:rgb(148, 194, 250) !important;"></div>
-                                    <span class="justify-content-center d-flex position-absolute w-100"></span>
-                                </div>
-                            </div>
-                            <span hidden ng-init="Doc.DomainEmails.Host='blacklanternsecurity.com'"></span>
-                            <span hidden ng-init="Doc.DomainEmails.IdEntity='5679236812ad5b3f748a413d'"></span>
-                            <table class="table table-striped  table-sm table-hover table-bordered text-muted">
-                                <thead class="table-primary">
-                                    <tr class="info">
-                                            <th style="width:1%;">#</th>
-                                        <th>
-                                            <div class="valign-center text-muted" title="Number of domain that filtered at least one email. Other domain is not in this list but it still you can see it in filter.">
-                                                <i class="material-icons md-dark">mail_outline</i> &nbsp; Email
-                                            </div>
-                                        </th>
-                                    </tr>
-                                </thead>
-                                <tbody>
-                                            <tr>
-                                                <td scope="row">1</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">2</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">3</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">4</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">5</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">6</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">7</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">8</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">9</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">10</td>
-                                                <td>
-                                                    <a href="/srch?q=page2email@blacklanternsecurity.com">page2email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                </tbody>
-                            </table>
-                                <a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
-                                <a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
-                        </div>
-                    <!-- Related domains -------------------------------------------------------------------------- -->
-            <br />
-            <br />
-            <br />
-            <br />
-      <div class="fb-comments" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="100%" data-numposts="5"></div>
-                </div>
-            <div class="col-sm-4" style="padding-top:60px;">
-             
-<div  style="display:inline-block;vertical-align:top;">
-    <div  style="display:inline-block;vertical-align:top;margin-top:-3px;">
-        <div class="fb-save" data-uri="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-size="small"></div>        </div>     
-    <div  style="display:inline-block;vertical-align:top;margin-top:0px;">
-        <div class="fb-like" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="" data-layout="button_count" data-action="like" data-size="small" data-share="true" data-colorscheme="light"></div>
-        </div>      
-</div>             
-<hr />
-            
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        
-    </div>
-</div>
-<br />
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        <br />
-        
-    </div>
-</div>
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        <br />
-        
-    </div>
-</div>  
-            <br />
-            <br />
-        </div>
-            </div>
-        </div>
-    </div>
-</div>
-    </main>
-    <footer class="text-muted" style="background-color: #ddd; margin-top: 60px; padding-top: 60px;">
-        <div class="container">
-            <hr>
-            <div class="row">
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">&copy; Skymem</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/">Home</a></li>
-                        <li><a href="/list">Create new email list</a></li>
-                        <li><a href="/faq">FAQ</a></li>
-                        <li><a href="/lists">Email lists</a></li>
-                <li>
-<a href="#a" class="popovers" style="text-decoration:none;"
-                   data-toggle="popover" data-trigger="manual" title="Name Extractor from text."
-                   data-original-title="Name Extractor from text."
-                   data-content="Try our new tool in (alfa version) for extracting person names from any kind of text.">                   
-                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
-                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
-                    </div>
-                </a>
-                                <a href="http://name.skymem.info"> New Tool: <b>Name Explorer</b></a>
-                            </li>
-                <li>
-                                <a href="http://martext.skymem.info"> MarText</a>
-                            </li>
-                        <li><a href="/donation">BitCoin Donations</a></li>
-                    </ul>
-                </div>
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">Contact</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/contact">Contact Us</a></li>
-                        <li><a href="https://www.facebook.com/Skymem-128969217176249/" target="_blank">Facebook page</a></li>
-            <li><a href="https://www.facebook.com/groups/169518103095402" target="_blank">Facebook group</a></li>
-            <li><a href="https://twitter.com/skymem" target="_blank">Twitter</a></li>
-                    </ul>
-                </div>
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">Policies</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/dmca-policy">DMCA Policy</a></li>
-                        <li><a href="/spam-policy">Spam Policy</a></li>
-                        <li><a href="/cookies-policy">Cookies Policy</a></li>
-                        <li><a href="/terms">Terms of Service</a></li>
-                        <li><a href="/privacy-policy">Privacy Policy</a></li>
-                        <li>
-                            <a href="http://www1395355448.e-cdn.com" rel="nofollow" target="_blank">Fight Spam!</a>
-                        </li>
-                    </ul>
-                </div>
-            </div>
-            <br />
-        </div>
-    </footer>
-    
-<script src="https://code.jquery.com/jquery-3.4.1.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous">
-</script>
-<script>(window.jQuery||document.write("\u003Cscript src=\u0022/lib2/jquery/jquery.min.js\u0022 integrity=\u0022sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
-<script src="https://stackpath.bootstrapcdn.com/bootstrap/4.3.1/js/bootstrap.bundle.min.js" integrity="sha384-xrRywqdh3PHs8keKZN+8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o" crossorigin="anonymous">
-</script>
-<script>(window.jQuery && window.jQuery.fn && window.jQuery.fn.modal||document.write("\u003Cscript src=\u0022/lib2/bootstrap/dist/js/bootstrap.bundle.min.js\u0022 integrity=\u0022sha384-xrRywqdh3PHs8keKZN\u002B8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/lodash.js/4.17.15/lodash.min.js" integrity="sha256-VeNaFBVDhoX3H+gJ37DpT/nTuZTdjYro9yBruHjVmoQ=" crossorigin="anonymous"></script>
-<script src="/lib2/angular-ui-grid/ui-grid.min.js"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/URI.js/1.19.1/URI.min.js"></script>
-<script src="/tsscripts/tsc.js?v=8ScpiXoINQWyILwjXqQp3feeposq0Ze9zjhZzJBAxc8"></script>
-<script src="/lib2/mcw/dist/material-components-web.min.js"></script>
-<script>
-    //$(function () {
-    //    $('[data-toggle="popover"]').popover();
-    //});
-    $(function () {
-        $("[data-toggle=popover]")
-            .popover({ html: true })
-            .on("focus", function () {
-                $(this).popover("show");
-            }).on("focusout", function () {
-                var _this = this;
-                if (!$(".popover:hover").length) {
-                    $(this).popover("hide");
-                }
-                else {
-                    $('.popover').mouseleave(function () {
-                        $(_this).popover("hide");
-                        $(this).off('mouseleave');
-                    });
-                }
-            });
-    });
-    $('.popover-dismiss').popover({
-        trigger: 'focus', html: true
-    });
-</script>
-<!-- Facebook Pixel Code -->
-<!-- End Facebook Pixel Code -->
-    
-</body>
-</html>"""
-page_3_body = """<!DOCTYPE html>
-<html lang="en">
-<head>
-    <meta charset="utf-8" />    
-    <meta name="viewport" content="width=device-width, initial-scale=1">
-    <meta http-equiv="X-UA-Compatible" content="IE=edge" />
-    <title>q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails</title>
-    <meta property="fb:app_id" content="876814239665436" /> 
-    <meta name="keywords" content="email, emails, email list, email marketing, marketing,  contacts, contact">
-    <meta name="description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails">
-    <meta name="author" content="Skymem">
-    <meta property="og:title" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
-    <meta property="og:site_name" content="Skymem web page" />
-    <meta property="og:type" content="website" />
-    <meta property="og:url" content="http://www.skymem.info/srch?q=blacklanternsecurity.com" />
-    <meta property="og:description" content="q=blacklanternsecurity.com - blacklanternsecurity.com=1768 emails" />
-    <meta property="og:image" content="http://www.skymem.info/images/www2.jpg" />
-    <meta property="og:image:type" content="image/jpeg" />
-    <meta property="og:image:width" content="400" />
-    <meta property="og:image:height" content="300" />
-    <meta name="google-site-verification" content="tfut_b-dbvVtExEHbFHdpQirHTtvQLRFmBJOBw38s7w" />
-    <meta name="robots" content="noarchive">
-    <!-- Material Design for Bootstrap fonts and icons -->
-<link rel="stylesheet" href="https://fonts.googleapis.com/css?family=Roboto:300,400,500,700|Material+Icons">
-<link href="/lib2/mcw/dist/material-components-web.css" rel="stylesheet" />
-<link rel="stylesheet" href="https://stackpath.bootstrapcdn.com/bootstrap/4.2.1/css/bootstrap.min.css" />
-<meta name="x-stylesheet-fallback-test" content="" class="sr-only" /><script>!function(a,b,c,d){var e,f=document,g=f.getElementsByTagName("SCRIPT"),h=g[g.length-1].previousElementSibling,i=f.defaultView&&f.defaultView.getComputedStyle?f.defaultView.getComputedStyle(h):h.currentStyle;if(i&&i[a]!==b)for(e=0;e<c.length;e++)f.write('<link href="'+c[e]+'" '+d+"/>")}("position","absolute",["/lib2/bootstrap/dist/css/bootstrap.min.css"], "rel=\u0022stylesheet\u0022 ");</script>
-<link rel="stylesheet" href="/lib2/angular-ui-grid/ui-grid.css" />
-<link rel="stylesheet" href="/css/site.min.css" />
-<script src="/lib2/angular/angular.min.js"></script>
-        <script>            
-            (function (i, s, o, g, r, a, m) {
-                i['GoogleAnalyticsObject'] = r;
-                i[r] = i[r] ||
-                    function () {
-                        (i[r].q = i[r].q || []).push(arguments);
-                    }, i[r].l = 1 * new Date();
-                a = s.createElement(o),
-                    m = s.getElementsByTagName(o)[0];
-                a.async = 1;
-                a.src = g;
-                m.parentNode.insertBefore(a, m);
-            })(window, document, 'script', '//www.google-analytics.com/analytics.js', 'ga');
-            ga('create', 'UA-177951-20', 'auto');
-            ga('send', 'pageview');
-        </script>
-    <meta name="yandex-verification" content="552f869c3d2c3790" />
-    <!-- Bing: Verify ownership for: www.skymem.info -->
-    <meta name="msvalidate.01" content="C0E58004DB6ADBA4BDA8A8683D08CEF5" />
-    <meta name="exoclick-site-verification" content="a21b82b756cc4c93d048b5d81c98ed70">
-<meta name="ahrefs-site-verification" content="2dd82e09740f685c7a184846aa6da037541576526eda4833a0c622189d9a323a">
-</head>
-<body>
-<script>
-  window.fbAsyncInit = function() {
-    FB.init({
-      appId      : '876814239665436',
-      xfbml      : true,
-      version    : 'v12.0'
-    });
-    FB.AppEvents.logPageView();
-  };
-  (function(d, s, id){
-     var js, fjs = d.getElementsByTagName(s)[0];
-     if (d.getElementById(id)) {return;}
-     js = d.createElement(s); js.id = id;
-     js.src = "https://connect.facebook.net/en_US/sdk.js";
-     fjs.parentNode.insertBefore(js, fjs);
-   }(document, 'script', 'facebook-jssdk'));
-</script>
-<div id="fb-root"></div>
-<script async defer crossorigin="anonymous" src="https://connect.facebook.net/en_US/sdk.js#xfbml=1&version=v12.0&appId=876814239665436&autoLogAppEvents=1" nonce="CJ4gP3PN"></script>
-    <header>
-        <div style="border-bottom:1px solid #ffffff;">
-            <nav class="navbar navbar-expand-md navbar-light bg-light" style="border-bottom:1px solid #d8d8d8;background-color: #fff!important;">
-                <div class="container">
-                    <a class="navbar-brand valign-center text-muted" href="/"><i class="material-icons nav-link-go1">home</i></a>
-                    <button class="navbar-toggler collapsed" type="button" data-toggle="collapse" data-target="#navbarsExample07" aria-controls="navbarsExample07" aria-expanded="false" aria-label="Toggle navigation">
-                        <span class="navbar-toggler-icon"></span>
-                    </button>
-                    <div class="navbar-collapse collapse" id="navbarsExample07" style="">
-                        <ul class="navbar-nav mr-auto">
-                            <li class="nav-item">
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/list"><i class="material-icons" style="color:#007bff;">add</i> &nbsp; <span>Create email list</span></a>
-                            </li>
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/lists"> <i class="material-icons">mail_outline</i> &nbsp; <span>Email Lists</span></a>
-                            </li>
-                            <li class="nav-item">
-                                <a class="nav-link valign-center" href="/"> <i class="material-icons">search</i> &nbsp; <span></span></a>
-                            </li>
-                            
-                        </ul>
-                    </div>
-                </div>
-            </nav>
-        </div>
-    </header>
-    <main role="main">\
-        
-<style>
-img {
-  margin: 0em auto;
-  display: inline-block;  
-  width: 18px;
-}
-</style>
-<script>
-    var EmptyListPackData =  {"DocResRep":{"ItemsUI":null,"UiLimit":{"Throttle":0.15,"MiningInAdCasePer":0,"MiningInNoAdCasePer":100,"ShowAd":false,"EmailShowOnFirstSearchPage":5,"RelatedEmailsMax":100,"RelatedEmailsItemsPerPage":10,"EmailSearchCountLimitOnMore":50,"DomainCountShowOnFirstSearchPage":10,"DomainRelatedLimitOnMore":200,"DomainRelatedItemsPerPage":25,"EmailsOfDomainShowPercentageOfAll":50,"ItemsPerPageOnList":5,"ListIdItemsPerPage":25,"MaxEmailsInTrial":50,"DownloadEmailsCountTrialLimit":30},"ListVersionId":null,"ListName":null,"ListFilter":{"ConditionANDs":[],"NEmailPerDomain":2000000,"EmailsLimitPerList":2000000,"HostLimitPerList":2000000,"EmailsPreviewMaxCount":100,"HostsPreviewMaxCount":5000},"ListPackDesc":null,"ListFilterItems":null,"HostORItems":null,"OtherORItems":null,"FV":null,"DomainCount":0,"EmailCount":0,"TotalNEmails":null,"FoundNEmails":null,"CloneBy":null,"ListInternalType":"Normal","MarketplaceLP":null,"OperationMod":"None","FinishedPercentage":0.0,"ListComplete":null,"ListCompleteStat":null,"TrialEmails":[],"PriceCalc":null,"BuyNowUrl":null,"TotalNDomains":null,"CreatorId":null,"CreatorName":null,"IdEntity":null,"IdDoc":null,"IdDocVer":null,"ExtraElements":null},"DocCollection":"","Resources":""}; 
-</script>
-<div ng-app="AppMain">
-    <div ng-controller="SearchResultCtrl">
-        <div class="container">
-            
-    <form class="form" role="form">
-            <div class="input-group input-group-lg mb-3"
-                 title="The search lets you find all the email addresses using one given domain name (for example, 'company.com').">
-                <input type="text" style="min-width: 200px;" ng-model="Doc.SearchRequest" class="form-control" placeholder="company.com" autofocus />
-                <span ng-init="Doc.SearchRequest='blacklanternsecurity.com'"></span>
-                <div class="input-group-append">
-                    <button type="submit" value="Submit" class="btn btn-primary btn-lg" ng-click="post()">
-                        <div class="valign-center">
-                            <i class="material-icons md-24">search</i>
-                        </div>
-                        <span class="d-none d-sm-inline-block"> Find </span> <span class="d-none d-md-inline-block">email </span> <span class="d-none d-lg-inline-block"> addresses</span>
-                    </button>
-                </div>
-            </div>     
-            <div style="position:relative; top:-18px;">
-                <a href="#a" class="popovers" style="text-decoration:none;"
-                   data-toggle="popover" data-trigger="manual" title="New feature in search"
-                   data-original-title="New feature in search"
-                   data-content="Type first and last name with domain name and we will do our best to find the email of this person. eg. <br /> <a href='/srch?q=david%20baker%20exeloncorp.com&ss=home'><strong>david baker exeloncorp.com</strong></a>">                   
-                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
-                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
-                    </div>
-                </a>
-            </div>
-    </form>
-            <div style="margin: 0 0; text-align: center;">
-            </div>
-        <div class="row ">
-                <div class="col-sm-8" style="padding-top:20px">
-                    <!-- Emails found -------------------------------------------------------------------------- -->
-                    <!-- Related emails -------------------------------------------------------------------------- -->
-                    <!-- Domain XXX emails found -------------------------------------------------------------------------- -->
-                        <div style="padding-bottom:20px">
-                            <div class="valign-center text-muted mdc-typography--headline5" title="Domain related to this search result">
-                                <!-- <i class="material-icons md-dark md-36">language</i>&nbsp; --> 
-                <img style="width: 32px; margin-right:5px;" src="https://s2.googleusercontent.com/s2/favicons?domain=blacklanternsecurity.com&sz=128" />
-                                <a href="/srch?q=blacklanternsecurity.com">blacklanternsecurity.com</a>&nbsp;
-                                <span title="Press CTRL + mouse click or middle mouse button, to open in background tab. This is a link to external web site of this domene in form https://example.com. If web site in form www.example.com or is not have SSL change to http://www.example.com">
-                                    <a href="https://blacklanternsecurity.com" target="_blank">
-                                        <i class="material-icons" style="width:20px;font-size: 18px; color:#c1c1c1">outbound_outline</i>
-                                    </a>
-                                </span>
-                                <small><small>(1768 emails)</small></small>
-                            </div>
-                            <span title="Buy Now all 1768 emails of domain blacklanternsecurity.com">
-                                &nbsp;
-                                <button type="button" class="btn btn-primary btn-sm" ng-disabled="DisabledBuyNow" ng-click="buyOneDomain('blacklanternsecurity.com')">
-                                    <i class="material-icons md-18">arrow_right</i> Buy Now
-                                </button>
-                            </span>
-                            <button class="mdc-icon-button material-icons md-18"
-                                    style="color:#aaa"
-                                    data-toggle="popover" data-trigger="focus" data-html="true" title="Buy Now"
-                                    data-content=" &lt;b&gt;Buy now&lt;/b&gt; all &lt;b&gt;1768&lt;/b&gt; emails of &lt;b&gt;blacklanternsecurity.com&lt;/b&gt; domain.&lt;br /&gt;&#xD;&#xA;                                            &lt;b&gt;Here&lt;/b&gt; is only the preview part of all emails for this domain.&lt;br /&gt;&#xD;&#xA;                                             &lt;b&gt;After &lt;/b&gt; you press &lt;b&gt;Buy now&lt;/b&gt; button we will redirect you to email list with all emails of this domain,&#xD;&#xA;                                                    where you can buy it with PayPal or any of popular credit card or with Bitcoin (see &lt;a href=&#x27;/faq&#x27;&gt;FAQ&lt;/a&gt;) &lt;br /&gt;&lt;br /&gt;&#xD;&#xA;                                            ">
-                                help_outline
-                            </button>
-                            <div ng-show="ShowProgressBar" class="ng-hide">
-                                <div class="progress position-relative" style="height: 5px;margin-bottom:2px;">
-                                    <div class="progress-bar progress-bar-striped progress-bar-animated" role="progressbar" aria-valuemin="0" aria-valuemax="100"
-                                         style="width:{{ProgressBarValue}}%;  background-color:rgb(148, 194, 250) !important;"></div>
-                                    <span class="justify-content-center d-flex position-absolute w-100"></span>
-                                </div>
-                            </div>
-                            <span hidden ng-init="Doc.DomainEmails.Host='blacklanternsecurity.com'"></span>
-                            <span hidden ng-init="Doc.DomainEmails.IdEntity='5679236812ad5b3f748a413d'"></span>
-                            <table class="table table-striped  table-sm table-hover table-bordered text-muted">
-                                <thead class="table-primary">
-                                    <tr class="info">
-                                            <th style="width:1%;">#</th>
-                                        <th>
-                                            <div class="valign-center text-muted" title="Number of domain that filtered at least one email. Other domain is not in this list but it still you can see it in filter.">
-                                                <i class="material-icons md-dark">mail_outline</i> &nbsp; Email
-                                            </div>
-                                        </th>
-                                    </tr>
-                                </thead>
-                                <tbody>
-                                            <tr>
-                                                <td scope="row">1</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">2</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">3</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">4</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">5</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">6</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">7</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">8</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">9</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                            <tr>
-                                                <td scope="row">10</td>
-                                                <td>
-                                                    <a href="/srch?q=page3email@blacklanternsecurity.com">page3email@blacklanternsecurity.com</a>
-                                                </td>
-                                            </tr>
-                                </tbody>
-                            </table>
-                                <a href="/domain/5679236812ad5b3f748a413d?p=2"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
-                                <a href="/domain/5679236812ad5b3f748a413d?p=3"><i class="fa fa-arrow-right fa-lg"></i> More emails for <strong>blacklanternsecurity.com </strong> ...</a>
-                        </div>
-                    <!-- Related domains -------------------------------------------------------------------------- -->
-            <br />
-            <br />
-            <br />
-            <br />
-      <div class="fb-comments" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="100%" data-numposts="5"></div>
-                </div>
-            <div class="col-sm-4" style="padding-top:60px;">
-             
-<div  style="display:inline-block;vertical-align:top;">
-    <div  style="display:inline-block;vertical-align:top;margin-top:-3px;">
-        <div class="fb-save" data-uri="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-size="small"></div>        </div>     
-    <div  style="display:inline-block;vertical-align:top;margin-top:0px;">
-        <div class="fb-like" data-href="https://www.skymem.info/srch?q=blacklanternsecurity.com" data-width="" data-layout="button_count" data-action="like" data-size="small" data-share="true" data-colorscheme="light"></div>
-        </div>      
-</div>             
-<hr />
-            
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        
-    </div>
-</div>
-<br />
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        <br />
-        
-    </div>
-</div>
-<div class="hidden-xs" style="text-align: left;">
-    <div>
-        <br />
-        
-    </div>
-</div>  
-            <br />
-            <br />
-        </div>
-            </div>
-        </div>
-    </div>
-</div>
-    </main>
-    <footer class="text-muted" style="background-color: #ddd; margin-top: 60px; padding-top: 60px;">
-        <div class="container">
-            <hr>
-            <div class="row">
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">&copy; Skymem</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/">Home</a></li>
-                        <li><a href="/list">Create new email list</a></li>
-                        <li><a href="/faq">FAQ</a></li>
-                        <li><a href="/lists">Email lists</a></li>
-                <li>
-<a href="#a" class="popovers" style="text-decoration:none;"
-                   data-toggle="popover" data-trigger="manual" title="Name Extractor from text."
-                   data-original-title="Name Extractor from text."
-                   data-content="Try our new tool in (alfa version) for extracting person names from any kind of text.">                   
-                    <div class="valign-center" title="Type first and last name with domain name and we will do our best to find the email of this person. eg. david baker exeloncorp.com">                        
-                        <i class="material-icons md-dark md-18" style="color:#c62a2a">new_releases</i>
-                    </div>
-                </a>
-                                <a href="http://name.skymem.info"> New Tool: <b>Name Explorer</b></a>
-                            </li>
-                <li>
-                                <a href="http://martext.skymem.info"> MarText</a>
-                            </li>
-                        <li><a href="/donation">BitCoin Donations</a></li>
-                    </ul>
-                </div>
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">Contact</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/contact">Contact Us</a></li>
-                        <li><a href="https://www.facebook.com/Skymem-128969217176249/" target="_blank">Facebook page</a></li>
-            <li><a href="https://www.facebook.com/groups/169518103095402" target="_blank">Facebook group</a></li>
-            <li><a href="https://twitter.com/skymem" target="_blank">Twitter</a></li>
-                    </ul>
-                </div>
-                <div class="col-md-4">
-                    <h4 class="font-weight-light">Policies</h4>
-                    <ul class="list-unstyled">
-                        <li><a href="/dmca-policy">DMCA Policy</a></li>
-                        <li><a href="/spam-policy">Spam Policy</a></li>
-                        <li><a href="/cookies-policy">Cookies Policy</a></li>
-                        <li><a href="/terms">Terms of Service</a></li>
-                        <li><a href="/privacy-policy">Privacy Policy</a></li>
-                        <li>
-                            <a href="http://www1395355448.e-cdn.com" rel="nofollow" target="_blank">Fight Spam!</a>
-                        </li>
-                    </ul>
-                </div>
-            </div>
-            <br />
-        </div>
-    </footer>
-    
-<script src="https://code.jquery.com/jquery-3.4.1.min.js" integrity="sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=" crossorigin="anonymous">
-</script>
-<script>(window.jQuery||document.write("\u003Cscript src=\u0022/lib2/jquery/jquery.min.js\u0022 integrity=\u0022sha256-CSXorXvZcTkaix6Yvo6HppcZGetbYMGWSFlBw8HfCJo=\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
-<script src="https://stackpath.bootstrapcdn.com/bootstrap/4.3.1/js/bootstrap.bundle.min.js" integrity="sha384-xrRywqdh3PHs8keKZN+8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o" crossorigin="anonymous">
-</script>
-<script>(window.jQuery && window.jQuery.fn && window.jQuery.fn.modal||document.write("\u003Cscript src=\u0022/lib2/bootstrap/dist/js/bootstrap.bundle.min.js\u0022 integrity=\u0022sha384-xrRywqdh3PHs8keKZN\u002B8zzc5TX0GRTLCcmivcbNJWm2rs5C8PRhcEn3czEjhAO9o\u0022 crossorigin=\u0022anonymous\u0022\u003E\u003C/script\u003E"));</script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/lodash.js/4.17.15/lodash.min.js" integrity="sha256-VeNaFBVDhoX3H+gJ37DpT/nTuZTdjYro9yBruHjVmoQ=" crossorigin="anonymous"></script>
-<script src="/lib2/angular-ui-grid/ui-grid.min.js"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/URI.js/1.19.1/URI.min.js"></script>
-<script src="/tsscripts/tsc.js?v=8ScpiXoINQWyILwjXqQp3feeposq0Ze9zjhZzJBAxc8"></script>
-<script src="/lib2/mcw/dist/material-components-web.min.js"></script>
-<script>
-    //$(function () {
-    //    $('[data-toggle="popover"]').popover();
-    //});
-    $(function () {
-        $("[data-toggle=popover]")
-            .popover({ html: true })
-            .on("focus", function () {
-                $(this).popover("show");
-            }).on("focusout", function () {
-                var _this = this;
-                if (!$(".popover:hover").length) {
-                    $(this).popover("hide");
-                }
-                else {
-                    $('.popover').mouseleave(function () {
-                        $(_this).popover("hide");
-                        $(this).off('mouseleave');
-                    });
-                }
-            });
-    });
-    $('.popover-dismiss').popover({
-        trigger: 'focus', html: true
-    });
-</script>
-<!-- Facebook Pixel Code -->
-<!-- End Facebook Pixel Code -->
-    
-</body>
-</html>"""

From 49eaaeb6eb9e9af34e5af841d715f4f9e568ffc9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 11:23:50 -0400
Subject: [PATCH 056/387] reworking event queues

---
 bbot/cli.py                           |  10 +--
 bbot/core/helpers/dns.py              |   6 +-
 bbot/core/helpers/misc.py             |  19 +++--
 bbot/core/helpers/queueing.py         | 102 --------------------------
 bbot/modules/base.py                  |  43 ++++++++---
 bbot/scanner/manager.py               |  47 +++++++++++-
 bbot/scanner/scanner.py               |  11 +--
 bbot/test/test_step_1/test_helpers.py |  51 -------------
 8 files changed, 96 insertions(+), 193 deletions(-)
 delete mode 100644 bbot/core/helpers/queueing.py

diff --git a/bbot/cli.py b/bbot/cli.py
index a8d44af27d..70f99dc57e 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -313,23 +313,21 @@ def keyboard_listen():
         if err:
             os._exit(1)
 
-        # debug troublesome modules
-        # while 1:
-        #     await scanner.manager.modules_status(_log=True)
-        #     await asyncio.sleep(1)
-
 
 def main():
     global scan_name
     try:
         asyncio.run(_main())
     except asyncio.CancelledError:
-        pass
+        if get_log_level() <= logging.DEBUG:
+            log_to_stderr(traceback.format_exc(), level="DEBUG")
     except KeyboardInterrupt:
         msg = "Interrupted"
         if scan_name:
             msg = f"You killed {scan_name}"
         log_to_stderr(msg, level="ERROR")
+        if get_log_level() <= logging.DEBUG:
+            log_to_stderr(traceback.format_exc(), level="DEBUG")
         os._exit(1)
 
 
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 917652a1b6..9528b4fdb5 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -84,9 +84,9 @@ async def resolve_raw(self, query, **kwargs):
         # DNS over TCP is more reliable
         # But setting this breaks DNS resolution on Ubuntu because systemd-resolve doesn't support TCP
         # kwargs["tcp"] = True
+        results = []
+        errors = []
         with suppress(asyncio.CancelledError):
-            results = []
-            errors = []
             query = str(query).strip()
             if is_ip(query):
                 kwargs.pop("type", None)
@@ -112,7 +112,7 @@ async def resolve_raw(self, query, **kwargs):
                     for error in e:
                         errors.append((t, error))
 
-            return (results, errors)
+        return (results, errors)
 
     async def _resolve_hostname(self, query, **kwargs):
         self.debug(f"Resolving {query} with kwargs={kwargs}")
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index ec4b9b20ec..3c267e1dcc 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -1075,12 +1075,15 @@ def get_traceback_details(e):
 
 
 async def cancel_tasks(tasks):
+    current_task = asyncio.current_task()
     for task in tasks:
-        task.cancel()
-        try:
-            await task
-        except asyncio.CancelledError:
-            pass
-        except Exception as e:
-            log.debug(e)
-            log.trace(traceback.format_exc())
+        if task != current_task:
+            with suppress(asyncio.CancelledError):
+                task.cancel()
+    for task in tasks:
+        if task != current_task:
+            try:
+                await task
+            except Exception as e:
+                log.debug(e)
+                log.trace(traceback.format_exc())
diff --git a/bbot/core/helpers/queueing.py b/bbot/core/helpers/queueing.py
deleted file mode 100644
index 3b7674544c..0000000000
--- a/bbot/core/helpers/queueing.py
+++ /dev/null
@@ -1,102 +0,0 @@
-import random
-from contextlib import suppress
-from queue import PriorityQueue, Empty
-
-
-class QueuedEvent(tuple):
-    """
-    Allows sorting of tuples in outgoing PriorityQueue
-    """
-
-    def __init__(self, item):
-        self.item = item
-
-    def __gt__(self, other):
-        return self.event > other.event
-
-    def __lt__(self, other):
-        return self.event < other.event
-
-    @property
-    def event(self):
-        return self._get_event(self.item)
-
-    @staticmethod
-    def _get_event(e):
-        try:
-            return e[0]
-        except Exception:
-            return e
-
-
-class EventQueue(PriorityQueue):
-    """
-    A "meta-queue" class that includes five queues, one for each priority
-
-    Events are taken from the queues in a weighted random fashion based
-    on the priority of their parent module.
-
-    This prevents complete exclusion of lower-priority events
-
-    This queue also tracks events by module and event type for stat purposes
-    """
-
-    def __init__(self, *args, **kwargs):
-        super().__init__(*args, **kwargs)
-        self.event_types = dict()
-        self.modules = dict()
-        self._queues = dict()
-        self._priorities = (1, 2, 3, 4, 5)
-        self._weights = (10, 7, 5, 3, 1)
-        for priority in self._priorities:
-            q = PriorityQueue(*args, **kwargs)
-            self._queues[priority] = q
-
-    @property
-    def events(self):
-        for q in self._queues:
-            for e in q.queue:
-                yield e.event
-
-    def _qsize(self):
-        return sum(q._qsize() for q in self._queues.values())
-
-    def empty(self):
-        return all(q.empty() for q in self._queues.values())
-
-    def _put(self, item):
-        queued_event = QueuedEvent(item)
-        q = self._queues[queued_event.event.module_priority]
-        self._increment(self.event_types, queued_event.event.type)
-        self._increment(self.modules, str(queued_event.event.module))
-        q._put(queued_event)
-
-    def _get(self):
-        # first pick a (weighted) random queue
-        priority = self._random_priority()
-        try:
-            # and get an event from it
-            queued_event = self._queues[priority]._get()
-        # if that fails
-        except IndexError:
-            # try every queue
-            queues = [_ for _ in self._queues.values() if not _.empty()]
-            if not queues:
-                raise Empty
-            queued_event = queues[0]._get()
-        self._decrement(self.event_types, queued_event.event.type)
-        self._decrement(self.modules, str(queued_event.event.module))
-        return queued_event.item
-
-    def _random_priority(self):
-        return random.choices(self._priorities, weights=self._weights, k=1)[0]
-
-    def _increment(self, d, v):
-        try:
-            d[v] += 1
-        except KeyError:
-            d[v] = 1
-
-    def _decrement(self, d, v):
-        with suppress(KeyError):
-            d[v] = max(0, d[v] - 1)
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 49cad93f91..af06a1ee06 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -66,8 +66,8 @@ class BaseModule:
     _scope_shepherding = True
     # Exclude from scan statistics
     _stats_exclude = False
-    # outgoing queue size (None == infinite)
-    _qsize = None
+    # outgoing queue size (0 == infinite)
+    _qsize = 0
     # Priority of events raised by this module, 1-5, lower numbers == higher priority
     _priority = 3
     # Name, overridden automatically
@@ -99,6 +99,8 @@ def __init__(self, scan):
 
         self._tasks = []
         self._event_received = asyncio.Condition()
+        self._event_queued = asyncio.Condition()
+        self._event_dequeued = asyncio.Condition()
 
     async def setup(self):
         """
@@ -206,7 +208,7 @@ async def _handle_batch(self):
         submitted = False
         if self.batch_size <= 1:
             return
-        if self.num_queued_events > 0:
+        if self.num_incoming_events > 0:
             events, finish, report = await self.events_waiting()
             if not self.errored:
                 self.debug(f"Handling batch of {len(events):,} events")
@@ -244,7 +246,7 @@ def emit_event(self, *args, **kwargs):
             if v is not None:
                 emit_kwargs[o] = v
         event = self.make_event(*args, **event_kwargs)
-        self.scan.manager.queue_event(event, **emit_kwargs)
+        self.queue_outgoing_event(event, **emit_kwargs)
 
     async def events_waiting(self):
         """
@@ -273,7 +275,7 @@ async def events_waiting(self):
         return events, finish, report
 
     @property
-    def num_queued_events(self):
+    def num_incoming_events(self):
         ret = 0
         if self.incoming_event_queue:
             ret = self.incoming_event_queue.qsize()
@@ -308,9 +310,9 @@ async def _worker(self):
         async with self.scan.acatch(context=self._worker):
             while not self.scan.stopping:
                 # hold the reigns if our outgoing queue is full
-                # if self._qsize and self.outgoing_event_queue.qsize() >= self._qsize:
-                #     with self.event_received:
-                #         await self.event_received.wait()
+                if self._qsize > 0 and self.outgoing_event_queue.qsize() >= self._qsize:
+                    async with self._event_dequeued:
+                        await self._event_dequeued.wait()
 
                 if self.batch_size > 1:
                     submitted = await self._handle_batch()
@@ -437,8 +439,11 @@ async def _cleanup(self):
                             await self.helpers.execute_sync_or_async(callback)
 
     async def queue_event(self, event):
+        """
+        Queue (incoming) event with module
+        """
         if self.incoming_event_queue in (None, False):
-            self.debug(f"Not in an acceptable state to queue event")
+            self.debug(f"Not in an acceptable state to queue incoming event")
             return
         acceptable, reason = self._event_precheck(event)
         if not acceptable:
@@ -450,7 +455,21 @@ async def queue_event(self, event):
             async with self._event_received:
                 self._event_received.notify()
         except AttributeError:
-            self.debug(f"Not in an acceptable state to queue event")
+            self.debug(f"Not in an acceptable state to queue incoming event")
+
+    def queue_outgoing_event(self, event, **kwargs):
+        """
+        Queue (outgoing) event with module
+        """
+        try:
+            self.outgoing_event_queue.put_nowait((event, kwargs))
+        except AttributeError:
+            self.debug(f"Not in an acceptable state to queue outgoing event")
+
+    async def dequeue_outgoing_event(self):
+        await self.outgoing_event_queue.get()
+        with self._event_dequeued:
+            self._event_dequeued.notify()
 
     def set_error_state(self, message=None):
         if not self.errored:
@@ -479,7 +498,7 @@ def helpers(self):
     @property
     def status(self):
         status = {
-            "events": {"incoming": self.num_queued_events, "outgoing": self.outgoing_event_queue.qsize()},
+            "events": {"incoming": self.num_incoming_events, "outgoing": self.outgoing_event_queue.qsize()},
             "tasks": self._task_counter.value,
             "errored": self.errored,
         }
@@ -498,7 +517,7 @@ def finished(self):
         """
         Indicates whether the module is finished (not running and nothing in queues)
         """
-        return not self.running and self.num_queued_events <= 0 and self.outgoing_event_queue.qsize() <= 0
+        return not self.running and self.num_incoming_events <= 0 and self.outgoing_event_queue.qsize() <= 0
 
     async def request_with_fail_count(self, *args, **kwargs):
         r = await self.helpers.request(*args, **kwargs)
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index d61fa5b14b..0b2da887e6 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -5,7 +5,6 @@
 from contextlib import suppress
 
 from ..core.errors import ValidationError
-from ..core.helpers.queueing import EventQueue
 from ..core.helpers.async_helpers import TaskCounter
 
 log = logging.getLogger("bbot.scanner.manager")
@@ -18,7 +17,8 @@ class ScanManager:
 
     def __init__(self, scan):
         self.scan = scan
-        self.incoming_event_queue = EventQueue()
+
+        self.incoming_event_queue = asyncio.PriorityQueue()
 
         # tracks duplicate events on a global basis
         self.events_distributed = set()
@@ -27,6 +27,7 @@ def __init__(self, scan):
         self.dns_resolution = self.scan.config.get("dns_resolution", False)
         self._task_counter = TaskCounter()
         self._new_activity = True
+        self._incoming_queues = None
 
     async def init_events(self):
         """
@@ -332,7 +333,8 @@ async def _worker_loop(self):
         try:
             while 1:
                 try:
-                    event, kwargs = self.incoming_event_queue.get_nowait()
+                    # event, kwargs = self.incoming_event_queue.get_nowait()
+                    event, kwargs = await self.get_event_from_modules()
                     acceptable = await self.emit_event(event, **kwargs)
                     if acceptable:
                         self._new_activity = True
@@ -345,6 +347,43 @@ async def _worker_loop(self):
         except Exception:
             log.critical(traceback.format_exc())
 
+    @property
+    def incoming_queues(self):
+        if self._incoming_queues is None:
+            modules_by_priority = sorted(list(self.scan.modules.values()), key=lambda m: m.priority)
+            queues_by_priority = [m.outgoing_event_queue for m in modules_by_priority]
+            self._incoming_queues = [self.incoming_event_queue] + queues_by_priority
+        return self._incoming_queues
+
+    async def _wait_on_queue(self, queue, waiter_tasks, first_done):
+        item = await queue.get()
+        first_done.set_result(item)
+        current_task = asyncio.current_task()
+        for t in waiter_tasks:
+            if t != current_task:
+                t.cancel()
+
+    async def get_event_from_modules(self):
+        waiter_tasks = []
+        first_done = asyncio.Future()
+        for incoming_queue in self.incoming_queues:
+            waiter_tasks.append(asyncio.create_task(self._wait_on_queue(incoming_queue, waiter_tasks, first_done)))
+        result = await first_done
+        return result
+
+    @property
+    def queued_event_types(self):
+        event_types = {}
+        for q in self.incoming_queues:
+            for event, _ in q._queue:
+                event_type = getattr(event, "type", None)
+                if event_type is not None:
+                    try:
+                        event_types[event_type] += 1
+                    except KeyError:
+                        event_types[event_type] = 1
+        return event_types
+
     def queue_event(self, event, **kwargs):
         if event:
             # nerf event's priority if it's likely not to be in scope
@@ -423,7 +462,7 @@ async def modules_status(self, _log=False):
                     f'{self.scan.name}: Modules errored: {len(modules_errored):,} ({", ".join([m for m in modules_errored])})'
                 )
 
-            queued_events_by_type = [(k, v) for k, v in self.incoming_event_queue.event_types.items() if v > 0]
+            queued_events_by_type = [(k, v) for k, v in self.queued_event_types.items() if v > 0]
             if queued_events_by_type:
                 queued_events_by_type.sort(key=lambda x: x[-1], reverse=True)
                 queued_events_by_type_str = ", ".join(f"{m}: {t:,}" for m, t in queued_events_by_type)
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index f55a5c0d60..43e09f8d83 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -1,6 +1,3 @@
-import queue
-
-# import signal
 import asyncio
 import logging
 import traceback
@@ -364,7 +361,7 @@ def drain_queues(self):
             with contextlib.suppress(asyncio.queues.QueueEmpty):
                 while 1:
                     module.incoming_event_queue.get_nowait()
-        with contextlib.suppress(queue.Empty):
+        with contextlib.suppress(asyncio.queues.QueueEmpty):
             while 1:
                 self.manager.incoming_event_queue.get_nowait()
         self.debug("Finished draining queues")
@@ -687,9 +684,9 @@ def _handle_exception(self, e, context="scan", finally_callback=None):
             self.stop()
         elif isinstance(e, BrokenPipeError):
             log.debug(f"BrokenPipeError in {filename}:{lineno}:{funcname}(): {e}")
-        elif isinstance(e, asyncio.CancelledError):
-            log.debug(f"asyncio CancelledError: {e}")
-            log.trace(traceback.format_exc())
+        # elif isinstance(e, asyncio.CancelledError):
+        #     log.debug(f"asyncio CancelledError: {e}")
+        #     log.trace(traceback.format_exc())
         elif isinstance(e, Exception):
             log.error(f"Error in {context}: {filename}:{lineno}:{funcname}(): {e}")
             log.trace(traceback.format_exc())
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index ec91009b67..9b604d7967 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -493,57 +493,6 @@ def test_word_cloud(helpers, bbot_config, bbot_scanner):
     assert top_mutations[:2] == [((None,), 3), ((None, "2"), 2)]
 
 
-def test_queues(scan, helpers):
-    from bbot.core.helpers.queueing import EventQueue
-
-    module_priority_1 = helpers._make_dummy_module("one")
-    module_priority_2 = helpers._make_dummy_module("two")
-    module_priority_3 = helpers._make_dummy_module("three")
-    module_priority_4 = helpers._make_dummy_module("four")
-    module_priority_5 = helpers._make_dummy_module("five")
-    module_priority_1._priority = 1
-    module_priority_2._priority = 2
-    module_priority_3._priority = 3
-    module_priority_4._priority = 4
-    module_priority_5._priority = 5
-    event1 = module_priority_1.make_event("1.1.1.1", source=scan.root_event)
-    event2 = module_priority_2.make_event("2.2.2.2", source=scan.root_event)
-    event3 = module_priority_3.make_event("3.3.3.3", source=scan.root_event)
-    event4 = module_priority_4.make_event("4.4.4.4", source=scan.root_event)
-    event5 = module_priority_5.make_event("5.5.5.5", source=scan.root_event)
-
-    event_queue = EventQueue()
-    for e in [event1, event2, event3, event4, event5]:
-        event_queue.put(e)
-
-    assert event1 == event_queue._queues[1].get().event
-    assert event2 == event_queue._queues[2].get().event
-    assert event3 == event_queue._queues[3].get().event
-    assert event4 == event_queue._queues[4].get().event
-    assert event5 == event_queue._queues[5].get().event
-
-    # insert each event 10000 times
-    for i in range(10000):
-        for e in [event1, event2, event3, event4, event5]:
-            event_queue.put(e)
-
-    # get 5000 events from queue and count how many of each there are
-    stats = dict()
-    for i in range(5000):
-        e = event_queue.get()
-        try:
-            stats[e.id] += 1
-        except KeyError:
-            stats[e.id] = 1
-
-    # make sure there's at least one of each event
-    for e in [event1, event2, event3, event4, event5]:
-        assert e.id in stats
-
-    # make sure there are more of the higher-priority ones
-    assert stats[event1.id] > stats[event2.id] > stats[event3.id] > stats[event4.id] > stats[event5.id]
-
-
 def test_names(helpers):
     assert helpers.names == sorted(helpers.names)
     assert helpers.adjectives == sorted(helpers.adjectives)

From 39449779350a6dcf8d410f4c2c756c0678ca4a30 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 14:35:10 -0400
Subject: [PATCH 057/387] reworked queueing systems

---
 bbot/core/event/base.py                     |  12 +-
 bbot/core/helpers/cloud/base.py             |   3 +-
 bbot/core/helpers/misc.py                   |  35 ++++--
 bbot/core/helpers/names_generator.py        |   1 -
 bbot/modules/base.py                        |  14 ++-
 bbot/modules/massdns.py                     |   6 +-
 bbot/modules/ntlm.py                        |   4 +-
 bbot/modules/telerik.py                     |   4 +-
 bbot/scanner/manager.py                     | 122 +++++++++++++-------
 bbot/scanner/scanner.py                     |  10 +-
 bbot/scanner/target.py                      |   2 +-
 bbot/test/bbot_fixtures.py                  |   2 +-
 bbot/test/run_tests.sh                      |   2 +-
 bbot/test/test_step_1/test_events.py        |   6 +-
 bbot/test/test_step_1/test_helpers.py       |  16 +++
 bbot/test/test_step_1/test_manager.py       |   2 +-
 bbot/test/test_step_1/test_modules_basic.py |   4 +-
 poetry.lock                                 |  40 ++++++-
 pyproject.toml                              |   1 +
 19 files changed, 207 insertions(+), 79 deletions(-)

diff --git a/bbot/core/event/base.py b/bbot/core/event/base.py
index f96e4a79a2..6d0d285547 100644
--- a/bbot/core/event/base.py
+++ b/bbot/core/event/base.py
@@ -309,6 +309,7 @@ def unmake_internal(self, set_scope_distance=None, force_output=False):
         if force_output == "trail_only":
             force_output = True
 
+        # if our source event is internal, unmake it too
         if getattr(self.source, "_internal", False):
             source_scope_distance = None
             if set_scope_distance is not None:
@@ -320,13 +321,16 @@ def unmake_internal(self, set_scope_distance=None, force_output=False):
 
         return source_trail
 
-    def make_in_scope(self, set_scope_distance=0):
+    def set_scope_distance(self, d=0):
+        """
+        Set the scope of an event and its parents
+        """
         source_trail = []
         # keep the event internal if the module requests so, unless it's a DNS_NAME
         if getattr(self.module, "_scope_shepherding", True) or self.type in ("DNS_NAME",):
-            source_trail = self.unmake_internal(set_scope_distance=set_scope_distance, force_output="trail_only")
-        self.scope_distance = set_scope_distance
-        if set_scope_distance == 0:
+            source_trail = self.unmake_internal(set_scope_distance=d, force_output="trail_only")
+        self.scope_distance = d
+        if d == 0:
             self.add_tag("in-scope")
         return source_trail
 
diff --git a/bbot/core/helpers/cloud/base.py b/bbot/core/helpers/cloud/base.py
index bd7b8b236a..cb1377d1db 100644
--- a/bbot/core/helpers/cloud/base.py
+++ b/bbot/core/helpers/cloud/base.py
@@ -69,7 +69,8 @@ def emit_event(self, *args, **kwargs):
         excavate_module = self.parent_helper.scan.modules.get("excavate", None)
         if excavate_module:
             event = self.dummy_module.make_event(*args, **kwargs)
-            excavate_module.emit_event(event)
+            if event:
+                excavate_module.emit_event(event)
 
     def is_valid_bucket(self, bucket_name):
         return self.bucket_name_regex.match(bucket_name)
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 3c267e1dcc..f8b51b6b63 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -17,6 +17,7 @@
 import platform
 import ipaddress
 import traceback
+import numpy as np
 import subprocess as sp
 from pathlib import Path
 from itertools import islice
@@ -1074,16 +1075,30 @@ def get_traceback_details(e):
     return filename, lineno, funcname
 
 
-async def cancel_tasks(tasks):
+def cancel_tasks(tasks):
     current_task = asyncio.current_task()
     for task in tasks:
         if task != current_task:
-            with suppress(asyncio.CancelledError):
-                task.cancel()
-    for task in tasks:
-        if task != current_task:
-            try:
-                await task
-            except Exception as e:
-                log.debug(e)
-                log.trace(traceback.format_exc())
+            task.cancel()
+
+
+def weighted_shuffle(items, weights):
+    # Make sure the list is a numpy array
+    items = np.array(items)
+
+    # Make an empty list to hold the shuffled items
+    shuffled_items = []
+
+    # While there are still items to be chosen...
+    while len(items) > 0:
+        # Choose an item
+        chosen_index = np.random.choice(range(len(items)), p=weights / np.sum(weights))
+
+        # Add the chosen item to the shuffled list
+        shuffled_items.append(items[chosen_index])
+
+        # Remove the chosen item from the available pool
+        items = np.delete(items, chosen_index)
+        weights = np.delete(weights, chosen_index)
+
+    return shuffled_items
diff --git a/bbot/core/helpers/names_generator.py b/bbot/core/helpers/names_generator.py
index 1dae35c4f6..46e46b2a24 100644
--- a/bbot/core/helpers/names_generator.py
+++ b/bbot/core/helpers/names_generator.py
@@ -21,7 +21,6 @@
     "blazed",
     "bloodshot",
     "brown",
-    "carbonated",
     "cheeky",
     "childish",
     "chiseled",
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index af06a1ee06..d0a2aff50d 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -246,7 +246,8 @@ def emit_event(self, *args, **kwargs):
             if v is not None:
                 emit_kwargs[o] = v
         event = self.make_event(*args, **event_kwargs)
-        self.queue_outgoing_event(event, **emit_kwargs)
+        if event:
+            self.queue_outgoing_event(event, **emit_kwargs)
 
     async def events_waiting(self):
         """
@@ -357,7 +358,7 @@ def _event_precheck(self, event):
         """
         # special signal event types
         if event.type in ("FINISHED",):
-            return True, ""
+            return True, "its type is FINISHED"
         if self.errored:
             return False, f"module is in error state"
         # exclude non-watched types
@@ -382,7 +383,7 @@ def _event_precheck(self, event):
                 # then skip the event.
                 # this helps avoid double-portscanning both an individual IP and its parent CIDR.
                 return False, "module consumes IP ranges directly"
-        return True, ""
+        return True, "precheck succeeded"
 
     async def _event_postcheck(self, event):
         """
@@ -450,6 +451,8 @@ async def queue_event(self, event):
             if reason and reason != "its type is not in watched_events":
                 self.debug(f"Not accepting {event} because {reason}")
             return
+        else:
+            self.debug(f"Accepting {event} because {reason}")
         try:
             self.incoming_event_queue.put_nowait(event)
             async with self._event_received:
@@ -471,6 +474,11 @@ async def dequeue_outgoing_event(self):
         with self._event_dequeued:
             self._event_dequeued.notify()
 
+    def dequeue_outgoing_event_nowait(self):
+        return self.outgoing_event_queue.get_nowait()
+        with self._event_dequeued:
+            self._event_dequeued.notify()
+
     def set_error_state(self, message=None):
         if not self.errored:
             if message is not None:
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index addef9fc3e..637edf1b84 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -13,7 +13,7 @@ class massdns(crobat):
     meta = {"description": "Brute-force subdomains with massdns (highly effective)"}
     options = {
         "wordlist": "https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt",
-        "max_resolvers": 500,
+        "max_resolvers": 1000,
         "max_mutations": 500,
     }
     options_desc = {
@@ -67,7 +67,7 @@ async def setup(self):
         self.mutations_tried = set()
         self.source_events = dict()
         self.subdomain_file = await self.helpers.wordlist(self.config.get("wordlist"))
-        self.max_resolvers = self.config.get("max_resolvers", 500)
+        self.max_resolvers = self.config.get("max_resolvers", 1000)
         self.max_mutations = self.config.get("max_mutations", 500)
         nameservers_url = (
             "https://raw.githubusercontent.com/blacklanternsecurity/public-dns-servers/master/nameservers.txt"
@@ -98,7 +98,7 @@ async def handle_event(self, event):
         if not h in self.source_events:
             self.source_events[h] = event
 
-        self.info(f"Brute-forcing subdomains for {query} ({event})")
+        self.info(f"Brute-forcing subdomains for {query} (source: {event.data})")
         for hostname in await self.massdns(query, self.helpers.read_file(self.subdomain_file)):
             self.emit_result(hostname, event, query)
 
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index 6f5f535d0e..636519128d 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -130,13 +130,13 @@ async def handle_url(self, event):
             try:
                 result, url = await task
                 if result:
-                    await self.helpers.cancel_tasks(tasks)
+                    self.helpers.cancel_tasks(tasks)
                     return result, url
             except (RequestError, ReadTimeout) as e:
                 if str(e):
                     self.warning(str(e))
                 # cancel all the tasks if there's an error
-                await self.helpers.cancel_tasks(tasks)
+                self.helpers.cancel_tasks(tasks)
                 break
 
         return None, None
diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index 1fa5cc6425..fceedf9c7d 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -235,7 +235,7 @@ async def handle_event(self, event):
                 if fail_count < 2:
                     continue
                 self.debug(f"Cancelling run against {event.data} due to failed request")
-                await self.helpers.cancel_tasks(tasks)
+                self.helpers.cancel_tasks(tasks)
                 break
             else:
                 if "Cannot deserialize dialog parameters" in result.text:
@@ -250,7 +250,7 @@ async def handle_event(self, event):
                     # Once we have a match we need to stop, because the basic handler (Telerik.Web.UI.DialogHandler.aspx) usually works with a path wildcard
                     break
 
-        await self.helpers.cancel_tasks(tasks)
+        self.helpers.cancel_tasks(tasks)
 
         spellcheckhandler = "Telerik.Web.UI.SpellCheckHandler.axd"
         result, _ = await self.test_detector(event.data, spellcheckhandler)
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 0b2da887e6..2128c53894 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -1,4 +1,3 @@
-import queue
 import asyncio
 import logging
 import traceback
@@ -27,7 +26,9 @@ def __init__(self, scan):
         self.dns_resolution = self.scan.config.get("dns_resolution", False)
         self._task_counter = TaskCounter()
         self._new_activity = True
+        self._modules_by_priority = None
         self._incoming_queues = None
+        self._module_priority_weights = None
 
     async def init_events(self):
         """
@@ -157,25 +158,27 @@ async def _emit_event(self, event, *args, **kwargs):
             for provider in self.scan.helpers.cloud.providers.values():
                 provider.tag_event(event)
 
-            # Scope shepherding
             event_is_duplicate = self.is_duplicate_event(event)
-            event_in_report_distance = event.scope_distance <= self.scan.scope_report_distance
-            set_scope_distance = event.scope_distance
-            if event_whitelisted:
-                set_scope_distance = 0
+
+            # Scope shepherding
+            # here, we buff or nerf an event based on its attributes and certain scan settings
+            # first, it needs to have a valid host
             if event.host:
-                if (event_whitelisted or event_in_report_distance) and (event._force_output or not event_is_duplicate):
-                    if set_scope_distance == 0:
-                        log.debug(f"Making {event} in-scope")
-                    source_trail = event.make_in_scope(set_scope_distance)
+                # if it's whitelisted, we make it in-scope
+                if event_whitelisted:
+                    log.debug(f"Making {event} in-scope")
+                    source_trail = event.set_scope_distance(0)
                     for s in source_trail:
                         self.queue_event(s)
-                else:
-                    if event.scope_distance > self.scan.scope_report_distance:
-                        log.debug(
-                            f"Making {event} internal because its scope_distance ({event.scope_distance}) > scope_report_distance ({self.scan.scope_report_distance})"
-                        )
-                        event.make_internal()
+
+                # finally, we check if it's inside our configured report distance
+                event_in_report_distance = event.scope_distance <= self.scan.scope_report_distance
+                # if it's not, we make it internal (so it's only distributed to modules and not to the user)
+                if not event_in_report_distance and not event._force_output:
+                    log.debug(
+                        f"Making {event} internal because its scope_distance ({event.scope_distance}) > scope_report_distance ({self.scan.scope_report_distance})"
+                    )
+                    event.make_internal()
 
             # check for wildcards
             if event.scope_distance <= self.scan.scope_search_distance:
@@ -207,7 +210,7 @@ async def _emit_event(self, event, *args, **kwargs):
 
             if not event.host or (event.always_emit and not event_is_duplicate):
                 log.debug(
-                    f"Force-emitting {event} because it does not have identifying scope information or because always_emit was True"
+                    f"Force-emitting {event} (host:{event.host}, always_emit={event.always_emit}, is_duplicate={event_is_duplicate})"
                 )
                 source_trail = event.unmake_internal(force_output=True)
                 for s in source_trail:
@@ -332,14 +335,14 @@ async def distribute_event(self, *args, **kwargs):
     async def _worker_loop(self):
         try:
             while 1:
-                try:
-                    # event, kwargs = self.incoming_event_queue.get_nowait()
-                    event, kwargs = await self.get_event_from_modules()
-                    acceptable = await self.emit_event(event, **kwargs)
-                    if acceptable:
-                        self._new_activity = True
-                except queue.Empty:
-                    await asyncio.sleep(0.1)
+                log.debug("manager worker loop")
+                result = await self.get_event_from_modules()
+                if result is None:
+                    continue
+                event, kwargs = result
+                acceptable = await self.emit_event(event, **kwargs)
+                if acceptable:
+                    self._new_activity = True
 
         except KeyboardInterrupt:
             self.scan.stop()
@@ -347,29 +350,68 @@ async def _worker_loop(self):
         except Exception:
             log.critical(traceback.format_exc())
 
+    @property
+    def modules_by_priority(self):
+        if not self._modules_by_priority:
+            self._modules_by_priority = sorted(list(self.scan.modules.values()), key=lambda m: m.priority)
+        return self._modules_by_priority
+
     @property
     def incoming_queues(self):
-        if self._incoming_queues is None:
-            modules_by_priority = sorted(list(self.scan.modules.values()), key=lambda m: m.priority)
-            queues_by_priority = [m.outgoing_event_queue for m in modules_by_priority]
+        if not self._incoming_queues:
+            queues_by_priority = [m.outgoing_event_queue for m in self.modules_by_priority]
             self._incoming_queues = [self.incoming_event_queue] + queues_by_priority
         return self._incoming_queues
 
-    async def _wait_on_queue(self, queue, waiter_tasks, first_done):
-        item = await queue.get()
+    @property
+    def module_priority_weights(self):
+        if not self._module_priority_weights:
+            # we subtract from six because lower priorities == higher weights
+            priorities = [6 - m.priority for m in self.modules_by_priority]
+            self._module_priority_weights = priorities
+        return self._module_priority_weights
+
+    async def _wait_on_module(self, module, waiter_tasks, first_done):
+        item = await module.dequeue_outgoing_event()
         first_done.set_result(item)
-        current_task = asyncio.current_task()
-        for t in waiter_tasks:
-            if t != current_task:
-                t.cancel()
-
-    async def get_event_from_modules(self):
+        self.scan.helpers.cancel_tasks(waiter_tasks)
+
+    def get_random_event_from_modules(self):
+        for m in self.scan.helpers.weighted_shuffle(
+            [self] + self.modules_by_priority, [5] + self.module_priority_weights
+        ):
+            try:
+                return m.dequeue_outgoing_event_nowait()
+            except asyncio.queues.QueueEmpty:
+                continue
+
+    async def dequeue_outgoing_event(self):
+        # technically this is the manager's "incoming" queue
+        # but we are mirroring the module's method
+        return await self.incoming_event_queue.get()
+
+    def dequeue_outgoing_event_nowait(self):
+        # technically this is the manager's "incoming" queue
+        # but we are mirroring the module's method
+        return self.incoming_event_queue.get_nowait()
+
+    async def get_first_event_from_modules(self):
         waiter_tasks = []
         first_done = asyncio.Future()
-        for incoming_queue in self.incoming_queues:
-            waiter_tasks.append(asyncio.create_task(self._wait_on_queue(incoming_queue, waiter_tasks, first_done)))
-        result = await first_done
-        return result
+        for module in [self] + self.modules_by_priority:
+            waiter_tasks.append(asyncio.create_task(self._wait_on_module(module, waiter_tasks, first_done)))
+        try:
+            return await asyncio.wait_for(first_done, timeout=0.1)
+        except asyncio.TimeoutError:
+            self.scan.helpers.cancel_tasks(waiter_tasks)
+
+    async def get_event_from_modules(self):
+        # try to get a (weighted) random one first
+        event = self.get_random_event_from_modules()
+        # if all the queues are, empty, then wait
+        if event is None:
+            event = await self.get_first_event_from_modules()
+        return event
 
     @property
     def queued_event_types(self):
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 43e09f8d83..60c58254c0 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -234,6 +234,7 @@ async def start(self):
 
             # main scan loop
             while 1:
+                self.debug("main scan loop")
                 # abort if we're aborting
                 if self.aborting:
                     self.drain_queues()
@@ -273,7 +274,7 @@ async def start(self):
                     self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
 
         finally:
-            await self.cancel_tasks()
+            self.cancel_tasks()
             await self.report()
             await self.cleanup()
 
@@ -361,12 +362,15 @@ def drain_queues(self):
             with contextlib.suppress(asyncio.queues.QueueEmpty):
                 while 1:
                     module.incoming_event_queue.get_nowait()
+            with contextlib.suppress(asyncio.queues.QueueEmpty):
+                while 1:
+                    module.outgoing_event_queue.get_nowait()
         with contextlib.suppress(asyncio.queues.QueueEmpty):
             while 1:
                 self.manager.incoming_event_queue.get_nowait()
         self.debug("Finished draining queues")
 
-    async def cancel_tasks(self):
+    def cancel_tasks(self):
         tasks = []
         # module workers
         for m in self.modules.values():
@@ -379,7 +383,7 @@ async def cancel_tasks(self):
             tasks.append(self.ticker_task)
         # manager worker loops
         tasks += self.manager_worker_loop_tasks
-        await self.helpers.cancel_tasks(tasks)
+        self.helpers.cancel_tasks(tasks)
 
     async def report(self):
         for mod in self.modules.values():
diff --git a/bbot/scanner/target.py b/bbot/scanner/target.py
index 53cf39f6ea..8d1345d42f 100644
--- a/bbot/scanner/target.py
+++ b/bbot/scanner/target.py
@@ -37,7 +37,7 @@ def add_target(self, t):
             else:
                 event = self.scan.make_event(t, source=self.scan.root_event, module=self.dummy_module, tags=["target"])
             if self.make_in_scope:
-                event.make_in_scope()
+                event.set_scope_distance(0)
             try:
                 self._events[event.host].add(event)
             except KeyError:
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index 5a75c81a6c..b43ee67511 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -223,7 +223,7 @@ class bbot_events:
     ]
 
     for e in bbot_events.all:
-        e.make_in_scope()
+        e.set_scope_distance(0)
 
     return bbot_events
 
diff --git a/bbot/test/run_tests.sh b/bbot/test/run_tests.sh
index cce52279ea..b95f4ab44a 100755
--- a/bbot/test/run_tests.sh
+++ b/bbot/test/run_tests.sh
@@ -14,4 +14,4 @@ flake8 --select F,E722 --ignore F403,F405,F541 --per-file-ignores="*/__init__.py
 echo
 
 echo "[+] Testing with pytest"
-pytest --exitfirst --disable-warnings --log-cli-level=ERROR "$bbot_dir" --cov=bbot --cov-report term-missing
+pytest --exitfirst --disable-warnings --log-cli-level=ERROR "$bbot_dir" --cov=bbot/test/test_step_2/test_cli.py --cov-report term-missing
diff --git a/bbot/test/test_step_1/test_events.py b/bbot/test/test_step_1/test_events.py
index 03ebde6354..44a94c647f 100644
--- a/bbot/test/test_step_1/test_events.py
+++ b/bbot/test/test_step_1/test_events.py
@@ -140,7 +140,7 @@ async def test_events(events, scan, helpers, bbot_config):
     # scope distance
     event1 = scan.make_event("1.2.3.4", dummy=True)
     assert event1._scope_distance == -1
-    event1.make_in_scope()
+    event1.set_scope_distance(0)
     assert event1._scope_distance == 0
     event2 = scan.make_event("2.3.4.5", source=event1)
     assert event2._scope_distance == 1
@@ -156,13 +156,13 @@ async def test_events(events, scan, helpers, bbot_config):
     internal_event1 = scan.make_event("1.2.3.4", source=root_event, internal=True)
     assert internal_event1._internal == True
     assert internal_event1._made_internal == True
-    internal_event1.make_in_scope()
+    internal_event1.set_scope_distance(0)
     assert internal_event1._internal == False
     assert internal_event1._made_internal == False
     internal_event2 = scan.make_event("2.3.4.5", source=internal_event1, internal=True)
     internal_event3 = scan.make_event("3.4.5.6", source=internal_event2, internal=True)
     internal_event4 = scan.make_event("4.5.6.7", source=internal_event3)
-    source_trail = internal_event4.make_in_scope()
+    source_trail = internal_event4.set_scope_distance(0)
     assert internal_event4._internal == False
     assert internal_event3._internal == False
     assert internal_event2._internal == False
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 9b604d7967..0c1fd4bb60 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -417,6 +417,22 @@ async def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver
     await scan1.load_modules()
     assert int(helpers.get_size(scan1.modules["ipneighbor"])) > 0
 
+    # weighted shuffle (used for module queues)
+    items = ["a", "b", "c", "d", "e"]
+    first_frequencies = {i: 0 for i in items}
+    weights = [1, 2, 3, 4, 5]
+    for i in range(10000):
+        shuffled = helpers.weighted_shuffle(items, weights)
+        first = shuffled[0]
+        first_frequencies[first] += 1
+    assert (
+        first_frequencies["a"]
+        < first_frequencies["b"]
+        < first_frequencies["c"]
+        < first_frequencies["d"]
+        < first_frequencies["e"]
+    )
+
 
 def test_word_cloud(helpers, bbot_config, bbot_scanner):
     number_mutations = helpers.word_cloud.get_number_mutations("base2_p013", n=5, padding=2)
diff --git a/bbot/test/test_step_1/test_manager.py b/bbot/test/test_step_1/test_manager.py
index 6b43ce07d8..d3e4b4f7c0 100644
--- a/bbot/test/test_step_1/test_manager.py
+++ b/bbot/test/test_step_1/test_manager.py
@@ -72,7 +72,7 @@ class DummyModule3:
     googledns = scan1.make_event("8.8.8.8", source=scan1.root_event)
     googledns.module = DummyModule2()
     googledns.source = "asdf"
-    googledns.make_in_scope()
+    googledns.set_scope_distance(0)
     manager.queue_event = event_children_append
     await manager._emit_event(googledns)
     assert len(event_children) > 0
diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index 459dc3fff5..c92f3ce4e3 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -34,7 +34,7 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
     for module_class in (BaseModule, BaseOutputModule, BaseReportModule, BaseInternalModule):
         base_module = module_class(scan)
         localhost2 = scan.make_event("127.0.0.2", source=events.subdomain)
-        localhost2.make_in_scope()
+        localhost2.set_scope_distance(0)
         # base cases
         base_module._watched_events = None
         base_module.watched_events = ["*"]
@@ -55,7 +55,7 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
         base_module.watched_events = ["IP_ADDRESS", "IP_RANGE"]
         ip_range = scan.make_event("127.0.0.0/24", dummy=True)
         localhost4 = scan.make_event("127.0.0.1", source=ip_range)
-        localhost4.make_in_scope()
+        localhost4.set_scope_distance(0)
         localhost4.module = "plumbus"
         assert base_module._event_precheck(localhost4)[0] == True
         localhost4.module = "speculate"
diff --git a/poetry.lock b/poetry.lock
index d1f8465257..39e4f7da21 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -860,6 +860,44 @@ files = [
     {file = "mypy_extensions-1.0.0.tar.gz", hash = "sha256:75dbf8955dc00442a438fc4d0666508a9a97b6bd41aa2f0ffe9d2f2725af0782"},
 ]
 
+[[package]]
+name = "numpy"
+version = "1.24.3"
+description = "Fundamental package for array computing in Python"
+category = "main"
+optional = false
+python-versions = ">=3.8"
+files = [
+    {file = "numpy-1.24.3-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:3c1104d3c036fb81ab923f507536daedc718d0ad5a8707c6061cdfd6d184e570"},
+    {file = "numpy-1.24.3-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:202de8f38fc4a45a3eea4b63e2f376e5f2dc64ef0fa692838e31a808520efaf7"},
+    {file = "numpy-1.24.3-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8535303847b89aa6b0f00aa1dc62867b5a32923e4d1681a35b5eef2d9591a463"},
+    {file = "numpy-1.24.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:2d926b52ba1367f9acb76b0df6ed21f0b16a1ad87c6720a1121674e5cf63e2b6"},
+    {file = "numpy-1.24.3-cp310-cp310-win32.whl", hash = "sha256:f21c442fdd2805e91799fbe044a7b999b8571bb0ab0f7850d0cb9641a687092b"},
+    {file = "numpy-1.24.3-cp310-cp310-win_amd64.whl", hash = "sha256:ab5f23af8c16022663a652d3b25dcdc272ac3f83c3af4c02eb8b824e6b3ab9d7"},
+    {file = "numpy-1.24.3-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:9a7721ec204d3a237225db3e194c25268faf92e19338a35f3a224469cb6039a3"},
+    {file = "numpy-1.24.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:d6cc757de514c00b24ae8cf5c876af2a7c3df189028d68c0cb4eaa9cd5afc2bf"},
+    {file = "numpy-1.24.3-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:76e3f4e85fc5d4fd311f6e9b794d0c00e7002ec122be271f2019d63376f1d385"},
+    {file = "numpy-1.24.3-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a1d3c026f57ceaad42f8231305d4653d5f05dc6332a730ae5c0bea3513de0950"},
+    {file = "numpy-1.24.3-cp311-cp311-win32.whl", hash = "sha256:c91c4afd8abc3908e00a44b2672718905b8611503f7ff87390cc0ac3423fb096"},
+    {file = "numpy-1.24.3-cp311-cp311-win_amd64.whl", hash = "sha256:5342cf6aad47943286afa6f1609cad9b4266a05e7f2ec408e2cf7aea7ff69d80"},
+    {file = "numpy-1.24.3-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:7776ea65423ca6a15255ba1872d82d207bd1e09f6d0894ee4a64678dd2204078"},
+    {file = "numpy-1.24.3-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:ae8d0be48d1b6ed82588934aaaa179875e7dc4f3d84da18d7eae6eb3f06c242c"},
+    {file = "numpy-1.24.3-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ecde0f8adef7dfdec993fd54b0f78183051b6580f606111a6d789cd14c61ea0c"},
+    {file = "numpy-1.24.3-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4749e053a29364d3452c034827102ee100986903263e89884922ef01a0a6fd2f"},
+    {file = "numpy-1.24.3-cp38-cp38-win32.whl", hash = "sha256:d933fabd8f6a319e8530d0de4fcc2e6a61917e0b0c271fded460032db42a0fe4"},
+    {file = "numpy-1.24.3-cp38-cp38-win_amd64.whl", hash = "sha256:56e48aec79ae238f6e4395886b5eaed058abb7231fb3361ddd7bfdf4eed54289"},
+    {file = "numpy-1.24.3-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:4719d5aefb5189f50887773699eaf94e7d1e02bf36c1a9d353d9f46703758ca4"},
+    {file = "numpy-1.24.3-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:0ec87a7084caa559c36e0a2309e4ecb1baa03b687201d0a847c8b0ed476a7187"},
+    {file = "numpy-1.24.3-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ea8282b9bcfe2b5e7d491d0bf7f3e2da29700cec05b49e64d6246923329f2b02"},
+    {file = "numpy-1.24.3-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:210461d87fb02a84ef243cac5e814aad2b7f4be953b32cb53327bb49fd77fbb4"},
+    {file = "numpy-1.24.3-cp39-cp39-win32.whl", hash = "sha256:784c6da1a07818491b0ffd63c6bbe5a33deaa0e25a20e1b3ea20cf0e43f8046c"},
+    {file = "numpy-1.24.3-cp39-cp39-win_amd64.whl", hash = "sha256:d5036197ecae68d7f491fcdb4df90082b0d4960ca6599ba2659957aafced7c17"},
+    {file = "numpy-1.24.3-pp38-pypy38_pp73-macosx_10_9_x86_64.whl", hash = "sha256:352ee00c7f8387b44d19f4cada524586f07379c0d49270f87233983bc5087ca0"},
+    {file = "numpy-1.24.3-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1a7d6acc2e7524c9955e5c903160aa4ea083736fde7e91276b0e5d98e6332812"},
+    {file = "numpy-1.24.3-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:35400e6a8d102fd07c71ed7dcadd9eb62ee9a6e84ec159bd48c28235bbb0f8e4"},
+    {file = "numpy-1.24.3.tar.gz", hash = "sha256:ab344f1bf21f140adab8e47fdbc7c35a477dc01408791f8ba00d018dd0bc5155"},
+]
+
 [[package]]
 name = "omegaconf"
 version = "2.3.0"
@@ -1703,4 +1741,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "084cb45bd37c294d262dc6a40819b67f18cca2447e56d843fb4ca56c16484e39"
+content-hash = "bf51b55024928ced33830450536f53cc0b93bf641bd9a603f8f8e0c6176afabe"
diff --git a/pyproject.toml b/pyproject.toml
index 0126a80f27..ef82f0e679 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -29,6 +29,7 @@ tabulate = "0.8.10"
 cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
 httpx = {extras = ["http2"], version = "^0.24.0"}
+numpy = "^1.24.3"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From 1e0173ae271b3b5a6d489547f4f000f01b37b8f5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 14:54:54 -0400
Subject: [PATCH 058/387] fix tests, improve queueing

---
 bbot/modules/base.py                  |  4 +--
 bbot/modules/bucket_aws.py            |  3 +--
 bbot/modules/bucket_azure.py          |  3 +--
 bbot/modules/bucket_digitalocean.py   |  3 +--
 bbot/modules/bucket_firebase.py       |  3 +--
 bbot/modules/bucket_gcp.py            |  3 +--
 bbot/modules/ntlm.py                  |  4 +--
 bbot/modules/paramminer_getparams.py  |  1 -
 bbot/modules/sslcert.py               |  1 -
 bbot/scanner/manager.py               | 35 +++++++++++----------------
 bbot/scanner/scanner.py               |  4 ++-
 bbot/test/test_step_1/test_manager.py |  2 +-
 12 files changed, 27 insertions(+), 39 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index d0a2aff50d..0f38108fee 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -312,8 +312,8 @@ async def _worker(self):
             while not self.scan.stopping:
                 # hold the reigns if our outgoing queue is full
                 if self._qsize > 0 and self.outgoing_event_queue.qsize() >= self._qsize:
-                    async with self._event_dequeued:
-                        await self._event_dequeued.wait()
+                    await asyncio.sleep(0.1)
+                    continue
 
                 if self.batch_size > 1:
                     submitted = await self._handle_batch()
diff --git a/bbot/modules/bucket_aws.py b/bbot/modules/bucket_aws.py
index 012bb6df6f..ee354c365b 100644
--- a/bbot/modules/bucket_aws.py
+++ b/bbot/modules/bucket_aws.py
@@ -6,9 +6,8 @@ class bucket_aws(BaseModule):
     produced_events = ["STORAGE_BUCKET", "FINDING"]
     flags = ["active", "safe", "cloud-enum", "web-basic", "web-thorough"]
     meta = {"description": "Check for S3 buckets related to target"}
-    options = {"max_threads": 10, "permutations": False}
+    options = {"permutations": False}
     options_desc = {
-        "max_threads": "Maximum number of threads for HTTP requests",
         "permutations": "Whether to try permutations",
     }
     scope_distance_modifier = 3
diff --git a/bbot/modules/bucket_azure.py b/bbot/modules/bucket_azure.py
index 97d81fa231..a5397b4d97 100644
--- a/bbot/modules/bucket_azure.py
+++ b/bbot/modules/bucket_azure.py
@@ -6,9 +6,8 @@ class bucket_azure(bucket_aws):
     produced_events = ["STORAGE_BUCKET", "FINDING"]
     flags = ["active", "safe", "cloud-enum", "web-basic", "web-thorough"]
     meta = {"description": "Check for Azure storage blobs related to target"}
-    options = {"max_threads": 10, "permutations": False}
+    options = {"permutations": False}
     options_desc = {
-        "max_threads": "Maximum number of threads for HTTP requests",
         "permutations": "Whether to try permutations",
     }
 
diff --git a/bbot/modules/bucket_digitalocean.py b/bbot/modules/bucket_digitalocean.py
index 738877a4b1..f55f33c67f 100644
--- a/bbot/modules/bucket_digitalocean.py
+++ b/bbot/modules/bucket_digitalocean.py
@@ -6,9 +6,8 @@ class bucket_digitalocean(bucket_aws):
     produced_events = ["STORAGE_BUCKET", "FINDING"]
     flags = ["active", "safe", "slow", "cloud-enum", "web-thorough"]
     meta = {"description": "Check for DigitalOcean spaces related to target"}
-    options = {"max_threads": 10, "permutations": False}
+    options = {"permutations": False}
     options_desc = {
-        "max_threads": "Maximum number of threads for HTTP requests",
         "permutations": "Whether to try permutations",
     }
 
diff --git a/bbot/modules/bucket_firebase.py b/bbot/modules/bucket_firebase.py
index 413457893a..bda49a3a4b 100644
--- a/bbot/modules/bucket_firebase.py
+++ b/bbot/modules/bucket_firebase.py
@@ -6,9 +6,8 @@ class bucket_firebase(bucket_aws):
     produced_events = ["STORAGE_BUCKET", "FINDING"]
     flags = ["active", "safe", "cloud-enum", "web-basic", "web-thorough"]
     meta = {"description": "Check for open Firebase databases related to target"}
-    options = {"max_threads": 10, "permutations": False}
+    options = {"permutations": False}
     options_desc = {
-        "max_threads": "Maximum number of threads for HTTP requests",
         "permutations": "Whether to try permutations",
     }
 
diff --git a/bbot/modules/bucket_gcp.py b/bbot/modules/bucket_gcp.py
index b7e96d5b1d..8c1c45674c 100644
--- a/bbot/modules/bucket_gcp.py
+++ b/bbot/modules/bucket_gcp.py
@@ -10,9 +10,8 @@ class bucket_gcp(bucket_aws):
     produced_events = ["STORAGE_BUCKET", "FINDING"]
     flags = ["active", "safe", "cloud-enum", "web-basic", "web-thorough"]
     meta = {"description": "Check for Google object storage related to target"}
-    options = {"max_threads": 10, "permutations": False}
+    options = {"permutations": False}
     options_desc = {
-        "max_threads": "Maximum number of threads for HTTP requests",
         "permutations": "Whether to try permutations",
     }
 
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index 636519128d..3aa305d297 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -64,8 +64,8 @@ class ntlm(BaseModule):
     produced_events = ["FINDING", "DNS_NAME"]
     flags = ["active", "safe", "web-basic", "web-thorough"]
     meta = {"description": "Watch for HTTP endpoints that support NTLM authentication"}
-    options = {"max_threads": 10, "try_all": False}
-    options_desc = {"max_threads": "Maximum concurrent requests", "try_all": "Try every NTLM endpoint"}
+    options = {"try_all": False}
+    options_desc = {"try_all": "Try every NTLM endpoint"}
 
     in_scope_only = True
 
diff --git a/bbot/modules/paramminer_getparams.py b/bbot/modules/paramminer_getparams.py
index 6b79053434..417c14ac54 100644
--- a/bbot/modules/paramminer_getparams.py
+++ b/bbot/modules/paramminer_getparams.py
@@ -15,7 +15,6 @@ class paramminer_getparams(paramminer_headers):
     options_desc = {"wordlist": "Define the wordlist to be used to derive GET params"}
     scanned_hosts = []
     getparam_blacklist = []
-    max_threads = 12
     in_scope_only = True
     compare_mode = "getparam"
 
diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index 8792cecfa9..d55f124ec8 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -19,7 +19,6 @@ class sslcert(BaseModule):
     options_desc = {"timeout": "Socket connect timeout in seconds", "skip_non_ssl": "Don't try common non-SSL ports"}
     deps_apt = ["openssl"]
     deps_pip = ["pyOpenSSL~=23.1.1"]
-    max_threads = 50
     max_event_handlers = 25
     scope_distance_modifier = 1
     _priority = 2
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 2128c53894..d789846dea 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -367,39 +367,27 @@ def incoming_queues(self):
     def module_priority_weights(self):
         if not self._module_priority_weights:
             # we subtract from six because lower priorities == higher weights
-            priorities = [6 - m.priority for m in self.modules_by_priority]
+            priorities = [5] + [6 - m.priority for m in self.modules_by_priority]
             self._module_priority_weights = priorities
         return self._module_priority_weights
 
-    async def _wait_on_module(self, module, waiter_tasks, first_done):
-        item = await module.dequeue_outgoing_event()
+    async def _wait_on_queue(self, q, waiter_tasks, first_done):
+        item = await q.get()
         first_done.set_result(item)
         self.scan.helpers.cancel_tasks(waiter_tasks)
 
     def get_random_event_from_modules(self):
-        for m in self.scan.helpers.weighted_shuffle(
-            [self] + self.modules_by_priority, [5] + self.module_priority_weights
-        ):
+        for q in self.scan.helpers.weighted_shuffle(self.incoming_queues, self.module_priority_weights):
             try:
-                return m.dequeue_outgoing_event_nowait()
+                return q.get_nowait()
             except asyncio.queues.QueueEmpty:
                 continue
 
-    async def dequeue_outgoing_event(self):
-        # technically this is the manager's "incoming" queue
-        # but we are mirroring the module's method
-        return await self.incoming_event_queue.get()
-
-    def dequeue_outgoing_event_nowait(self):
-        # technically this is the manager's "incoming" queue
-        # but we are mirroring the module's method
-        return self.incoming_event_queue.get_nowait()
-
     async def get_first_event_from_modules(self):
         waiter_tasks = []
         first_done = asyncio.Future()
-        for module in [self] + self.modules_by_priority:
-            waiter_tasks.append(asyncio.create_task(self._wait_on_module(module, waiter_tasks, first_done)))
+        for q in self.incoming_queues:
+            waiter_tasks.append(asyncio.create_task(self._wait_on_queue(q, waiter_tasks, first_done)))
         try:
             return await asyncio.wait_for(first_done, timeout=0.1)
         except asyncio.TimeoutError:
@@ -441,11 +429,16 @@ def queue_event(self, event, **kwargs):
 
     @property
     def running(self):
-        return self._task_counter.value > 0 or self.incoming_event_queue.qsize() > 0
+        active_tasks = self._task_counter.value
+        incoming_events = self.incoming_event_queue.qsize()
+        log.debug(f"active tasks: {active_tasks}, incoming events: {incoming_events}")
+        return active_tasks > 0 or incoming_events > 0
 
     @property
     def modules_finished(self):
-        return all(m.finished for m in self.scan.modules.values())
+        finished_modules = [m.finished for m in self.scan.modules.values()]
+        log.debug(f"finished modules: {finished_modules}")
+        return all(finished_modules)
 
     @property
     def active(self):
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 60c58254c0..990a520ebc 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -250,8 +250,10 @@ async def start(self):
                     new_activity = await self.finish()
                     if not new_activity:
                         break
+                else:
+                    self.debug(f"manager.active: {self.manager.active}, finished init: {self._finished_init}")
 
-                await asyncio.sleep(0.01)
+                await asyncio.sleep(0.1)
 
             failed = False
 
diff --git a/bbot/test/test_step_1/test_manager.py b/bbot/test/test_step_1/test_manager.py
index d3e4b4f7c0..b57c9ccb71 100644
--- a/bbot/test/test_step_1/test_manager.py
+++ b/bbot/test/test_step_1/test_manager.py
@@ -175,7 +175,7 @@ async def test_scope_distance(bbot_scanner, bbot_config):
     assert test_event4.scope_distance == 2
     await manager._emit_event(test_event4)
     assert test_event4.scope_distance == 2
-    assert test_event4._internal == True
+    assert test_event4._internal == False
     assert test_event4._force_output == True
     assert test_event4 in output_queue
     assert test_event4 in module_queue

From b4c785064146d767d7481553ea80b334f10a5018 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 15:58:00 -0400
Subject: [PATCH 059/387] added nmap module

---
 bbot/core/helpers/helper.py                   |   7 +-
 bbot/modules/nmap.py                          | 134 ++++++++++++++++++
 bbot/scanner/manager.py                       |  34 +----
 .../module_tests/test_module_nmap.py          |  10 ++
 4 files changed, 155 insertions(+), 30 deletions(-)
 create mode 100644 bbot/modules/nmap.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_nmap.py

diff --git a/bbot/core/helpers/helper.py b/bbot/core/helpers/helper.py
index 7d0a00d7d7..fd37387ef5 100644
--- a/bbot/core/helpers/helper.py
+++ b/bbot/core/helpers/helper.py
@@ -60,11 +60,14 @@ def interactsh(self):
     def http_compare(self, url, allow_redirects=False, include_cache_buster=True):
         return HttpCompare(url, self, allow_redirects=allow_redirects, include_cache_buster=include_cache_buster)
 
-    def temp_filename(self):
+    def temp_filename(self, extension=None):
         """
         temp_filename() --> Path("/home/user/.bbot/temp/pgxml13bov87oqrvjz7a")
         """
-        return self.temp_dir / self.rand_string(20)
+        filename = self.rand_string(20)
+        if extension is not None:
+            filename = f"{filename}.{extension}"
+        return self.temp_dir / filename
 
     def clean_old_scans(self):
         _filter = lambda x: x.is_dir() and self.regexes.scan_name_regex.match(x.name)
diff --git a/bbot/modules/nmap.py b/bbot/modules/nmap.py
new file mode 100644
index 0000000000..96a66d3942
--- /dev/null
+++ b/bbot/modules/nmap.py
@@ -0,0 +1,134 @@
+from lxml import etree
+from bbot.modules.base import BaseModule
+
+
+class nmap(BaseModule):
+    watched_events = ["IP_ADDRESS", "DNS_NAME"]
+    produced_events = ["OPEN_TCP_PORT"]
+    flags = ["active", "portscan", "aggressive", "web-thorough"]
+    meta = {"description": "Execute port scans with nmap"}
+    options = {
+        "ports": "",
+        "top_ports": 100,
+        "timing": "T4",
+        "skip_host_discovery": True,
+    }
+    options_desc = {
+        "ports": "ports to scan",
+        "top_ports": "top ports to scan",
+        "timing": "-T<0-5>: Set timing template (higher is faster)",
+        "skip_host_discovery": "skip host discovery (-Pn)",
+    }
+    max_event_handlers = 2
+    batch_size = 256
+    _priority = 2
+
+    deps_apt = ["nmap"]
+    deps_pip = ["lxml~=4.9.2"]
+
+    async def setup(self):
+        self.helpers.depsinstaller.ensure_root(message="Nmap requires root privileges")
+        self.ports = self.config.get("ports", "")
+        self.timing = self.config.get("timing", "T4")
+        self.top_ports = self.config.get("top_ports", 100)
+        self.skip_host_discovery = self.config.get("skip_host_discovery", True)
+        return True
+
+    async def handle_batch(self, *events):
+        target = self.helpers.make_target(events)
+        targets = list(set(str(e.data) for e in events))
+        command, output_file = self.construct_command(targets)
+        try:
+            await self.helpers.run(command, sudo=True)
+            for host in self.parse_nmap_xml(output_file):
+                source_event = None
+                for h in [host.address] + host.hostnames:
+                    source_event = target.get(h)
+                    if source_event is not None:
+                        break
+                if source_event is None:
+                    self.warning(f"Failed to correlate source event from {host}")
+                    source_event = self.scan.root_event
+                for port in host.open_ports:
+                    port_number = int(port.split("/")[0])
+                    netloc = self.helpers.make_netloc(host.address, port_number)
+                    self.emit_event(netloc, "OPEN_TCP_PORT", source=source_event)
+                    for hostname in host.hostnames:
+                        netloc = self.helpers.make_netloc(hostname, port_number)
+                        self.emit_event(netloc, "OPEN_TCP_PORT", source=source_event)
+        finally:
+            output_file.unlink(missing_ok=True)
+
+    def construct_command(self, targets):
+        ports = self.config.get("ports", "")
+        top_ports = self.config.get("top_ports", "")
+        temp_filename = self.helpers.temp_filename(extension="xml")
+        command = [
+            "nmap",
+            "-n",
+            f"-{self.timing}",
+            "-oX",
+            temp_filename,
+        ]
+        if self.skip_host_discovery:
+            command += ["-Pn"]
+        if ports:
+            command += ["-p", ports]
+        else:
+            command += ["--top-ports", top_ports]
+        command += targets
+        return command, temp_filename
+
+    def parse_nmap_xml(self, xml_file):
+        try:
+            with open(xml_file, "rb") as f:
+                et = etree.parse(f)
+                for host in et.iter("host"):
+                    yield NmapHost(host)
+        except Exception as e:
+            self.warning(f"Error parsing Nmap XML at {xml_file}: {e}")
+
+    async def cleanup(self):
+        resume_file = self.helpers.current_dir / "resume.cfg"
+        resume_file.unlink(missing_ok=True)
+
+
+class NmapHost(str):
+    def __init__(self, xml):
+        self.etree = xml
+
+        # convenient host information
+        self.status = self.etree.find("status").attrib.get("state", "down")
+        self.address = self.etree.find("address").attrib.get("addr", "")
+        self.hostnames = []
+        for hostname in self.etree.findall("hostnames/hostname"):
+            hostname = hostname.attrib.get("name")
+            if hostname and not hostname in self.hostnames:
+                self.hostnames.append(hostname)
+
+        # convenient port information
+        self.scripts = dict()
+        self.open_ports = []
+        self.closed_ports = []
+        self.filtered_ports = []
+        for port in self.etree.findall("ports/port"):
+            port_name = port.attrib.get("portid", "0") + "/" + port.attrib.get("protocol", "tcp").lower()
+            port_status = port.find("state").attrib.get("state", "closed")
+            if port_status in ("open", "closed", "filtered"):
+                getattr(self, f"{port_status}_ports").append(port_name)
+            for script in port.iter("script"):
+                script_name = script.attrib.get("id", "")
+                script_output = script.attrib.get("output", "")
+                if script_name:
+                    try:
+                        self.scripts[port_name][script_name] = script_output
+                    except KeyError:
+                        self.scripts[port_name] = {script_name: script_output}
+
+    def __str__(self):
+        address = self.address + (" " if self.address else "")
+        hostnames = "(" + ", ".join(self.hostnames) + ")" if self.hostnames else ""
+        return f"{address}{hostnames}"
+
+    def __repr__(self):
+        return str(self)
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index d789846dea..e510c6dfaf 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -335,11 +335,11 @@ async def distribute_event(self, *args, **kwargs):
     async def _worker_loop(self):
         try:
             while 1:
-                log.debug("manager worker loop")
-                result = await self.get_event_from_modules()
-                if result is None:
+                try:
+                    event, kwargs = self.get_event_from_modules()
+                except asyncio.queues.QueueEmpty:
+                    await asyncio.sleep(0.1)
                     continue
-                event, kwargs = result
                 acceptable = await self.emit_event(event, **kwargs)
                 if acceptable:
                     self._new_activity = True
@@ -371,35 +371,13 @@ def module_priority_weights(self):
             self._module_priority_weights = priorities
         return self._module_priority_weights
 
-    async def _wait_on_queue(self, q, waiter_tasks, first_done):
-        item = await q.get()
-        first_done.set_result(item)
-        self.scan.helpers.cancel_tasks(waiter_tasks)
-
-    def get_random_event_from_modules(self):
+    def get_event_from_modules(self):
         for q in self.scan.helpers.weighted_shuffle(self.incoming_queues, self.module_priority_weights):
             try:
                 return q.get_nowait()
             except asyncio.queues.QueueEmpty:
                 continue
-
-    async def get_first_event_from_modules(self):
-        waiter_tasks = []
-        first_done = asyncio.Future()
-        for q in self.incoming_queues:
-            waiter_tasks.append(asyncio.create_task(self._wait_on_queue(q, waiter_tasks, first_done)))
-        try:
-            return await asyncio.wait_for(first_done, timeout=0.1)
-        except asyncio.TimeoutError:
-            self.scan.helpers.cancel_tasks(waiter_tasks)
-
-    async def get_event_from_modules(self):
-        # try to get a (weighted) random one first
-        event = self.get_random_event_from_modules()
-        # if all the queues are, empty, then wait
-        if event is None:
-            event = await self.get_first_event_from_modules()
-        return event
+        raise asyncio.queues.QueueEmpty()
 
     @property
     def queued_event_types(self):
diff --git a/bbot/test/test_step_2/module_tests/test_module_nmap.py b/bbot/test/test_step_2/module_tests/test_module_nmap.py
new file mode 100644
index 0000000000..58bb801d19
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_nmap.py
@@ -0,0 +1,10 @@
+from .base import ModuleTestBase
+
+
+class TestNmap(ModuleTestBase):
+    targets = ["127.0.0.1"]
+    config_overrides = {"modules": {"nmap": {"ports": "8888,8889"}}}
+
+    def check(self, module_test, events):
+        assert any(e.data == "127.0.0.1:8888" for e in events)
+        assert not any(e.data == "127.0.0.1:8889" for e in events)

From c8976c896e9a19db94a9021034603b935d795bd5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 16:28:06 -0400
Subject: [PATCH 060/387] fix tests

---
 bbot/modules/telerik.py | 2 +-
 bbot/test/conftest.py   | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index fceedf9c7d..5166e45b73 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -239,7 +239,7 @@ async def handle_event(self, event):
                 break
             else:
                 if "Cannot deserialize dialog parameters" in result.text:
-                    await self.helpers.cancel_tasks(tasks)
+                    self.helpers.cancel_tasks(tasks)
                     self.debug(f"Detected Telerik UI instance ({dh})")
                     description = f"Telerik DialogHandler detected"
                     self.emit_event(
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 094be9dd80..6069f19ae3 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -16,7 +16,7 @@ def pytest_sessionfinish(session, exitstatus):
             logger.removeHandler(handler)
 
     # Wipe out BBOT home dir
-    shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
+    # shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
 
     yield
 

From d96cb0ee2990e50fff0f17e4b8b0840ffd7c4bcf Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 16:35:08 -0400
Subject: [PATCH 061/387] fix tests

---
 bbot/test/conftest.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 6069f19ae3..094be9dd80 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -16,7 +16,7 @@ def pytest_sessionfinish(session, exitstatus):
             logger.removeHandler(handler)
 
     # Wipe out BBOT home dir
-    # shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
+    shutil.rmtree("/tmp/.bbot_test", ignore_errors=True)
 
     yield
 

From 9ebfe5d4cadacea9b996c2a38f62dd8c3df360b7 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 16:50:22 -0400
Subject: [PATCH 062/387] fixed WEBSCREENSHOT scope distance

---
 bbot/core/event/base.py | 33 +++++++++++++--------------------
 1 file changed, 13 insertions(+), 20 deletions(-)

diff --git a/bbot/core/event/base.py b/bbot/core/event/base.py
index 6d0d285547..7600caa487 100644
--- a/bbot/core/event/base.py
+++ b/bbot/core/event/base.py
@@ -335,7 +335,12 @@ def set_scope_distance(self, d=0):
         return source_trail
 
     def _host(self):
-        return ""
+        if isinstance(self.data, dict) and "host" in self.data:
+            return make_ip_type(self.data["host"])
+        else:
+            parsed = getattr(self, "parsed", None)
+            if parsed is not None:
+                return make_ip_type(parsed.hostname)
 
     def _sanitize_data(self, data):
         data = self._data_load(data)
@@ -589,24 +594,15 @@ def _data_load(self, data):
         return data
 
 
-class DictHostEvent(DictEvent):
-    def _host(self):
-        return make_ip_type(self.data["host"])
-
-
 class ASN(DictEvent):
     _always_emit = True
 
 
-class CODE_REPOSITORY(DictHostEvent):
+class CODE_REPOSITORY(DictEvent):
     class _data_validator(BaseModel):
         url: str
         _validate_url = validator("url", allow_reuse=True)(validators.validate_url)
 
-    def _host(self):
-        self.parsed = validators.validate_url_parsed(self.data["url"])
-        return make_ip_type(self.parsed.hostname)
-
     def _pretty_string(self):
         return self.data["url"]
 
@@ -751,9 +747,6 @@ def _words(self):
             return extract_words(first_elem)
         return set()
 
-    def _host(self):
-        return make_ip_type(self.parsed.hostname)
-
     def _data_id(self):
         # consider spider-danger tag when deduping
         data = super()._data_id()
@@ -839,7 +832,7 @@ def _pretty_string(self):
         return f'{self.data["hash"]["header_mmh3"]}:{self.data["hash"]["body_mmh3"]}'
 
 
-class VULNERABILITY(DictHostEvent):
+class VULNERABILITY(DictEvent):
     _always_emit = True
 
     def sanitize_data(self, data):
@@ -858,7 +851,7 @@ def _pretty_string(self):
         return f'[{self.data["severity"]}] {self.data["description"]}'
 
 
-class FINDING(DictHostEvent):
+class FINDING(DictEvent):
     _always_emit = True
 
     class _data_validator(BaseModel):
@@ -871,7 +864,7 @@ def _pretty_string(self):
         return self.data["description"]
 
 
-class TECHNOLOGY(DictHostEvent):
+class TECHNOLOGY(DictEvent):
     class _data_validator(BaseModel):
         host: str
         technology: str
@@ -887,7 +880,7 @@ def _pretty_string(self):
         return self.data["technology"]
 
 
-class VHOST(DictHostEvent):
+class VHOST(DictEvent):
     class _data_validator(BaseModel):
         host: str
         vhost: str
@@ -898,7 +891,7 @@ def _pretty_string(self):
         return self.data["vhost"]
 
 
-class PROTOCOL(DictHostEvent):
+class PROTOCOL(DictEvent):
     class _data_validator(BaseModel):
         host: str
         protocol: str
@@ -928,7 +921,7 @@ class SOCIAL(DictEvent):
     _always_emit = True
 
 
-class WEBSCREENSHOT(BaseEvent):
+class WEBSCREENSHOT(DictEvent):
     _always_emit = True
 
 
From 7e44f2c29f2c7ca287bc760036497117b280c8f4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 17:03:29 -0400
Subject: [PATCH 063/387] fix tests

---
 bbot/core/event/base.py | 34 +++++++++++++++++++++-------------
 1 file changed, 21 insertions(+), 13 deletions(-)

diff --git a/bbot/core/event/base.py b/bbot/core/event/base.py
index 7600caa487..c8a0c8ab28 100644
--- a/bbot/core/event/base.py
+++ b/bbot/core/event/base.py
@@ -335,12 +335,7 @@ def set_scope_distance(self, d=0):
         return source_trail
 
     def _host(self):
-        if isinstance(self.data, dict) and "host" in self.data:
-            return make_ip_type(self.data["host"])
-        else:
-            parsed = getattr(self, "parsed", None)
-            if parsed is not None:
-                return make_ip_type(parsed.hostname)
+        return ""
 
     def _sanitize_data(self, data):
         data = self._data_load(data)
@@ -594,11 +589,21 @@ def _data_load(self, data):
         return data
 
 
+class DictHostEvent(DictEvent):
+    def _host(self):
+        if isinstance(self.data, dict) and "host" in self.data:
+            return make_ip_type(self.data["host"])
+        else:
+            parsed = getattr(self, "parsed")
+            if parsed is not None:
+                return make_ip_type(parsed.hostname)
+
+
 class ASN(DictEvent):
     _always_emit = True
 
 
-class CODE_REPOSITORY(DictEvent):
+class CODE_REPOSITORY(DictHostEvent):
     class _data_validator(BaseModel):
         url: str
         _validate_url = validator("url", allow_reuse=True)(validators.validate_url)
@@ -747,6 +752,9 @@ def _words(self):
             return extract_words(first_elem)
         return set()
 
+    def _host(self):
+        return make_ip_type(self.parsed.hostname)
+
     def _data_id(self):
         # consider spider-danger tag when deduping
         data = super()._data_id()
@@ -832,7 +840,7 @@ def _pretty_string(self):
         return f'{self.data["hash"]["header_mmh3"]}:{self.data["hash"]["body_mmh3"]}'
 
 
-class VULNERABILITY(DictEvent):
+class VULNERABILITY(DictHostEvent):
     _always_emit = True
 
     def sanitize_data(self, data):
@@ -851,7 +859,7 @@ def _pretty_string(self):
         return f'[{self.data["severity"]}] {self.data["description"]}'
 
 
-class FINDING(DictEvent):
+class FINDING(DictHostEvent):
     _always_emit = True
 
     class _data_validator(BaseModel):
@@ -864,7 +872,7 @@ def _pretty_string(self):
         return self.data["description"]
 
 
-class TECHNOLOGY(DictEvent):
+class TECHNOLOGY(DictHostEvent):
     class _data_validator(BaseModel):
         host: str
         technology: str
@@ -880,7 +888,7 @@ def _pretty_string(self):
         return self.data["technology"]
 
 
-class VHOST(DictEvent):
+class VHOST(DictHostEvent):
     class _data_validator(BaseModel):
         host: str
         vhost: str
@@ -891,7 +899,7 @@ def _pretty_string(self):
         return self.data["vhost"]
 
 
-class PROTOCOL(DictEvent):
+class PROTOCOL(DictHostEvent):
     class _data_validator(BaseModel):
         host: str
         protocol: str
@@ -921,7 +929,7 @@ class SOCIAL(DictEvent):
     _always_emit = True
 
 
-class WEBSCREENSHOT(DictEvent):
+class WEBSCREENSHOT(DictHostEvent):
     _always_emit = True
 
 
From 6cbd4bcfbf6964ed7bf5d34fb5d84335f4434aa3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 23 May 2023 17:47:00 -0400
Subject: [PATCH 064/387] add dns and http rate limiting

---
 bbot/core/helpers/dns.py         | 14 ++++++++++----
 bbot/core/helpers/ratelimiter.py | 32 ++++++++++++++++++++++++++++++++
 bbot/core/helpers/web.py         |  6 +++++-
 bbot/defaults.yml                | 10 ++++++----
 bbot/scanner/manager.py          |  2 --
 bbot/scanner/scanner.py          |  1 -
 6 files changed, 53 insertions(+), 12 deletions(-)
 create mode 100644 bbot/core/helpers/ratelimiter.py

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 9528b4fdb5..3b15c336e3 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -6,6 +6,7 @@
 from contextlib import suppress
 
 from .regexes import dns_name_regex
+from bbot.core.helpers.ratelimiter import RateLimiter
 from bbot.core.helpers.async_helpers import NamedLock
 from bbot.core.errors import ValidationError, DNSError
 from .misc import is_ip, is_domain, is_dns_name, domain_parents, parent_domain, rand_string, cloudcheck
@@ -47,7 +48,8 @@ def __init__(self, parent_helper):
         self._dns_warnings = set()
         self._errors = dict()
         self.fallback_nameservers_file = self.parent_helper.wordlist_dir / "nameservers.txt"
-        self.max_threads = self.parent_helper.config.get("max_dns_threads", 100)
+        self.dns_queries_per_second = self.parent_helper.config.get("dns_queries_per_second", 100)
+        self.dns_rate_limiter = RateLimiter(self.dns_queries_per_second)
         self._debug = self.parent_helper.config.get("dns_debug", False)
         self._dummy_modules = dict()
         self._dns_cache = self.parent_helper.CacheDict(max_size=100000)
@@ -136,7 +138,8 @@ async def _resolve_hostname(self, query, **kwargs):
                             f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
                         )
                         return results, errors
-                    results = await self._catch(self.resolver.resolve, query, **kwargs)
+                    async with self.dns_rate_limiter:
+                        results = await self._catch(self.resolver.resolve, query, **kwargs)
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = results
                     if parent_hash in self._errors:
@@ -177,7 +180,8 @@ async def _resolve_ip(self, query, **kwargs):
                 if dns_cache_hash in self._dns_cache:
                     result = self._dns_cache[dns_cache_hash]
                 else:
-                    result = await self._catch(self.resolver.resolve_address, query, **kwargs)
+                    async with self.dns_rate_limiter:
+                        result = await self._catch(self.resolver.resolve_address, query, **kwargs)
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = result
                 return result, errors
@@ -550,7 +554,9 @@ async def is_wildcard_domain(self, domain, log_info=False):
                     #     continue
                     for _ in range(self.wildcard_tests):
                         rand_query = f"{rand_string(digits=False, length=10)}.{host}"
-                        wildcard_tasks[rdtype].append(self.resolve(rand_query, type=rdtype, cache_result=False))
+                        wildcard_tasks[rdtype].append(
+                            asyncio.create_task(self.resolve(rand_query, type=rdtype, cache_result=False))
+                        )
 
                 # combine the random results
                 is_wildcard = False
diff --git a/bbot/core/helpers/ratelimiter.py b/bbot/core/helpers/ratelimiter.py
new file mode 100644
index 0000000000..0871038dbb
--- /dev/null
+++ b/bbot/core/helpers/ratelimiter.py
@@ -0,0 +1,32 @@
+import time
+import asyncio
+import logging
+from collections import deque
+
+log = logging.getLogger("bbot.helpers.ratelimiter")
+
+
+class RateLimiter:
+    def __init__(self, rate):
+        self.rate = rate
+        self.timestamps = deque()
+        self.lock = asyncio.Lock()
+
+    async def __aenter__(self):
+        async with self.lock:
+            while True:
+                while len(self.timestamps) >= self.rate:
+                    time_diff = time.time() - self.timestamps[0]
+                    if time_diff < 1.0:
+                        sleep_duration = 1.0 - time_diff
+                        await asyncio.sleep(sleep_duration)
+                    self.timestamps.popleft()
+
+                # Check if adding a new request will not exceed the rate limit
+                if len(self.timestamps) < self.rate:
+                    self.timestamps.append(time.time())
+                    break
+        return self
+
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
+        pass
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index f111071273..9372a91f29 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -4,6 +4,7 @@
 from pathlib import Path
 
 from bbot.core.errors import WordlistError, CurlError
+from bbot.core.helpers.ratelimiter import RateLimiter
 
 log = logging.getLogger("bbot.core.helpers.web")
 
@@ -59,6 +60,8 @@ class WebHelper:
     def __init__(self, parent_helper):
         self.parent_helper = parent_helper
         self.ssl_verify = self.parent_helper.config.get("ssl_verify", False)
+        self.web_requests_per_second = self.parent_helper.config.get("web_requests_per_second", 50)
+        self.web_rate_limiter = RateLimiter(self.web_requests_per_second)
 
     def AsyncClient(self, *args, **kwargs):
         kwargs["_bbot_scan"] = self.parent_helper.scan
@@ -96,7 +99,8 @@ async def request(self, *args, **kwargs):
                 if http_debug:
                     logstr = f"Web request: {str(args)}, {str(kwargs)}"
                     log.debug(logstr)
-                response = await client.request(*args, **kwargs)
+                async with self.web_rate_limiter:
+                    response = await client.request(*args, **kwargs)
                 if http_debug:
                     log.debug(
                         f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 6de4c44c48..5c6187a389 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -10,8 +10,12 @@ scope_report_distance: 0
 dns_resolution: true
 # Limit the number of BBOT threads
 max_threads: 25
-# Limit the number of DNS threads (this should be approximately 4x max_threads)
-max_dns_threads: 100
+# Rate-limit DNS
+dns_queries_per_second: 250
+# Rate-limit HTTP
+web_requests_per_second: 50
+# Interval for displaying status messages
+status_frequency: 15
 # HTTP proxy
 http_proxy: 
 # Web user-agent
@@ -75,8 +79,6 @@ dns_filter_ptrs: true
 dns_debug: false
 # Whether to verify SSL certificates
 ssl_verify: false
-# Interval for displaying status messages
-status_frequency: 15
 # How many scan results to keep before cleaning up the older ones
 keep_scans: 20
 # Completely ignore URLs with these extensions
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index e510c6dfaf..79e8585153 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -409,13 +409,11 @@ def queue_event(self, event, **kwargs):
     def running(self):
         active_tasks = self._task_counter.value
         incoming_events = self.incoming_event_queue.qsize()
-        log.debug(f"active tasks: {active_tasks}, incoming events: {incoming_events}")
         return active_tasks > 0 or incoming_events > 0
 
     @property
     def modules_finished(self):
         finished_modules = [m.finished for m in self.scan.modules.values()]
-        log.debug(f"finished modules: {finished_modules}")
         return all(finished_modules)
 
     @property
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 990a520ebc..c2dd248a0d 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -234,7 +234,6 @@ async def start(self):
 
             # main scan loop
             while 1:
-                self.debug("main scan loop")
                 # abort if we're aborting
                 if self.aborting:
                     self.drain_queues()

From 0edeba49eb7a84b94fcff83fe8e69da6c227fc16 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 10:52:05 -0400
Subject: [PATCH 065/387] add ratelimit tests

---
 bbot/test/test_step_1/test_helpers.py | 24 ++++++++++++++++++++++++
 1 file changed, 24 insertions(+)

diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 0c1fd4bb60..f561773f23 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -512,3 +512,27 @@ def test_word_cloud(helpers, bbot_config, bbot_scanner):
 def test_names(helpers):
     assert helpers.names == sorted(helpers.names)
     assert helpers.adjectives == sorted(helpers.adjectives)
+
+
+@pytest.mark.asyncio
+async def test_ratelimiter(helpers):
+    from bbot.core.helpers.ratelimiter import RateLimiter
+
+    results = []
+
+    async def web_request(r):
+        async with r:
+            await asyncio.sleep(0.12345)
+            results.append(None)
+
+    # allow 10 requests per second
+    r = RateLimiter(10)
+    tasks = []
+    # start 500 requests
+    for i in range(500):
+        tasks.append(asyncio.create_task(web_request(r)))
+    # sleep for 5 seconds
+    await asyncio.sleep(5)
+    helpers.cancel_tasks(tasks)
+    # 5 seconds * 10 requests per second == 50
+    assert len(results) == 50

From 3fff3a76c1d873f571cd80818ae772287c9f8e08 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 11:14:45 -0400
Subject: [PATCH 066/387] fixed excavate redirect bug

---
 bbot/modules/internal/excavate.py             |  8 +++++---
 .../module_tests/test_module_excavate.py      | 19 +++++++++++++++++++
 2 files changed, 24 insertions(+), 3 deletions(-)

diff --git a/bbot/modules/internal/excavate.py b/bbot/modules/internal/excavate.py
index 25cef3d625..f562300ccb 100644
--- a/bbot/modules/internal/excavate.py
+++ b/bbot/modules/internal/excavate.py
@@ -326,12 +326,14 @@ async def handle_event(self, event):
             num_redirects = max(getattr(event, "num_redirects", 0), web_spider_distance)
             location = event.data.get("location", "")
             host = event.host
+            # if it's a redirect
             if location:
+                # get the url scheme
                 scheme = self.helpers.is_uri(location, return_scheme=True)
+                # if there's no scheme (i.e. it's a relative redirect)
                 if not scheme:
-                    location_parsed = event.parsed._replace(path=location)
-                    host, _ = self.helpers.split_host_port(location_parsed.netloc)
-                    location = location_parsed.geturl()
+                    # then join the location with the current url
+                    location = urljoin(event.parsed.geturl(), location)
                     scheme = self.helpers.is_uri(location, return_scheme=True)
                 if scheme in ("http", "https"):
                     if num_redirects <= self.max_redirects:
diff --git a/bbot/test/test_step_2/module_tests/test_module_excavate.py b/bbot/test/test_step_2/module_tests/test_module_excavate.py
index eba35d4892..284d941f5f 100644
--- a/bbot/test/test_step_2/module_tests/test_module_excavate.py
+++ b/bbot/test/test_step_2/module_tests/test_module_excavate.py
@@ -147,3 +147,22 @@ def check(self, module_test, events):
         assert page_relative_detection_2, "Failed to properly excavate page-relative URL"
         assert not root_page_confusion_1, "Incorrectly detected page-relative URL"
         assert not root_page_confusion_2, "Incorrectly detected root-relative URL"
+
+
+class TestExcavateRedirect(TestExcavate):
+    targets = ["http://127.0.0.1:8888/", "http://127.0.0.1:8888/relative/"]
+    config_overrides = {"scope_report_distance": 1}
+
+    async def setup_before_prep(self, module_test):
+        # absolute redirect
+        module_test.httpserver.expect_request("/").respond_with_data(
+            "", status=302, headers={"Location": "https://www.test.notreal/yep"}
+        )
+        module_test.httpserver.expect_request("/relative/").respond_with_data(
+            "", status=302, headers={"Location": "./owa/"}
+        )
+        module_test.httpserver.no_handler_status_code = 404
+
+    def check(self, module_test, events):
+        assert any(e.data == "https://www.test.notreal/yep" for e in events)
+        assert any(e.data == "http://127.0.0.1:8888/relative/owa/" for e in events)

From 1b39e94a1a134acf9f9799822876c28cbdf36c09 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 14:43:25 -0400
Subject: [PATCH 067/387] paginate virustotal

---
 README.md                      | 198 ++++++++++++++++-----------------
 bbot/core/configurator/args.py |   7 --
 bbot/core/helpers/web.py       |  46 +++++++-
 bbot/defaults.yml              |   2 +-
 bbot/modules/virustotal.py     |  21 +++-
 bbot/scanner/scanner.py        |   2 -
 6 files changed, 160 insertions(+), 116 deletions(-)

diff --git a/README.md b/README.md
index 9b9e05f446..02c7918369 100644
--- a/README.md
+++ b/README.md
@@ -1,27 +1,28 @@
-![bbot_banner](https://user-images.githubusercontent.com/20261699/158000235-6c1ace81-a267-4f8e-90a1-f4c16884ebac.png)
-
 # BEE·bot
 ### OSINT automation for hackers.
 
-~~~bash
-pip install bbot
-~~~
-
 [![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot)
 
-![bbot-demo](https://user-images.githubusercontent.com/20261699/217346759-d5bf56c3-3936-43f7-ad14-4d73d2cd1417.gif)
+BBOT is a powerful and modular OSINT (Open Source Intelligence) framework designed to map the attack surface of an organization. With BBOT, you can execute the entire OSINT workflow with just a single command.
 
-### **BBOT** is a **recursive**, **modular** OSINT framework inspired by Spiderfoot.
+![bbot_banner](https://user-images.githubusercontent.com/20261699/158000235-6c1ace81-a267-4f8e-90a1-f4c16884ebac.png)
+
+BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. With over 80 modules and counting, BBOT provides a comprehensive set of tools for gathering intelligence.
 
-BBOT can execute the entire OSINT process in a single command: subdomain enumeration, port scans, web screenshots (with `gowitness`), vulnerability scanning (with `nuclei`), and much more. BBOT has over **80 modules** and counting.
+Whether you're a pentester, security researcher, or bug bounty hunter, BBOT simplifies and automates the OSINT process so you can focus on the fun part: hacking!
+
+![bbot-demo](https://user-images.githubusercontent.com/20261699/217346759-d5bf56c3-3936-43f7-ad14-4d73d2cd1417.gif)
 
-Read our [blog post](https://blog.blacklanternsecurity.com/p/subdomain-enumeration-tool-face-off) to find out why BBOT is the most thorough subdomain enumeration tool available.
 
-![graphs-small](https://user-images.githubusercontent.com/20261699/199602154-14c71a93-57aa-4ac0-ad81-87ce64fbffc7.png)
+# Getting Started
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
-Note: installing in a virtualenv (e.g. via `pipx`) is recommended
+Note: installing in a virtualenv (e.g. via `pipx`) is recommended. If you need help with installation, please refer to the [wiki](https://github.com/blacklanternsecurity/bbot/wiki#installation).
 ~~~bash
+# Prerequisites:
+# - Linux (Windows and macOS are *not* supported)
+# - Python 3.9 or newer
+
 # stable version
 pip install bbot
 
@@ -30,29 +31,9 @@ pip install --pre bbot
 
 bbot --help
 ~~~
-Prerequisites:
-- Linux (Windows and macOS are *not* supported)
-- Python 3.9 or newer
-
-## Installation ([Docker](https://hub.docker.com/r/blacklanternsecurity/bbot))
-~~~bash
-# bleeding edge (dev)
-docker run -it blacklanternsecurity/bbot --help
-
-# stable
-docker run -it blacklanternsecurity/bbot:stable --help
-
-# note: alternatively there is a helper script that will map docker volumes to persist your BBOT scan data:
-./bbot-docker.sh --help
-~~~
-
-If you need help with installation, please refer to the [wiki](https://github.com/blacklanternsecurity/bbot/wiki#installation).
-
-See also: [Release History](https://github.com/blacklanternsecurity/bbot/wiki/Release-History)
 
-## Scanning with BBOT
-
-### Examples
+## Example Commands
+Note: Scan output, logs, etc. are saved to `~/.bbot`.
 ~~~bash
 # subdomains
 bbot -t evilcorp.com -f subdomain-enum
@@ -77,7 +58,21 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m naabu
 bbot -l
 ~~~
 
-### Targets
+## Using BBOT as a Python library
+~~~python
+from bbot.scanner import Scanner
+
+async def main():
+    # any number of targets can be specified
+    scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
+    async for event in scan.start():
+        print(event.json())
+
+import asyncio
+asyncio.run(main())
+~~~
+
+## Targets
 
 Targets seed a scan with initial data. You can specify an unlimited number of targets, either directly on the command line or in files (or both!). Targets can be any of the following:
 
@@ -94,64 +89,28 @@ For example, the following scan is totally valid:
 bbot -t evilcorp.com evilcorp.co.uk http://www.evilcorp.cn 1.2.3.0/24 other_targets.txt
 ~~~
 
-#### Whitelists / Blacklists
-
-BBOT's whitelist determines what's considered to be in-scope. By default, the whitelist is simply your target. But if you want more granular scope control, you can override it with `--whitelist` (or add a `--blacklist`).
-
-~~~bash
-# seed a scan with two domains, but only consider assets to be in scope if they are inside 1.2.3.0/24
-bbot -t evilcorp.com evilcorp.co.uk --whitelist 1.2.3.0/24 --blacklist test.evilcorp.com 1.2.3.4 blacklist.txt
-~~~
-
 Visit the wiki for more [tips and tricks](https://github.com/blacklanternsecurity/bbot/wiki#tips-and-tricks).
 
-## Using BBOT as a Python library
-~~~python
-from bbot.scanner import Scanner
-
-# any number of targets can be specified
-scan = Scanner("evilcorp.com", "evilcorp.co.uk", modules=["httpx", "sslcert"])
-for event in scan.start():
-    print(event.json())
-~~~
-
-# Output
-By default, BBOT saves its output in TXT, JSON, and CSV formats. To enable more output modules, you can use `--output-module`.
+## [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot)
+BBOT provides docker images, along with helper script `bbot-docker.sh` to persist your BBOT scan data.
 ~~~bash
-# tee to a file
-bbot -f subdomain-enum -t evilcorp.com | tee evilcorp.txt
+# helper script
+./bbot-docker.sh --help
 
-# output to JSON
-bbot --output-module json -f subdomain-enum -t evilcorp.com | jq
+# bleeding edge (dev)
+docker run -it blacklanternsecurity/bbot --help
 
-# output asset inventory in current directory
-bbot -o . --output-module asset_inventory -f subdomain-enum -t evilcorp.com
+# stable
+docker run -it blacklanternsecurity/bbot:stable --help
 ~~~
-For every scan, BBOT generates a unique and mildly-entertaining name like `demonic_jimmy`. Output for that scan, including the word cloud and any gowitness screenshots, etc., are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed. You can change the location of BBOT's output with `--output`, and you can also pick a custom scan name with `--name`.
-
-If you reuse a scan name, it will append to its original output files and leverage the previous word cloud.
-
-# Neo4j
-Neo4j is the funnest (and prettiest) way to view and interact with BBOT data.
 
-![neo4j](https://user-images.githubusercontent.com/20261699/182398274-729f3c48-c23c-4db0-8c2e-8b403c1bf790.png)
-
-- You can get Neo4j up and running with a single docker command:
-~~~bash
-docker run -p 7687:7687 -p 7474:7474 -v "$(pwd)/data/:/data/" -e NEO4J_AUTH=neo4j/bbotislife neo4j
-~~~
-- After that, run bbot with `--output-modules neo4j`
-~~~bash
-bbot -f subdomain-enum -t evilcorp.com --output-modules neo4j
-~~~
-- Browse data at http://localhost:7474
 
 # Usage
 ~~~
 $ bbot --help
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l] [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
-            [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--save-wordcloud FILE] [--load-wordcloud FILE]
-            [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a] [--version]
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+            [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR] [-c [CONFIG ...]]
+            [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a] [--version]
 
 Bighuge BLS OSINT Tool
 
@@ -170,7 +129,7 @@ Target:
 
 Modules:
   -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
   -l, --list-modules    List available modules.
   -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
                         Exclude these modules.
@@ -198,14 +157,6 @@ Scan:
   --dry-run             Abort before executing scan
   --current-config      Show current config in YAML format
 
-Word cloud:
-  Save/load wordlist of common words gathered during a scan
-
-  --save-wordcloud FILE
-                        Output wordcloud to custom file when the scan completes
-  --load-wordcloud FILE
-                        Load wordcloud from a custom file
-
 Module dependencies:
   Control how modules install their dependencies
 
@@ -224,12 +175,13 @@ Misc:
   --version             show BBOT version and exit
 ~~~
 
+
 # BBOT Config
-BBOT loads its config from these places in the following order:
+Additional config options (such as API keys, rate limits, user-agent, etc.) can be passed to BBOT via its YAML config. BBOT loads its config beginning from `~/.config/bbot`:
 
 - `~/.config/bbot/bbot.yml` <-- Use this one as your main config
 - `~/.config/bbot/secrets.yml` <-- Use this one for sensitive stuff like API keys
-- command line (`--config`)
+- command line (`--config`) <-- Use this to specify a custom `.yml` or override individual config options
 
 These config files will be automatically created for you when you first run BBOT.
 
@@ -248,6 +200,39 @@ bbot --config modules.shodan.api_key=deadbeef
 
 For explanations of config options, see `defaults.yml` or the [wiki](https://github.com/blacklanternsecurity/bbot/wiki#yaml-config)
 
+
+# Output
+By default, BBOT saves its output in TXT, JSON, and CSV formats. You can enable other output modules with `--output-module`.
+~~~bash
+# tee to a file
+bbot -f subdomain-enum -t evilcorp.com | tee evilcorp.txt
+
+# output to JSON
+bbot --output-module json -f subdomain-enum -t evilcorp.com | jq
+
+# output asset inventory in current directory
+bbot -o . --output-module asset_inventory -f subdomain-enum -t evilcorp.com
+~~~
+For every scan, BBOT generates a unique and mildly-entertaining name like `demonic_jimmy`. Output for that scan, including scan stats and any gowitness screenshots, etc., are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed. You can change the location of BBOT's output with `--output`, and you can also pick a custom scan name with `--name`.
+
+If you reuse a scan name, it will append to its original output files and leverage the previous.
+
+## Neo4j
+Neo4j is the funnest (and prettiest) way to view and interact with BBOT data.
+
+![neo4j](https://user-images.githubusercontent.com/20261699/182398274-729f3c48-c23c-4db0-8c2e-8b403c1bf790.png)
+
+- You can get Neo4j up and running with a single docker command:
+~~~bash
+docker run -p 7687:7687 -p 7474:7474 -v "$(pwd)/data/:/data/" -e NEO4J_AUTH=neo4j/bbotislife neo4j
+~~~
+- After that, run bbot with `--output-modules neo4j`
+~~~bash
+bbot -f subdomain-enum -t evilcorp.com --output-modules neo4j
+~~~
+- Browse data at http://localhost:7474
+
+
 # Modules
 
 ### Note: You can find more fun and interesting modules at the [Module Playground](https://github.com/blacklanternsecurity/bbot-module-playground). For instructions on how to install these other modules, see the [wiki](https://github.com/blacklanternsecurity/bbot/wiki#module-playground).
@@ -312,6 +297,8 @@ To see modules' options (how to change wordlists, thread count, etc.), use `--he
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
 | naabu                | scan     |         | Execute port scans with naabu            | active,aggressive,portscan,web-thorough  | OPEN_TCP_PORT                            |
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
+| nmap                 | scan     |         | Execute port scans with nmap             | active,aggressive,portscan,web-thorough  | OPEN_TCP_PORT                            |
++----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
 | ntlm                 | scan     |         | Watch for HTTP endpoints that support    | active,safe,web-basic,web-thorough       | DNS_NAME,FINDING                         |
 |                      |          |         | NTLM authentication                      |                                          |                                          |
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
@@ -357,7 +344,7 @@ To see modules' options (how to change wordlists, thread count, etc.), use `--he
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
 | wappalyzer           | scan     |         | Extract technologies from web responses  | active,safe,web-basic,web-thorough       | TECHNOLOGY                               |
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| affiliates           | scan     |         | Summarize affiliate domains at the end   | passive,report,safe                      |                                          |
+| affiliates           | scan     |         | Summarize affiliate domains at the end   | affiliates,passive,report,safe           |                                          |
 |                      |          |         | of a scan                                |                                          |                                          |
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
 | anubisdb             | scan     |         | Query jldc.me's database for subdomains  | passive,safe,subdomain-enum              | DNS_NAME                                 |
@@ -446,7 +433,7 @@ To see modules' options (how to change wordlists, thread count, etc.), use `--he
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
 | zoomeye              | scan     | X       | Query ZoomEye's API for subdomains       | affiliates,passive,safe,subdomain-enum   | DNS_NAME                                 |
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| asset_inventory      | output   |         | Output to an asset inventory style       |                                          |                                          |
+| asset_inventory      | output   |         | Output to an asset inventory style       |                                          | IP_ADDRESS,OPEN_TCP_PORT                 |
 |                      |          |         | flattened CSV file                       |                                          |                                          |
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
 | csv                  | output   |         | Output to CSV                            |                                          |                                          |
@@ -477,12 +464,25 @@ To see modules' options (how to change wordlists, thread count, etc.), use `--he
 +----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
 ~~~
 
-# Credit
 
-BBOT is written by @TheTechromancer. Web hacking in BBOT is made possible by @liquidsec, who wrote most of the web modules and helpers.
+# Acknowledgements
 
-Very special thanks to the following people who made BBOT possible:
+Thanks to all these amazing people for contributing to BBOT! :heart:
 
-- @kerrymilan for his Neo4j and Ansible expertise
+If you have an idea for a feature or run into bugs of any kind, please submit an issue or a PR. We welcome contributions!
+
+<p align="center">
+<a href="https://github.com/blacklanternsecurity/bbot/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=blacklanternsecurity/bbot&max=500">
+</a>
+</p>
+
+Special thanks to the following people who made BBOT possible:
+
+- @TheTechromancer for creating BBOT
+- @liquidsec for his extensive work on BBOT's web hacking features
 - Steve Micallef (@smicallef) for creating Spiderfoot
+- @kerrymilan for his Neo4j and Ansible expertise
 - Aleksei Kornev (@alekseiko) for allowing us ownership of the bbot Pypi repository <3
+
+See also: [Release History](https://github.com/blacklanternsecurity/bbot/wiki/Release-History)
diff --git a/bbot/core/configurator/args.py b/bbot/core/configurator/args.py
index 0cb2f1519f..48c4297ad7 100644
--- a/bbot/core/configurator/args.py
+++ b/bbot/core/configurator/args.py
@@ -175,13 +175,6 @@ def error(self, message):
         action="store_true",
         help="Show current config in YAML format",
     )
-    wordcloud = p.add_argument_group(
-        title="Word cloud", description="Save/load wordlist of common words gathered during a scan"
-    )
-    wordcloud.add_argument(
-        "--save-wordcloud", help="Output wordcloud to custom file when the scan completes", metavar="FILE"
-    )
-    wordcloud.add_argument("--load-wordcloud", help="Load wordcloud from a custom file", metavar="FILE")
     deps = p.add_argument_group(
         title="Module dependencies", description="Control how modules install their dependencies"
     )
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 9372a91f29..747560c00e 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -174,11 +174,53 @@ async def wordlist(self, path, lines=None, **kwargs):
                     f.write(line)
             return truncated_filename
 
-    async def api_page_iter(self, url, page_size=100, json=True, **requests_kwargs):
+    async def api_page_iter(self, url, page_size=100, json=True, next_key=None, **requests_kwargs):
+        """
+        An async generator to fetch and loop through API pages.
+
+        This function keeps calling the API with the provided URL, increasing the page number each time, and spits out
+        the results one page at a time. It's perfect for APIs that split their data across multiple pages.
+
+        Args:
+            url (str): The API endpoint. May contain placeholders for 'page' and 'page_size'.
+            page_size (int, optional): How many items you want per page. Defaults to 100.
+            json (bool, optional): If True, we'll try to convert the response to JSON. Defaults to True.
+            next_key (callable, optional): If your API has a weird way to get to the next page, give us a function
+                                           that takes the response and spits out the new URL. Defaults to None.
+            **requests_kwargs: Any other stuff you want to pass to the request.
+
+        Yields:
+            If 'json' is True, you'll get a dict with the API's response, else you'll get the raw response.
+
+        Note:
+            You MUST break out of the loop when you stop getting useful results! Otherwise it will loop forever.
+
+        Example:
+            Here's a quick example of how to use this:
+            ```
+            agen = api_page_iter('https://api.example.com/data?page={page}&page_size={page_size}')
+            try:
+                async for page in agen:
+                    subdomains = json["subdomains"]
+                    self.hugesuccess(subdomains)
+                    if not subdomains:
+                        break
+            finally:
+                agen.aclose()
+            ```
+        """
         page = 1
         offset = 0
+        result = None
         while 1:
-            new_url = url.format(page=page, page_size=page_size, offset=offset)
+            if result and callable(next_key):
+                try:
+                    new_url = next_key(result)
+                except Exception as e:
+                    log.debug(f"Failed to extract next page of results from {url}: {e}")
+                    log.debug(traceback.formate_exc())
+            else:
+                new_url = url.format(page=page, page_size=page_size, offset=offset)
             result = await self.request(new_url, **requests_kwargs)
             try:
                 if json:
diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 5c6187a389..051415165a 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -11,7 +11,7 @@ dns_resolution: true
 # Limit the number of BBOT threads
 max_threads: 25
 # Rate-limit DNS
-dns_queries_per_second: 250
+dns_queries_per_second: 1000
 # Rate-limit HTTP
 web_requests_per_second: 50
 # Interval for displaying status messages
diff --git a/bbot/modules/virustotal.py b/bbot/modules/virustotal.py
index dac8ee6335..90575aaa72 100644
--- a/bbot/modules/virustotal.py
+++ b/bbot/modules/virustotal.py
@@ -20,11 +20,6 @@ async def ping(self):
         # virustotal does not have a ping function
         return
 
-    async def request_url(self, query):
-        url = f"{self.base_url}/domains/{self.helpers.quote(query)}/subdomains"
-        r = await self.request_with_fail_count(url, headers=self.headers)
-        return r
-
     def parse_results(self, r, query):
         results = set()
         text = getattr(r, "text", "")
@@ -33,3 +28,19 @@ def parse_results(self, r, query):
             if match.endswith(query):
                 results.add(match)
         return results
+
+    async def query(self, query):
+        results = set()
+        url = f"{self.base_url}/domains/{self.helpers.quote(query)}/subdomains"
+        agen = self.helpers.api_page_iter(
+            url, json=False, headers=self.headers, next_key=lambda r: r.json().get("links", {}).get("next", "")
+        )
+        try:
+            async for response in agen:
+                r = self.parse_results(response, query)
+                if not r:
+                    break
+                results.update(r)
+        finally:
+            agen.aclose()
+        return results
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index c2dd248a0d..832f2d3090 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -249,8 +249,6 @@ async def start(self):
                     new_activity = await self.finish()
                     if not new_activity:
                         break
-                else:
-                    self.debug(f"manager.active: {self.manager.active}, finished init: {self._finished_init}")
 
                 await asyncio.sleep(0.1)
 

From 4aa639ec1668d9417ef2ef6138283097cce8b1f3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 14:57:33 -0400
Subject: [PATCH 068/387] fix wordcloud

---
 bbot/cli.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index 70f99dc57e..c1b70590de 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -258,7 +258,7 @@ async def _main():
                             f"You have enabled the following slow modules: {','.join(slow_modules)}. Scan may take longer than usual"
                         )
 
-                scanner.helpers.word_cloud.load(options.load_wordcloud)
+                scanner.helpers.word_cloud.load()
 
                 await scanner.prep()
 

From 39f9845e16f09507f77da3916f2f2aef8c5051cc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 16:07:50 -0400
Subject: [PATCH 069/387] better rate limiting, fix tests

---
 bbot/cli.py                           |  2 +-
 bbot/core/helpers/misc.py             |  5 +++--
 bbot/core/helpers/ratelimiter.py      | 28 ++++++++++++++-------------
 bbot/modules/internal/excavate.py     |  2 +-
 bbot/scanner/scanner.py               |  9 ++++++---
 bbot/test/test_step_1/test_helpers.py |  2 +-
 6 files changed, 27 insertions(+), 21 deletions(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index c1b70590de..5c1724454b 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -304,7 +304,7 @@ def keyboard_listen():
     finally:
         # save word cloud
         with suppress(BaseException):
-            save_success, filename = scanner.helpers.word_cloud.save(options.save_wordcloud)
+            save_success, filename = scanner.helpers.word_cloud.save()
             if save_success:
                 log_to_stderr(f"Saved word cloud ({len(scanner.helpers.word_cloud):,} words) to {filename}")
         # remove output directory if empty
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index f8b51b6b63..68274661e2 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -598,8 +598,9 @@ def search_format_dict(d, **kwargs):
     elif isinstance(d, list):
         return [search_format_dict(v, **kwargs) for v in d]
     elif isinstance(d, str):
-        for k, v in kwargs.items():
-            d = d.replace("#{" + str(k) + "}", v)
+        for find, replace in kwargs.items():
+            find = "#{" + str(find) + "}"
+            d = d.replace(find, replace)
     return d
 
 
diff --git a/bbot/core/helpers/ratelimiter.py b/bbot/core/helpers/ratelimiter.py
index 0871038dbb..a444323aa1 100644
--- a/bbot/core/helpers/ratelimiter.py
+++ b/bbot/core/helpers/ratelimiter.py
@@ -1,31 +1,33 @@
 import time
 import asyncio
 import logging
-from collections import deque
 
 log = logging.getLogger("bbot.helpers.ratelimiter")
 
 
 class RateLimiter:
     def __init__(self, rate):
-        self.rate = rate
-        self.timestamps = deque()
+        self.rate = rate / 10
+        self.current_timestamp = time.time()
+        self.count = 0
         self.lock = asyncio.Lock()
 
     async def __aenter__(self):
         async with self.lock:
             while True:
-                while len(self.timestamps) >= self.rate:
-                    time_diff = time.time() - self.timestamps[0]
-                    if time_diff < 1.0:
-                        sleep_duration = 1.0 - time_diff
-                        await asyncio.sleep(sleep_duration)
-                    self.timestamps.popleft()
-
-                # Check if adding a new request will not exceed the rate limit
-                if len(self.timestamps) < self.rate:
-                    self.timestamps.append(time.time())
+                if time.time() - self.current_timestamp >= 0.1:
+                    # A new 0.1 second interval has begun, reset the count and timestamp
+                    self.current_timestamp = time.time()
+                    self.count = 1
+                    break
+                elif self.count < self.rate:
+                    # Still within the rate limit for the current 0.1 second interval
+                    self.count += 1
                     break
+                else:
+                    # Rate limit for the current 0.1 second interval has been reached, wait until the next interval
+                    await asyncio.sleep(self.current_timestamp + 0.1 - time.time())
+
         return self
 
     async def __aexit__(self, exc_type, exc_val, exc_tb):
diff --git a/bbot/modules/internal/excavate.py b/bbot/modules/internal/excavate.py
index f562300ccb..94e711bc22 100644
--- a/bbot/modules/internal/excavate.py
+++ b/bbot/modules/internal/excavate.py
@@ -276,7 +276,7 @@ def report(self, result, name, event, **kwargs):
         # ensure that basic auth matches aren't false positives
         if name == "authorization_basic":
             try:
-                b64test = base64.b64decode(result.split(" ")[1].encode())
+                b64test = base64.b64decode(result.split(" ", 1)[-1].encode())
                 if b":" not in b64test:
                     return
             except (base64.binascii.Error, UnicodeDecodeError):
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 832f2d3090..c8d33738ca 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -166,6 +166,8 @@ def __init__(
         self.init_events_task = None
         self.ticker_task = None
 
+        self._stopping = False
+
     def _on_keyboard_interrupt(self, loop, event):
         self.stop()
 
@@ -255,9 +257,9 @@ async def start(self):
             failed = False
 
         except BaseException as e:
+            self.stop()
             exception_chain = self.helpers.get_exception_chain(e)
             if any(isinstance(exc, KeyboardInterrupt) for exc in exception_chain):
-                self.stop()
                 failed = False
             else:
                 try:
@@ -267,7 +269,6 @@ async def start(self):
 
                 except BBOTError as e:
                     self.critical(f"Error during scan: {e}")
-                    self.trace()
 
                 except Exception:
                     self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
@@ -329,7 +330,8 @@ async def setup_modules(self, remove_failed=True):
             self.warning(f"Setup failed for {total_failed:,} modules")
 
     def stop(self):
-        if self.status != "ABORTING":
+        if not self._stopping:
+            self._stopping = True
             self.status = "ABORTING"
             self.hugewarning(f"Aborting scan")
             self.trace()
@@ -545,6 +547,7 @@ def trace(self):
 
     def critical(self, *args, **kwargs):
         log.critical(*args, extra={"scan_id": self.id}, **kwargs)
+        self.trace()
 
     def _internal_modules(self):
         for modname in module_loader.preloaded(type="internal"):
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index f561773f23..f9b95ed955 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -535,4 +535,4 @@ async def web_request(r):
     await asyncio.sleep(5)
     helpers.cancel_tasks(tasks)
     # 5 seconds * 10 requests per second == 50
-    assert len(results) == 50
+    assert 45 <= len(results) <= 55

From af44293febfa18a60df10fc7137ae06421004afb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 17:11:48 -0400
Subject: [PATCH 070/387] fix websocket bug, clarify scope shepherding logic

---
 bbot/modules/output/websocket.py |  6 +++---
 bbot/scanner/manager.py          | 37 +++++++++++++++++++-------------
 2 files changed, 25 insertions(+), 18 deletions(-)

diff --git a/bbot/modules/output/websocket.py b/bbot/modules/output/websocket.py
index 9c78e42d10..d4d6d9966e 100644
--- a/bbot/modules/output/websocket.py
+++ b/bbot/modules/output/websocket.py
@@ -41,9 +41,9 @@ async def send(self, message):
         while not self.scan.stopped:
             try:
                 ws = await self.ws(rebuild=rebuild)
-                message = json.dumps(message)
-                self.debug(f"Sending message of length {len(message)}")
-                await ws.send(message)
+                message_str = json.dumps(message)
+                self.debug(f"Sending message of length {len(message_str)}")
+                await ws.send(message_str)
                 rebuild = False
                 break
             except Exception as e:
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 79e8585153..0ff489001b 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -162,23 +162,30 @@ async def _emit_event(self, event, *args, **kwargs):
 
             # Scope shepherding
             # here, we buff or nerf an event based on its attributes and certain scan settings
-            # first, it needs to have a valid host
+            event_is_duplicate = self.is_duplicate_event(event)
+            event_in_report_distance = event.scope_distance <= self.scan.scope_report_distance
+            set_scope_distance = event.scope_distance
+            if event_whitelisted:
+                set_scope_distance = 0
             if event.host:
-                # if it's whitelisted, we make it in-scope
-                if event_whitelisted:
-                    log.debug(f"Making {event} in-scope")
-                    source_trail = event.set_scope_distance(0)
+                # here, we evaluate some weird logic
+                # the reason this exists is to ensure we don't have orphans in the graph
+                # because forcefully internalizing certain events can orphan their children
+                event_will_be_output = event_whitelisted or event_in_report_distance
+                event_is_not_duplicate = event._force_output or not event_is_duplicate
+                if event_will_be_output and event_is_not_duplicate:
+                    if set_scope_distance == 0:
+                        log.debug(f"Making {event} in-scope")
+                    source_trail = event.set_scope_distance(set_scope_distance)
+                    # force re-emit internal source events
                     for s in source_trail:
-                        self.queue_event(s)
-
-                # finally, we check if it's inside our configured report distance
-                event_in_report_distance = event.scope_distance <= self.scan.scope_report_distance
-                # if it's not, we make it internal (so it's only distributed to modules and not to the user)
-                if not event_in_report_distance and not event._force_output:
-                    log.debug(
-                        f"Making {event} internal because its scope_distance ({event.scope_distance}) > scope_report_distance ({self.scan.scope_report_distance})"
-                    )
-                    event.make_internal()
+                        await self.emit_event(s, _block=False, _force_submit=True)
+                else:
+                    if event.scope_distance > self.scan.scope_report_distance:
+                        log.debug(
+                            f"Making {event} internal because its scope_distance ({event.scope_distance}) > scope_report_distance ({self.scan.scope_report_distance})"
+                        )
+                        event.make_internal()
 
             # check for wildcards
             if event.scope_distance <= self.scan.scope_search_distance:

From 82dac0bc3a5e0dbd88b6525b1eac60c2be939b77 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 17:20:35 -0400
Subject: [PATCH 071/387] performance tweaks

---
 bbot/modules/dnscommonsrv.py        | 2 +-
 bbot/test/test_step_1/test_files.py | 4 ++--
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/bbot/modules/dnscommonsrv.py b/bbot/modules/dnscommonsrv.py
index ab8f9029e7..d49612a055 100644
--- a/bbot/modules/dnscommonsrv.py
+++ b/bbot/modules/dnscommonsrv.py
@@ -94,7 +94,7 @@ class dnscommonsrv(BaseModule):
     produced_events = ["DNS_NAME"]
     flags = ["subdomain-enum", "passive", "safe"]
     meta = {"description": "Check for common SRV records"}
-    max_event_handlers = 10
+    max_event_handlers = 2
 
     async def filter_event(self, event):
         # skip SRV wildcards
diff --git a/bbot/test/test_step_1/test_files.py b/bbot/test/test_step_1/test_files.py
index 210a6342f2..be52b1cd20 100644
--- a/bbot/test/test_step_1/test_files.py
+++ b/bbot/test/test_step_1/test_files.py
@@ -1,4 +1,4 @@
-from time import sleep
+import asyncio
 
 from ..bbot_fixtures import *
 
@@ -18,5 +18,5 @@ async def test_files(bbot_scanner, bbot_config):
     tempfile = scan1.helpers.tempfile_tail(callback=lambda x: results.append(x))
     with open(tempfile, "w") as f:
         f.write("asdf\n")
-    sleep(0.1)
+    await asyncio.sleep(0.1)
     assert "asdf" in results

From 56170a075f902f7c8fd7f459c48be64ca78fdc5a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 24 May 2023 17:26:56 -0400
Subject: [PATCH 072/387] fix agent tests

---
 bbot/scanner/scanner.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index c8d33738ca..8c47143ced 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -257,9 +257,9 @@ async def start(self):
             failed = False
 
         except BaseException as e:
-            self.stop()
             exception_chain = self.helpers.get_exception_chain(e)
             if any(isinstance(exc, KeyboardInterrupt) for exc in exception_chain):
+                self.stop()
                 failed = False
             else:
                 try:

From baf246395ab716a2c002a9b1c585d611885d26db Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 25 May 2023 10:49:54 -0400
Subject: [PATCH 073/387] rate limiter status logging

---
 bbot/core/helpers/dns.py              | 2 +-
 bbot/core/helpers/ratelimiter.py      | 9 ++++++++-
 bbot/core/helpers/web.py              | 2 +-
 bbot/defaults.yml                     | 2 +-
 bbot/modules/crt.py                   | 2 +-
 bbot/scanner/manager.py               | 4 ++--
 bbot/test/test_step_1/test_helpers.py | 2 +-
 bbot/test/test_step_1/test_manager.py | 2 +-
 8 files changed, 16 insertions(+), 9 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 3b15c336e3..02e84d253e 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -49,7 +49,7 @@ def __init__(self, parent_helper):
         self._errors = dict()
         self.fallback_nameservers_file = self.parent_helper.wordlist_dir / "nameservers.txt"
         self.dns_queries_per_second = self.parent_helper.config.get("dns_queries_per_second", 100)
-        self.dns_rate_limiter = RateLimiter(self.dns_queries_per_second)
+        self.dns_rate_limiter = RateLimiter(self.dns_queries_per_second, "DNS")
         self._debug = self.parent_helper.config.get("dns_debug", False)
         self._dummy_modules = dict()
         self._dns_cache = self.parent_helper.CacheDict(max_size=100000)
diff --git a/bbot/core/helpers/ratelimiter.py b/bbot/core/helpers/ratelimiter.py
index a444323aa1..a7b37a42e6 100644
--- a/bbot/core/helpers/ratelimiter.py
+++ b/bbot/core/helpers/ratelimiter.py
@@ -6,11 +6,14 @@
 
 
 class RateLimiter:
-    def __init__(self, rate):
+    def __init__(self, rate, name):
         self.rate = rate / 10
+        self.name = name
+        self.log_interval = 10
         self.current_timestamp = time.time()
         self.count = 0
         self.lock = asyncio.Lock()
+        self.last_notification = None
 
     async def __aenter__(self):
         async with self.lock:
@@ -25,6 +28,10 @@ async def __aenter__(self):
                     self.count += 1
                     break
                 else:
+                    now = time.time()
+                    if self.last_notification is None or now - self.last_notification >= self.log_interval:
+                        log.verbose(f"{self.name} rate limit threshold ({self.rate*10:.1f}/s) reached")
+                        self.last_notification = now
                     # Rate limit for the current 0.1 second interval has been reached, wait until the next interval
                     await asyncio.sleep(self.current_timestamp + 0.1 - time.time())
 
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 747560c00e..9aa759f9cd 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -61,7 +61,7 @@ def __init__(self, parent_helper):
         self.parent_helper = parent_helper
         self.ssl_verify = self.parent_helper.config.get("ssl_verify", False)
         self.web_requests_per_second = self.parent_helper.config.get("web_requests_per_second", 50)
-        self.web_rate_limiter = RateLimiter(self.web_requests_per_second)
+        self.web_rate_limiter = RateLimiter(self.web_requests_per_second, "Web")
 
     def AsyncClient(self, *args, **kwargs):
         kwargs["_bbot_scan"] = self.parent_helper.scan
diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 051415165a..715ae5547d 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -13,7 +13,7 @@ max_threads: 25
 # Rate-limit DNS
 dns_queries_per_second: 1000
 # Rate-limit HTTP
-web_requests_per_second: 50
+web_requests_per_second: 100
 # Interval for displaying status messages
 status_frequency: 15
 # HTTP proxy
diff --git a/bbot/modules/crt.py b/bbot/modules/crt.py
index 62d4a37fd6..b2b5837c30 100644
--- a/bbot/modules/crt.py
+++ b/bbot/modules/crt.py
@@ -17,7 +17,7 @@ async def setup(self):
     async def request_url(self, query):
         params = {"q": f"%.{query}", "output": "json"}
         url = self.helpers.add_get_params(self.base_url, params).geturl()
-        return await self.request_with_fail_count(url, timeout=self.http_timeout + 10)
+        return await self.request_with_fail_count(url, timeout=self.http_timeout + 30)
 
     def parse_results(self, r, query):
         j = r.json()
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 0ff489001b..5a12e3ee5d 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -172,8 +172,8 @@ async def _emit_event(self, event, *args, **kwargs):
                 # the reason this exists is to ensure we don't have orphans in the graph
                 # because forcefully internalizing certain events can orphan their children
                 event_will_be_output = event_whitelisted or event_in_report_distance
-                event_is_not_duplicate = event._force_output or not event_is_duplicate
-                if event_will_be_output and event_is_not_duplicate:
+                event_is_duplicate = event_is_duplicate and not event._force_output
+                if event_will_be_output and not event_is_duplicate:
                     if set_scope_distance == 0:
                         log.debug(f"Making {event} in-scope")
                     source_trail = event.set_scope_distance(set_scope_distance)
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index f9b95ed955..da3575ce76 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -526,7 +526,7 @@ async def web_request(r):
             results.append(None)
 
     # allow 10 requests per second
-    r = RateLimiter(10)
+    r = RateLimiter(10, "Test")
     tasks = []
     # start 500 requests
     for i in range(500):
diff --git a/bbot/test/test_step_1/test_manager.py b/bbot/test/test_step_1/test_manager.py
index b57c9ccb71..d3e4b4f7c0 100644
--- a/bbot/test/test_step_1/test_manager.py
+++ b/bbot/test/test_step_1/test_manager.py
@@ -175,7 +175,7 @@ async def test_scope_distance(bbot_scanner, bbot_config):
     assert test_event4.scope_distance == 2
     await manager._emit_event(test_event4)
     assert test_event4.scope_distance == 2
-    assert test_event4._internal == False
+    assert test_event4._internal == True
     assert test_event4._force_output == True
     assert test_event4 in output_queue
     assert test_event4 in module_queue

From bb4802d8ebe0a0cae3c5c9fa473912ffea90ea14 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 25 May 2023 13:39:42 -0400
Subject: [PATCH 074/387] fixed virustotal, improved ctrl+c

---
 bbot/cli.py                  | 24 ++++++++++++++
 bbot/core/helpers/dns.py     | 64 +++++++++++++++++-------------------
 bbot/core/helpers/misc.py    |  5 +--
 bbot/modules/hackertarget.py |  5 ++-
 bbot/scanner/manager.py      |  5 +--
 bbot/scanner/scanner.py      | 12 ++++---
 6 files changed, 70 insertions(+), 45 deletions(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index 5c1724454b..3a77829a8f 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -41,6 +41,30 @@ async def _main():
     global scan_name
     environ.cli_execution = True
 
+    # async def monitor_tasks():
+    #     in_row = 0
+    #     while 1:
+    #         try:
+    #             print('looooping')
+    #             tasks = asyncio.all_tasks()
+    #             current_task = asyncio.current_task()
+    #             if len(tasks) == 1 and list(tasks)[0] == current_task:
+    #                 print('no tasks')
+    #                 in_row += 1
+    #             else:
+    #                 in_row = 0
+    #             for t in tasks:
+    #                 print(t)
+    #             if in_row > 2:
+    #                 break
+    #             await asyncio.sleep(1)
+    #         except BaseException as e:
+    #             print(traceback.format_exc())
+    #             with suppress(BaseException):
+    #                 await asyncio.sleep(.1)
+
+    # monitor_tasks_task = asyncio.create_task(monitor_tasks())
+
     ensure_config_files()
 
     try:
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 02e84d253e..fb57295d40 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -1,9 +1,9 @@
 import asyncio
 import logging
 import ipaddress
+import contextlib
 import dns.exception
 import dns.asyncresolver
-from contextlib import suppress
 
 from .regexes import dns_name_regex
 from bbot.core.helpers.ratelimiter import RateLimiter
@@ -88,31 +88,30 @@ async def resolve_raw(self, query, **kwargs):
         # kwargs["tcp"] = True
         results = []
         errors = []
-        with suppress(asyncio.CancelledError):
-            query = str(query).strip()
-            if is_ip(query):
-                kwargs.pop("type", None)
-                kwargs.pop("rdtype", None)
-                results, errors = await self._resolve_ip(query, **kwargs)
-                return [("PTR", results)], [("PTR", e) for e in errors]
-            else:
-                types = ["A", "AAAA"]
-                kwargs.pop("rdtype", None)
-                if "type" in kwargs:
-                    t = kwargs.pop("type")
-                    if isinstance(t, str):
-                        if t.strip().lower() in ("any", "all", "*"):
-                            types = self.all_rdtypes
-                        else:
-                            types = [t.strip().upper()]
-                    elif any([isinstance(t, x) for x in (list, tuple)]):
-                        types = [str(_).strip().upper() for _ in t]
-                for t in types:
-                    r, e = await self._resolve_hostname(query, rdtype=t, **kwargs)
-                    if r:
-                        results.append((t, r))
-                    for error in e:
-                        errors.append((t, error))
+        query = str(query).strip()
+        if is_ip(query):
+            kwargs.pop("type", None)
+            kwargs.pop("rdtype", None)
+            results, errors = await self._resolve_ip(query, **kwargs)
+            return [("PTR", results)], [("PTR", e) for e in errors]
+        else:
+            types = ["A", "AAAA"]
+            kwargs.pop("rdtype", None)
+            if "type" in kwargs:
+                t = kwargs.pop("type")
+                if isinstance(t, str):
+                    if t.strip().lower() in ("any", "all", "*"):
+                        types = self.all_rdtypes
+                    else:
+                        types = [t.strip().upper()]
+                elif any([isinstance(t, x) for x in (list, tuple)]):
+                    types = [str(_).strip().upper() for _ in t]
+            for t in types:
+                r, e = await self._resolve_hostname(query, rdtype=t, **kwargs)
+                if r:
+                    results.append((t, r))
+                for error in e:
+                    errors.append((t, error))
 
         return (results, errors)
 
@@ -177,14 +176,14 @@ async def _resolve_ip(self, query, **kwargs):
         dns_cache_hash = hash(f"{query}:PTR")
         while tries_left > 0:
             try:
-                if dns_cache_hash in self._dns_cache:
-                    result = self._dns_cache[dns_cache_hash]
-                else:
+                try:
+                    results = self._dns_cache[dns_cache_hash]
+                except KeyError:
                     async with self.dns_rate_limiter:
                         result = await self._catch(self.resolver.resolve_address, query, **kwargs)
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = result
-                return result, errors
+                break
             except (dns.exception.Timeout, dns.resolver.LifetimeTimeout, dns.resolver.NoNameservers) as e:
                 errors.append(e)
                 # don't retry if we get a SERVFAIL
@@ -299,11 +298,11 @@ async def resolve_event(self, event, minimal=False):
                                     ip = self.parent_helper.make_ip_type(t)
 
                                     if rdtype in ("A", "AAAA", "CNAME"):
-                                        with suppress(ValidationError):
+                                        with contextlib.suppress(ValidationError):
                                             if self.parent_helper.is_ip(ip):
                                                 if self.parent_helper.scan.whitelisted(ip):
                                                     event_whitelisted = True
-                                        with suppress(ValidationError):
+                                        with contextlib.suppress(ValidationError):
                                             if self.parent_helper.scan.blacklisted(ip):
                                                 event_blacklisted = True
 
@@ -416,7 +415,6 @@ async def _catch(self, callback, *args, **kwargs):
             self.debug(f"{e} (args={args}, kwargs={kwargs})")
         except Exception:
             log.warning(f"Error in {callback.__qualname__}() with args={args}, kwargs={kwargs}")
-        return list()
 
     async def is_wildcard(self, query, ips=None, rdtype=None):
         """
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 68274661e2..858671a2d7 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -589,8 +589,8 @@ def search_dict_by_key(key, d):
 
 def search_format_dict(d, **kwargs):
     """
-    Recursively .format() string values in dictionary keys
-    search_format_dict({"test": "{name} is awesome"}, name="keanu")
+    Recursively .format() string values in dictionary values
+    search_format_dict({"test": "#{name} is awesome"}, name="keanu")
         --> {"test": "keanu is awesome"}
     """
     if isinstance(d, dict):
@@ -1080,6 +1080,7 @@ def cancel_tasks(tasks):
     current_task = asyncio.current_task()
     for task in tasks:
         if task != current_task:
+            log.debug(f"Cancelling task: {task}")
             task.cancel()
 
 
diff --git a/bbot/modules/hackertarget.py b/bbot/modules/hackertarget.py
index 8392110340..ad476abec5 100644
--- a/bbot/modules/hackertarget.py
+++ b/bbot/modules/hackertarget.py
@@ -17,5 +17,8 @@ async def request_url(self, query):
     def parse_results(self, r, query):
         for line in r.text.splitlines():
             host = line.split(",")[0]
-            if self.helpers.validators.validate_host(host):
+            try:
+                self.helpers.validators.validate_host(host)
                 yield host
+            except ValueError:
+                self.set_error_state(host)
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 5a12e3ee5d..c8573b62c5 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -341,7 +341,7 @@ async def distribute_event(self, *args, **kwargs):
 
     async def _worker_loop(self):
         try:
-            while 1:
+            while not self.scan.stopped:
                 try:
                     event, kwargs = self.get_event_from_modules()
                 except asyncio.queues.QueueEmpty:
@@ -351,9 +351,6 @@ async def _worker_loop(self):
                 if acceptable:
                     self._new_activity = True
 
-        except KeyboardInterrupt:
-            self.scan.stop()
-
         except Exception:
             log.critical(traceback.format_exc())
 
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 8c47143ced..40a7700f9b 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -335,6 +335,7 @@ def stop(self):
             self.status = "ABORTING"
             self.hugewarning(f"Aborting scan")
             self.trace()
+            self.cancel_tasks()
             self.drain_queues()
             self.helpers.kill_children()
             self.drain_queues()
@@ -362,10 +363,12 @@ def drain_queues(self):
         for module in self.modules.values():
             with contextlib.suppress(asyncio.queues.QueueEmpty):
                 while 1:
-                    module.incoming_event_queue.get_nowait()
+                    if module.incoming_event_queue:
+                        module.incoming_event_queue.get_nowait()
             with contextlib.suppress(asyncio.queues.QueueEmpty):
                 while 1:
-                    module.outgoing_event_queue.get_nowait()
+                    if module.outgoing_event_queue:
+                        module.outgoing_event_queue.get_nowait()
         with contextlib.suppress(asyncio.queues.QueueEmpty):
             while 1:
                 self.manager.incoming_event_queue.get_nowait()
@@ -690,9 +693,8 @@ def _handle_exception(self, e, context="scan", finally_callback=None):
             self.stop()
         elif isinstance(e, BrokenPipeError):
             log.debug(f"BrokenPipeError in {filename}:{lineno}:{funcname}(): {e}")
-        # elif isinstance(e, asyncio.CancelledError):
-        #     log.debug(f"asyncio CancelledError: {e}")
-        #     log.trace(traceback.format_exc())
+        elif isinstance(e, asyncio.CancelledError):
+            raise
         elif isinstance(e, Exception):
             log.error(f"Error in {context}: {filename}:{lineno}:{funcname}(): {e}")
             log.trace(traceback.format_exc())

From 6a36e45eeccc11b7b26cc226cd95b7124f2abb83 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 25 May 2023 14:00:44 -0400
Subject: [PATCH 075/387] fix dns tests

---
 bbot/cli.py              | 3 ++-
 bbot/core/helpers/dns.py | 4 ++--
 2 files changed, 4 insertions(+), 3 deletions(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index 3a77829a8f..b4e08e5e5a 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -6,6 +6,7 @@
 import logging
 import threading
 import traceback
+from time import sleep
 from omegaconf import OmegaConf
 from contextlib import suppress
 
@@ -352,7 +353,7 @@ def main():
         log_to_stderr(msg, level="ERROR")
         if get_log_level() <= logging.DEBUG:
             log_to_stderr(traceback.format_exc(), level="DEBUG")
-        os._exit(1)
+        exit(1)
 
 
 if __name__ == "__main__":
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index fb57295d40..877ce679d5 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -180,9 +180,9 @@ async def _resolve_ip(self, query, **kwargs):
                     results = self._dns_cache[dns_cache_hash]
                 except KeyError:
                     async with self.dns_rate_limiter:
-                        result = await self._catch(self.resolver.resolve_address, query, **kwargs)
+                        results = await self._catch(self.resolver.resolve_address, query, **kwargs)
                     if cache_result:
-                        self._dns_cache[dns_cache_hash] = result
+                        self._dns_cache[dns_cache_hash] = results
                 break
             except (dns.exception.Timeout, dns.resolver.LifetimeTimeout, dns.resolver.NoNameservers) as e:
                 errors.append(e)

From 7ed1bd6d867334c651a2a17cc77ff5262ce752e6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 25 May 2023 14:02:15 -0400
Subject: [PATCH 076/387] remove sleep statement

---
 bbot/cli.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index b4e08e5e5a..8570bd88f1 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -6,7 +6,6 @@
 import logging
 import threading
 import traceback
-from time import sleep
 from omegaconf import OmegaConf
 from contextlib import suppress
 

From 555c5aa12ed757ef1a4280a850a21b58a7d049b9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 25 May 2023 14:09:10 -0400
Subject: [PATCH 077/387] prioritize hosts in asset inventory sorting

---
 bbot/core/helpers/dns.py               |  1 +
 bbot/modules/output/asset_inventory.py | 10 +++++++++-
 bbot/scanner/manager.py                |  2 +-
 3 files changed, 11 insertions(+), 2 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 877ce679d5..a604b497a8 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -415,6 +415,7 @@ async def _catch(self, callback, *args, **kwargs):
             self.debug(f"{e} (args={args}, kwargs={kwargs})")
         except Exception:
             log.warning(f"Error in {callback.__qualname__}() with args={args}, kwargs={kwargs}")
+        return []
 
     async def is_wildcard(self, query, ips=None, rdtype=None):
         """
diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index ce1f44e98b..1b9c81ea25 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -1,5 +1,6 @@
 import csv
 import ipaddress
+from contextlib import suppress
 
 from .csv import CSV
 from bbot.core.helpers.misc import make_ip_type, is_ip, is_port
@@ -78,7 +79,14 @@ def increment_stat(stat, value):
             except KeyError:
                 stats[stat][value] = 1
 
-        for asset in sorted(self.assets.values(), key=lambda a: str(a.host)):
+        def sort_key(asset):
+            host = str(asset.host)
+            is_digit = False
+            with suppress(IndexError):
+                is_digit = host[0].isdigit()
+            return (is_digit, host)
+
+        for asset in sorted(self.assets.values(), key=sort_key):
             findings_and_vulns = asset.findings.union(asset.vulnerabilities)
             ports = getattr(asset, "ports", set())
             ports = [str(p) for p in sorted([int(p) for p in asset.ports])]
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index c8573b62c5..926a7447f2 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -379,7 +379,7 @@ def get_event_from_modules(self):
         for q in self.scan.helpers.weighted_shuffle(self.incoming_queues, self.module_priority_weights):
             try:
                 return q.get_nowait()
-            except asyncio.queues.QueueEmpty:
+            except (asyncio.queues.QueueEmpty, AttributeError):
                 continue
         raise asyncio.queues.QueueEmpty()
 

From e04df50228903f047b0cdb8aad47660a56ea2f79 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 25 May 2023 14:25:48 -0400
Subject: [PATCH 078/387] fix dns tests

---
 bbot/core/helpers/dns.py     | 51 ++++++++++++++++++++----------------
 bbot/modules/dnscommonsrv.py |  2 +-
 bbot/scanner/scanner.py      |  7 ++++-
 3 files changed, 35 insertions(+), 25 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index a604b497a8..669fb336ad 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -1,6 +1,7 @@
 import asyncio
 import logging
 import ipaddress
+import traceback
 import contextlib
 import dns.exception
 import dns.asyncresolver
@@ -89,29 +90,33 @@ async def resolve_raw(self, query, **kwargs):
         results = []
         errors = []
         query = str(query).strip()
-        if is_ip(query):
-            kwargs.pop("type", None)
-            kwargs.pop("rdtype", None)
-            results, errors = await self._resolve_ip(query, **kwargs)
-            return [("PTR", results)], [("PTR", e) for e in errors]
-        else:
-            types = ["A", "AAAA"]
-            kwargs.pop("rdtype", None)
-            if "type" in kwargs:
-                t = kwargs.pop("type")
-                if isinstance(t, str):
-                    if t.strip().lower() in ("any", "all", "*"):
-                        types = self.all_rdtypes
-                    else:
-                        types = [t.strip().upper()]
-                elif any([isinstance(t, x) for x in (list, tuple)]):
-                    types = [str(_).strip().upper() for _ in t]
-            for t in types:
-                r, e = await self._resolve_hostname(query, rdtype=t, **kwargs)
-                if r:
-                    results.append((t, r))
-                for error in e:
-                    errors.append((t, error))
+        try:
+            if is_ip(query):
+                kwargs.pop("type", None)
+                kwargs.pop("rdtype", None)
+                results, errors = await self._resolve_ip(query, **kwargs)
+                return [("PTR", results)], [("PTR", e) for e in errors]
+            else:
+                types = ["A", "AAAA"]
+                kwargs.pop("rdtype", None)
+                if "type" in kwargs:
+                    t = kwargs.pop("type")
+                    if isinstance(t, str):
+                        if t.strip().lower() in ("any", "all", "*"):
+                            types = self.all_rdtypes
+                        else:
+                            types = [t.strip().upper()]
+                    elif any([isinstance(t, x) for x in (list, tuple)]):
+                        types = [str(_).strip().upper() for _ in t]
+                for t in types:
+                    r, e = await self._resolve_hostname(query, rdtype=t, **kwargs)
+                    if r:
+                        results.append((t, r))
+                    for error in e:
+                        errors.append((t, error))
+        except RuntimeError as e:
+            log.debug(f"Error in resolve_raw({query}, kwargs={kwargs}): {e}")
+            log.trace(traceback.format_exc())
 
         return (results, errors)
 
diff --git a/bbot/modules/dnscommonsrv.py b/bbot/modules/dnscommonsrv.py
index d49612a055..6c80212d73 100644
--- a/bbot/modules/dnscommonsrv.py
+++ b/bbot/modules/dnscommonsrv.py
@@ -94,7 +94,7 @@ class dnscommonsrv(BaseModule):
     produced_events = ["DNS_NAME"]
     flags = ["subdomain-enum", "passive", "safe"]
     meta = {"description": "Check for common SRV records"}
-    max_event_handlers = 2
+    max_event_handlers = 5
 
     async def filter_event(self, event):
         # skip SRV wildcards
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 40a7700f9b..ab8106082c 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -165,6 +165,7 @@ def __init__(
         self.manager_worker_loop_tasks = []
         self.init_events_task = None
         self.ticker_task = None
+        self.dispatcher_tasks = []
 
         self._stopping = False
 
@@ -385,6 +386,8 @@ def cancel_tasks(self):
         # ticker
         if self.ticker_task:
             tasks.append(self.ticker_task)
+        # dispatcher
+        tasks += self.dispatcher_tasks
         # manager worker loops
         tasks += self.manager_worker_loop_tasks
         self.helpers.cancel_tasks(tasks)
@@ -462,7 +465,9 @@ def status(self, status):
                 if status != self._status:
                     self._status = status
                     self._status_code = self._status_codes[status]
-                    asyncio.create_task(self.dispatcher.catch(self.dispatcher.on_status, self._status, self.id))
+                    self.dispatcher_tasks.append(
+                        asyncio.create_task(self.dispatcher.catch(self.dispatcher.on_status, self._status, self.id))
+                    )
                 else:
                     self.debug(f'Scan status is already "{status}"')
         else:

From 966a5f48e5713c978913ab58d152d0999169017b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 25 May 2023 16:31:28 -0400
Subject: [PATCH 079/387] tweak subdomain enum timeouts, logging for
 dnszonetransfer/scan manager

---
 bbot/modules/certspotter.py     | 2 +-
 bbot/modules/dnszonetransfer.py | 3 +--
 bbot/modules/threatminer.py     | 2 +-
 bbot/scanner/manager.py         | 3 ++-
 4 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/bbot/modules/certspotter.py b/bbot/modules/certspotter.py
index 5e928fc4be..d943bf8eb3 100644
--- a/bbot/modules/certspotter.py
+++ b/bbot/modules/certspotter.py
@@ -11,7 +11,7 @@ class certspotter(crobat):
 
     def request_url(self, query):
         url = f"{self.base_url}/issuances?domain={self.helpers.quote(query)}&include_subdomains=true&expand=dns_names"
-        return self.request_with_fail_count(url)
+        return self.request_with_fail_count(url, timeout=self.http_timeout + 30)
 
     def parse_results(self, r, query):
         json = r.json()
diff --git a/bbot/modules/dnszonetransfer.py b/bbot/modules/dnszonetransfer.py
index 5d959bcfe9..bb9819fbb6 100644
--- a/bbot/modules/dnszonetransfer.py
+++ b/bbot/modules/dnszonetransfer.py
@@ -41,8 +41,7 @@ async def handle_event(self, event):
                 )
                 zone = dns.zone.from_xfr(xfr_answer)
             except Exception as e:
-                self.verbose(f"Error retrieving zone: {e}")
-                self.trace()
+                self.debug(f"Error retrieving zone for {domain}: {e}")
                 continue
             self.hugesuccess(f"Successful zone transfer against {nameserver} for domain {domain}!")
             finding_description = f"Successful DNS zone transfer against {nameserver} for {domain}"
diff --git a/bbot/modules/threatminer.py b/bbot/modules/threatminer.py
index 066e4c3bb1..0613c59028 100644
--- a/bbot/modules/threatminer.py
+++ b/bbot/modules/threatminer.py
@@ -13,7 +13,7 @@ class threatminer(crobat):
 
     async def request_url(self, query):
         url = f"{self.base_url}/domain.php?q={self.helpers.quote(query)}&rt=5"
-        r = await self.request_with_fail_count(url)
+        r = await self.request_with_fail_count(url, timeout=self.http_timeout + 30)
         return r
 
     def parse_results(self, r, query):
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 926a7447f2..6efa993219 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -481,8 +481,9 @@ async def modules_status(self, _log=False):
             if queued_events_by_type:
                 queued_events_by_type.sort(key=lambda x: x[-1], reverse=True)
                 queued_events_by_type_str = ", ".join(f"{m}: {t:,}" for m, t in queued_events_by_type)
+                num_queued_events = sum(v for k, v in queued_events_by_type)
                 self.scan.info(
-                    f"{self.scan.name}: {self.incoming_event_queue.qsize():,} events in queue ({queued_events_by_type_str})"
+                    f"{self.scan.name}: {num_queued_events:,} events in queue ({queued_events_by_type_str})"
                 )
             else:
                 self.scan.info(f"{self.scan.name}: No events in queue")

From 303c02b93155c83e6052a26e5d866eb24515b89a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 26 May 2023 10:52:23 -0400
Subject: [PATCH 080/387] better dns mutations

---
 bbot/core/helpers/wordcloud.py        | 23 +++++++++++++++--------
 bbot/test/test_step_1/test_helpers.py | 27 ++++++++++++++++++++++++++-
 2 files changed, 41 insertions(+), 9 deletions(-)

diff --git a/bbot/core/helpers/wordcloud.py b/bbot/core/helpers/wordcloud.py
index d0c9a076ac..37de8b62af 100644
--- a/bbot/core/helpers/wordcloud.py
+++ b/bbot/core/helpers/wordcloud.py
@@ -254,9 +254,8 @@ class DNSMutator(Mutator):
         re.compile(r, re.I)
         for r in [
             r"[a-z]+",
+            r"[a-z_-]+",
             r"[a-z0-9]+",
-            r"[a-z0-9-]+",
-            r"[a-z0-9_]+",
             r"[a-z0-9_-]+",
         ]
     ]
@@ -277,16 +276,22 @@ def mutations(self, words, max_mutations=None):
         return super().mutations(new_words, max_mutations=max_mutations)
 
     def add_word(self, word):
-        for match in self.word_regex.finditer(word):
-            start, end = match.span()
+        spans = set()
+        mutations = set()
+        for r in self.extract_word_regexes:
+            for match in r.finditer(word):
+                span = match.span()
+                if span not in spans:
+                    spans.add(span)
+        for start, end in spans:
             match_str = word[start:end]
             # skip digits
             if match_str.isdigit():
                 continue
             before = word[:start]
             after = word[end:]
-            basic_mutation = [before, None, after]
-            self._add_mutation(basic_mutation)
+            basic_mutation = (before, None, after)
+            mutations.add(basic_mutation)
             match_str_split = self.model.split(match_str)
             if len(match_str_split) > 1:
                 for i, s in enumerate(match_str_split):
@@ -294,5 +299,7 @@ def add_word(self, word):
                         continue
                     split_before = "".join(match_str_split[:i])
                     split_after = "".join(match_str_split[i + 1 :])
-                    wordninja_mutation = [before + split_before, None, split_after + after]
-                    self._add_mutation(wordninja_mutation)
+                    wordninja_mutation = (before + split_before, None, split_after + after)
+                    mutations.add(wordninja_mutation)
+        for m in mutations:
+            self._add_mutation(m)
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index da3575ce76..925bb5ee21 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -477,6 +477,22 @@ def test_word_cloud(helpers, bbot_config, bbot_scanner):
     # mutators
     from bbot.core.helpers.wordcloud import DNSMutator
 
+    m = DNSMutator()
+    m.add_word("blacklantern-security237")
+    mutations = set(m)
+    assert mutations == {
+        (None, "237"),
+        ("black", None, "-security237"),
+        (None, "lantern-security237"),
+        ("blacklantern-", None),
+        ("black", None, "security237"),
+        (None,),
+        ("blacklantern", None, "237"),
+        (None, "-security237"),
+        ("blacklantern-", None, "237"),
+        (None, "lanternsecurity237"),
+    }
+
     m = DNSMutator()
     m.add_word("blacklantern-security")
     m.add_word("sec")
@@ -489,12 +505,19 @@ def test_word_cloud(helpers, bbot_config, bbot_scanner):
             "basket-security",
             "basket2",
             "basketlantern-security",
+            "basketlanternsecurity",
             "blackbasket-security",
+            "blackbasketsecurity",
             "blacklantern-basket",
             "blacklantern-white",
             "blacklantern-whitebasket",
+            "blacklanternbasket",
+            "blacklanternwhite",
+            "blacklanternwhitebasket",
             "blackwhite-security",
             "blackwhitebasket-security",
+            "blackwhitebasketsecurity",
+            "blackwhitesecurity",
             "white",
             "white-security",
             "white2",
@@ -502,11 +525,13 @@ def test_word_cloud(helpers, bbot_config, bbot_scanner):
             "whitebasket-security",
             "whitebasket2",
             "whitebasketlantern-security",
+            "whitebasketlanternsecurity",
             "whitelantern-security",
+            "whitelanternsecurity",
         ]
     )
     top_mutations = sorted(m.top_mutations().items(), key=lambda x: x[-1], reverse=True)
-    assert top_mutations[:2] == [((None,), 3), ((None, "2"), 2)]
+    assert top_mutations[:2] == [((None,), 4), ((None, "2"), 2)]
 
 
 def test_names(helpers):

From 568ad55531984f62762c5a155d55806eb05f6aa3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 28 May 2023 20:42:53 -0400
Subject: [PATCH 081/387] limit http title length, add process pool, improve
 badsecrets/secretsdb/excavate performance

---
 README.md                             |  2 +-
 bbot/cli.py                           |  1 +
 bbot/core/helpers/cache.py            | 36 ++++++++++++---------------
 bbot/core/helpers/misc.py             |  4 +--
 bbot/core/helpers/wordcloud.py        |  1 -
 bbot/modules/badsecrets.py            |  8 +++++-
 bbot/modules/base.py                  |  6 ++++-
 bbot/modules/httpx.py                 |  2 +-
 bbot/modules/internal/excavate.py     | 26 +++++++++++--------
 bbot/modules/secretsdb.py             | 29 +++++++++++++--------
 bbot/scanner/scanner.py               | 24 ++++++++++++++++++
 bbot/test/test_step_1/test_helpers.py | 10 ++++----
 12 files changed, 95 insertions(+), 54 deletions(-)

diff --git a/README.md b/README.md
index 02c7918369..cc550fb6b5 100644
--- a/README.md
+++ b/README.md
@@ -12,7 +12,7 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 Whether you're a pentester, security researcher, or bug bounty hunter, BBOT simplifies and automates the OSINT process so you can focus on the fun part: hacking!
 
 ![bbot-demo](https://user-images.githubusercontent.com/20261699/217346759-d5bf56c3-3936-43f7-ad14-4d73d2cd1417.gif)
-
+Visualization courtesey of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
 
 # Getting Started
 
diff --git a/bbot/cli.py b/bbot/cli.py
index 8570bd88f1..6e7b5d1dee 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -302,6 +302,7 @@ def keyboard_listen():
                                 allowed_errors -= 1
                             if not keyboard_input:
                                 toggle_log_level(logger=log)
+                                scanner.manager.modules_status(_log=True)
                             if allowed_errors <= 0:
                                 break
 
diff --git a/bbot/core/helpers/cache.py b/bbot/core/helpers/cache.py
index 9e0e1e68e6..15c9d904f8 100644
--- a/bbot/core/helpers/cache.py
+++ b/bbot/core/helpers/cache.py
@@ -1,7 +1,6 @@
 import os
 import time
 import logging
-import threading
 from contextlib import suppress
 from collections import OrderedDict
 
@@ -66,32 +65,29 @@ class CacheDict:
 
     def __init__(self, max_size=1000):
         self._cache = OrderedDict()
-        self._lock = threading.Lock()
         self._max_size = int(max_size)
 
     def get(self, name, fallback=_sentinel):
         name_hash = self._hash(name)
-        with self._lock:
-            try:
-                return self._cache[name_hash]
-            except KeyError:
-                if fallback is not _sentinel:
-                    return fallback
-                raise
-            finally:
-                with suppress(KeyError):
-                    self._cache.move_to_end(name_hash)
-                self._truncate()
+        try:
+            return self._cache[name_hash]
+        except KeyError:
+            if fallback is not _sentinel:
+                return fallback
+            raise
+        finally:
+            with suppress(KeyError):
+                self._cache.move_to_end(name_hash)
+            self._truncate()
 
     def put(self, name, value):
         name_hash = self._hash(name)
-        with self._lock:
-            try:
-                self._cache[name_hash] = value
-            finally:
-                with suppress(KeyError):
-                    self._cache.move_to_end(name_hash)
-                self._truncate()
+        try:
+            self._cache[name_hash] = value
+        finally:
+            with suppress(KeyError):
+                self._cache.move_to_end(name_hash)
+            self._truncate()
 
     def _truncate(self):
         if not self or len(self) <= self._max_size:
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 858671a2d7..8053f277d1 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -942,14 +942,14 @@ def os_platform_friendly():
 tag_filter_regex = re.compile(r"[^a-z0-9]+")
 
 
-def tagify(s):
+def tagify(s, maxlen=None):
     """
     Sanitize a string into a tag-friendly format
 
     tagify("HTTP Web Title") --> "http-web-title"
     """
     ret = str(s).lower()
-    return tag_filter_regex.sub("-", ret).strip("-")
+    return tag_filter_regex.sub("-", ret)[:maxlen].strip("-")
 
 
 def memory_status():
diff --git a/bbot/core/helpers/wordcloud.py b/bbot/core/helpers/wordcloud.py
index 37de8b62af..1d387df812 100644
--- a/bbot/core/helpers/wordcloud.py
+++ b/bbot/core/helpers/wordcloud.py
@@ -249,7 +249,6 @@ def add_word(self, word):
 
 
 class DNSMutator(Mutator):
-    word_regex = re.compile(r"[^_\W]+")
     extract_word_regexes = [
         re.compile(r, re.I)
         for r in [
diff --git a/bbot/modules/badsecrets.py b/bbot/modules/badsecrets.py
index 99194eae3d..62a3b8442d 100644
--- a/bbot/modules/badsecrets.py
+++ b/bbot/modules/badsecrets.py
@@ -1,3 +1,5 @@
+import multiprocessing
+
 from .base import BaseModule
 
 from badsecrets.base import carve_all_modules
@@ -11,6 +13,10 @@ class badsecrets(BaseModule):
     max_event_handlers = 2
     deps_pip = ["badsecrets~=0.1.287"]
 
+    @property
+    def _max_event_handlers(self):
+        return multiprocessing.cpu_count()
+
     async def handle_event(self, event):
         resp_body = event.data.get("body", None)
         resp_headers = event.data.get("header", None)
@@ -27,7 +33,7 @@ async def handle_event(self, event):
                     if len(c2) == 2:
                         resp_cookies[c2[0]] = c2[1]
         if resp_body or resp_cookies:
-            r_list = carve_all_modules(body=resp_body, cookies=resp_cookies)
+            r_list = await self.scan.run_in_executor_mp(carve_all_modules, body=resp_body, cookies=resp_cookies)
             if r_list:
                 for r in r_list:
                     if r["type"] == "SecretFound":
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 0f38108fee..ffa1cd659a 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -282,8 +282,12 @@ def num_incoming_events(self):
             ret = self.incoming_event_queue.qsize()
         return ret
 
+    @property
+    def _max_event_handlers(self):
+        return self.max_event_handlers
+
     def start(self):
-        self._tasks = [asyncio.create_task(self._worker()) for _ in range(self.max_event_handlers)]
+        self._tasks = [asyncio.create_task(self._worker()) for _ in range(self._max_event_handlers)]
 
     async def _setup(self):
         status_codes = {False: "hard-fail", None: "soft-fail", True: "success"}
diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index 4b110bea5d..7ab78a1997 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -133,7 +133,7 @@ async def handle_batch(self, *events):
             # main URL
             httpx_ip = j.get("host", "unknown")
             tags = [f"status-{status_code}", f"ip-{httpx_ip}"]
-            title = self.helpers.tagify(j.get("title", ""))
+            title = self.helpers.tagify(j.get("title", ""), maxlen=30)
             if title:
                 tags.append(f"http-title-{title}")
             url_event = self.make_event(url, "URL", source_event, tags=tags)
diff --git a/bbot/modules/internal/excavate.py b/bbot/modules/internal/excavate.py
index 94e711bc22..0b834a2018 100644
--- a/bbot/modules/internal/excavate.py
+++ b/bbot/modules/internal/excavate.py
@@ -18,15 +18,17 @@ def __init__(self, excavate):
         for rname, r in self.regexes.items():
             self.compiled_regexes[rname] = re.compile(r)
 
-    def search(self, content, event, **kwargs):
+    async def search(self, content, event, **kwargs):
         results = set()
-        for result, name in self._search(content, event, **kwargs):
+        async for result, name in self._search(content, event, **kwargs):
             results.add(result)
         for result in results:
             self.report(result, name, event, **kwargs)
 
-    def _search(self, content, event, **kwargs):
+    async def _search(self, content, event, **kwargs):
         for name, regex in self.compiled_regexes.items():
+            # yield to event loop
+            await self.excavate.helpers.sleep(0)
             for result in regex.findall(content):
                 yield result, name
 
@@ -66,10 +68,10 @@ def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
         self.web_spider_links_per_page = self.excavate.scan.config.get("web_spider_links_per_page", 20)
 
-    def search(self, content, event, **kwargs):
+    async def search(self, content, event, **kwargs):
         result_hashes = set()
         results = []
-        for result in self._search(content, event, **kwargs):
+        async for result in self._search(content, event, **kwargs):
             result_hash = hash(result)
             if result_hash not in result_hashes:
                 result_hashes.add(result_hash)
@@ -81,9 +83,11 @@ def search(self, content, event, **kwargs):
                 new_kwargs["exceeded_max_links"] = True
             self.report(result, name, event, **new_kwargs)
 
-    def _search(self, content, event, **kwargs):
+    async def _search(self, content, event, **kwargs):
         parsed = getattr(event, "parsed", None)
         for name, regex in self.compiled_regexes.items():
+            # yield to event loop
+            await self.excavate.helpers.sleep(0)
             for result in regex.findall(content):
                 if name == "fullurl":
                     protocol, other = result
@@ -312,9 +316,9 @@ async def setup(self):
 
         return True
 
-    def search(self, source, extractors, event, **kwargs):
+    async def search(self, source, extractors, event, **kwargs):
         for e in extractors:
-            e.search(source, event, **kwargs)
+            await e.search(source, event, **kwargs)
 
     async def handle_event(self, event):
         data = event.data
@@ -353,7 +357,7 @@ async def handle_event(self, event):
             body = self.helpers.recursive_decode(event.data.get("body", ""))
             # Cloud extractors
             self.helpers.cloud.excavate(event, body)
-            self.search(
+            await self.search(
                 body,
                 [
                     self.hostname,
@@ -370,7 +374,7 @@ async def handle_event(self, event):
             )
 
             headers = self.helpers.recursive_decode(event.data.get("raw_header", ""))
-            self.search(
+            await self.search(
                 headers,
                 [self.hostname, self.url, self.email, self.error_extractor, self.jwt, self.serialization],
                 event,
@@ -378,7 +382,7 @@ async def handle_event(self, event):
             )
 
         else:
-            self.search(
+            await self.search(
                 str(data),
                 [self.hostname, self.url, self.email, self.error_extractor, self.jwt, self.serialization],
                 event,
diff --git a/bbot/modules/secretsdb.py b/bbot/modules/secretsdb.py
index db74f7acc3..b5115c1fa9 100644
--- a/bbot/modules/secretsdb.py
+++ b/bbot/modules/secretsdb.py
@@ -44,6 +44,22 @@ async def setup(self):
     async def handle_event(self, event):
         resp_body = event.data.get("body", "")
         resp_headers = event.data.get("raw_header", "")
+        all_matches = await self.scan.run_in_executor(self.search_data, resp_body, resp_headers)
+        for matches, name in all_matches:
+            matches = [m.string[m.start() : m.end()] for m in matches]
+            description = f"Possible secret ({name}): {matches}"
+            event_data = {"host": str(event.host), "description": description}
+            parsed_url = getattr(event, "parsed", None)
+            if parsed_url:
+                event_data["url"] = parsed_url.geturl()
+            self.emit_event(
+                event_data,
+                "FINDING",
+                source=event,
+            )
+
+    def search_data(self, resp_body, resp_headers):
+        all_matches = []
         for r in self.rules:
             regex = r["regex"]
             name = r["name"]
@@ -51,14 +67,5 @@ async def handle_event(self, event):
                 if text:
                     matches = list(regex.finditer(text))
                     if matches:
-                        matches = [m.string[m.start() : m.end()] for m in matches]
-                        description = f"Possible secret ({name}): {matches}"
-                        event_data = {"host": str(event.host), "description": description}
-                        parsed_url = getattr(event, "parsed", None)
-                        if parsed_url:
-                            event_data["url"] = parsed_url.geturl()
-                        self.emit_event(
-                            event_data,
-                            "FINDING",
-                            source=event,
-                        )
+                        all_matches.append((matches, name))
+        return all_matches
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index ab8106082c..1ab57452e8 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -4,10 +4,12 @@
 import contextlib
 from sys import exc_info
 from pathlib import Path
+import multiprocessing as mp
 from datetime import datetime
 from functools import partial
 from omegaconf import OmegaConf
 from collections import OrderedDict
+from concurrent.futures import ProcessPoolExecutor
 
 from bbot import config as bbot_config
 
@@ -167,6 +169,13 @@ def __init__(
         self.ticker_task = None
         self.dispatcher_tasks = []
 
+        # multiprocessing thread pool
+        try:
+            mp.set_start_method("spawn")
+        except Exception:
+            self.warning(f"Failed to set multiprocessing spawn method. This may negatively affect performance.")
+        self.process_pool = ProcessPoolExecutor()
+
         self._stopping = False
 
     def _on_keyboard_interrupt(self, loop, event):
@@ -271,6 +280,9 @@ async def start(self):
                 except BBOTError as e:
                     self.critical(f"Error during scan: {e}")
 
+                except asyncio.CancelledError:
+                    self.trace()
+
                 except Exception:
                     self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
 
@@ -391,6 +403,8 @@ def cancel_tasks(self):
         # manager worker loops
         tasks += self.manager_worker_loop_tasks
         self.helpers.cancel_tasks(tasks)
+        # process pool
+        self.process_pool.shutdown(cancel_futures=True)
 
     async def report(self):
         for mod in self.modules.values():
@@ -685,9 +699,19 @@ async def acatch(self, context="scan", finally_callback=None):
             self._handle_exception(e, context=context)
 
     def run_in_executor(self, callback, *args, **kwargs):
+        """
+        Run a synchronous task in the event loop's default thread pool executor
+        """
         callback = partial(callback, **kwargs)
         return self._loop.run_in_executor(None, callback, *args)
 
+    def run_in_executor_mp(self, callback, *args, **kwargs):
+        """
+        Same as run_in_executor() except with a process pool executor
+        """
+        callback = partial(callback, **kwargs)
+        return self._loop.run_in_executor(self.process_pool, callback, *args)
+
     def _handle_exception(self, e, context="scan", finally_callback=None):
         if callable(context):
             context = f"{context.__qualname__}()"
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 925bb5ee21..91802192e9 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -481,16 +481,16 @@ def test_word_cloud(helpers, bbot_config, bbot_scanner):
     m.add_word("blacklantern-security237")
     mutations = set(m)
     assert mutations == {
+        (None,),
         (None, "237"),
-        ("black", None, "-security237"),
+        (None, "-security237"),
+        (None, "lanternsecurity237"),
         (None, "lantern-security237"),
         ("blacklantern-", None),
-        ("black", None, "security237"),
-        (None,),
         ("blacklantern", None, "237"),
-        (None, "-security237"),
         ("blacklantern-", None, "237"),
-        (None, "lanternsecurity237"),
+        ("black", None, "security237"),
+        ("black", None, "-security237"),
     }
 
     m = DNSMutator()

From 6692124201764487643d530e390aeb18fff98972 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 30 May 2023 13:50:30 -0400
Subject: [PATCH 082/387] asset inventory tweaks

---
 bbot/modules/base.py                   |  2 ++
 bbot/modules/output/asset_inventory.py |  8 ++++----
 bbot/scanner/manager.py                | 10 ++++------
 bbot/scanner/scanner.py                |  2 +-
 4 files changed, 11 insertions(+), 11 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index ffa1cd659a..5701be86d4 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -461,6 +461,8 @@ async def queue_event(self, event):
             self.incoming_event_queue.put_nowait(event)
             async with self._event_received:
                 self._event_received.notify()
+            if event.type != "FINISHED":
+                self.scan.manager._new_activity = True
         except AttributeError:
             self.debug(f"Not in an acceptable state to queue incoming event")
 
diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index 1b9c81ea25..6e5e61d6f4 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -42,6 +42,7 @@ async def setup(self):
         self.use_previous = self.config.get("use_previous", False)
         self.summary_netmask = self.config.get("summary_netmask", 16)
         self.emitted_contents = False
+        self._ran_hooks = False
         ret = await super().setup()
         return ret
 
@@ -127,7 +128,7 @@ def sort_key(asset):
         if self._file is not None:
             self.info(f"Saved asset-inventory output to {self.output_file}")
 
-    def emit_contents(self):
+    async def finish(self):
         if self.use_previous and not self.emitted_contents:
             self.emitted_contents = True
             if self.output_file.is_file():
@@ -165,9 +166,8 @@ def emit_contents(self):
                 self.warning(
                     f"use_previous=True was set but no previous asset inventory was found at {self.output_file}"
                 )
-
-    async def finish(self):
-        self.emit_contents()
+        else:
+            self._run_hooks()
 
     def _run_hooks(self):
         """
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 6efa993219..ca1e99fda3 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -55,7 +55,7 @@ async def emit_event(self, event, *args, **kwargs):
             # skip event if it fails precheck
             if not self._event_precheck(event):
                 event._resolved.set()
-                return False
+                return
 
             log.debug(f'Module "{event.module}" raised {event}')
 
@@ -179,7 +179,7 @@ async def _emit_event(self, event, *args, **kwargs):
                     source_trail = event.set_scope_distance(set_scope_distance)
                     # force re-emit internal source events
                     for s in source_trail:
-                        await self.emit_event(s, _block=False, _force_submit=True)
+                        self.emit_event(s, _block=False, _force_submit=True)
                 else:
                     if event.scope_distance > self.scan.scope_report_distance:
                         log.debug(
@@ -347,9 +347,7 @@ async def _worker_loop(self):
                 except asyncio.queues.QueueEmpty:
                     await asyncio.sleep(0.1)
                     continue
-                acceptable = await self.emit_event(event, **kwargs)
-                if acceptable:
-                    self._new_activity = True
+                await self.emit_event(event, **kwargs)
 
         except Exception:
             log.critical(traceback.format_exc())
@@ -424,7 +422,7 @@ def modules_finished(self):
     def active(self):
         return self.running or not self.modules_finished
 
-    async def modules_status(self, _log=False):
+    def modules_status(self, _log=False):
         finished = True
         status = {"modules": {}}
 
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 1ab57452e8..dcd3a833cf 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -670,7 +670,7 @@ async def _status_ticker(self, interval=15):
         async with self.acatch():
             while 1:
                 await asyncio.sleep(interval)
-                await self.manager.modules_status(_log=True)
+                self.manager.modules_status(_log=True)
 
     @contextlib.contextmanager
     def catch(self, context="scan", finally_callback=None):

From d4f0986d383d1d0887d19466f624e5e3e60fe22d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 30 May 2023 14:37:10 -0400
Subject: [PATCH 083/387] fix tests

---
 bbot/scanner/manager.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index ca1e99fda3..d7bc25aaa7 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -179,7 +179,7 @@ async def _emit_event(self, event, *args, **kwargs):
                     source_trail = event.set_scope_distance(set_scope_distance)
                     # force re-emit internal source events
                     for s in source_trail:
-                        self.emit_event(s, _block=False, _force_submit=True)
+                        await self.emit_event(s, _block=False, _force_submit=True)
                 else:
                     if event.scope_distance > self.scan.scope_report_distance:
                         log.debug(

From 7d26b8762d16ad42e232a95ecefab6daf979aa8c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 30 May 2023 15:33:10 -0400
Subject: [PATCH 084/387] fix ssl errors

---
 bbot/core/helpers/web.py    |  3 +++
 bbot/modules/base.py        | 48 +++++++++++++++++++++++++------------
 bbot/modules/crobat.py      |  3 +--
 bbot/modules/gowitness.py   |  1 -
 bbot/modules/ipstack.py     |  3 +--
 bbot/modules/output/http.py |  1 -
 bbot/modules/sslcert.py     |  6 ++++-
 bbot/scanner/scanner.py     | 48 +++++++++++++++++++++++++------------
 8 files changed, 76 insertions(+), 37 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 9aa759f9cd..97415f5442 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -1,3 +1,4 @@
+import ssl
 import httpx
 import logging
 import traceback
@@ -110,6 +111,8 @@ async def request(self, *args, **kwargs):
                 log.debug(f"Error with request: {e}")
                 if raise_error:
                     raise
+            except ssl.SSLError as e:
+                log.debug(f"SSL error with request: {e}")
 
     async def download(self, url, **kwargs):
         """
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 5701be86d4..8ddf60f869 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -612,44 +612,62 @@ def log_table(self, *args, **kwargs):
     def stdout(self, *args, **kwargs):
         self.log.stdout(*args, extra={"scan_id": self.scan.id}, **kwargs)
 
-    def debug(self, *args, **kwargs):
+    def debug(self, *args, trace=False, **kwargs):
         self.log.debug(*args, extra={"scan_id": self.scan.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def verbose(self, *args, **kwargs):
+    def verbose(self, *args, trace=False, **kwargs):
         self.log.verbose(*args, extra={"scan_id": self.scan.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def hugeverbose(self, *args, **kwargs):
+    def hugeverbose(self, *args, trace=False, **kwargs):
         self.log.hugeverbose(*args, extra={"scan_id": self.scan.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def info(self, *args, **kwargs):
+    def info(self, *args, trace=False, **kwargs):
         self.log.info(*args, extra={"scan_id": self.scan.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def hugeinfo(self, *args, **kwargs):
+    def hugeinfo(self, *args, trace=False, **kwargs):
         self.log.hugeinfo(*args, extra={"scan_id": self.scan.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def success(self, *args, **kwargs):
+    def success(self, *args, trace=False, **kwargs):
         self.log.success(*args, extra={"scan_id": self.scan.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def hugesuccess(self, *args, **kwargs):
+    def hugesuccess(self, *args, trace=False, **kwargs):
         self.log.hugesuccess(*args, extra={"scan_id": self.scan.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def warning(self, *args, **kwargs):
+    def warning(self, *args, trace=True, **kwargs):
         self.log.warning(*args, extra={"scan_id": self.scan.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
 
-    def hugewarning(self, *args, **kwargs):
+    def hugewarning(self, *args, trace=True, **kwargs):
         self.log.hugewarning(*args, extra={"scan_id": self.scan.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
 
-    def error(self, *args, **kwargs):
+    def error(self, *args, trace=True, **kwargs):
         self.log.error(*args, extra={"scan_id": self.scan.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
 
     def trace(self):
         e_type, e_val, e_traceback = exc_info()
         if e_type is not None:
             self.log.trace(traceback.format_exc())
 
-    def critical(self, *args, **kwargs):
+    def critical(self, *args, trace=True, **kwargs):
         self.log.critical(*args, extra={"scan_id": self.scan.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index 1db822eb8d..9fe03f11e0 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -128,5 +128,4 @@ async def query(self, query, parse_fn=None, request_fn=None):
                 return results
             self.debug(f'No results for "{query}"')
         except Exception as e:
-            self.info(f"Error retrieving results for {query}: {e}")
-            self.trace()
+            self.info(f"Error retrieving results for {query}: {e}", trace=True)
diff --git a/bbot/modules/gowitness.py b/bbot/modules/gowitness.py
index 867f1534bc..2ae676134d 100644
--- a/bbot/modules/gowitness.py
+++ b/bbot/modules/gowitness.py
@@ -239,7 +239,6 @@ def cur_execute(self, cur, query):
             return cur.execute(query)
         except sqlite3.OperationalError as e:
             self.warning(f"Error executing query: {query}: {e}")
-            self.trace()
             return []
 
     async def report(self):
diff --git a/bbot/modules/ipstack.py b/bbot/modules/ipstack.py
index a1d01acc7c..798065d635 100644
--- a/bbot/modules/ipstack.py
+++ b/bbot/modules/ipstack.py
@@ -39,8 +39,7 @@ async def handle_event(self, event):
             else:
                 self.verbose(f"No response from {url}")
         except Exception:
-            self.verbose(f"Error retrieving results for {event.data}")
-            self.trace()
+            self.verbose(f"Error retrieving results for {event.data}", trace=True)
             return
         geo_data = {
             "ip": j.get("ip"),
diff --git a/bbot/modules/output/http.py b/bbot/modules/output/http.py
index 93fa92f3ed..10ca1c8dfb 100644
--- a/bbot/modules/output/http.py
+++ b/bbot/modules/output/http.py
@@ -58,5 +58,4 @@ async def handle_event(self, event):
                 break
             except RequestError as e:
                 self.warning(f"Error sending {event}: {e}, retrying...")
-                self.trace()
                 await self.helpers.sleep(1)
diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index d55f124ec8..a5ea15b2b7 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -140,7 +140,11 @@ async def visit_host(self, host, port):
                     transport.close()
 
             # Get the SSL object
-            ssl_object = transport.get_extra_info("ssl_object")
+            try:
+                ssl_object = transport.get_extra_info("ssl_object")
+            except Exception as e:
+                self.verbose(f"Error getting ssl_object: {e}", trace=True)
+                return [], [], (host, port)
 
             # Get the certificate
             der = ssl_object.getpeercert(binary_form=True)
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index dcd3a833cf..40bbbc057f 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -529,47 +529,65 @@ def json(self):
             j.update({"modules": [str(m) for m in self.modules]})
         return j
 
-    def debug(self, *args, **kwargs):
+    def debug(self, *args, trace=False, **kwargs):
         log.debug(*args, extra={"scan_id": self.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def verbose(self, *args, **kwargs):
+    def verbose(self, *args, trace=False, **kwargs):
         log.verbose(*args, extra={"scan_id": self.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def hugeverbose(self, *args, **kwargs):
+    def hugeverbose(self, *args, trace=False, **kwargs):
         log.hugeverbose(*args, extra={"scan_id": self.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def info(self, *args, **kwargs):
+    def info(self, *args, trace=False, **kwargs):
         log.info(*args, extra={"scan_id": self.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def hugeinfo(self, *args, **kwargs):
+    def hugeinfo(self, *args, trace=False, **kwargs):
         log.hugeinfo(*args, extra={"scan_id": self.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def success(self, *args, **kwargs):
+    def success(self, *args, trace=False, **kwargs):
         log.success(*args, extra={"scan_id": self.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def hugesuccess(self, *args, **kwargs):
+    def hugesuccess(self, *args, trace=False, **kwargs):
         log.hugesuccess(*args, extra={"scan_id": self.id}, **kwargs)
+        if trace:
+            self.trace()
 
-    def warning(self, *args, **kwargs):
+    def warning(self, *args, trace=True, **kwargs):
         log.warning(*args, extra={"scan_id": self.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
 
-    def hugewarning(self, *args, **kwargs):
+    def hugewarning(self, *args, trace=True, **kwargs):
         log.hugewarning(*args, extra={"scan_id": self.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
 
-    def error(self, *args, **kwargs):
+    def error(self, *args, trace=True, **kwargs):
         log.error(*args, extra={"scan_id": self.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
 
     def trace(self):
         e_type, e_val, e_traceback = exc_info()
         if e_type is not None:
             log.trace(traceback.format_exc())
 
-    def critical(self, *args, **kwargs):
+    def critical(self, *args, trace=True, **kwargs):
         log.critical(*args, extra={"scan_id": self.id}, **kwargs)
-        self.trace()
+        if trace:
+            self.trace()
 
     def _internal_modules(self):
         for modname in module_loader.preloaded(type="internal"):

From 0e5d1db09cf94f87db50e4c3cd99cbdb1abc33a1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 30 May 2023 17:10:13 -0400
Subject: [PATCH 085/387] added .git module

---
 bbot/modules/git.py                           | 39 ++++++++++++++++
 .../module_tests/test_module_git.py           | 46 +++++++++++++++++++
 2 files changed, 85 insertions(+)
 create mode 100644 bbot/modules/git.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_git.py

diff --git a/bbot/modules/git.py b/bbot/modules/git.py
new file mode 100644
index 0000000000..c7676ddeb8
--- /dev/null
+++ b/bbot/modules/git.py
@@ -0,0 +1,39 @@
+import re
+from urllib.parse import urljoin
+
+from bbot.modules.base import BaseModule
+
+
+class git(BaseModule):
+    watched_events = ["URL"]
+    produced_events = ["FINDING"]
+    flags = ["active", "safe", "web-basic", "web-thorough"]
+    meta = {"description": "Check for exposed .git repositories"}
+
+    in_scope_only = True
+
+    fp_regex = re.compile(r"<html|<body", re.I)
+
+    async def handle_event(self, event):
+        base_url = event.data.rstrip("/")
+        urls = {
+            # git config
+            urljoin(base_url, ".git/config"),
+            urljoin(f"{base_url}/", ".git/config"),
+        }
+        tasks = [self.get_url(u) for u in urls]
+        for task in self.helpers.as_completed(tasks):
+            result, url = await task
+            text = getattr(result, "text", "")
+            if not text:
+                text = ""
+            if text:
+                if getattr(result, "status_code", 0) == 200 and "[core]" in text and not self.fp_regex.match(text):
+                    self.emit_event(
+                        {"host": str(event.host), "url": url, "description": f"Exposed .git config at {url}"},
+                        "FINDING",
+                        event,
+                    )
+
+    async def get_url(self, url):
+        return (await self.helpers.request(url), url)
diff --git a/bbot/test/test_step_2/module_tests/test_module_git.py b/bbot/test/test_step_2/module_tests/test_module_git.py
new file mode 100644
index 0000000000..57fcfa9183
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_git.py
@@ -0,0 +1,46 @@
+from .base import ModuleTestBase
+
+
+class TestGit(ModuleTestBase):
+    targets = [
+        "http://127.0.0.1:8888/",
+        "http://127.0.0.1:8888/test/asdf",
+        "http://127.0.0.1:8888/test2",
+    ]
+
+    modules_overrides = ["git", "httpx"]
+
+    git_config = """[core]
+    repositoryformatversion = 0
+    filemode = true
+    bare = false
+    logallrefupdates = true"""
+
+    async def setup_after_prep(self, module_test):
+        module_test.set_expect_requests(
+            expect_args={"uri": "/.git/config"}, respond_args={"response_data": self.git_config}
+        )
+        module_test.set_expect_requests(
+            expect_args={"uri": "/test/.git/config"}, respond_args={"response_data": self.git_config}
+        )
+        module_test.set_expect_requests(
+            expect_args={"uri": "/test/asdf/.git/config"}, respond_args={"response_data": self.git_config}
+        )
+        module_test.set_expect_requests(expect_args={"uri": "/test2/.git/config"}, respond_args={"response_data": ""})
+
+    def check(self, module_test, events):
+        for e in events:
+            module_test.log.critical(e.data)
+        assert any(
+            e.type == "FINDING" and "http://127.0.0.1:8888/.git/config" in e.data["description"] for e in events
+        )
+        assert any(
+            e.type == "FINDING" and "http://127.0.0.1:8888/test/.git/config" in e.data["description"] for e in events
+        )
+        assert any(
+            e.type == "FINDING" and "http://127.0.0.1:8888/test/asdf/.git/config" in e.data["description"]
+            for e in events
+        )
+        assert not any(
+            e.type == "FINDING" and "http://127.0.0.1:8888/test2/.git/config" in e.data["description"] for e in events
+        )

From fdcb2064a992cabfffd5885ee947eaf9c4cd0a30 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 1 Jun 2023 16:50:02 -0400
Subject: [PATCH 086/387] Added columbus module

---
 bbot/modules/columbus.py                      | 21 +++++++++++++++++++
 .../module_tests/test_module_columbus.py      | 13 ++++++++++++
 2 files changed, 34 insertions(+)
 create mode 100644 bbot/modules/columbus.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_columbus.py

diff --git a/bbot/modules/columbus.py b/bbot/modules/columbus.py
new file mode 100644
index 0000000000..66340b8609
--- /dev/null
+++ b/bbot/modules/columbus.py
@@ -0,0 +1,21 @@
+from .crobat import crobat
+
+
+class columbus(crobat):
+    flags = ["subdomain-enum", "passive", "safe"]
+    watched_events = ["DNS_NAME"]
+    produced_events = ["DNS_NAME"]
+    meta = {"description": "Query the Columbus Project API for subdomains"}
+
+    base_url = "https://columbus.elmasy.com/api/lookup"
+
+    async def request_url(self, query):
+        url = f"{self.base_url}/{self.helpers.quote(query)}"
+        return await self.request_with_fail_count(url)
+
+    def parse_results(self, r, query):
+        results = set()
+        json = r.json()
+        if json and isinstance(json, list):
+            return set([f"{s.lower()}.{query}" for s in json])
+        return results
diff --git a/bbot/test/test_step_2/module_tests/test_module_columbus.py b/bbot/test/test_step_2/module_tests/test_module_columbus.py
new file mode 100644
index 0000000000..76174683d7
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_columbus.py
@@ -0,0 +1,13 @@
+from .base import ModuleTestBase
+
+
+class TestColumbus(ModuleTestBase):
+    async def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://columbus.elmasy.com/api/lookup/blacklanternsecurity.com",
+            json=["asdf", "zzzz"],
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"

From 6e8857742338e7a0aee5460a049df16412c5e704 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 5 Jun 2023 07:22:52 -0400
Subject: [PATCH 087/387] unbreak python api

---
 README.md                                | 14 +++++++--
 bbot/agent/agent.py                      |  2 +-
 bbot/cli.py                              |  2 +-
 bbot/core/helpers/async_helpers.py       | 36 ++++++++++++++++++++++++
 bbot/scanner/scanner.py                  | 15 ++++++++--
 bbot/test/test_step_1/test_helpers.py    | 19 +++++++++++++
 bbot/test/test_step_1/test_python_api.py | 24 ++++++++++++++--
 7 files changed, 103 insertions(+), 9 deletions(-)

diff --git a/README.md b/README.md
index cc550fb6b5..8ea7b8cbd7 100644
--- a/README.md
+++ b/README.md
@@ -59,13 +59,23 @@ bbot -l
 ~~~
 
 ## Using BBOT as a Python library
+**Synchronous**
+~~~python
+from bbot.scanner import Scanner
+
+# any number of targets can be specified
+scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
+for event in scan.start():
+    print(event.json())
+~~~
+
+**Asynchronous**
 ~~~python
 from bbot.scanner import Scanner
 
 async def main():
-    # any number of targets can be specified
     scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
-    async for event in scan.start():
+    async for event in scan.async_start():
         print(event.json())
 
 import asyncio
diff --git a/bbot/agent/agent.py b/bbot/agent/agent.py
index 6c170cfacb..f3b2969270 100644
--- a/bbot/agent/agent.py
+++ b/bbot/agent/agent.py
@@ -139,7 +139,7 @@ async def start_scan(self, scan_id, name=None, targets=[], modules=[], output_mo
     async def _start_scan_task(self, scan):
         self.scan = scan
         try:
-            await scan.start_without_generator()
+            await scan.async_start_without_generator()
         except bbot.core.errors.ScanError as e:
             log.error(f"Scan error: {e}")
             log.trace(traceback.format_exc())
diff --git a/bbot/cli.py b/bbot/cli.py
index 6e7b5d1dee..726afad5f3 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -309,7 +309,7 @@ def keyboard_listen():
                     keyboard_listen_thread = threading.Thread(target=keyboard_listen, daemon=True)
                     keyboard_listen_thread.start()
 
-                    await scanner.start_without_generator()
+                    await scanner.async_start_without_generator()
 
             except bbot.core.errors.ScanError as e:
                 log_to_stderr(str(e), level="ERROR")
diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 9a7b7bcde1..df7219ec33 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -1,5 +1,7 @@
 import asyncio
 import logging
+import threading
+from queue import Queue, Empty
 from contextlib import asynccontextmanager
 
 log = logging.getLogger("bbot.core.helpers.async_helpers")
@@ -44,3 +46,37 @@ def __enter__(self):
 
     def __exit__(self, exc_type, exc_val, exc_tb):
         self.value -= 1
+
+
+def async_to_sync_gen(async_gen):
+    # Queue to hold generated values
+    queue = Queue()
+
+    # Flag to indicate if the async generator is done
+    is_done = False
+
+    # Function to run in the separate thread
+    async def runner():
+        nonlocal is_done
+        try:
+            async for value in async_gen:
+                queue.put(value)
+        finally:
+            is_done = True
+
+    def generator():
+        while True:
+            # Try to get a value from the queue
+            try:
+                yield queue.get(timeout=0.1)
+            except Empty:
+                # If the queue is empty, check if the async generator is done
+                if is_done:
+                    break
+
+    # Start the event loop in a separate thread
+    thread = threading.Thread(target=lambda: asyncio.run(runner()))
+    thread.start()
+
+    # Return the generator
+    return generator()
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 40bbbc057f..d7ae83495f 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -22,6 +22,7 @@
 from bbot.core.helpers.misc import sha1, rand_string
 from bbot.core.helpers.helper import ConfigAwareHelper
 from bbot.core.helpers.names_generator import random_name
+from bbot.core.helpers.async_helpers import async_to_sync_gen
 from bbot.core.configurator.environ import prepare_environment
 from bbot.core.errors import BBOTError, ScanError, ValidationError
 from bbot.core.logger import init_logging, get_log_level, set_log_level
@@ -205,11 +206,19 @@ async def prep(self):
             self.success(f"Setup succeeded for {len(self.modules):,} modules.")
             self._prepped = True
 
-    async def start_without_generator(self):
-        async for event in self.start():
+    def start(self):
+        for event in async_to_sync_gen(self.async_start()):
+            yield event
+
+    def start_without_generator(self):
+        for event in async_to_sync_gen(self.async_start()):
+            pass
+
+    async def async_start_without_generator(self):
+        async for event in self.async_start():
             pass
 
-    async def start(self):
+    async def async_start(self):
         failed = True
         scan_start_time = datetime.now()
         try:
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 91802192e9..3e5b13d3b0 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -561,3 +561,22 @@ async def web_request(r):
     helpers.cancel_tasks(tasks)
     # 5 seconds * 10 requests per second == 50
     assert 45 <= len(results) <= 55
+
+
+def test_async_helpers():
+    from bbot.core.helpers.async_helpers import async_to_sync_gen
+
+    # async to sync generator converter
+    async def async_gen():
+        for i in range(5):
+            yield i
+
+    sync_gen = async_to_sync_gen(async_gen())
+
+    l = []
+    while 1:
+        try:
+            l.append(next(sync_gen))
+        except StopIteration:
+            break
+    assert l == [0, 1, 2, 3, 4]
diff --git a/bbot/test/test_step_1/test_python_api.py b/bbot/test/test_step_1/test_python_api.py
index 77fc43f4c0..7a632ed3d3 100644
--- a/bbot/test/test_step_1/test_python_api.py
+++ b/bbot/test/test_step_1/test_python_api.py
@@ -8,12 +8,32 @@ async def test_python_api(bbot_config):
     # make sure events are properly yielded
     scan1 = Scanner("127.0.0.1", config=bbot_config)
     events1 = []
-    async for event in scan1.start():
+    async for event in scan1.async_start():
         events1.append(event)
     assert any("127.0.0.1" == e for e in events1)
     # make sure output files work
     scan2 = Scanner("127.0.0.1", config=bbot_config, output_modules=["json"], name="python_api_test")
-    await scan2.start_without_generator()
+    await scan2.async_start_without_generator()
+    out_file = scan2.helpers.scans_dir / "python_api_test" / "output.json"
+    assert list(scan2.helpers.read_file(out_file))
+    # make sure config loads properly
+    bbot_home = "/tmp/.bbot_python_api_test"
+    Scanner("127.0.0.1", config={"home": bbot_home})
+    assert os.environ["BBOT_TOOLS"] == str(Path(bbot_home) / "tools")
+
+
+def test_python_api_sync(bbot_config):
+    from bbot.scanner import Scanner
+
+    # make sure events are properly yielded
+    scan1 = Scanner("127.0.0.1", config=bbot_config)
+    events1 = []
+    for event in scan1.start():
+        events1.append(event)
+    assert any("127.0.0.1" == e for e in events1)
+    # make sure output files work
+    scan2 = Scanner("127.0.0.1", config=bbot_config, output_modules=["json"], name="python_api_test")
+    scan2.start_without_generator()
     out_file = scan2.helpers.scans_dir / "python_api_test" / "output.json"
     assert list(scan2.helpers.read_file(out_file))
     # make sure config loads properly

From 33d42238a4515b77f10dd53feac5c293b9fec862 Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Mon, 5 Jun 2023 08:20:19 -0400
Subject: [PATCH 088/387] Update test_scan.py

---
 bbot/test/test_step_1/test_scan.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/test/test_step_1/test_scan.py b/bbot/test/test_step_1/test_scan.py
index 6aeae96317..aa8140f5e7 100644
--- a/bbot/test/test_step_1/test_scan.py
+++ b/bbot/test/test_step_1/test_scan.py
@@ -59,7 +59,7 @@ async def test_scan(
     dns_config = OmegaConf.merge(bbot_config, dns_config)
     scan4 = bbot_scanner("8.8.8.8", config=dns_config)
     events = []
-    async for event in scan4.start():
+    async for event in scan4.async_start():
         events.append(event)
     event_data = [e.data for e in events]
     assert "dns.google" in event_data
@@ -69,7 +69,7 @@ async def test_scan(
     no_dns_config = OmegaConf.merge(bbot_config, no_dns_config)
     scan5 = bbot_scanner("8.8.8.8", config=no_dns_config)
     events = []
-    async for event in scan5.start():
+    async for event in scan5.async_start():
         events.append(event)
     event_data = [e.data for e in events]
     assert "dns.google" not in event_data

From ab7d32337ecf8ffa6d8d17c64c6ca231780b88ca Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 5 Jun 2023 08:51:55 -0400
Subject: [PATCH 089/387] async api

---
 bbot/test/test_step_1/test_agent.py        | 2 +-
 bbot/test/test_step_2/module_tests/base.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/test/test_step_1/test_agent.py b/bbot/test/test_step_1/test_agent.py
index 2497791ef5..91611ff204 100644
--- a/bbot/test/test_step_1/test_agent.py
+++ b/bbot/test/test_step_1/test_agent.py
@@ -137,7 +137,7 @@ async def test_agent(agent):
 
     global success
     async with websockets.serve(websocket_handler, "127.0.0.1", 8765):
-        asyncio.create_task(agent.start())
+        asyncio.create_task(agent.async_start())
         # wait for 30 seconds
         await asyncio.wait_for(scan_done.wait(), 10)
         assert success
diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index 096f667b90..814097bfb9 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -102,7 +102,7 @@ async def module_test(self, httpx_mock, bbot_httpserver, monkeypatch, request):
         await self.setup_before_prep(module_test)
         await module_test.scan.prep()
         await self.setup_after_prep(module_test)
-        module_test.events = [e async for e in module_test.scan.start()]
+        module_test.events = [e async for e in module_test.scan.async_start()]
         yield module_test
 
     @pytest.mark.asyncio

From 2a302a605adb1e0218621572e1fe4c7c02da3e11 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 5 Jun 2023 08:55:00 -0400
Subject: [PATCH 090/387] fix agent tests

---
 bbot/test/test_step_1/test_agent.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/test_step_1/test_agent.py b/bbot/test/test_step_1/test_agent.py
index 91611ff204..2497791ef5 100644
--- a/bbot/test/test_step_1/test_agent.py
+++ b/bbot/test/test_step_1/test_agent.py
@@ -137,7 +137,7 @@ async def test_agent(agent):
 
     global success
     async with websockets.serve(websocket_handler, "127.0.0.1", 8765):
-        asyncio.create_task(agent.async_start())
+        asyncio.create_task(agent.start())
         # wait for 30 seconds
         await asyncio.wait_for(scan_done.wait(), 10)
         assert success

From 70f185aaf8abbeb7ab933da5e52d842676bb304d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 6 Jun 2023 08:38:03 -0400
Subject: [PATCH 091/387] small asn tweak, better exception handling

---
 bbot/modules/report/asn.py | 2 ++
 bbot/scanner/scanner.py    | 5 +----
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/report/asn.py b/bbot/modules/report/asn.py
index 1844e67006..6537051720 100644
--- a/bbot/modules/report/asn.py
+++ b/bbot/modules/report/asn.py
@@ -117,6 +117,8 @@ async def get_asn_ripe(self, ip):
             asn_numbers = []
         for number in asn_numbers:
             asn = await self.get_asn_metadata_ripe(number)
+            if asn == False:
+                return False
             asn["subnet"] = prefix
             asns.append(asn)
         return asns
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index d7ae83495f..917d9af91e 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -277,7 +277,7 @@ async def async_start(self):
 
         except BaseException as e:
             exception_chain = self.helpers.get_exception_chain(e)
-            if any(isinstance(exc, KeyboardInterrupt) for exc in exception_chain):
+            if any(isinstance(exc, (KeyboardInterrupt, asyncio.CancelledError)) for exc in exception_chain):
                 self.stop()
                 failed = False
             else:
@@ -289,9 +289,6 @@ async def async_start(self):
                 except BBOTError as e:
                     self.critical(f"Error during scan: {e}")
 
-                except asyncio.CancelledError:
-                    self.trace()
-
                 except Exception:
                     self.critical(f"Unexpected error during scan:\n{traceback.format_exc()}")
 

From f5a2d97bbf34bbff56bc6598324fca7c2c1871a4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 6 Jun 2023 14:19:20 -0400
Subject: [PATCH 092/387] don't create asyncio loop right away

---
 bbot/scanner/scanner.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 917d9af91e..427bbb42be 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -164,7 +164,7 @@ def __init__(
         self._finished_init = False
         self._cleanedup = False
 
-        self._loop = asyncio.get_event_loop()
+        self.__loop = None
         self.manager_worker_loop_tasks = []
         self.init_events_task = None
         self.ticker_task = None
@@ -673,6 +673,12 @@ def fail_setup(self, msg):
     def log_level(self):
         return get_log_level()
 
+    @property
+    def _loop(self):
+        if self.__loop is None:
+            self.__loop = asyncio.get_event_loop()
+        return self.__loop
+
     def _load_modules(self, modules):
         modules = [str(m) for m in modules]
         loaded_modules = {}

From f616a716b0228c7c72a7561fef4def8de2c4e2e9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 6 Jun 2023 16:57:43 -0400
Subject: [PATCH 093/387] increase ulimits on self

---
 bbot/core/configurator/environ.py | 18 ++++++++++++++++++
 1 file changed, 18 insertions(+)

diff --git a/bbot/core/configurator/environ.py b/bbot/core/configurator/environ.py
index 23c7e78627..b299fd7a61 100644
--- a/bbot/core/configurator/environ.py
+++ b/bbot/core/configurator/environ.py
@@ -1,5 +1,6 @@
 import os
 import sys
+import resource
 import omegaconf
 from pathlib import Path
 
@@ -12,6 +13,23 @@
 cli_execution = False
 
 
+def increase_limit(new_limit):
+    # Get current limit
+    soft_limit, hard_limit = resource.getrlimit(resource.RLIMIT_NOFILE)
+
+    new_limit = min(new_limit, hard_limit)
+
+    # Attempt to set new limit
+    try:
+        resource.setrlimit(resource.RLIMIT_NOFILE, (new_limit, hard_limit))
+    except ValueError as e:
+        sys.stderr.write(f"Failed to set new ulimit: {e}\n")
+    print(resource.getrlimit(resource.RLIMIT_NOFILE))
+
+
+increase_limit(65535)
+
+
 def flatten_config(config, base="bbot"):
     """
     Flatten a JSON-like config into a list of environment variables:

From ed9dc23bb932af87b95601599ecb3588ba95e751 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 7 Jun 2023 13:58:20 -0400
Subject: [PATCH 094/387] advanced status debugging

---
 bbot/core/configurator/environ.py | 16 ++++++++--------
 bbot/scanner/manager.py           | 19 +++++++++++++++++++
 2 files changed, 27 insertions(+), 8 deletions(-)

diff --git a/bbot/core/configurator/environ.py b/bbot/core/configurator/environ.py
index b299fd7a61..6651bad012 100644
--- a/bbot/core/configurator/environ.py
+++ b/bbot/core/configurator/environ.py
@@ -1,6 +1,5 @@
 import os
 import sys
-import resource
 import omegaconf
 from pathlib import Path
 
@@ -14,17 +13,18 @@
 
 
 def increase_limit(new_limit):
-    # Get current limit
-    soft_limit, hard_limit = resource.getrlimit(resource.RLIMIT_NOFILE)
+    try:
+        import resource
 
-    new_limit = min(new_limit, hard_limit)
+        # Get current limit
+        soft_limit, hard_limit = resource.getrlimit(resource.RLIMIT_NOFILE)
 
-    # Attempt to set new limit
-    try:
+        new_limit = min(new_limit, hard_limit)
+
+        # Attempt to set new limit
         resource.setrlimit(resource.RLIMIT_NOFILE, (new_limit, hard_limit))
-    except ValueError as e:
+    except Exception as e:
         sys.stderr.write(f"Failed to set new ulimit: {e}\n")
-    print(resource.getrlimit(resource.RLIMIT_NOFILE))
 
 
 increase_limit(65535)
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index d7bc25aaa7..fb0053c775 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -487,6 +487,25 @@ def modules_status(self, _log=False):
                 self.scan.info(f"{self.scan.name}: No events in queue")
 
             if self.scan.log_level <= logging.DEBUG:
+                # status debugging
+                scan_active_status = []
+                scan_active_status.append(f"manager.active: {self.active}")
+                scan_active_status.append(f"    manager.running: {self.running}")
+                scan_active_status.append(f"        manager._task_counter.value: {self._task_counter.value}")
+                scan_active_status.append(
+                    f"        manager.incoming_event_queue.qsize(): {self.incoming_event_queue.qsize()}"
+                )
+                scan_active_status.append(f"    manager.modules_finished: {self.modules_finished}")
+                for m in self.scan.modules.values():
+                    scan_active_status.append(f"        {m}.finished: {m.finished}")
+                    scan_active_status.append(f"            {m}.running: {m.running}")
+                    scan_active_status.append(f"            {m}.num_incoming_events: {m.num_incoming_events}")
+                    scan_active_status.append(
+                        f"            {m}.outgoing_event_queue.qsize(): {m.outgoing_event_queue.qsize()}"
+                    )
+                for line in scan_active_status:
+                    self.scan.debug(line)
+
                 # log module memory usage
                 module_memory_usage = []
                 for module in self.scan.modules.values():

From 75eba870dc21ba0d2d73bda87869491b173002bb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 8 Jun 2023 10:57:38 -0400
Subject: [PATCH 095/387] better asn error handling

---
 bbot/modules/report/asn.py                 | 4 ++--
 bbot/test/test_step_2/module_tests/base.py | 3 +--
 2 files changed, 3 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/report/asn.py b/bbot/modules/report/asn.py
index 6537051720..e23e3e4258 100644
--- a/bbot/modules/report/asn.py
+++ b/bbot/modules/report/asn.py
@@ -97,7 +97,7 @@ async def get_asn(self, ip, retries=1):
                     self.verbose(f"Failed to contact {source}, retrying")
                     continue
                 return res
-        self.warning(f"Error retrieving ASN via for {ip}")
+        self.warning(f"Error retrieving ASN for {ip}")
         return []
 
     async def get_asn_ripe(self, ip):
@@ -215,6 +215,6 @@ async def get_url(self, url, data_type, cache=False):
                 return data
             return j
         except Exception as e:
-            self.verbose(f"Error retrieving {data_type} at {url}: {e}")
+            self.verbose(f"Error retrieving {data_type} at {url}: {e}", trace=True)
             self.debug(f"Got data: {getattr(r, 'content', '')}")
             return False
diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index 814097bfb9..4c48c51cbd 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -109,9 +109,8 @@ async def module_test(self, httpx_mock, bbot_httpserver, monkeypatch, request):
     async def test_module_run(self, module_test):
         self.check(module_test, module_test.events)
 
-    @abstractmethod
     def check(self, module_test, events):
-        raise NotImplementedError
+        assert False, f"Must override {self.name}.check()"
 
     @property
     def name(self):

From 2e4fb45223d106313b99b24b3dfe815efa82b32f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 8 Jun 2023 10:58:05 -0400
Subject: [PATCH 096/387] flaked

---
 bbot/test/test_step_2/module_tests/base.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index 4c48c51cbd..b5ce805221 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -1,7 +1,6 @@
 import pytest
 import logging
 import pytest_asyncio
-from abc import abstractmethod
 from omegaconf import OmegaConf
 from types import SimpleNamespace
 

From 88dc1522e4404261c342e9b38287ebbb1b5eb75d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 8 Jun 2023 14:44:30 -0400
Subject: [PATCH 097/387] better status messages

---
 bbot/scanner/manager.py                    | 7 ++++---
 bbot/test/test_step_2/module_tests/base.py | 4 +++-
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index fb0053c775..d0fa0f5f76 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -489,6 +489,7 @@ def modules_status(self, _log=False):
             if self.scan.log_level <= logging.DEBUG:
                 # status debugging
                 scan_active_status = []
+                scan_active_status.append(f"scan._finished_init: {self.scan._finished_init}")
                 scan_active_status.append(f"manager.active: {self.active}")
                 scan_active_status.append(f"    manager.running: {self.running}")
                 scan_active_status.append(f"        manager._task_counter.value: {self._task_counter.value}")
@@ -498,10 +499,10 @@ def modules_status(self, _log=False):
                 scan_active_status.append(f"    manager.modules_finished: {self.modules_finished}")
                 for m in self.scan.modules.values():
                     scan_active_status.append(f"        {m}.finished: {m.finished}")
-                    scan_active_status.append(f"            {m}.running: {m.running}")
-                    scan_active_status.append(f"            {m}.num_incoming_events: {m.num_incoming_events}")
+                    scan_active_status.append(f"            running: {m.running}")
+                    scan_active_status.append(f"            num_incoming_events: {m.num_incoming_events}")
                     scan_active_status.append(
-                        f"            {m}.outgoing_event_queue.qsize(): {m.outgoing_event_queue.qsize()}"
+                        f"            outgoing_event_queue.qsize(): {m.outgoing_event_queue.qsize()}"
                     )
                 for line in scan_active_status:
                     self.scan.debug(line)
diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index b5ce805221..a4685933eb 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -121,7 +121,9 @@ def name(self):
     def _scan_name(self):
         if self.scan_name:
             return self.scan_name
-        return f"{self.__class__.__name__.lower()}_test_{rand_string()}"
+        if getattr(self, "__scan_name", None) is None:
+            self.__scan_name = f"{self.__class__.__name__.lower()}_test_{rand_string()}"
+        return self.__scan_name
 
     @property
     def modules(self):

From e3209cbadc43bd54cf7989f54797ce13d49b09cc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 8 Jun 2023 16:20:54 -0400
Subject: [PATCH 098/387] discord badge

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 8ea7b8cbd7..8ad0c0fe48 100644
--- a/README.md
+++ b/README.md
@@ -1,7 +1,7 @@
 # BEE·bot
 ### OSINT automation for hackers.
 
-[![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot)
+[![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot) [![Discord](https://img.shields.io/discord/859164869970362439)](https://discord.com/invite/PZqkgxu5SA)
 
 BBOT is a powerful and modular OSINT (Open Source Intelligence) framework designed to map the attack surface of an organization. With BBOT, you can execute the entire OSINT workflow with just a single command.
 

From 9659fd03c32184145789d2952054b9d49cd18fb2 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 8 Jun 2023 16:58:10 -0400
Subject: [PATCH 099/387] don't brute-force wildcards

---
 bbot/modules/massdns.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 637edf1b84..6a9c4328fd 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -57,7 +57,7 @@ class massdns(crobat):
             "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
         },
     ]
-    reject_wildcards = "cloud_only"
+    reject_wildcards = "strict"
     _qsize = 100
 
     digit_regex = re.compile(r"\d+")

From 60b0022bc309be130f601c1946cacf20eb436aca Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Fri, 9 Jun 2023 15:52:22 -0400
Subject: [PATCH 100/387] adding generic_ssrf test

---
 bbot/core/helpers/interactsh.py               |  2 +-
 bbot/test/bbot_fixtures.py                    | 13 -----
 bbot/test/conftest.py                         | 23 +++++++++
 bbot/test/test_step_2/module_tests/base.py    |  4 ++
 .../module_tests/test_module_generic_ssrf.py  | 47 ++++++++++++++++++-
 5 files changed, 73 insertions(+), 16 deletions(-)

diff --git a/bbot/core/helpers/interactsh.py b/bbot/core/helpers/interactsh.py
index 6cb679b4e9..205fc2bb31 100644
--- a/bbot/core/helpers/interactsh.py
+++ b/bbot/core/helpers/interactsh.py
@@ -145,7 +145,7 @@ async def _poll_loop(self, callback):
                 continue
             for data in data_list:
                 if data:
-                    self.parent_helper.execute_sync_or_async(callback, data)
+                    await self.parent_helper.execute_sync_or_async(callback, data)
 
     def decrypt(self, aes_key, data):
         private_key = RSA.importKey(self.private_key)
diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index b43ee67511..1d7fe4e230 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -265,16 +265,3 @@ def install_all_python_deps():
     for module in module_loader.preloaded().values():
         deps_pip.update(set(module.get("deps", {}).get("pip", [])))
     subprocess.run([sys.executable, "-m", "pip", "install"] + list(deps_pip))
-
-
-def tempwordlist(content):
-    tmp_path = "/tmp/.bbot_test/"
-    from bbot.core.helpers.misc import rand_string, mkdir
-
-    mkdir(tmp_path)
-    filename = f"{tmp_path}{rand_string(8)}"
-    with open(filename, "w", errors="ignore") as f:
-        for c in content:
-            line = f"{c}\n"
-            f.write(line)
-    return filename
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 094be9dd80..4a1205ba4a 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -47,3 +47,26 @@ def bbot_httpserver():
 
     server.check_assertions()
     server.clear()
+
+
+@pytest.fixture
+def interactsh_mock_instance():
+    interactsh_mock = Interactsh_mock()
+    return interactsh_mock
+
+
+class Interactsh_mock:
+    def __init__(self):
+        self.interactions = []
+
+    def mock_interaction(self, subdomain_tag):
+        self.interactions.append(subdomain_tag)
+
+    async def register(self, callback=None):
+        return "fakedomain.fakeinteractsh.com"
+
+    async def poll(self):
+        poll_results = []
+        for subdomain_tag in self.interactions:
+            poll_results.append({"full-id": f"{subdomain_tag}.fakedomain.fakeinteractsh.com", "protocol": "HTTP"})
+        return poll_results
diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index a4685933eb..a0d11bbdb1 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -1,3 +1,4 @@
+import re
 import pytest
 import logging
 import pytest_asyncio
@@ -88,6 +89,9 @@ def set_expect_requests(self, expect_args={}, respond_args={}):
                 expect_args["uri"] = "/"
             self.httpserver.expect_request(**expect_args).respond_with_data(**respond_args)
 
+        def set_expect_requests_handler(self, expect_args=None, request_handler=None):
+            self.httpserver.expect_request(expect_args).respond_with_handler(request_handler)
+
         @property
         def module(self):
             return self.scan.modules[self.name]
diff --git a/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py b/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
index 9e5ed6264b..9d7f7cec0d 100644
--- a/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
+++ b/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
@@ -1,9 +1,52 @@
+import re
+from werkzeug.wrappers import Response
+
 from .base import ModuleTestBase
 
 
+def extract_subdomain_tag(data):
+    pattern = r"http://([a-z0-9]{4})\.fakedomain\.fakeinteractsh\.com"
+    match = re.search(pattern, data)
+    if match:
+        return match.group(1)
+
+
 class TestGeneric_SSRF(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "generic_ssrf"]
+
+    def request_handler(self, request):  # ,interactsh_mock_instance=None
+        subdomain_tag = None
+
+        if request.method == "GET":
+            subdomain_tag = extract_subdomain_tag(request.full_path)
+        elif request.method == "POST":
+            subdomain_tag = extract_subdomain_tag(request.data.decode())
+        if subdomain_tag:
+            self.interactsh_mock_instance.mock_interaction(subdomain_tag)
+
+        return Response("alive", status=200)
+
+    async def setup_before_prep(self, module_test):
+        self.interactsh_mock_instance = module_test.request_fixture.getfixturevalue("interactsh_mock_instance")
+        module_test.monkeypatch.setattr(
+            module_test.scan.helpers, "interactsh", lambda *args, **kwargs: self.interactsh_mock_instance
+        )
+
+    async def setup_after_prep(self, module_test):
+        expect_args = re.compile("/")
+        module_test.set_expect_requests_handler(expect_args=expect_args, request_handler=self.request_handler)
 
-    # PAUL TODO
     def check(self, module_test, events):
-        pass
+        assert any(
+            e.type == "VULNERABILITY" and "Out-of-band interaction: [Generic SSRF (GET)]" in e.data["description"]
+            for e in events
+        ), "Failed to detect Generic SSRF (GET)"
+        assert any(
+            e.type == "VULNERABILITY" and "Out-of-band interaction: [Generic SSRF (POST)]" in e.data["description"]
+            for e in events
+        ), "Failed to detect Generic SSRF (POST)"
+        assert any(
+            e.type == "VULNERABILITY" and "Out-of-band interaction: [Generic XXE] [HTTP]" in e.data["description"]
+            for e in events
+        ), "Failed to detect Generic SSRF (XXE)"

From 4cf3d454315616e7510bba12f2aacc2edd876e4a Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Fri, 9 Jun 2023 16:16:51 -0400
Subject: [PATCH 101/387] flake8

---
 bbot/test/test_step_2/module_tests/base.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index a0d11bbdb1..8a046ccca0 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -1,4 +1,3 @@
-import re
 import pytest
 import logging
 import pytest_asyncio

From 118c51d4ff8ff80e767d21d329ebf38d9afd25b7 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 12 Jun 2023 14:01:22 -0400
Subject: [PATCH 102/387] host_header_test

---
 bbot/modules/generic_ssrf.py                  | 10 ++++
 bbot/modules/host_header.py                   |  1 -
 bbot/test/conftest.py                         |  4 ++
 .../module_tests/test_module_generic_ssrf.py  |  2 +-
 .../module_tests/test_module_host_header.py   | 59 ++++++++++++++++++-
 5 files changed, 72 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/generic_ssrf.py b/bbot/modules/generic_ssrf.py
index 91e1721ab1..bf2c37097d 100644
--- a/bbot/modules/generic_ssrf.py
+++ b/bbot/modules/generic_ssrf.py
@@ -214,6 +214,16 @@ def interactsh_callback(self, r):
                 # this is likely caused by something trying to resolve the base domain first and can be ignored
                 self.debug("skipping result because subdomain tag was missing")
 
+    async def cleanup(self):
+        if self.scan.config.get("interactsh_disable", False) == False:
+            try:
+                await self.interactsh_instance.deregister()
+                self.debug(
+                    f"successfully deregistered interactsh session with correlation_id {self.interactsh_instance.correlation_id}"
+                )
+            except InteractshError as e:
+                self.warning(f"Interactsh failure: {e}")
+
     async def finish(self):
         if self.scan.config.get("interactsh_disable", False) == False:
             await self.helpers.sleep(5)
diff --git a/bbot/modules/host_header.py b/bbot/modules/host_header.py
index 0bb0f88e94..69caea57c6 100644
--- a/bbot/modules/host_header.py
+++ b/bbot/modules/host_header.py
@@ -117,7 +117,6 @@ async def handle_event(self, event):
         self.subdomain_tags[subdomain_tag] = (event, technique_description)
         output = await self.helpers.curl(
             url=event.data["url"],
-            headers={"Host": f"{subdomain_tag}.{self.domain}"},
             path_override=event.data["url"],
             cookies=added_cookies,
         )
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 4a1205ba4a..ee7494838d 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -58,6 +58,7 @@ def interactsh_mock_instance():
 class Interactsh_mock:
     def __init__(self):
         self.interactions = []
+        self.correlation_id = "deadbeef-dead-beef-dead-beefdeadbeef"
 
     def mock_interaction(self, subdomain_tag):
         self.interactions.append(subdomain_tag)
@@ -65,6 +66,9 @@ def mock_interaction(self, subdomain_tag):
     async def register(self, callback=None):
         return "fakedomain.fakeinteractsh.com"
 
+    async def deregister(self, callback=None):
+        pass
+
     async def poll(self):
         poll_results = []
         for subdomain_tag in self.interactions:
diff --git a/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py b/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
index 9d7f7cec0d..370dd151a1 100644
--- a/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
+++ b/bbot/test/test_step_2/module_tests/test_module_generic_ssrf.py
@@ -15,7 +15,7 @@ class TestGeneric_SSRF(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "generic_ssrf"]
 
-    def request_handler(self, request):  # ,interactsh_mock_instance=None
+    def request_handler(self, request):
         subdomain_tag = None
 
         if request.method == "GET":
diff --git a/bbot/test/test_step_2/module_tests/test_module_host_header.py b/bbot/test/test_step_2/module_tests/test_module_host_header.py
index 43d6bc6a0d..9741d9bc12 100644
--- a/bbot/test/test_step_2/module_tests/test_module_host_header.py
+++ b/bbot/test/test_step_2/module_tests/test_module_host_header.py
@@ -1,9 +1,64 @@
+import re
+from werkzeug.wrappers import Response
+
 from .base import ModuleTestBase
 
 
+def extract_subdomain_tag(data):
+    pattern = r"([a-z0-9]{4})\.fakedomain\.fakeinteractsh\.com"
+    match = re.search(pattern, data)
+    if match:
+        return match.group(1)
+
+
 class TestHost_Header(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "host_header"]
+
+    fake_host = "fakedomain.fakeinteractsh.com"
+
+    def request_handler(self, request):
+        subdomain_tag = None
+        subdomain_tag = extract_subdomain_tag(request.headers["Host"])
+
+        # Standard (with reflection)
+        if subdomain_tag:
+            self.interactsh_mock_instance.mock_interaction(subdomain_tag)
+            return Response(f"Alive, host is: {subdomain_tag}.{self.fake_host}", status=200)
+
+        # Host Header Overrides
+        subdomain_tag_overrides = extract_subdomain_tag(request.headers["X-Forwarded-For"])
+        if subdomain_tag_overrides:
+            return Response(f"Alive, host is: {subdomain_tag}.{self.fake_host}", status=200)
+
+        return Response(f"Alive, host is: defaulthost.com", status=200)
+
+    async def setup_before_prep(self, module_test):
+        self.interactsh_mock_instance = module_test.request_fixture.getfixturevalue("interactsh_mock_instance")
+        module_test.monkeypatch.setattr(
+            module_test.scan.helpers, "interactsh", lambda *args, **kwargs: self.interactsh_mock_instance
+        )
+
+    async def setup_after_prep(self, module_test):
+        expect_args = re.compile("/")
+        module_test.set_expect_requests_handler(expect_args=expect_args, request_handler=self.request_handler)
 
-    # PAUL TODO
     def check(self, module_test, events):
-        pass
+        # We can't fully test all the use-cases because werkzeug abstracts away some of our RFC-violating tricks :/
+
+        for e in events:
+            assert any(
+                e.type == "FINDING"
+                and "Possible Host header injection. Injection technique: standard" in e.data["description"]
+                for e in events
+            ), "Failed to detect Possible Host Header Injection (standard)"
+            assert any(
+                e.type == "FINDING"
+                and "Possible Host header injection. Injection technique: host override headers"
+                in e.data["description"]
+                for e in events
+            ), "Failed to detect Possible Host Header Injection (host override headers)"
+            assert any(
+                e.type == "FINDING" and "Spoofed Host header (standard) [HTTP] interaction" in e.data["description"]
+                for e in events
+            ), "Failed to detect Spoofed Host header (standard) [HTTP] interaction"

From 833eb83bb7c8f964995a49c40f5afb21b06f92ad Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 12 Jun 2023 17:09:26 -0400
Subject: [PATCH 103/387] smuggler_test

---
 bbot/modules/smuggler.py                      | 19 ++++---
 .../module_tests/test_module_masscan.py       |  2 +-
 .../module_tests/test_module_smuggler.py      | 55 ++++++++++++++++++-
 3 files changed, 65 insertions(+), 11 deletions(-)

diff --git a/bbot/modules/smuggler.py b/bbot/modules/smuggler.py
index f478a63641..ca538d87d4 100644
--- a/bbot/modules/smuggler.py
+++ b/bbot/modules/smuggler.py
@@ -44,11 +44,14 @@ async def handle_event(self, event):
             "-u",
             event.data,
         ]
-        async for f in self.helpers.run_live(command):
-            if "Issue Found" in f:
-                technique = f.split(":")[0].rstrip()
-                text = f.split(":")[1].split("-")[0].strip()
-                description = f"[HTTP SMUGGLER] [{text}] Technique: {technique}"
-                self.emit_event(
-                    {"host": str(event.host), "url": event.data, "description": description}, "FINDING", source=event
-                )
+        async for line in self.helpers.run_live(command):
+            for f in line.split("\r"):
+                if "Issue Found" in f:
+                    technique = f.split(":")[0].rstrip()
+                    text = f.split(":")[1].split("-")[0].strip()
+                    description = f"[HTTP SMUGGLER] [{text}] Technique: {technique}"
+                    self.emit_event(
+                        {"host": str(event.host), "url": event.data, "description": description},
+                        "FINDING",
+                        source=event,
+                    )
diff --git a/bbot/test/test_step_2/module_tests/test_module_masscan.py b/bbot/test/test_step_2/module_tests/test_module_masscan.py
index 121b4f9751..3bb24341b5 100644
--- a/bbot/test/test_step_2/module_tests/test_module_masscan.py
+++ b/bbot/test/test_step_2/module_tests/test_module_masscan.py
@@ -27,7 +27,7 @@ async def run_masscan(command, *args, **kwargs):
                     yield l
                 self.masscan_run = True
             else:
-                async for l in self.scan.helpers.run_live(command, *args, **kwargs):
+                async for l in module_test.scan.helpers.run_live(command, *args, **kwargs):
                     yield l
 
         module_test.scan.modules["masscan"].masscan_config = self.masscan_config
diff --git a/bbot/test/test_step_2/module_tests/test_module_smuggler.py b/bbot/test/test_step_2/module_tests/test_module_smuggler.py
index 955fcffde4..aeb9bc21dd 100644
--- a/bbot/test/test_step_2/module_tests/test_module_smuggler.py
+++ b/bbot/test/test_step_2/module_tests/test_module_smuggler.py
@@ -1,9 +1,60 @@
 from .base import ModuleTestBase
 
+smuggler_text = """
+              ______ _              
+     / _____)                       | |             
+    ( (____  ____  _   _  ____  ____| | _____  ____ 
+     \____ \|    \| | | |/ _  |/ _  | || ___ |/ ___)
+     _____) ) | | | |_| ( (_| ( (_| | || ____| |    
+    (______/|_|_|_|____/ \___ |\___ |\_)_____)_|    
+                        (_____(_____|               
+
+         @defparam v1.1
+
+    [+] URL        : http://127.0.0.1:8888
+    [+] Method     : POST
+    [+] Endpoint   : /
+    [+] Configfile : default.py
+    [+] Timeout    : 5.0 seconds
+    [+] Cookies    : 1 (Appending to the attack)                   
+    [nameprefix1]  : Checking TECL...                
+    [nameprefix1]  : Checking CLTE...             
+    [nameprefix1]  : OK (TECL: 0.61 - 405) (CLTE: 0.62 - 405)       
+    [tabprefix1]   : Checking TECL...
+    [tabprefix1]   : Checking CLTE...          
+    [tabprefix1]   : Checking TECL...                 
+    [tabprefix1]   : Checking CLTE...
+    [tabprefix1]   : Checking TECL...
+    [tabprefix1]   : Checking CLTE...
+    [tabprefix1]   : Potential CLTE Issue Found - POST @ https://0a6b003504e05ba3801517d1002600a0.web-security-academy.net/post - default.py
+    [CRITICAL]     : CLTE Payload: /home/liquid/.bbot/tools/smuggler/payloads/https_0a6b003504e05ba3801517d1002600a0_web-security-academy_net_CLTE_tabprefix1.txt URL: https://0a6b003504e05ba3801517d1002600a0.web-security-academy.net/post
+    """
+
 
 class TestSmuggler(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
+    modules_overrides = ["httpx", "smuggler"]
+
+    async def setup_after_prep(self, module_test):
+        old_run_live = module_test.scan.helpers.run_live
+
+        async def smuggler_mock_run_live(*command, **kwargs):
+            if not "smuggler" in command[0][1]:
+                async for l in old_run_live(*command, **kwargs):
+                    yield l
+            else:
+                for line in smuggler_text.splitlines():
+                    yield line
+
+        module_test.monkeypatch.setattr(module_test.scan.helpers, "run_live", smuggler_mock_run_live)
+
+        request_args = {"uri": "/robots.txt"}
+        respond_args = {"response_data": "alive"}
+        module_test.set_expect_requests(request_args, respond_args)
 
-    # PAUL TODO
     def check(self, module_test, events):
-        pass
+        assert any(
+            e.type == "FINDING"
+            and "[HTTP SMUGGLER] [Potential CLTE Issue Found] Technique:     [tabprefix1]" in e.data["description"]
+            for e in events
+        ), "Failed to parse mocked command output"

From 4e506afd71d0e0d07179a9534df42b96a6d9bbc1 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 12 Jun 2023 17:13:10 -0400
Subject: [PATCH 104/387] cleaning up smuggler fake output

---
 bbot/test/test_step_2/module_tests/test_module_smuggler.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_smuggler.py b/bbot/test/test_step_2/module_tests/test_module_smuggler.py
index aeb9bc21dd..ee04f5afcd 100644
--- a/bbot/test/test_step_2/module_tests/test_module_smuggler.py
+++ b/bbot/test/test_step_2/module_tests/test_module_smuggler.py
@@ -26,8 +26,8 @@
     [tabprefix1]   : Checking CLTE...
     [tabprefix1]   : Checking TECL...
     [tabprefix1]   : Checking CLTE...
-    [tabprefix1]   : Potential CLTE Issue Found - POST @ https://0a6b003504e05ba3801517d1002600a0.web-security-academy.net/post - default.py
-    [CRITICAL]     : CLTE Payload: /home/liquid/.bbot/tools/smuggler/payloads/https_0a6b003504e05ba3801517d1002600a0_web-security-academy_net_CLTE_tabprefix1.txt URL: https://0a6b003504e05ba3801517d1002600a0.web-security-academy.net/post
+    [tabprefix1]   : Potential CLTE Issue Found - POST @ http://127.0.0.1:8888 - default.py
+    [CRITICAL]     : CLTE Payload: /home/user/.bbot/tools/smuggler/payloads/http_127.0.0.1_net_CLTE_tabprefix1.txt URL: http://127.0.0.1:8888/
     """
 
 
From 72f949baf439a58a119690237cfe58b05cd1921e Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 12 Jun 2023 17:20:24 -0400
Subject: [PATCH 105/387] how did this work lol

---
 bbot/test/test_step_2/module_tests/test_module_smuggler.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_smuggler.py b/bbot/test/test_step_2/module_tests/test_module_smuggler.py
index ee04f5afcd..c887d684a5 100644
--- a/bbot/test/test_step_2/module_tests/test_module_smuggler.py
+++ b/bbot/test/test_step_2/module_tests/test_module_smuggler.py
@@ -20,7 +20,7 @@
     [nameprefix1]  : Checking TECL...                
     [nameprefix1]  : Checking CLTE...             
     [nameprefix1]  : OK (TECL: 0.61 - 405) (CLTE: 0.62 - 405)       
-    [tabprefix1]   : Checking TECL...
+    [tabprefix1]   : Checking TECL...git 
     [tabprefix1]   : Checking CLTE...          
     [tabprefix1]   : Checking TECL...                 
     [tabprefix1]   : Checking CLTE...
@@ -48,7 +48,7 @@ async def smuggler_mock_run_live(*command, **kwargs):
 
         module_test.monkeypatch.setattr(module_test.scan.helpers, "run_live", smuggler_mock_run_live)
 
-        request_args = {"uri": "/robots.txt"}
+        request_args = {"uri": "/"}
         respond_args = {"response_data": "alive"}
         module_test.set_expect_requests(request_args, respond_args)
 

From 0e4bb5d97eac2c66ed3738a8c20e4009996eaea6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 13 Jun 2023 14:56:26 -0400
Subject: [PATCH 106/387] fixed telerik future cancelling bug

---
 bbot/core/helpers/misc.py             | 15 ++++++++++++++-
 bbot/modules/ntlm.py                  |  4 ++--
 bbot/modules/telerik.py               |  6 +++---
 bbot/scanner/scanner.py               |  2 +-
 bbot/test/test_step_1/test_helpers.py |  2 +-
 5 files changed, 21 insertions(+), 8 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 8053f277d1..9e471a7b6b 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -1076,7 +1076,20 @@ def get_traceback_details(e):
     return filename, lineno, funcname
 
 
-def cancel_tasks(tasks):
+async def cancel_tasks(tasks):
+    current_task = asyncio.current_task()
+    tasks = [t for t in tasks if t != current_task]
+    for task in tasks:
+        log.debug(f"Cancelling task: {task}")
+        task.cancel()
+    for task in tasks:
+        try:
+            await task
+        except asyncio.CancelledError:
+            log.trace(traceback.format_exc())
+
+
+def cancel_tasks_sync(tasks):
     current_task = asyncio.current_task()
     for task in tasks:
         if task != current_task:
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index 3aa305d297..c05c5221ae 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -130,13 +130,13 @@ async def handle_url(self, event):
             try:
                 result, url = await task
                 if result:
-                    self.helpers.cancel_tasks(tasks)
+                    await self.helpers.cancel_tasks(tasks)
                     return result, url
             except (RequestError, ReadTimeout) as e:
                 if str(e):
                     self.warning(str(e))
                 # cancel all the tasks if there's an error
-                self.helpers.cancel_tasks(tasks)
+                await self.helpers.cancel_tasks(tasks)
                 break
 
         return None, None
diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index 5166e45b73..1fa5cc6425 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -235,11 +235,11 @@ async def handle_event(self, event):
                 if fail_count < 2:
                     continue
                 self.debug(f"Cancelling run against {event.data} due to failed request")
-                self.helpers.cancel_tasks(tasks)
+                await self.helpers.cancel_tasks(tasks)
                 break
             else:
                 if "Cannot deserialize dialog parameters" in result.text:
-                    self.helpers.cancel_tasks(tasks)
+                    await self.helpers.cancel_tasks(tasks)
                     self.debug(f"Detected Telerik UI instance ({dh})")
                     description = f"Telerik DialogHandler detected"
                     self.emit_event(
@@ -250,7 +250,7 @@ async def handle_event(self, event):
                     # Once we have a match we need to stop, because the basic handler (Telerik.Web.UI.DialogHandler.aspx) usually works with a path wildcard
                     break
 
-        self.helpers.cancel_tasks(tasks)
+        await self.helpers.cancel_tasks(tasks)
 
         spellcheckhandler = "Telerik.Web.UI.SpellCheckHandler.axd"
         result, _ = await self.test_detector(event.data, spellcheckhandler)
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 427bbb42be..df4bde4aae 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -408,7 +408,7 @@ def cancel_tasks(self):
         tasks += self.dispatcher_tasks
         # manager worker loops
         tasks += self.manager_worker_loop_tasks
-        self.helpers.cancel_tasks(tasks)
+        self.helpers.cancel_tasks_sync(tasks)
         # process pool
         self.process_pool.shutdown(cancel_futures=True)
 
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 3e5b13d3b0..f7dd72c57f 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -558,7 +558,7 @@ async def web_request(r):
         tasks.append(asyncio.create_task(web_request(r)))
     # sleep for 5 seconds
     await asyncio.sleep(5)
-    helpers.cancel_tasks(tasks)
+    await helpers.cancel_tasks(tasks)
     # 5 seconds * 10 requests per second == 50
     assert 45 <= len(results) <= 55
 

From 02ea29d0690f1ed8174442bab042796dd0330197 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 13 Jun 2023 15:25:52 -0400
Subject: [PATCH 107/387] support all ssl ciphers/versions

---
 README.md               | 2 +-
 bbot/modules/sslcert.py | 3 +++
 2 files changed, 4 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 8ad0c0fe48..e3132f9dcb 100644
--- a/README.md
+++ b/README.md
@@ -7,7 +7,7 @@ BBOT is a powerful and modular OSINT (Open Source Intelligence) framework design
 
 ![bbot_banner](https://user-images.githubusercontent.com/20261699/158000235-6c1ace81-a267-4f8e-90a1-f4c16884ebac.png)
 
-BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. With over 80 modules and counting, BBOT provides a comprehensive set of tools for gathering intelligence.
+BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. BBOT has over 80 modules and counting.
 
 Whether you're a pentester, security researcher, or bug bounty hunter, BBOT simplifies and automates the OSINT process so you can focus on the fun part: hacking!
 
diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index a5ea15b2b7..b977fef5a1 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -116,6 +116,9 @@ async def visit_host(self, host, port):
                 ssl_context = ssl.create_default_context()
                 ssl_context.check_hostname = False
                 ssl_context.verify_mode = ssl.CERT_NONE
+                ssl_context.options &= ~ssl.OP_NO_SSLv2 & ~ssl.OP_NO_SSLv3
+                ssl_context.set_ciphers('ALL:@SECLEVEL=0')
+                ssl_context.options |= 0x4  # Add the OP_LEGACY_SERVER_CONNECT option
             except Exception as e:
                 self.warning(f"Error creating SSL context: {e}")
                 return [], [], (host, port)

From 782b450142c3a95efee6b9e855febecad14fb53c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 13 Jun 2023 15:26:03 -0400
Subject: [PATCH 108/387] support all ssl ciphers/versions

---
 bbot/modules/sslcert.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index b977fef5a1..ece8508a87 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -117,7 +117,7 @@ async def visit_host(self, host, port):
                 ssl_context.check_hostname = False
                 ssl_context.verify_mode = ssl.CERT_NONE
                 ssl_context.options &= ~ssl.OP_NO_SSLv2 & ~ssl.OP_NO_SSLv3
-                ssl_context.set_ciphers('ALL:@SECLEVEL=0')
+                ssl_context.set_ciphers("ALL:@SECLEVEL=0")
                 ssl_context.options |= 0x4  # Add the OP_LEGACY_SERVER_CONNECT option
             except Exception as e:
                 self.warning(f"Error creating SSL context: {e}")

From f0693e05890167937b70eba82e8fea208c6b44c5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 13 Jun 2023 17:31:08 -0400
Subject: [PATCH 109/387] added basic login page detection

---
 bbot/core/event/base.py                       |  2 +
 bbot/core/helpers/web.py                      | 29 +++++++++++
 bbot/modules/httpx.py                         |  7 ++-
 bbot/modules/internal/excavate.py             |  2 -
 .../module_tests/test_module_httpx.py         | 37 +++++++++++---
 poetry.lock                                   | 51 ++++++++++++++++++-
 pyproject.toml                                |  2 +
 7 files changed, 118 insertions(+), 12 deletions(-)

diff --git a/bbot/core/event/base.py b/bbot/core/event/base.py
index c8a0c8ab28..cc5ec89e85 100644
--- a/bbot/core/event/base.py
+++ b/bbot/core/event/base.py
@@ -811,6 +811,7 @@ def _words(self):
 class HTTP_RESPONSE(URL_UNVERIFIED, DictEvent):
     def __init__(self, *args, **kwargs):
         super().__init__(*args, **kwargs)
+        # count number of consecutive redirects
         self.num_redirects = getattr(self.source, "num_redirects", 0)
         if str(self.data.get("status_code", 0)).startswith("3"):
             self.num_redirects += 1
@@ -831,6 +832,7 @@ def sanitize_data(self, data):
         data = dict(data)
         new_data = {"url": data.pop("url")}
         new_data.update(data)
+
         return new_data
 
     def _words(self):
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 97415f5442..1b48369c38 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -1,8 +1,10 @@
+import re
 import ssl
 import httpx
 import logging
 import traceback
 from pathlib import Path
+from bs4 import BeautifulSoup
 
 from bbot.core.errors import WordlistError, CurlError
 from bbot.core.helpers.ratelimiter import RateLimiter
@@ -325,3 +327,30 @@ async def curl(self, *args, **kwargs):
 
         output = (await self.parent_helper.run(curl_command)).stdout
         return output
+
+
+user_keywords = [re.compile(r, re.I) for r in ["user", "login", "email"]]
+pass_keywords = [re.compile(r, re.I) for r in ["pass"]]
+
+
+def is_login_page(html):
+    try:
+        soup = BeautifulSoup(html, "html.parser")
+    except Exception as e:
+        log.debug(f"Error parsing html: {e}")
+        return False
+
+    forms = soup.find_all("form")
+
+    # first, check for obvious password fields
+    for form in forms:
+        if form.find_all("input", {"type": "password"}):
+            return True
+
+    # next, check for forms that have both a user-like and password-like field
+    for form in forms:
+        user_fields = sum(bool(form.find_all("input", {"name": r})) for r in user_keywords)
+        pass_fields = sum(bool(form.find_all("input", {"name": r})) for r in pass_keywords)
+        if user_fields and pass_fields:
+            return True
+    return False
diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index 7ab78a1997..12577e9dc5 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -1,6 +1,7 @@
 import json
 import subprocess
 from bbot.modules.base import BaseModule
+from bbot.core.helpers.web import is_login_page
 
 
 class httpx(BaseModule):
@@ -133,6 +134,10 @@ async def handle_batch(self, *events):
             # main URL
             httpx_ip = j.get("host", "unknown")
             tags = [f"status-{status_code}", f"ip-{httpx_ip}"]
+            # detect login pages
+            if is_login_page(j.get("body", "")):
+                tags.append("login-page")
+            # grab title
             title = self.helpers.tagify(j.get("title", ""), maxlen=30)
             if title:
                 tags.append(f"http-title-{title}")
@@ -143,7 +148,7 @@ async def handle_batch(self, *events):
                 else:
                     url_event._resolved.set()
                 # HTTP response
-                self.emit_event(j, "HTTP_RESPONSE", url_event, internal=True)
+                self.emit_event(j, "HTTP_RESPONSE", url_event, tags=url_event.tags, internal=True)
 
     async def cleanup(self):
         resume_file = self.helpers.current_dir / "resume.cfg"
diff --git a/bbot/modules/internal/excavate.py b/bbot/modules/internal/excavate.py
index 0b834a2018..cff1ce458b 100644
--- a/bbot/modules/internal/excavate.py
+++ b/bbot/modules/internal/excavate.py
@@ -301,8 +301,6 @@ class excavate(BaseInternalModule):
 
     scope_distance_modifier = None
 
-    deps_pip = ["pyjwt~=2.6.0"]
-
     async def setup(self):
         self.hostname = HostnameExtractor(self)
         self.url = URLExtractor(self)
diff --git a/bbot/test/test_step_2/module_tests/test_module_httpx.py b/bbot/test/test_step_2/module_tests/test_module_httpx.py
index b66aa6ce0d..a58fb31333 100644
--- a/bbot/test/test_step_2/module_tests/test_module_httpx.py
+++ b/bbot/test/test_step_2/module_tests/test_module_httpx.py
@@ -1,16 +1,38 @@
-import json
 from .base import ModuleTestBase
 
 
 class TestHTTPX(ModuleTestBase):
     targets = ["http://127.0.0.1:8888/url", "127.0.0.1:8888"]
 
+    # HTML for a page with a login form
+    html_with_login = """
+<html>
+<body>
+    <form>
+        <input type="text" name="username">
+        <input name="password">
+        <input type="submit" value="Login">
+    </form>
+</body>
+</html>"""
+
+    # HTML for a page without a login form
+    html_without_login = """
+<html>
+<body>
+    <form>
+        <input type="text" name="search">
+        <input type="submit" value="Search">
+    </form>
+</body>
+</html>"""
+
     async def setup_after_prep(self, module_test):
         request_args = dict(uri="/", headers={"test": "header"})
-        respond_args = dict(response_data=json.dumps({"open": "port"}))
+        respond_args = dict(response_data=self.html_without_login)
         module_test.set_expect_requests(request_args, respond_args)
         request_args = dict(uri="/url", headers={"test": "header"})
-        respond_args = dict(response_data=json.dumps({"url": "url"}))
+        respond_args = dict(response_data=self.html_with_login)
         module_test.set_expect_requests(request_args, respond_args)
 
     def check(self, module_test, events):
@@ -18,12 +40,11 @@ def check(self, module_test, events):
         open_port = False
         for e in events:
             if e.type == "HTTP_RESPONSE":
-                j = json.loads(e.data["body"])
                 if e.data["path"] == "/":
-                    if j.get("open", "") == "port":
-                        open_port = True
+                    assert not "login-page" in e.tags
+                    open_port = True
                 elif e.data["path"] == "/url":
-                    if j.get("url", "") == "url":
-                        url = True
+                    assert "login-page" in e.tags
+                    url = True
         assert url, "Failed to visit target URL"
         assert open_port, "Failed to visit target OPEN_TCP_PORT"
diff --git a/poetry.lock b/poetry.lock
index 39e4f7da21..367a661d79 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -116,6 +116,25 @@ docs = ["furo", "myst-parser", "sphinx", "sphinx-notfound-page", "sphinxcontrib-
 tests = ["attrs[tests-no-zope]", "zope-interface"]
 tests-no-zope = ["cloudpickle", "hypothesis", "mypy (>=1.1.1)", "pympler", "pytest (>=4.3.0)", "pytest-mypy-plugins", "pytest-xdist[psutil]"]
 
+[[package]]
+name = "beautifulsoup4"
+version = "4.12.2"
+description = "Screen-scraping library"
+category = "main"
+optional = false
+python-versions = ">=3.6.0"
+files = [
+    {file = "beautifulsoup4-4.12.2-py3-none-any.whl", hash = "sha256:bd2520ca0d9d7d12694a53d44ac482d181b4ec1888909b035a3dbf40d0f57d4a"},
+    {file = "beautifulsoup4-4.12.2.tar.gz", hash = "sha256:492bbc69dca35d12daac71c4db1bfff0c876c00ef4a2ffacce226d4638eb72da"},
+]
+
+[package.dependencies]
+soupsieve = ">1.2"
+
+[package.extras]
+html5lib = ["html5lib"]
+lxml = ["lxml"]
+
 [[package]]
 name = "black"
 version = "23.3.0"
@@ -1190,6 +1209,24 @@ files = [
     {file = "pyflakes-3.0.1.tar.gz", hash = "sha256:ec8b276a6b60bd80defed25add7e439881c19e64850afd9b346283d4165fd0fd"},
 ]
 
+[[package]]
+name = "pyjwt"
+version = "2.7.0"
+description = "JSON Web Token implementation in Python"
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "PyJWT-2.7.0-py3-none-any.whl", hash = "sha256:ba2b425b15ad5ef12f200dc67dd56af4e26de2331f965c5439994dad075876e1"},
+    {file = "PyJWT-2.7.0.tar.gz", hash = "sha256:bd6ca4a3c4285c1a2d4349e5a035fdf8fb94e04ccd0fcbe6ba289dae9cc3e074"},
+]
+
+[package.extras]
+crypto = ["cryptography (>=3.4.0)"]
+dev = ["coverage[toml] (==5.0.4)", "cryptography (>=3.4.0)", "pre-commit", "pytest (>=6.0.0,<7.0.0)", "sphinx (>=4.5.0,<5.0.0)", "sphinx-rtd-theme", "zope.interface"]
+docs = ["sphinx (>=4.5.0,<5.0.0)", "sphinx-rtd-theme", "zope.interface"]
+tests = ["coverage[toml] (==5.0.4)", "pytest (>=6.0.0,<7.0.0)"]
+
 [[package]]
 name = "pytest"
 version = "7.3.1"
@@ -1500,6 +1537,18 @@ files = [
     {file = "sniffio-1.3.0.tar.gz", hash = "sha256:e60305c5e5d314f5389259b7f22aaa33d8f7dee49763119234af3755c55b9101"},
 ]
 
+[[package]]
+name = "soupsieve"
+version = "2.4.1"
+description = "A modern CSS selector implementation for Beautiful Soup."
+category = "main"
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "soupsieve-2.4.1-py3-none-any.whl", hash = "sha256:1c1bfee6819544a3447586c889157365a27e10d88cde3ad3da0cf0ddf646feb8"},
+    {file = "soupsieve-2.4.1.tar.gz", hash = "sha256:89d12b2d5dfcd2c9e8c22326da9d9aa9cb3dfab0a83a024f05704076ee8d35ea"},
+]
+
 [[package]]
 name = "tabulate"
 version = "0.8.10"
@@ -1741,4 +1790,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "bf51b55024928ced33830450536f53cc0b93bf641bd9a603f8f8e0c6176afabe"
+content-hash = "9ddb3f590354fc34ba956c3b9fc97a27a37b4a109ee6e246b8f14949a06df316"
diff --git a/pyproject.toml b/pyproject.toml
index ef82f0e679..e5a5ae5d72 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -30,6 +30,8 @@ cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
 httpx = {extras = ["http2"], version = "^0.24.0"}
 numpy = "^1.24.3"
+pyjwt = "^2.7.0"
+beautifulsoup4 = "^4.12.2"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From a4138d75307a5ce6fb7b0a26cbbb1c03805ecadc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 13 Jun 2023 17:50:04 -0400
Subject: [PATCH 110/387] fix dnsdumpster tests

---
 bbot/modules/dnsdumpster.py | 6 ++----
 bbot/modules/viewdns.py     | 3 +--
 2 files changed, 3 insertions(+), 6 deletions(-)

diff --git a/bbot/modules/dnsdumpster.py b/bbot/modules/dnsdumpster.py
index 8009540865..00a557a3ad 100644
--- a/bbot/modules/dnsdumpster.py
+++ b/bbot/modules/dnsdumpster.py
@@ -10,8 +10,6 @@ class dnsdumpster(crobat):
     flags = ["subdomain-enum", "passive", "safe"]
     meta = {"description": "Query dnsdumpster for subdomains"}
 
-    deps_pip = ["beautifulsoup4", "lxml~=4.9.2"]
-
     base_url = "https://dnsdumpster.com"
 
     async def query(self, domain):
@@ -27,7 +25,7 @@ async def query(self, domain):
             return ret
         else:
             self.debug(f'Valid response code "{status_code}" from DNSDumpster')
-        html = BeautifulSoup(res1.content, features="lxml")
+        html = BeautifulSoup(res1.content, "html.parser")
         csrftoken = None
         csrfmiddlewaretoken = None
         try:
@@ -75,7 +73,7 @@ async def query(self, domain):
             self.verbose(f'Bad response code "{status_code}" from DNSDumpster')
             return ret
 
-        html = BeautifulSoup(res2.content, features="lxml")
+        html = BeautifulSoup(res2.content, "html.parser")
         escaped_domain = re.escape(domain)
         match_pattern = re.compile(r"^[\w\.-]+\." + escaped_domain + r"$")
         for subdomain in html.findAll(text=match_pattern):
diff --git a/bbot/modules/viewdns.py b/bbot/modules/viewdns.py
index a38e8d9f9f..4fbfb08f19 100644
--- a/bbot/modules/viewdns.py
+++ b/bbot/modules/viewdns.py
@@ -14,7 +14,6 @@ class viewdns(BaseModule):
     meta = {
         "description": "Query viewdns.info's reverse whois for related domains",
     }
-    deps_pip = ["beautifulsoup4", "lxml~=4.9.2"]
     base_url = "https://viewdns.info"
     in_scope_only = True
     _qsize = 1
@@ -48,7 +47,7 @@ async def query(self, query):
         content = getattr(r, "content", b"")
         from bs4 import BeautifulSoup
 
-        html = BeautifulSoup(content, features="lxml")
+        html = BeautifulSoup(content, "html.parser")
         found = set()
         for table_row in html.findAll("tr"):
             table_cells = table_row.findAll("td")

From f6ed2ecdfee8b4f7ed059398c605f08e67aa562e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 14 Jun 2023 09:43:46 -0400
Subject: [PATCH 111/387] fix wappalyzer tests

---
 bbot/modules/wappalyzer.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/wappalyzer.py b/bbot/modules/wappalyzer.py
index a372d1791d..fdde20f1d0 100644
--- a/bbot/modules/wappalyzer.py
+++ b/bbot/modules/wappalyzer.py
@@ -17,7 +17,7 @@ class wappalyzer(BaseModule):
     meta = {
         "description": "Extract technologies from web responses",
     }
-    deps_pip = ["python-Wappalyzer~=0.3.1"]
+    deps_pip = ["python-Wappalyzer~=0.3.1", "lxml~=4.9.2"]
     # accept all events regardless of scope distance
     scope_distance_modifier = None
     max_event_handlers = 5

From c32e612b17f4a4fb0d887b71e847efa0bcb7514b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 14 Jun 2023 15:46:16 -0400
Subject: [PATCH 112/387] fix wappalyzer tests

---
 bbot/cli.py                |  2 +-
 bbot/modules/wappalyzer.py |  2 +-
 poetry.lock                | 95 +++++++++++++++++++++++++++++++++++++-
 pyproject.toml             |  1 +
 4 files changed, 97 insertions(+), 3 deletions(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index 726afad5f3..09cdb19cd0 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -350,7 +350,7 @@ def main():
         msg = "Interrupted"
         if scan_name:
             msg = f"You killed {scan_name}"
-        log_to_stderr(msg, level="ERROR")
+        log_to_stderr(msg, level="WARNING")
         if get_log_level() <= logging.DEBUG:
             log_to_stderr(traceback.format_exc(), level="DEBUG")
         exit(1)
diff --git a/bbot/modules/wappalyzer.py b/bbot/modules/wappalyzer.py
index fdde20f1d0..a372d1791d 100644
--- a/bbot/modules/wappalyzer.py
+++ b/bbot/modules/wappalyzer.py
@@ -17,7 +17,7 @@ class wappalyzer(BaseModule):
     meta = {
         "description": "Extract technologies from web responses",
     }
-    deps_pip = ["python-Wappalyzer~=0.3.1", "lxml~=4.9.2"]
+    deps_pip = ["python-Wappalyzer~=0.3.1"]
     # accept all events regardless of scope distance
     scope_distance_modifier = None
     max_event_handlers = 5
diff --git a/poetry.lock b/poetry.lock
index 367a661d79..e1dd080d26 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -795,6 +795,99 @@ files = [
     {file = "lockfile-0.12.2.tar.gz", hash = "sha256:6aed02de03cba24efabcd600b30540140634fc06cfa603822d508d5361e9f799"},
 ]
 
+[[package]]
+name = "lxml"
+version = "4.9.2"
+description = "Powerful and Pythonic XML processing library combining libxml2/libxslt with the ElementTree API."
+category = "main"
+optional = false
+python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, != 3.4.*"
+files = [
+    {file = "lxml-4.9.2-cp27-cp27m-macosx_10_15_x86_64.whl", hash = "sha256:76cf573e5a365e790396a5cc2b909812633409306c6531a6877c59061e42c4f2"},
+    {file = "lxml-4.9.2-cp27-cp27m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:b1f42b6921d0e81b1bcb5e395bc091a70f41c4d4e55ba99c6da2b31626c44892"},
+    {file = "lxml-4.9.2-cp27-cp27m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:9f102706d0ca011de571de32c3247c6476b55bb6bc65a20f682f000b07a4852a"},
+    {file = "lxml-4.9.2-cp27-cp27m-win32.whl", hash = "sha256:8d0b4612b66ff5d62d03bcaa043bb018f74dfea51184e53f067e6fdcba4bd8de"},
+    {file = "lxml-4.9.2-cp27-cp27m-win_amd64.whl", hash = "sha256:4c8f293f14abc8fd3e8e01c5bd86e6ed0b6ef71936ded5bf10fe7a5efefbaca3"},
+    {file = "lxml-4.9.2-cp27-cp27mu-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2899456259589aa38bfb018c364d6ae7b53c5c22d8e27d0ec7609c2a1ff78b50"},
+    {file = "lxml-4.9.2-cp27-cp27mu-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:6749649eecd6a9871cae297bffa4ee76f90b4504a2a2ab528d9ebe912b101975"},
+    {file = "lxml-4.9.2-cp310-cp310-macosx_10_15_x86_64.whl", hash = "sha256:a08cff61517ee26cb56f1e949cca38caabe9ea9fbb4b1e10a805dc39844b7d5c"},
+    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:85cabf64adec449132e55616e7ca3e1000ab449d1d0f9d7f83146ed5bdcb6d8a"},
+    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:8340225bd5e7a701c0fa98284c849c9b9fc9238abf53a0ebd90900f25d39a4e4"},
+    {file = "lxml-4.9.2-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:1ab8f1f932e8f82355e75dda5413a57612c6ea448069d4fb2e217e9a4bed13d4"},
+    {file = "lxml-4.9.2-cp310-cp310-musllinux_1_1_aarch64.whl", hash = "sha256:699a9af7dffaf67deeae27b2112aa06b41c370d5e7633e0ee0aea2e0b6c211f7"},
+    {file = "lxml-4.9.2-cp310-cp310-musllinux_1_1_x86_64.whl", hash = "sha256:b9cc34af337a97d470040f99ba4282f6e6bac88407d021688a5d585e44a23184"},
+    {file = "lxml-4.9.2-cp310-cp310-win32.whl", hash = "sha256:d02a5399126a53492415d4906ab0ad0375a5456cc05c3fc0fc4ca11771745cda"},
+    {file = "lxml-4.9.2-cp310-cp310-win_amd64.whl", hash = "sha256:a38486985ca49cfa574a507e7a2215c0c780fd1778bb6290c21193b7211702ab"},
+    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:c83203addf554215463b59f6399835201999b5e48019dc17f182ed5ad87205c9"},
+    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:2a87fa548561d2f4643c99cd13131acb607ddabb70682dcf1dff5f71f781a4bf"},
+    {file = "lxml-4.9.2-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:d6b430a9938a5a5d85fc107d852262ddcd48602c120e3dbb02137c83d212b380"},
+    {file = "lxml-4.9.2-cp311-cp311-musllinux_1_1_aarch64.whl", hash = "sha256:3efea981d956a6f7173b4659849f55081867cf897e719f57383698af6f618a92"},
+    {file = "lxml-4.9.2-cp311-cp311-musllinux_1_1_x86_64.whl", hash = "sha256:df0623dcf9668ad0445e0558a21211d4e9a149ea8f5666917c8eeec515f0a6d1"},
+    {file = "lxml-4.9.2-cp311-cp311-win32.whl", hash = "sha256:da248f93f0418a9e9d94b0080d7ebc407a9a5e6d0b57bb30db9b5cc28de1ad33"},
+    {file = "lxml-4.9.2-cp311-cp311-win_amd64.whl", hash = "sha256:3818b8e2c4b5148567e1b09ce739006acfaa44ce3156f8cbbc11062994b8e8dd"},
+    {file = "lxml-4.9.2-cp35-cp35m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:ca989b91cf3a3ba28930a9fc1e9aeafc2a395448641df1f387a2d394638943b0"},
+    {file = "lxml-4.9.2-cp35-cp35m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:822068f85e12a6e292803e112ab876bc03ed1f03dddb80154c395f891ca6b31e"},
+    {file = "lxml-4.9.2-cp35-cp35m-win32.whl", hash = "sha256:be7292c55101e22f2a3d4d8913944cbea71eea90792bf914add27454a13905df"},
+    {file = "lxml-4.9.2-cp35-cp35m-win_amd64.whl", hash = "sha256:998c7c41910666d2976928c38ea96a70d1aa43be6fe502f21a651e17483a43c5"},
+    {file = "lxml-4.9.2-cp36-cp36m-macosx_10_15_x86_64.whl", hash = "sha256:b26a29f0b7fc6f0897f043ca366142d2b609dc60756ee6e4e90b5f762c6adc53"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:ab323679b8b3030000f2be63e22cdeea5b47ee0abd2d6a1dc0c8103ddaa56cd7"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:689bb688a1db722485e4610a503e3e9210dcc20c520b45ac8f7533c837be76fe"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:f49e52d174375a7def9915c9f06ec4e569d235ad428f70751765f48d5926678c"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:36c3c175d34652a35475a73762b545f4527aec044910a651d2bf50de9c3352b1"},
+    {file = "lxml-4.9.2-cp36-cp36m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:a35f8b7fa99f90dd2f5dc5a9fa12332642f087a7641289ca6c40d6e1a2637d8e"},
+    {file = "lxml-4.9.2-cp36-cp36m-musllinux_1_1_aarch64.whl", hash = "sha256:58bfa3aa19ca4c0f28c5dde0ff56c520fbac6f0daf4fac66ed4c8d2fb7f22e74"},
+    {file = "lxml-4.9.2-cp36-cp36m-musllinux_1_1_x86_64.whl", hash = "sha256:bc718cd47b765e790eecb74d044cc8d37d58562f6c314ee9484df26276d36a38"},
+    {file = "lxml-4.9.2-cp36-cp36m-win32.whl", hash = "sha256:d5bf6545cd27aaa8a13033ce56354ed9e25ab0e4ac3b5392b763d8d04b08e0c5"},
+    {file = "lxml-4.9.2-cp36-cp36m-win_amd64.whl", hash = "sha256:3ab9fa9d6dc2a7f29d7affdf3edebf6ece6fb28a6d80b14c3b2fb9d39b9322c3"},
+    {file = "lxml-4.9.2-cp37-cp37m-macosx_10_15_x86_64.whl", hash = "sha256:05ca3f6abf5cf78fe053da9b1166e062ade3fa5d4f92b4ed688127ea7d7b1d03"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:a5da296eb617d18e497bcf0a5c528f5d3b18dadb3619fbdadf4ed2356ef8d941"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:04876580c050a8c5341d706dd464ff04fd597095cc8c023252566a8826505726"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:c9ec3eaf616d67db0764b3bb983962b4f385a1f08304fd30c7283954e6a7869b"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2a29ba94d065945944016b6b74e538bdb1751a1db6ffb80c9d3c2e40d6fa9894"},
+    {file = "lxml-4.9.2-cp37-cp37m-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:a82d05da00a58b8e4c0008edbc8a4b6ec5a4bc1e2ee0fb6ed157cf634ed7fa45"},
+    {file = "lxml-4.9.2-cp37-cp37m-musllinux_1_1_aarch64.whl", hash = "sha256:223f4232855ade399bd409331e6ca70fb5578efef22cf4069a6090acc0f53c0e"},
+    {file = "lxml-4.9.2-cp37-cp37m-musllinux_1_1_x86_64.whl", hash = "sha256:d17bc7c2ccf49c478c5bdd447594e82692c74222698cfc9b5daae7ae7e90743b"},
+    {file = "lxml-4.9.2-cp37-cp37m-win32.whl", hash = "sha256:b64d891da92e232c36976c80ed7ebb383e3f148489796d8d31a5b6a677825efe"},
+    {file = "lxml-4.9.2-cp37-cp37m-win_amd64.whl", hash = "sha256:a0a336d6d3e8b234a3aae3c674873d8f0e720b76bc1d9416866c41cd9500ffb9"},
+    {file = "lxml-4.9.2-cp38-cp38-macosx_10_15_x86_64.whl", hash = "sha256:da4dd7c9c50c059aba52b3524f84d7de956f7fef88f0bafcf4ad7dde94a064e8"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:821b7f59b99551c69c85a6039c65b75f5683bdc63270fec660f75da67469ca24"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:e5168986b90a8d1f2f9dc1b841467c74221bd752537b99761a93d2d981e04889"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:8e20cb5a47247e383cf4ff523205060991021233ebd6f924bca927fcf25cf86f"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:13598ecfbd2e86ea7ae45ec28a2a54fb87ee9b9fdb0f6d343297d8e548392c03"},
+    {file = "lxml-4.9.2-cp38-cp38-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:880bbbcbe2fca64e2f4d8e04db47bcdf504936fa2b33933efd945e1b429bea8c"},
+    {file = "lxml-4.9.2-cp38-cp38-musllinux_1_1_aarch64.whl", hash = "sha256:7d2278d59425777cfcb19735018d897ca8303abe67cc735f9f97177ceff8027f"},
+    {file = "lxml-4.9.2-cp38-cp38-musllinux_1_1_x86_64.whl", hash = "sha256:5344a43228767f53a9df6e5b253f8cdca7dfc7b7aeae52551958192f56d98457"},
+    {file = "lxml-4.9.2-cp38-cp38-win32.whl", hash = "sha256:925073b2fe14ab9b87e73f9a5fde6ce6392da430f3004d8b72cc86f746f5163b"},
+    {file = "lxml-4.9.2-cp38-cp38-win_amd64.whl", hash = "sha256:9b22c5c66f67ae00c0199f6055705bc3eb3fcb08d03d2ec4059a2b1b25ed48d7"},
+    {file = "lxml-4.9.2-cp39-cp39-macosx_10_15_x86_64.whl", hash = "sha256:5f50a1c177e2fa3ee0667a5ab79fdc6b23086bc8b589d90b93b4bd17eb0e64d1"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:090c6543d3696cbe15b4ac6e175e576bcc3f1ccfbba970061b7300b0c15a2140"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.manylinux_2_24_aarch64.whl", hash = "sha256:63da2ccc0857c311d764e7d3d90f429c252e83b52d1f8f1d1fe55be26827d1f4"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:5b4545b8a40478183ac06c073e81a5ce4cf01bf1734962577cf2bb569a5b3bbf"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_5_i686.manylinux1_i686.whl", hash = "sha256:2e430cd2824f05f2d4f687701144556646bae8f249fd60aa1e4c768ba7018947"},
+    {file = "lxml-4.9.2-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.whl", hash = "sha256:6804daeb7ef69e7b36f76caddb85cccd63d0c56dedb47555d2fc969e2af6a1a5"},
+    {file = "lxml-4.9.2-cp39-cp39-musllinux_1_1_aarch64.whl", hash = "sha256:a6e441a86553c310258aca15d1c05903aaf4965b23f3bc2d55f200804e005ee5"},
+    {file = "lxml-4.9.2-cp39-cp39-musllinux_1_1_x86_64.whl", hash = "sha256:ca34efc80a29351897e18888c71c6aca4a359247c87e0b1c7ada14f0ab0c0fb2"},
+    {file = "lxml-4.9.2-cp39-cp39-win32.whl", hash = "sha256:6b418afe5df18233fc6b6093deb82a32895b6bb0b1155c2cdb05203f583053f1"},
+    {file = "lxml-4.9.2-cp39-cp39-win_amd64.whl", hash = "sha256:f1496ea22ca2c830cbcbd473de8f114a320da308438ae65abad6bab7867fe38f"},
+    {file = "lxml-4.9.2-pp37-pypy37_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:b264171e3143d842ded311b7dccd46ff9ef34247129ff5bf5066123c55c2431c"},
+    {file = "lxml-4.9.2-pp37-pypy37_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:0dc313ef231edf866912e9d8f5a042ddab56c752619e92dfd3a2c277e6a7299a"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-macosx_10_15_x86_64.whl", hash = "sha256:16efd54337136e8cd72fb9485c368d91d77a47ee2d42b057564aae201257d419"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:0f2b1e0d79180f344ff9f321327b005ca043a50ece8713de61d1cb383fb8ac05"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:7b770ed79542ed52c519119473898198761d78beb24b107acf3ad65deae61f1f"},
+    {file = "lxml-4.9.2-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:efa29c2fe6b4fdd32e8ef81c1528506895eca86e1d8c4657fda04c9b3786ddf9"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-macosx_10_15_x86_64.whl", hash = "sha256:7e91ee82f4199af8c43d8158024cbdff3d931df350252288f0d4ce656df7f3b5"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-manylinux_2_12_i686.manylinux2010_i686.manylinux_2_24_i686.whl", hash = "sha256:b23e19989c355ca854276178a0463951a653309fb8e57ce674497f2d9f208746"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.manylinux_2_24_x86_64.whl", hash = "sha256:01d36c05f4afb8f7c20fd9ed5badca32a2029b93b1750f571ccc0b142531caf7"},
+    {file = "lxml-4.9.2-pp39-pypy39_pp73-win_amd64.whl", hash = "sha256:7b515674acfdcadb0eb5d00d8a709868173acece5cb0be3dd165950cbfdf5409"},
+    {file = "lxml-4.9.2.tar.gz", hash = "sha256:2455cfaeb7ac70338b3257f41e21f0724f4b5b0c0e7702da67ee6c3640835b67"},
+]
+
+[package.extras]
+cssselect = ["cssselect (>=0.7)"]
+html5 = ["html5lib"]
+htmlsoup = ["BeautifulSoup4"]
+source = ["Cython (>=0.29.7)"]
+
 [[package]]
 name = "markupsafe"
 version = "2.1.2"
@@ -1790,4 +1883,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "9ddb3f590354fc34ba956c3b9fc97a27a37b4a109ee6e246b8f14949a06df316"
+content-hash = "550f452df57c9141e9996e4ad62f4e221178413b8c54715eba9757452458a4b9"
diff --git a/pyproject.toml b/pyproject.toml
index e5a5ae5d72..cd586d245d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -32,6 +32,7 @@ httpx = {extras = ["http2"], version = "^0.24.0"}
 numpy = "^1.24.3"
 pyjwt = "^2.7.0"
 beautifulsoup4 = "^4.12.2"
+lxml = "^4.9.2"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From ed7ad644524d952fc84feadbc4b747f39662317c Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Wed, 14 Jun 2023 17:44:47 -0400
Subject: [PATCH 113/387] Update README.md

---
 README.md | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index e3132f9dcb..b956915558 100644
--- a/README.md
+++ b/README.md
@@ -11,7 +11,9 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 Whether you're a pentester, security researcher, or bug bounty hunter, BBOT simplifies and automates the OSINT process so you can focus on the fun part: hacking!
 
-![bbot-demo](https://user-images.githubusercontent.com/20261699/217346759-d5bf56c3-3936-43f7-ad14-4d73d2cd1417.gif)
+
+https://github.com/blacklanternsecurity/bbot/assets/20261699/02df1f23-d575-43b2-b158-bf5f3e708ae5
+
 Visualization courtesey of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
 
 # Getting Started

From 264e045a58489a4f83f45a31fb0cac260e85c809 Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Wed, 14 Jun 2023 17:47:43 -0400
Subject: [PATCH 114/387] Update README.md

---
 README.md | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/README.md b/README.md
index b956915558..6eec401ade 100644
--- a/README.md
+++ b/README.md
@@ -11,8 +11,7 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 Whether you're a pentester, security researcher, or bug bounty hunter, BBOT simplifies and automates the OSINT process so you can focus on the fun part: hacking!
 
-
-https://github.com/blacklanternsecurity/bbot/assets/20261699/02df1f23-d575-43b2-b158-bf5f3e708ae5
+https://github.com/blacklanternsecurity/bbot/assets/20261699/ebf2a81e-7530-4a9e-922d-4e62eb949f35
 
 Visualization courtesey of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
 

From 7fcaa092018793902dec7dc920dd2665fde944e2 Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Wed, 14 Jun 2023 17:49:13 -0400
Subject: [PATCH 115/387] Update README.md

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 6eec401ade..a5153c26f0 100644
--- a/README.md
+++ b/README.md
@@ -13,7 +13,7 @@ Whether you're a pentester, security researcher, or bug bounty hunter, BBOT simp
 
 https://github.com/blacklanternsecurity/bbot/assets/20261699/ebf2a81e-7530-4a9e-922d-4e62eb949f35
 
-Visualization courtesey of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
+Visualization courtesy of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
 
 # Getting Started
 

From af56d4afce6170574fdd62a17dc50dcba7e4dbc0 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 15 Jun 2023 11:45:44 -0400
Subject: [PATCH 116/387] fix sslcert tests

---
 bbot/test/conftest.py                         | 25 +++++++++++++++++++
 bbot/test/test_step_2/module_tests/base.py    |  7 +++---
 .../module_tests/test_module_sslcert.py       |  4 +--
 3 files changed, 31 insertions(+), 5 deletions(-)

diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index ee7494838d..6c7b125352 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -1,6 +1,8 @@
+import ssl
 import shutil
 import pytest
 import logging
+from pathlib import Path
 from pytest_httpserver import HTTPServer
 
 from bbot.core.helpers.interactsh import server_list as interactsh_servers
@@ -49,6 +51,29 @@ def bbot_httpserver():
     server.clear()
 
 
+@pytest.fixture
+def bbot_httpserver_ssl():
+    context = ssl.SSLContext(ssl.PROTOCOL_TLS_SERVER)
+    current_dir = Path(__file__).parent
+    keyfile = str(current_dir / "testsslkey.pem")
+    certfile = str(current_dir / "testsslcert.pem")
+    context.load_cert_chain(certfile, keyfile)
+    server = HTTPServer(host="127.0.0.1", port=9999, ssl_context=context)
+    server.start()
+
+    yield server
+
+    server.clear()
+    if server.is_running():
+        server.stop()
+
+    # this is to check if the client has made any request where no
+    # `assert_request` was called on it from the test
+
+    server.check_assertions()
+    server.clear()
+
+
 @pytest.fixture
 def interactsh_mock_instance():
     interactsh_mock = Interactsh_mock()
diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index 8a046ccca0..b598989535 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -48,12 +48,13 @@ class ModuleTestBase:
     modules_overrides = []
 
     class ModuleTest:
-        def __init__(self, module_test_base, httpx_mock, httpserver, monkeypatch, request):
+        def __init__(self, module_test_base, httpx_mock, httpserver, httpserver_ssl, monkeypatch, request):
             self.name = module_test_base.name
             self.config = OmegaConf.merge(test_config, OmegaConf.create(module_test_base.config_overrides))
 
             self.httpx_mock = httpx_mock
             self.httpserver = httpserver
+            self.httpserver_ssl = httpserver_ssl
             self.monkeypatch = monkeypatch
             self.request_fixture = request
             self.preloaded = module_loader.preloaded()
@@ -99,8 +100,8 @@ def mock_record(self, *args, **kwargs):
             return MockRecord(*args, **kwargs)
 
     @pytest_asyncio.fixture
-    async def module_test(self, httpx_mock, bbot_httpserver, monkeypatch, request):
-        module_test = self.ModuleTest(self, httpx_mock, bbot_httpserver, monkeypatch, request)
+    async def module_test(self, httpx_mock, bbot_httpserver, bbot_httpserver_ssl, monkeypatch, request):
+        module_test = self.ModuleTest(self, httpx_mock, bbot_httpserver, bbot_httpserver_ssl, monkeypatch, request)
         await self.setup_before_prep(module_test)
         await module_test.scan.prep()
         await self.setup_after_prep(module_test)
diff --git a/bbot/test/test_step_2/module_tests/test_module_sslcert.py b/bbot/test/test_step_2/module_tests/test_module_sslcert.py
index d443dfb618..df524f49ca 100644
--- a/bbot/test/test_step_2/module_tests/test_module_sslcert.py
+++ b/bbot/test/test_step_2/module_tests/test_module_sslcert.py
@@ -2,7 +2,7 @@
 
 
 class TestSSLCert(ModuleTestBase):
-    targets = ["8.8.8.8:443"]
+    targets = ["127.0.0.1:9999", "bbottest.notreal"]
 
     def check(self, module_test, events):
-        assert any(e.data == "dns.google" and str(e.module) == "sslcert" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "www.bbottest.notreal" and str(e.module) == "sslcert" for e in events), "Failed to detect subdomain"

From 5f23ecfc91b289fe12e58d464f0b1a39df2bbdf6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 15 Jun 2023 11:47:24 -0400
Subject: [PATCH 117/387] blacked

---
 bbot/test/test_step_2/module_tests/test_module_sslcert.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_sslcert.py b/bbot/test/test_step_2/module_tests/test_module_sslcert.py
index df524f49ca..51d9f8dcca 100644
--- a/bbot/test/test_step_2/module_tests/test_module_sslcert.py
+++ b/bbot/test/test_step_2/module_tests/test_module_sslcert.py
@@ -5,4 +5,6 @@ class TestSSLCert(ModuleTestBase):
     targets = ["127.0.0.1:9999", "bbottest.notreal"]
 
     def check(self, module_test, events):
-        assert any(e.data == "www.bbottest.notreal" and str(e.module) == "sslcert" for e in events), "Failed to detect subdomain"
+        assert any(
+            e.data == "www.bbottest.notreal" and str(e.module) == "sslcert" for e in events
+        ), "Failed to detect subdomain"

From 72b6d6ee4e5a611edb63e4212651e744a8b687a2 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 15 Jun 2023 11:54:56 -0400
Subject: [PATCH 118/387] add bogus sslcerts for testing

---
 bbot/test/testsslcert.pem | 32 ++++++++++++++++++++++++
 bbot/test/testsslkey.pem  | 52 +++++++++++++++++++++++++++++++++++++++
 2 files changed, 84 insertions(+)
 create mode 100644 bbot/test/testsslcert.pem
 create mode 100644 bbot/test/testsslkey.pem

diff --git a/bbot/test/testsslcert.pem b/bbot/test/testsslcert.pem
new file mode 100644
index 0000000000..58795f01db
--- /dev/null
+++ b/bbot/test/testsslcert.pem
@@ -0,0 +1,32 @@
+-----BEGIN CERTIFICATE-----
+MIIFcTCCA1mgAwIBAgIUbj+lT6F+42NhnHW4I5nMg8f7fVYwDQYJKoZIhvcNAQEL
+BQAwRzELMAkGA1UEBhMCVVMxCzAJBgNVBAgMAkNBMQwwCgYDVQQKDANCTFMxHTAb
+BgNVBAMMFHd3dy5iYm90dGVzdC5ub3RyZWFsMCAXDTIzMDYxNTE1MjcxOVoYDzIw
+NTAxMDMwMTUyNzE5WjBHMQswCQYDVQQGEwJVUzELMAkGA1UECAwCQ0ExDDAKBgNV
+BAoMA0JMUzEdMBsGA1UEAwwUd3d3LmJib3R0ZXN0Lm5vdHJlYWwwggIiMA0GCSqG
+SIb3DQEBAQUAA4ICDwAwggIKAoICAQC+Xown/v4Ow/kdGL2FHiF4wBBYZqwjXSFG
+W2ch2KHv2S9LKhfw+sesv0LAa1JEnBkA0BYoTS35H9W7PWeClA7fyeWwyv4BWoe6
+7aCldOdm6r3KtHswK1BYfZfi6zvPebTr08Bo2sUIw/C75XXUYX5aqAIjHwFzE7Fm
+/wadTgNAk8Qt16esrfoeJGP5by+rUraJa2aOsQZ20CCKtvMKc7aVev7XTYb8ZpGo
+a9b6qW4pn3+AeF8ZlzE7VUHVPObsSeZYEvQ1y+jEcISFtzkrPmsEs0mlatOdJzoJ
+CZCUgtkK4oqU2JgWH0dc7/slvuEolCJ3LgbiZ1MS7lq5CJSk/P09twn681/UTBav
+V9XR4x554Qta3DD4wE4HBhQ0HNtofQThlq9kQXyKbQimLFntyNI++mArLxakUCfP
+JwySG2VSppE3PS9Mv4/hF5134pkOcZ7vfUcxS941AQWs4LAqN/P16XDOkC97rsVm
+SwEoNlZm4saRRUeK6+YO1lKScD59Uv/XOTsnTqVU5EX/NNpCNFZkO+Loqzm/Cxg1
+XZoL4ggQHBq2hU6EGokRk7PGpPFnCwTevpL9FHFkYZgs0Q/gmxDSDz13bzpIegoA
+dSZ6qNgm69Uar5x7wxh6m7qgtVSlbT3mvhNRZAdfQjA0V1ei4AcjI+7ZZOsMr/AI
+qXDgXImzWwIDAQABo1MwUTAdBgNVHQ4EFgQU3mja6Q9QHOqYZusrPg7DFsKdKwIw
+HwYDVR0jBBgwFoAU3mja6Q9QHOqYZusrPg7DFsKdKwIwDwYDVR0TAQH/BAUwAwEB
+/zANBgkqhkiG9w0BAQsFAAOCAgEAY22H/Yn2ZHEe/OsoN4nkb2TlCSNN3hWz/6kj
+peivRuFzC3lIEThZq1QPi1ncLY0ZVFpbWtZxA2NCi6QN/nDJyjYnBzxkluUJWq15
+m4ktZNCDbvAXzTl5CFAzCpsPFITWusx10rD5UxV9qmmJ+ruaL/IlqKVYgcNlUam/
+tJjmMIOtmnszD4Z01v1M4MpLsaZXSGIqGiTAZNydbFF5bmccZV/e+8SBFv78Hoqh
+OEk8CCCLG31KF0q88YuNjA0B62g2B+xZRy3fxaZLm5mL56ZaMf6muezEI2vVUKPh
+0KWSnnxhNtLPNIB26zx6Epr6mUV9zccSKg9n9pZf7gPNWbQreV1tgFIoavI7XZvE
+dyOAwXyo1dnoyEmATanVLn/XutEyjHHtG/QnzV87/MoATVMeGwoteSoq1TGcXn1N
+xvmDt+VKrYSgyIGI3eFk1/WZXCQApL61SZItfK3kPEfKFPhWj2O7TtYT7LTeaAbO
+/n64t7fPeSB4d6zUL1lxhtPn5DwcZnEenc098N7yqtdNtjYJRPn3qTIqAI29d6UU
+puylfyyoLUwIXWXnOGnkJV5/DWBLbLRSWxMY8+YhIHaDv9VtAsPhCz4uKjLHk35c
+OztJlxpMzfM9VuttMzCD1aqufdLRtMGS9US+0ZrwQyjix3rkgovbFOOGrWYYu95A
+gWR5KGU=
+-----END CERTIFICATE-----
diff --git a/bbot/test/testsslkey.pem b/bbot/test/testsslkey.pem
new file mode 100644
index 0000000000..6e90e108ba
--- /dev/null
+++ b/bbot/test/testsslkey.pem
@@ -0,0 +1,52 @@
+-----BEGIN PRIVATE KEY-----
+MIIJQQIBADANBgkqhkiG9w0BAQEFAASCCSswggknAgEAAoICAQC+Xown/v4Ow/kd
+GL2FHiF4wBBYZqwjXSFGW2ch2KHv2S9LKhfw+sesv0LAa1JEnBkA0BYoTS35H9W7
+PWeClA7fyeWwyv4BWoe67aCldOdm6r3KtHswK1BYfZfi6zvPebTr08Bo2sUIw/C7
+5XXUYX5aqAIjHwFzE7Fm/wadTgNAk8Qt16esrfoeJGP5by+rUraJa2aOsQZ20CCK
+tvMKc7aVev7XTYb8ZpGoa9b6qW4pn3+AeF8ZlzE7VUHVPObsSeZYEvQ1y+jEcISF
+tzkrPmsEs0mlatOdJzoJCZCUgtkK4oqU2JgWH0dc7/slvuEolCJ3LgbiZ1MS7lq5
+CJSk/P09twn681/UTBavV9XR4x554Qta3DD4wE4HBhQ0HNtofQThlq9kQXyKbQim
+LFntyNI++mArLxakUCfPJwySG2VSppE3PS9Mv4/hF5134pkOcZ7vfUcxS941AQWs
+4LAqN/P16XDOkC97rsVmSwEoNlZm4saRRUeK6+YO1lKScD59Uv/XOTsnTqVU5EX/
+NNpCNFZkO+Loqzm/Cxg1XZoL4ggQHBq2hU6EGokRk7PGpPFnCwTevpL9FHFkYZgs
+0Q/gmxDSDz13bzpIegoAdSZ6qNgm69Uar5x7wxh6m7qgtVSlbT3mvhNRZAdfQjA0
+V1ei4AcjI+7ZZOsMr/AIqXDgXImzWwIDAQABAoICAFH3ztxn2IeODUTggrX/J8Vg
+2YjeyI6/ilTLhWgW6X8nIkx4du+NY413muvUKgudtMxbTLcUqE9kzDf/dALO8mqc
+ebh6Zw05KEkuCSZE5GA1gfv2YzZ15/X6Ofx8cfffPS3vsqDTVdR03cJhxi7ovamW
+PrlVn9+nYpLpCzWPQio7ldRxT2K0VIZG//8GR1260xrvcizNf22IJwLjTFm7Qiox
+1+nnmVAzb9M3f8zVSDhG03UDH1ua9JlKF/sTapDiLvrMSnehcXunwP/8SPLcQOM4
+uWSuzygTHFOI2UaA4qhjq+z0J+QamrUjJZ32hudchUyQtmkkuSnlFI4oaixyPC1o
+KkwPyV/y+ugBuq/bIOTlHwTjg68kDLNRct+uL+GYq6MWUcDl3VnhK3471gSm6RBq
+VMoulKDQg7tyjWM1+TZgT5JRuCkXRw3TUm9RVrWMUa4VAPQCW+zgNf6TITI3IPMx
+R+SJ3SlGtkmU+kWIqMvFtGAMjttNuEpba9jnhtlO3O1WuZXcdn+oD1qRq2ifNIN3
+w2DZQ+waYFa5NO2a26KNxSA22S32AWLu7nA3zR8eomEFIzlrvNYUPo7g4kyeL2tA
+tmhSN6gRge5c0hymdtozXrNUad6rtV49oJDc1t47Wkqq2n205TEZyzxX/g2I0lPd
+vF9WVWva2T2OO0q+CJwRAoIBAQDJZ2BtjDIg16Q4oSARKfiN1e+74oIMnh3djf68
+fQXDYSZvs6UlTZdeFtJC0NppkaNyBUnjzgI1xtMCbLbYYT0kUTaikNU0Lvi5NjZH
+IQ+pTT21V7eKe0XMGhF8CLYt8Dh2JxCMPJDKhHwppOqIRRVsuUXEEYQlRQL/f/jm
+ONLMClwr+/a/DFYY/vqdt3al50dpszHB3POwKiMLpiANNir2k1fQ++OPW0Pm0c8/
+qe0Iuz7Qo629uBEWsv6MiEhpY7GfT8QBeqPKutdg1y5j7q6M1CgZSDClyhQ2bYRp
+5ZGib6I2Mdzf/vWFO+lTEfFWne7DLvN4ViW/8w31dc9ZUiErAoIBAQDx+WvS1LhQ
+rczCYh4em3L1k6G54dsnnIU7kudXsNIm/ND+YNbOJKxRm3jA0C6/Z7t+lSCKiAVK
+iG48Oz/c9wtWu1ck77fUY6IGbd+CM+o76KLmsadnOEaCrsWN8XJJBxSGxQBgD24F
+NjhxRwabzqAkpHcHT4LakrrWWoTcS1v059fxmbSWEmMxrHcQ5GwMmRU5p5d66Fwz
+mmT9J6W0yxitQRkO8vfu5C8m2UF/o7jYITY55JmNmTdp0z+p9U/gUVO6vo6/zROR
+DKLelvso42wTkgWNJFnxKnBUZIQ78PYdkL7Nf42tm0Rf/Dmti1SV5l/rMQ/4plGZ
+i0/QF4aXtb6RAoIBAAx0lTURJ4R6cZCC/m2xT8rNwT64WlyXZrdt8aQMg0+68VqV
+HJB7BPJvrN8u9WLz+8ywYQpykhZrTl9nA8PL97EISL2zAUxx3zXtEVxCwioxObC+
+VP5+cymVLyGhlEqxAXzlG5Pgpv+vQ9J7fXmh9Bo+Nv9SKf74DqBodKcgOoEd3udl
+dLQJ+kUfd7ZLQ04tSHBUAa7AkF2DrZkp0++dOvj20cZ93WvfNArRTOTeCGey1Mao
+aLVD7eKefTmJsBi8bp6wmymQQRLnjSxTAm5xs1/IOxadLU0De06GZVr7NI98IecC
+HGvJ47syolJd2LQHnl15yNrXUQxW5rUYbRNUDfMCggEAP4cSTdnXQic/GNGVwsdh
+GSRXU2v+k5m+SPO6lQUxR1ccr4xRGPH747kDrOt7OnlLemJAlt47NWQ4PMv5alPZ
+wD2TFXlyM+qsgS+bfJ2Qo4XiLtr5bloR+QFVkHyRWqbnNrLF9HJYmjmv+91/2KwY
+00XykhLH8gaP0vMU6plGXTf5M8784GGXdVUoNWEjFPOj5O0hEf2rJ0kjtmsQUDT6
+F5J9t7UGbsutrW9giNg9EVE24WApCEnviHMTxdVH0UbIysB4zdZTisNchz/wVL3Q
+hBrUJkgi7PQNZbq2FN6gXwa/cUhJtAiNnP2lTvDDlk9TY3YQEWHpDnzKyYFDrtTi
+YQKCAQA99iclLk7fWv+nNoEpAmI+qrtBtKNIQOvJ+0ACx61l5ycs5R9dpRVhaeB0
+vJMDm3r8ZouOYgycZDENk07bMhRtlFb2XKf10vnhTReQx9HJSsy/ZzhIJKFfTcbY
+SBH+VoxIX8U3/Da8cJ4VT+JM8rFHk94lsadl+wpRrwWaYgDCVcU3zwFIX0HBEUDi
+DZ93FdK/pVNdUsxQtm4v/ctreXmfwGTVnh8O92pDRw2vrqin7yTnElw42BNcGszW
+wCIuxiWtE3O10zj04o71MTtA5IN5l4xUPO/TpKjFqi2nfqJQOnlOqxgzVQAoUyqq
+TxNrvplI4d8A4JF6Q427dhu2M7vy
+-----END PRIVATE KEY-----

From ac85222ca510d820237103502a04c7205d6e3614 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 20 Jun 2023 16:35:17 -0400
Subject: [PATCH 119/387] remove numpy dependency

---
 bbot/core/helpers/misc.py |  23 +++----
 poetry.lock               | 139 +++-----------------------------------
 pyproject.toml            |   1 -
 3 files changed, 20 insertions(+), 143 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 9e471a7b6b..1563e20c3c 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -17,7 +17,6 @@
 import platform
 import ipaddress
 import traceback
-import numpy as np
 import subprocess as sp
 from pathlib import Path
 from itertools import islice
@@ -1098,22 +1097,22 @@ def cancel_tasks_sync(tasks):
 
 
 def weighted_shuffle(items, weights):
-    # Make sure the list is a numpy array
-    items = np.array(items)
+    # Create a list of tuples where each tuple is (item, weight)
+    pool = list(zip(items, weights))
 
-    # Make an empty list to hold the shuffled items
     shuffled_items = []
 
     # While there are still items to be chosen...
-    while len(items) > 0:
-        # Choose an item
-        chosen_index = np.random.choice(range(len(items)), p=weights / np.sum(weights))
+    while pool:
+        # Normalize weights
+        total = sum(weight for item, weight in pool)
+        weights = [weight / total for item, weight in pool]
 
-        # Add the chosen item to the shuffled list
-        shuffled_items.append(items[chosen_index])
+        # Choose an index based on weight
+        chosen_index = random.choices(range(len(pool)), weights=weights, k=1)[0]
 
-        # Remove the chosen item from the available pool
-        items = np.delete(items, chosen_index)
-        weights = np.delete(weights, chosen_index)
+        # Add the chosen item to the shuffled list
+        chosen_item, chosen_weight = pool.pop(chosen_index)
+        shuffled_items.append(chosen_item)
 
     return shuffled_items
diff --git a/poetry.lock b/poetry.lock
index e1dd080d26..1fb51fefd9 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1,10 +1,9 @@
-# This file is automatically @generated by Poetry and should not be changed by hand.
+# This file is automatically @generated by Poetry 1.5.1 and should not be changed by hand.
 
 [[package]]
 name = "ansible"
 version = "7.5.0"
 description = "Radically simple IT automation"
-category = "main"
 optional = false
 python-versions = ">=3.9"
 files = [
@@ -19,7 +18,6 @@ ansible-core = ">=2.14.5,<2.15.0"
 name = "ansible-core"
 version = "2.14.6"
 description = "Radically simple IT automation"
-category = "main"
 optional = false
 python-versions = ">=3.9"
 files = [
@@ -38,7 +36,6 @@ resolvelib = ">=0.5.3,<0.9.0"
 name = "ansible-runner"
 version = "2.3.2"
 description = "\"Consistent Ansible Python API and CLI with container and process isolation runtime capabilities\""
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -57,7 +54,6 @@ six = "*"
 name = "antlr4-python3-runtime"
 version = "4.9.3"
 description = "ANTLR 4.9.3 runtime for Python 3.7"
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -68,7 +64,6 @@ files = [
 name = "anyio"
 version = "3.6.2"
 description = "High level compatibility layer for multiple asynchronous event loop implementations"
-category = "main"
 optional = false
 python-versions = ">=3.6.2"
 files = [
@@ -89,7 +84,6 @@ trio = ["trio (>=0.16,<0.22)"]
 name = "appdirs"
 version = "1.4.4"
 description = "A small Python module for determining appropriate platform-specific dirs, e.g. a \"user data dir\"."
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -101,7 +95,6 @@ files = [
 name = "attrs"
 version = "23.1.0"
 description = "Classes Without Boilerplate"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -120,7 +113,6 @@ tests-no-zope = ["cloudpickle", "hypothesis", "mypy (>=1.1.1)", "pympler", "pyte
 name = "beautifulsoup4"
 version = "4.12.2"
 description = "Screen-scraping library"
-category = "main"
 optional = false
 python-versions = ">=3.6.0"
 files = [
@@ -139,7 +131,6 @@ lxml = ["lxml"]
 name = "black"
 version = "23.3.0"
 description = "The uncompromising code formatter."
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -189,7 +180,6 @@ uvloop = ["uvloop (>=0.15.2)"]
 name = "cattrs"
 version = "22.2.0"
 description = "Composable complex class support for attrs and dataclasses."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -205,7 +195,6 @@ exceptiongroup = {version = "*", markers = "python_version < \"3.11\""}
 name = "certifi"
 version = "2023.5.7"
 description = "Python package for providing Mozilla's CA Bundle."
-category = "main"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -217,7 +206,6 @@ files = [
 name = "cffi"
 version = "1.15.1"
 description = "Foreign Function Interface for Python calling C code."
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -294,7 +282,6 @@ pycparser = "*"
 name = "charset-normalizer"
 version = "3.1.0"
 description = "The Real First Universal Charset Detector. Open, modern and actively maintained alternative to Chardet."
-category = "main"
 optional = false
 python-versions = ">=3.7.0"
 files = [
@@ -379,7 +366,6 @@ files = [
 name = "click"
 version = "8.1.3"
 description = "Composable command line interface toolkit"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -394,7 +380,6 @@ colorama = {version = "*", markers = "platform_system == \"Windows\""}
 name = "cloudcheck"
 version = "2.0.0.36"
 description = "Check whether an IP address belongs to a cloud provider"
-category = "main"
 optional = false
 python-versions = ">=3.7,<4.0"
 files = [
@@ -410,7 +395,6 @@ requests-cache = ">=0.9.7,<0.10.0"
 name = "colorama"
 version = "0.4.6"
 description = "Cross-platform colored terminal text."
-category = "dev"
 optional = false
 python-versions = "!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,!=3.4.*,!=3.5.*,!=3.6.*,>=2.7"
 files = [
@@ -422,7 +406,6 @@ files = [
 name = "coverage"
 version = "7.2.5"
 description = "Code coverage measurement for Python"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -489,7 +472,6 @@ toml = ["tomli"]
 name = "cryptography"
 version = "40.0.2"
 description = "cryptography is a package which provides cryptographic recipes and primitives to Python developers."
-category = "main"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -531,7 +513,6 @@ tox = ["tox"]
 name = "deepdiff"
 version = "6.3.0"
 description = "Deep Difference and Search of any Python object/data. Recreate objects by adding adding deltas to each other."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -550,7 +531,6 @@ optimize = ["orjson"]
 name = "dnspython"
 version = "2.3.0"
 description = "DNS toolkit"
-category = "main"
 optional = false
 python-versions = ">=3.7,<4.0"
 files = [
@@ -571,7 +551,6 @@ wmi = ["wmi (>=1.5.1,<2.0.0)"]
 name = "docutils"
 version = "0.20.1"
 description = "Docutils -- Python Documentation Utilities"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -583,7 +562,6 @@ files = [
 name = "dunamai"
 version = "1.17.0"
 description = "Dynamic version generation"
-category = "dev"
 optional = false
 python-versions = ">=3.5,<4.0"
 files = [
@@ -598,7 +576,6 @@ packaging = ">=20.9"
 name = "exceptiongroup"
 version = "1.1.1"
 description = "Backport of PEP 654 (exception groups)"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -613,7 +590,6 @@ test = ["pytest (>=6)"]
 name = "filelock"
 version = "3.12.0"
 description = "A platform independent file lock."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -629,7 +605,6 @@ testing = ["covdefaults (>=2.3)", "coverage (>=7.2.3)", "diff-cover (>=7.5)", "p
 name = "flake8"
 version = "6.0.0"
 description = "the modular source code checker: pep8 pyflakes and co"
-category = "dev"
 optional = false
 python-versions = ">=3.8.1"
 files = [
@@ -646,7 +621,6 @@ pyflakes = ">=3.0.0,<3.1.0"
 name = "h11"
 version = "0.14.0"
 description = "A pure-Python, bring-your-own-I/O implementation of HTTP/1.1"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -658,7 +632,6 @@ files = [
 name = "h2"
 version = "4.1.0"
 description = "HTTP/2 State-Machine based protocol implementation"
-category = "main"
 optional = false
 python-versions = ">=3.6.1"
 files = [
@@ -674,7 +647,6 @@ hyperframe = ">=6.0,<7"
 name = "hpack"
 version = "4.0.0"
 description = "Pure-Python HPACK header compression"
-category = "main"
 optional = false
 python-versions = ">=3.6.1"
 files = [
@@ -686,7 +658,6 @@ files = [
 name = "httpcore"
 version = "0.17.1"
 description = "A minimal low-level HTTP client."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -698,17 +669,16 @@ files = [
 anyio = ">=3.0,<5.0"
 certifi = "*"
 h11 = ">=0.13,<0.15"
-sniffio = ">=1.0.0,<2.0.0"
+sniffio = "==1.*"
 
 [package.extras]
 http2 = ["h2 (>=3,<5)"]
-socks = ["socksio (>=1.0.0,<2.0.0)"]
+socks = ["socksio (==1.*)"]
 
 [[package]]
 name = "httpx"
 version = "0.24.1"
 description = "The next generation HTTP client."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -725,15 +695,14 @@ sniffio = "*"
 
 [package.extras]
 brotli = ["brotli", "brotlicffi"]
-cli = ["click (>=8.0.0,<9.0.0)", "pygments (>=2.0.0,<3.0.0)", "rich (>=10,<14)"]
+cli = ["click (==8.*)", "pygments (==2.*)", "rich (>=10,<14)"]
 http2 = ["h2 (>=3,<5)"]
-socks = ["socksio (>=1.0.0,<2.0.0)"]
+socks = ["socksio (==1.*)"]
 
 [[package]]
 name = "hyperframe"
 version = "6.0.1"
 description = "HTTP/2 framing layer for Python"
-category = "main"
 optional = false
 python-versions = ">=3.6.1"
 files = [
@@ -745,7 +714,6 @@ files = [
 name = "idna"
 version = "3.4"
 description = "Internationalized Domain Names in Applications (IDNA)"
-category = "main"
 optional = false
 python-versions = ">=3.5"
 files = [
@@ -757,7 +725,6 @@ files = [
 name = "iniconfig"
 version = "2.0.0"
 description = "brain-dead simple config-ini parsing"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -769,7 +736,6 @@ files = [
 name = "jinja2"
 version = "3.1.2"
 description = "A very fast and expressive template engine."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -787,7 +753,6 @@ i18n = ["Babel (>=2.7)"]
 name = "lockfile"
 version = "0.12.2"
 description = "Platform-independent file locking module"
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -799,7 +764,6 @@ files = [
 name = "lxml"
 version = "4.9.2"
 description = "Powerful and Pythonic XML processing library combining libxml2/libxslt with the ElementTree API."
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, != 3.4.*"
 files = [
@@ -892,7 +856,6 @@ source = ["Cython (>=0.29.7)"]
 name = "markupsafe"
 version = "2.1.2"
 description = "Safely add untrusted strings to HTML/XML markup."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -952,7 +915,6 @@ files = [
 name = "mccabe"
 version = "0.7.0"
 description = "McCabe checker, plugin for flake8"
-category = "dev"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -964,7 +926,6 @@ files = [
 name = "mypy-extensions"
 version = "1.0.0"
 description = "Type system extensions for programs checked with the mypy type checker."
-category = "dev"
 optional = false
 python-versions = ">=3.5"
 files = [
@@ -972,49 +933,10 @@ files = [
     {file = "mypy_extensions-1.0.0.tar.gz", hash = "sha256:75dbf8955dc00442a438fc4d0666508a9a97b6bd41aa2f0ffe9d2f2725af0782"},
 ]
 
-[[package]]
-name = "numpy"
-version = "1.24.3"
-description = "Fundamental package for array computing in Python"
-category = "main"
-optional = false
-python-versions = ">=3.8"
-files = [
-    {file = "numpy-1.24.3-cp310-cp310-macosx_10_9_x86_64.whl", hash = "sha256:3c1104d3c036fb81ab923f507536daedc718d0ad5a8707c6061cdfd6d184e570"},
-    {file = "numpy-1.24.3-cp310-cp310-macosx_11_0_arm64.whl", hash = "sha256:202de8f38fc4a45a3eea4b63e2f376e5f2dc64ef0fa692838e31a808520efaf7"},
-    {file = "numpy-1.24.3-cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:8535303847b89aa6b0f00aa1dc62867b5a32923e4d1681a35b5eef2d9591a463"},
-    {file = "numpy-1.24.3-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:2d926b52ba1367f9acb76b0df6ed21f0b16a1ad87c6720a1121674e5cf63e2b6"},
-    {file = "numpy-1.24.3-cp310-cp310-win32.whl", hash = "sha256:f21c442fdd2805e91799fbe044a7b999b8571bb0ab0f7850d0cb9641a687092b"},
-    {file = "numpy-1.24.3-cp310-cp310-win_amd64.whl", hash = "sha256:ab5f23af8c16022663a652d3b25dcdc272ac3f83c3af4c02eb8b824e6b3ab9d7"},
-    {file = "numpy-1.24.3-cp311-cp311-macosx_10_9_x86_64.whl", hash = "sha256:9a7721ec204d3a237225db3e194c25268faf92e19338a35f3a224469cb6039a3"},
-    {file = "numpy-1.24.3-cp311-cp311-macosx_11_0_arm64.whl", hash = "sha256:d6cc757de514c00b24ae8cf5c876af2a7c3df189028d68c0cb4eaa9cd5afc2bf"},
-    {file = "numpy-1.24.3-cp311-cp311-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:76e3f4e85fc5d4fd311f6e9b794d0c00e7002ec122be271f2019d63376f1d385"},
-    {file = "numpy-1.24.3-cp311-cp311-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:a1d3c026f57ceaad42f8231305d4653d5f05dc6332a730ae5c0bea3513de0950"},
-    {file = "numpy-1.24.3-cp311-cp311-win32.whl", hash = "sha256:c91c4afd8abc3908e00a44b2672718905b8611503f7ff87390cc0ac3423fb096"},
-    {file = "numpy-1.24.3-cp311-cp311-win_amd64.whl", hash = "sha256:5342cf6aad47943286afa6f1609cad9b4266a05e7f2ec408e2cf7aea7ff69d80"},
-    {file = "numpy-1.24.3-cp38-cp38-macosx_10_9_x86_64.whl", hash = "sha256:7776ea65423ca6a15255ba1872d82d207bd1e09f6d0894ee4a64678dd2204078"},
-    {file = "numpy-1.24.3-cp38-cp38-macosx_11_0_arm64.whl", hash = "sha256:ae8d0be48d1b6ed82588934aaaa179875e7dc4f3d84da18d7eae6eb3f06c242c"},
-    {file = "numpy-1.24.3-cp38-cp38-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ecde0f8adef7dfdec993fd54b0f78183051b6580f606111a6d789cd14c61ea0c"},
-    {file = "numpy-1.24.3-cp38-cp38-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:4749e053a29364d3452c034827102ee100986903263e89884922ef01a0a6fd2f"},
-    {file = "numpy-1.24.3-cp38-cp38-win32.whl", hash = "sha256:d933fabd8f6a319e8530d0de4fcc2e6a61917e0b0c271fded460032db42a0fe4"},
-    {file = "numpy-1.24.3-cp38-cp38-win_amd64.whl", hash = "sha256:56e48aec79ae238f6e4395886b5eaed058abb7231fb3361ddd7bfdf4eed54289"},
-    {file = "numpy-1.24.3-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:4719d5aefb5189f50887773699eaf94e7d1e02bf36c1a9d353d9f46703758ca4"},
-    {file = "numpy-1.24.3-cp39-cp39-macosx_11_0_arm64.whl", hash = "sha256:0ec87a7084caa559c36e0a2309e4ecb1baa03b687201d0a847c8b0ed476a7187"},
-    {file = "numpy-1.24.3-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:ea8282b9bcfe2b5e7d491d0bf7f3e2da29700cec05b49e64d6246923329f2b02"},
-    {file = "numpy-1.24.3-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:210461d87fb02a84ef243cac5e814aad2b7f4be953b32cb53327bb49fd77fbb4"},
-    {file = "numpy-1.24.3-cp39-cp39-win32.whl", hash = "sha256:784c6da1a07818491b0ffd63c6bbe5a33deaa0e25a20e1b3ea20cf0e43f8046c"},
-    {file = "numpy-1.24.3-cp39-cp39-win_amd64.whl", hash = "sha256:d5036197ecae68d7f491fcdb4df90082b0d4960ca6599ba2659957aafced7c17"},
-    {file = "numpy-1.24.3-pp38-pypy38_pp73-macosx_10_9_x86_64.whl", hash = "sha256:352ee00c7f8387b44d19f4cada524586f07379c0d49270f87233983bc5087ca0"},
-    {file = "numpy-1.24.3-pp38-pypy38_pp73-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:1a7d6acc2e7524c9955e5c903160aa4ea083736fde7e91276b0e5d98e6332812"},
-    {file = "numpy-1.24.3-pp38-pypy38_pp73-win_amd64.whl", hash = "sha256:35400e6a8d102fd07c71ed7dcadd9eb62ee9a6e84ec159bd48c28235bbb0f8e4"},
-    {file = "numpy-1.24.3.tar.gz", hash = "sha256:ab344f1bf21f140adab8e47fdbc7c35a477dc01408791f8ba00d018dd0bc5155"},
-]
-
 [[package]]
 name = "omegaconf"
 version = "2.3.0"
 description = "A flexible configuration library"
-category = "main"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -1023,14 +945,13 @@ files = [
 ]
 
 [package.dependencies]
-antlr4-python3-runtime = ">=4.9.0,<4.10.0"
+antlr4-python3-runtime = "==4.9.*"
 PyYAML = ">=5.1.0"
 
 [[package]]
 name = "ordered-set"
 version = "4.1.0"
 description = "An OrderedSet is a custom MutableSet that remembers its order, so that every"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1045,7 +966,6 @@ dev = ["black", "mypy", "pytest"]
 name = "packaging"
 version = "23.1"
 description = "Core utilities for Python packages"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1057,7 +977,6 @@ files = [
 name = "pathspec"
 version = "0.11.1"
 description = "Utility library for gitignore style pattern matching of file paths."
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1069,7 +988,6 @@ files = [
 name = "pexpect"
 version = "4.8.0"
 description = "Pexpect allows easy control of interactive console applications."
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -1084,7 +1002,6 @@ ptyprocess = ">=0.5"
 name = "platformdirs"
 version = "3.5.1"
 description = "A small Python package for determining appropriate platform-specific dirs, e.g. a \"user data dir\"."
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1100,7 +1017,6 @@ test = ["appdirs (==1.4.4)", "covdefaults (>=2.3)", "pytest (>=7.3.1)", "pytest-
 name = "pluggy"
 version = "1.0.0"
 description = "plugin and hook calling mechanisms for python"
-category = "dev"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -1116,7 +1032,6 @@ testing = ["pytest", "pytest-benchmark"]
 name = "poetry-dynamic-versioning"
 version = "0.21.5"
 description = "Plugin for Poetry to enable dynamic versioning based on VCS tags"
-category = "dev"
 optional = false
 python-versions = ">=3.7,<4.0"
 files = [
@@ -1136,7 +1051,6 @@ plugin = ["poetry (>=1.2.0,<2.0.0)"]
 name = "psutil"
 version = "5.9.5"
 description = "Cross-platform lib for process and system monitoring in Python."
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*"
 files = [
@@ -1163,7 +1077,6 @@ test = ["enum34", "ipaddress", "mock", "pywin32", "wmi"]
 name = "ptyprocess"
 version = "0.7.0"
 description = "Run a subprocess in a pseudo terminal"
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -1175,7 +1088,6 @@ files = [
 name = "pycodestyle"
 version = "2.10.0"
 description = "Python style guide checker"
-category = "dev"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -1187,7 +1099,6 @@ files = [
 name = "pycparser"
 version = "2.21"
 description = "C parser in Python"
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*"
 files = [
@@ -1199,7 +1110,6 @@ files = [
 name = "pycryptodome"
 version = "3.18.0"
 description = "Cryptographic library for Python"
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*"
 files = [
@@ -1241,7 +1151,6 @@ files = [
 name = "pydantic"
 version = "1.10.7"
 description = "Data validation and settings management using python type hints"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1294,7 +1203,6 @@ email = ["email-validator (>=1.0.3)"]
 name = "pyflakes"
 version = "3.0.1"
 description = "passive checker of Python programs"
-category = "dev"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -1306,7 +1214,6 @@ files = [
 name = "pyjwt"
 version = "2.7.0"
 description = "JSON Web Token implementation in Python"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1324,7 +1231,6 @@ tests = ["coverage[toml] (==5.0.4)", "pytest (>=6.0.0,<7.0.0)"]
 name = "pytest"
 version = "7.3.1"
 description = "pytest: simple powerful testing with Python"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1347,7 +1253,6 @@ testing = ["argcomplete", "attrs (>=19.2.0)", "hypothesis (>=3.56)", "mock", "no
 name = "pytest-asyncio"
 version = "0.21.0"
 description = "Pytest support for asyncio"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1366,7 +1271,6 @@ testing = ["coverage (>=6.2)", "flaky (>=3.5.0)", "hypothesis (>=5.7.1)", "mypy
 name = "pytest-cov"
 version = "4.0.0"
 description = "Pytest plugin for measuring coverage."
-category = "dev"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -1385,7 +1289,6 @@ testing = ["fields", "hunter", "process-tests", "pytest-xdist", "six", "virtuale
 name = "pytest-httpserver"
 version = "1.0.8"
 description = "pytest-httpserver is a httpserver for pytest"
-category = "dev"
 optional = false
 python-versions = ">=3.8,<4.0"
 files = [
@@ -1400,7 +1303,6 @@ Werkzeug = ">=2.0.0"
 name = "pytest-httpx"
 version = "0.22.0"
 description = "Send responses to httpx."
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1409,17 +1311,16 @@ files = [
 ]
 
 [package.dependencies]
-httpx = ">=0.24.0,<0.25.0"
+httpx = "==0.24.*"
 pytest = ">=6.0,<8.0"
 
 [package.extras]
-testing = ["pytest-asyncio (>=0.20.0,<0.21.0)", "pytest-cov (>=4.0.0,<5.0.0)"]
+testing = ["pytest-asyncio (==0.20.*)", "pytest-cov (==4.*)"]
 
 [[package]]
 name = "pytest-rerunfailures"
 version = "11.1.2"
 description = "pytest plugin to re-run tests to eliminate flaky failures"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1435,7 +1336,6 @@ pytest = ">=5.3"
 name = "python-daemon"
 version = "3.0.1"
 description = "Library to implement a well-behaved Unix daemon process."
-category = "main"
 optional = false
 python-versions = ">=3"
 files = [
@@ -1456,7 +1356,6 @@ test = ["coverage", "docutils", "testscenarios (>=0.4)", "testtools"]
 name = "pyyaml"
 version = "6.0"
 description = "YAML parser and emitter for Python"
-category = "main"
 optional = false
 python-versions = ">=3.6"
 files = [
@@ -1506,7 +1405,6 @@ files = [
 name = "requests"
 version = "2.31.0"
 description = "Python HTTP for Humans."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1528,7 +1426,6 @@ use-chardet-on-py3 = ["chardet (>=3.0.2,<6)"]
 name = "requests-cache"
 version = "0.9.8"
 description = "A transparent persistent cache for the requests library"
-category = "main"
 optional = false
 python-versions = ">=3.7,<4.0"
 files = [
@@ -1559,7 +1456,6 @@ yaml = ["pyyaml (>=5.4)"]
 name = "requests-file"
 version = "1.5.1"
 description = "File transport adapter for Requests"
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -1575,7 +1471,6 @@ six = "*"
 name = "resolvelib"
 version = "0.8.1"
 description = "Resolve abstract dependencies into concrete ones"
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -1593,7 +1488,6 @@ test = ["commentjson", "packaging", "pytest"]
 name = "setuptools"
 version = "67.8.0"
 description = "Easily download, build, install, upgrade, and uninstall Python packages"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1610,7 +1504,6 @@ testing-integration = ["build[virtualenv]", "filelock (>=3.4.0)", "jaraco.envs (
 name = "six"
 version = "1.16.0"
 description = "Python 2 and 3 compatibility utilities"
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*"
 files = [
@@ -1622,7 +1515,6 @@ files = [
 name = "sniffio"
 version = "1.3.0"
 description = "Sniff out which async library your code is running under"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1634,7 +1526,6 @@ files = [
 name = "soupsieve"
 version = "2.4.1"
 description = "A modern CSS selector implementation for Beautiful Soup."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1646,7 +1537,6 @@ files = [
 name = "tabulate"
 version = "0.8.10"
 description = "Pretty-print tabular data"
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*"
 files = [
@@ -1661,7 +1551,6 @@ widechars = ["wcwidth"]
 name = "tldextract"
 version = "3.4.4"
 description = "Accurately separates a URL's subdomain, domain, and public suffix, using the Public Suffix List (PSL). By default, this includes the public ICANN TLDs and their exceptions. You can optionally support the Public Suffix List's private domains as well."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1679,7 +1568,6 @@ requests-file = ">=1.4"
 name = "tomli"
 version = "2.0.1"
 description = "A lil' TOML parser"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1691,7 +1579,6 @@ files = [
 name = "tomlkit"
 version = "0.11.8"
 description = "Style preserving TOML library"
-category = "dev"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1703,7 +1590,6 @@ files = [
 name = "typing-extensions"
 version = "4.5.0"
 description = "Backported and Experimental Type Hints for Python 3.7+"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1715,7 +1601,6 @@ files = [
 name = "url-normalize"
 version = "1.4.3"
 description = "URL normalization for Python"
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*, !=3.4.*, !=3.5.*"
 files = [
@@ -1730,7 +1615,6 @@ six = "*"
 name = "urllib3"
 version = "2.0.2"
 description = "HTTP library with thread-safe connection pooling, file post, and more."
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1748,7 +1632,6 @@ zstd = ["zstandard (>=0.18.0)"]
 name = "websockets"
 version = "11.0.3"
 description = "An implementation of the WebSocket Protocol (RFC 6455 & 7692)"
-category = "main"
 optional = false
 python-versions = ">=3.7"
 files = [
@@ -1828,7 +1711,6 @@ files = [
 name = "werkzeug"
 version = "2.3.4"
 description = "The comprehensive WSGI web application library."
-category = "dev"
 optional = false
 python-versions = ">=3.8"
 files = [
@@ -1846,7 +1728,6 @@ watchdog = ["watchdog (>=2.3)"]
 name = "wordninja"
 version = "2.0.0"
 description = "Probabilistically split concatenated words using NLP based on English Wikipedia uni-gram frequencies."
-category = "main"
 optional = false
 python-versions = "*"
 files = [
@@ -1857,7 +1738,6 @@ files = [
 name = "xmltodict"
 version = "0.12.0"
 description = "Makes working with XML feel like you are working with JSON"
-category = "main"
 optional = false
 python-versions = ">=2.7, !=3.0.*, !=3.1.*, !=3.2.*, !=3.3.*"
 files = [
@@ -1869,7 +1749,6 @@ files = [
 name = "xmltojson"
 version = "2.0.2"
 description = "A Python module and cli tool to quickly convert xml text or files into json"
-category = "main"
 optional = false
 python-versions = ">=3.7,<4.0"
 files = [
@@ -1883,4 +1762,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "550f452df57c9141e9996e4ad62f4e221178413b8c54715eba9757452458a4b9"
+content-hash = "d068843a460d48249082516ca2cb42e026230a8815329114a94c092c242ec6d7"
diff --git a/pyproject.toml b/pyproject.toml
index cd586d245d..502e7a032c 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -29,7 +29,6 @@ tabulate = "0.8.10"
 cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
 httpx = {extras = ["http2"], version = "^0.24.0"}
-numpy = "^1.24.3"
 pyjwt = "^2.7.0"
 beautifulsoup4 = "^4.12.2"
 lxml = "^4.9.2"

From 20a718080b7c13923f7adb93a617e76f0a87e73c Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Sat, 24 Jun 2023 22:06:37 -0400
Subject: [PATCH 120/387] Create index.md

---
 docs/index.md | 1 +
 1 file changed, 1 insertion(+)
 create mode 100644 docs/index.md

diff --git a/docs/index.md b/docs/index.md
new file mode 100644
index 0000000000..a9ebe8a63d
--- /dev/null
+++ b/docs/index.md
@@ -0,0 +1 @@
+# bbot

From 4727d9d27d64cd55c7a02f9e37ede691a5e2d7eb Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Sat, 24 Jun 2023 22:07:12 -0400
Subject: [PATCH 121/387] Create mkdocs.yml

---
 docs/mkdocs.yml | 2 ++
 1 file changed, 2 insertions(+)
 create mode 100644 docs/mkdocs.yml

diff --git a/docs/mkdocs.yml b/docs/mkdocs.yml
new file mode 100644
index 0000000000..0f8ed1e4da
--- /dev/null
+++ b/docs/mkdocs.yml
@@ -0,0 +1,2 @@
+theme:
+  name: material

From ac83b309000d8f82a58d6a421a2e0395662c38ab Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Sat, 24 Jun 2023 22:07:35 -0400
Subject: [PATCH 122/387] Rename docs/mkdocs.yml to mkdocs.yml

---
 docs/mkdocs.yml => mkdocs.yml | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename docs/mkdocs.yml => mkdocs.yml (100%)

diff --git a/docs/mkdocs.yml b/mkdocs.yml
similarity index 100%
rename from docs/mkdocs.yml
rename to mkdocs.yml

From 5c4efd94ef8e537dc9f66b3de812d51c4138bc2c Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 25 Jun 2023 09:36:35 -0400
Subject: [PATCH 123/387] updating badsecrets module for compability with
 badsecrets 0.3.X

---
 bbot/modules/badsecrets.py                       | 10 ++++++----
 .../module_tests/test_module_badsecrets.py       | 16 +++++++++-------
 2 files changed, 15 insertions(+), 11 deletions(-)

diff --git a/bbot/modules/badsecrets.py b/bbot/modules/badsecrets.py
index 62a3b8442d..a058fe198d 100644
--- a/bbot/modules/badsecrets.py
+++ b/bbot/modules/badsecrets.py
@@ -11,7 +11,7 @@ class badsecrets(BaseModule):
     flags = ["active", "safe", "web-basic", "web-thorough"]
     meta = {"description": "Library for detecting known or weak secrets across many web frameworks"}
     max_event_handlers = 2
-    deps_pip = ["badsecrets~=0.1.287"]
+    deps_pip = ["badsecrets~=0.3.351"]
 
     @property
     def _max_event_handlers(self):
@@ -33,20 +33,22 @@ async def handle_event(self, event):
                     if len(c2) == 2:
                         resp_cookies[c2[0]] = c2[1]
         if resp_body or resp_cookies:
-            r_list = await self.scan.run_in_executor_mp(carve_all_modules, body=resp_body, cookies=resp_cookies)
+            r_list = await self.scan.run_in_executor_mp(
+                carve_all_modules, body=resp_body, cookies=resp_cookies, url=event.data.get("url", None)
+            )
             if r_list:
                 for r in r_list:
                     if r["type"] == "SecretFound":
                         data = {
                             "severity": "HIGH",
-                            "description": f"Known Secret Found. Secret Type: [{r['description']['Secret']}] Secret: [{r['secret']}] Product Type: [{r['description']['Product']}] Product: [{r['source']}] Detecting Module: [{r['detecting_module']}]",
+                            "description": f"Known Secret Found. Secret Type: [{r['description']['secret']}] Secret: [{r['secret']}] Product Type: [{r['description']['product']}] Product: [{r['product']}] Detecting Module: [{r['detecting_module']}] Details: [{r['details']}]",
                             "url": event.data["url"],
                             "host": str(event.host),
                         }
                         self.emit_event(data, "VULNERABILITY", event)
                     elif r["type"] == "IdentifyOnly":
                         data = {
-                            "description": f"Cryptographic Product identified. Product Type: [{r['description']['Product']}] Product: [{r['source']}] Detecting Module: [{r['detecting_module']}]",
+                            "description": f"Cryptographic Product identified. Product Type: [{r['description']['product']}] Product: [{r['product']}] Detecting Module: [{r['detecting_module']}]",
                             "url": event.data["url"],
                             "host": str(event.host),
                         }
diff --git a/bbot/test/test_step_2/module_tests/test_module_badsecrets.py b/bbot/test/test_step_2/module_tests/test_module_badsecrets.py
index c7b18376ed..457e5f4402 100644
--- a/bbot/test/test_step_2/module_tests/test_module_badsecrets.py
+++ b/bbot/test/test_step_2/module_tests/test_module_badsecrets.py
@@ -79,28 +79,30 @@ def check(self, module_test, events):
             if (
                 e.type == "VULNERABILITY"
                 and e.data["description"]
-                == "Known Secret Found. Secret Type: [ASP.NET MachineKey] Secret: [validationKey: 0F97BAE23F6F36801ABDB5F145124E00A6F795A97093D778EE5CD24F35B78B6FC4C0D0D4420657689C4F321F8596B59E83F02E296E970C4DEAD2DFE226294979 validationAlgo: SHA1 encryptionKey: 8CCFBC5B7589DD37DC3B4A885376D7480A69645DAEEC74F418B4877BEC008156 encryptionAlgo: AES] Product Type: [ASP.NET Viewstate] Product: [rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu] Detecting Module: [ASPNET_Viewstate]"
+                == "Known Secret Found. Secret Type: [ASP.NET MachineKey] Secret: [validationKey: 0F97BAE23F6F36801ABDB5F145124E00A6F795A97093D778EE5CD24F35B78B6FC4C0D0D4420657689C4F321F8596B59E83F02E296E970C4DEAD2DFE226294979 validationAlgo: SHA1 encryptionKey: 8CCFBC5B7589DD37DC3B4A885376D7480A69645DAEEC74F418B4877BEC008156 encryptionAlgo: AES] Product Type: [ASP.NET Viewstate] Product: [rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu] Detecting Module: [ASPNET_Viewstate] Details: [Mode [DOTNET40]]"
             ):
                 SecretFound = True
 
             if (
                 e.type == "FINDING"
-                and e.data["description"]
-                == "Cryptographic Product identified. Product Type: [ASP.NET Viewstate] Product: [AAAAYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESfAAAA] Detecting Module: [ASPNET_Viewstate]"
+                and "AAAAYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESfAAAA"
+                in e.data["description"]
             ):
                 IdentifyOnly = True
 
             if (
                 e.type == "VULNERABILITY"
-                and e.data["description"]
-                == "Known Secret Found. Secret Type: [HMAC/RSA Key] Secret: [1234] Product Type: [JSON Web Token (JWT)] Product: [eyJhbGciOiJIUzI1NiJ9.eyJJc3N1ZXIiOiJJc3N1ZXIiLCJVc2VybmFtZSI6IkJhZFNlY3JldHMiLCJleHAiOjE1OTMxMzM0ODMsImlhdCI6MTQ2NjkwMzA4M30.ovqRikAo_0kKJ0GVrAwQlezymxrLGjcEiW_s3UJMMCo] Detecting Module: [Generic_JWT]"
+                and "1234" in e.data["description"]
+                and "eyJhbGciOiJIUzI1NiJ9.eyJJc3N1ZXIiOiJJc3N1ZXIiLCJVc2VybmFtZSI6IkJhZFNlY3JldHMiLCJleHAiOjE1OTMxMzM0ODMsImlhdCI6MTQ2NjkwMzA4M30.ovqRikAo_0kKJ0GVrAwQlezymxrLGjcEiW_s3UJMMCo"
+                in e.data["description"]
             ):
                 CookieBasedDetection = True
 
             if (
                 e.type == "VULNERABILITY"
-                and e.data["description"]
-                == "Known Secret Found. Secret Type: [Express.js SESSION_SECRET] Secret: [keyboard cat] Product Type: [Express.js Signed Cookie] Product: [s%3A8FnPwdeM9kdGTZlWvdaVtQ0S1BCOhY5G.qys7H2oGSLLdRsEq7sqh7btOohHsaRKqyjV4LiVnBvc] Detecting Module: [ExpressSignedCookies]"
+                and "keyboard cat" in e.data["description"]
+                and "s%3A8FnPwdeM9kdGTZlWvdaVtQ0S1BCOhY5G.qys7H2oGSLLdRsEq7sqh7btOohHsaRKqyjV4LiVnBvc"
+                in e.data["description"]
             ):
                 CookieBasedDetection_2 = True
 

From 738fd24e62ddfcab78492abc88c954aa1b36214f Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 25 Jun 2023 09:55:56 -0400
Subject: [PATCH 124/387] less specific tests

---
 bbot/test/test_step_2/module_tests/test_module_badsecrets.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_badsecrets.py b/bbot/test/test_step_2/module_tests/test_module_badsecrets.py
index 457e5f4402..843e1461fc 100644
--- a/bbot/test/test_step_2/module_tests/test_module_badsecrets.py
+++ b/bbot/test/test_step_2/module_tests/test_module_badsecrets.py
@@ -78,8 +78,9 @@ def check(self, module_test, events):
         for e in events:
             if (
                 e.type == "VULNERABILITY"
-                and e.data["description"]
-                == "Known Secret Found. Secret Type: [ASP.NET MachineKey] Secret: [validationKey: 0F97BAE23F6F36801ABDB5F145124E00A6F795A97093D778EE5CD24F35B78B6FC4C0D0D4420657689C4F321F8596B59E83F02E296E970C4DEAD2DFE226294979 validationAlgo: SHA1 encryptionKey: 8CCFBC5B7589DD37DC3B4A885376D7480A69645DAEEC74F418B4877BEC008156 encryptionAlgo: AES] Product Type: [ASP.NET Viewstate] Product: [rJdyYspajyiWEjvZ/SMXsU/1Q6Dp1XZ/19fZCABpGqWu+s7F1F/JT1s9mP9ED44fMkninhDc8eIq7IzSllZeJ9JVUME41i8ozheGunVSaESf4nBu] Detecting Module: [ASPNET_Viewstate] Details: [Mode [DOTNET40]]"
+                and "Known Secret Found." in e.data["description"]
+                and "validationKey: 0F97BAE23F6F36801ABDB5F145124E00A6F795A97093D778EE5CD24F35B78B6FC4C0D0D4420657689C4F321F8596B59E83F02E296E970C4DEAD2DFE226294979 validationAlgo: SHA1 encryptionKey: 8CCFBC5B7589DD37DC3B4A885376D7480A69645DAEEC74F418B4877BEC008156 encryptionAlgo: AES"
+                in e.data["description"]
             ):
                 SecretFound = True
 

From 5e2d5df91bf8c82190f4307eebfd2694e8aa58fc Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Sun, 25 Jun 2023 20:59:47 -0400
Subject: [PATCH 125/387] Update index.md

---
 docs/index.md | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/docs/index.md b/docs/index.md
index a9ebe8a63d..6cb30b8ea6 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -1 +1,13 @@
 # bbot
+
+## Installation ([pip](https://pypi.org/project/bbot/))
+Note: installing in a virtualenv (e.g. via `pipx`) is recommended
+~~~bash
+# stable version
+pip install bbot
+
+# bleeding edge (dev branch)
+pip install --pre bbot
+
+bbot --help
+~~~

From 424ccceb9dd0f9204e115ae7c359816c64459e3e Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Sun, 25 Jun 2023 21:00:16 -0400
Subject: [PATCH 126/387] Create extra.css

---
 docs/stylesheets/extra.css | 15 +++++++++++++++
 1 file changed, 15 insertions(+)
 create mode 100644 docs/stylesheets/extra.css

diff --git a/docs/stylesheets/extra.css b/docs/stylesheets/extra.css
new file mode 100644
index 0000000000..74f952bfe8
--- /dev/null
+++ b/docs/stylesheets/extra.css
@@ -0,0 +1,15 @@
+:root {
+  --bbot-orange: #FF8400;
+}
+
+.md-typeset a, a {
+  color: var(--bbot-orange);
+}
+
+a.md-source, .md-header__topic {
+  color: var(--bbot-orange);
+}
+
+div.md-source__repository ul {
+  color: white;
+}

From 9de47c7b28e906146c5899d8332226afa47b0cd8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <20261699+TheTechromancer@users.noreply.github.com>
Date: Sun, 25 Jun 2023 21:00:32 -0400
Subject: [PATCH 127/387] Update mkdocs.yml

---
 mkdocs.yml | 31 +++++++++++++++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/mkdocs.yml b/mkdocs.yml
index 0f8ed1e4da..38f1b39229 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -1,2 +1,33 @@
+# Project information
+site_name: BBOT Docs
+site_url: https://blacklanternsecurity.github.io/bbot/
+site_author: TheTechromancer
+site_description: >-
+  OSINT automation for hackers
+# Repository
+repo_name: blacklanternsecurity/bbot
+repo_url: https://github.com/blacklanternsecurity/bbot
+
 theme:
   name: material
+  logo: bbot.png
+  palette: 
+
+    # Palette toggle for dark mode
+    - scheme: slate
+      primary: black
+      accent: deep orange
+      toggle:
+        icon: material/brightness-4
+        name: Switch to light mode
+
+    # Palette toggle for light mode
+    - scheme: default
+      primary: black
+      accent: deep orange
+      toggle:
+        icon: material/brightness-7 
+        name: Switch to dark mode
+
+extra_css:
+  - stylesheets/extra.css

From 8b2ab551fcbc3bbcb93eae4578a0b7a436548afe Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 25 Jun 2023 21:28:58 -0400
Subject: [PATCH 128/387] add docs.yml

---
 .github/workflows/docs.yml | 25 +++++++++++++++++++++++++
 1 file changed, 25 insertions(+)
 create mode 100644 .github/workflows/docs.yml

diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
new file mode 100644
index 0000000000..67b129bf33
--- /dev/null
+++ b/.github/workflows/docs.yml
@@ -0,0 +1,25 @@
+name: ci 
+on:
+  push:
+    branches:
+      - master 
+      - main
+permissions:
+  contents: write
+jobs:
+  deploy:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+      - uses: actions/setup-python@v4
+        with:
+          python-version: 3.x
+      - run: echo "cache_id=$(date --utc '+%V')" >> $GITHUB_ENV 
+      - uses: actions/cache@v3
+        with:
+          key: mkdocs-material-${{ env.cache_id }}
+          path: .cache
+          restore-keys: |
+            mkdocs-material-
+      - run: pip install mkdocs-material 
+      - run: mkdocs gh-deploy --force

From 57dcf93524474524a58065ad0944e2d4117f0f28 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 25 Jun 2023 21:29:31 -0400
Subject: [PATCH 129/387] deploy gh pages from material-docs branch

---
 .github/workflows/docs.yml | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
index 67b129bf33..24f98bcc09 100644
--- a/.github/workflows/docs.yml
+++ b/.github/workflows/docs.yml
@@ -2,8 +2,7 @@ name: ci
 on:
   push:
     branches:
-      - master 
-      - main
+      - material-docs
 permissions:
   contents: write
 jobs:

From 662f06ca3d4ce5f9ffb9cf886d6a4e0ad5600c29 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 25 Jun 2023 21:30:26 -0400
Subject: [PATCH 130/387] rename ci

---
 .github/workflows/docs.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
index 24f98bcc09..bb15cd3d30 100644
--- a/.github/workflows/docs.yml
+++ b/.github/workflows/docs.yml
@@ -1,4 +1,4 @@
-name: ci 
+name: docs
 on:
   push:
     branches:

From 37b1ef7874408e2f723631312bd353550995106c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 25 Jun 2023 23:10:46 -0400
Subject: [PATCH 131/387] added bbot.png

---
 docs/bbot.png | Bin 0 -> 13380 bytes
 1 file changed, 0 insertions(+), 0 deletions(-)
 create mode 100644 docs/bbot.png

diff --git a/docs/bbot.png b/docs/bbot.png
new file mode 100644
index 0000000000000000000000000000000000000000..3bae442c7cce0549282a36861c26ba8f824da546
GIT binary patch
literal 13380
zcmYj%bySq!_w~?24;@MjEe)d5F#-}&3M1X!4bm|nAV>*FmxR(CN_T@uNrMv7AsxT_
z`M&?Wvxdc5Fi*^V&fRC9y?3O#>I*_VT095@La3-9`w9X<qXIufP;~GYZtL!G@C(;j
zLB|aOA?p6`2Q7(<=m7-62vL-k(e%#P%Y3V^sde2x)>H$Z=jUePWJ;F~DGt(JO-{c4
zaozk;%+{j*Q);S{O~D_#R9fApshuoK`BeP)FO4DioGT$rA&k{Sg6#y4-3~5qJFc%D
z2b*jxxTSPl-+m7~U0c``KVLdoa2s{YIuVB`{C_X;Iq7}b63wq4=)^p?f3R|Mb2Bow
zkByCWb#+ZmX?@WgG#8A@<A@4@Auf#QV2I)S9Gm9C!ot$h-K7@axw*MF6^1RId%rTp
zyg0eInqF%o2&AF&b#^o09T5>xZt(5u`r7yHTM<#w!9T8Z_d&3y?pfi=Fa)s}vC5>7
zO8QH-&<=HdeSLLx=k?y0+S=OF(^E08{h!m*u6d6i$w*2{3jFUS;d^F3UtgA(nAp<N
zqErBGDZ&pGH(~vA+g-P;J}-|+LgM!4m)Cu<3}b_X2q=jSA|#Lz)!N#MflWXy>}=fN
zxF|#$lbHBA{i(xmSCP4J7y>&qx4s@(GDS&F{<*M_UMfIbM5L*>IHJY*C08B?CqKXQ
zc#h1N#5uUPxRjI>-Lm8X^IeK+yl|7RU%%qv<2x-h#((<XD<!3`hKO`}ZEa1^d8OT?
zD_l-qzTRosFn{83*^QQ;Hs;TtKVe~EU%q^ajEq!NRJ5?Lpmr^-WNOl<r=bz?yEtt1
zzsAPK_VMvaptVvk5llTkIhmZCBqJpyq7!vLSdz$nl5oLyc6RpPmw9aY(%rqbt*s3#
z#5nDfV8e>Bp&`31DR62mEG$aH*=h<bOiTiBV1FDOEE`x*KVcdQ5$w>_tA9H$V(D-H
z%@~1oqzNa{&1a84+nbN2d2IQ!SOdJu%gYfZW?0~(8zbpOYT1&`E7GrCC8!qF=%Nt0
z5s{HPO|BNYy0l&V{mCZOZ0zh-w^#qbn{0k%PWR~SEMPt6Swcbr0e0y4K{f<@&7-5E
z*M%>SPEYMGH}-aS!3|JRQGvx|uieOqOH8b>pR0CUY*yUp#<H#Rxw$yPA$n*{*E{*?
z>gwwGJ0g`#(W#-Koul+OUo^ot(Qoy88xYVs?sMFo`q+w1HDhaIgH6`T&Ox1=f}Z|v
z>WxuSN(%n1>03n6WKUmTEWO09fr0HdH8`kh2?+!19?YEPW}luY3WH|%s-&K*S!ZWw
zYEk#CNHTU*Kq7k1%ue9l<!0Ze_sQm1pld5@tjopWYD5Hd&6m84I!6AnS#R{(nrW_4
zCjUaCOTO2^l8O{<oh}^%!?G@W9Zy1PDh(M~z9#48Ufk1g`TWb3P~vF${P7B9YEUmr
zekUWz?0g*^9pE?$UA+ztKEBw<$oSrZUSSat9-~(Mt#f8-w#4ljqd<qr!WfEJ`@cWG
zAWC>xw6wG)CMGgG6dpY1P2n?W*4*-9VgXCLH{a0r*7L)M55DL76uN;O#?)+LVq)Cf
z(eBx`0vn^5dU|?Xr}Hp^7DFkIznb-KiS6y}^9@e;{(K=OLbS0AQcG24FA)AelBp$p
zPFsA>Q2`i;YL6XcjQsNro3EN*Z6*tC>U49Rl=y9JZJ*lDGLCNX@j`KN6;)NAroKc-
zd3Pu%EALF?<6N@u{P|O7Gs&h$3^nZnXDU?7R=pdD!c9^Fe=Tfo7R_a-H`dhD?C$N=
z-IS|LF3JwL>I}n2EPpW`7xD*BJtv2eh@r~)<tP5!I_yB5eo!U?Ezs$_S6>YM|4k(%
zkmfq+@c;e$H<?FoI*p0``}gl)U!1b235{k+Tn|4UJG@<xkdS!hwDfYacD#X)+Q!BP
z6tka{*N^@`$DmXs2i`CJ`0?Y7k-t{1I`oVvFF$`QQ;hx84VKXJo@#z>4)+Xwc6D#h
z|8PYnmmwG2RSQ@MP^r1g7!bkK-I!-f-U;m9DZB=Mf7O+YA9RSC3(iU1UjnF6%4Nvn
z=O=Jm?F<8zlDpistihS|&Fi4NqJrw`5{jWRSyfe4Pa3+pwsw4bzKnl6jG5oq=slVt
zf@ni+;1Uv!^!Iz4QYp9H--%VJh>k+>@rOo6D6TYcLk%mI>+Dh-hTE-1(*AX;QYa}a
z%RN)OU=U2TKii#C+j#cD<dfY@ITj8M{w-;#Os@LwY}NXJp9wVg?a4;u2r+NU5I_)A
z0Dq^tk&%?m50>0z2yZ|@0DwZ$D;hjV7e4?4imRi0DcYFA;$nrZA|?W<n?sC-V5oSG
zI!EsZx@+^Sn{U47<#IY^!j`j@CTf=Io|cw{+1c5%Y*-i8LTMg5)3~>qSpRJ+05%8-
zPw47k5?6Nn+b1fMV7HLCGAA)JqH=R{Q}~Q1uW(Od2F!J<&2jIIWW~h3u{*=f1yccN
z>b~`4Pks5+q!ab^D`#%@)8(7fNj1NHwzob$hAlo?Tj?9=zkmNeJak^7uWoPr_N}j{
zN5V$0mR&VtWfPT<o<5(%^#;{yVEBleJ44VSN?qq9jD?f)ucCql($MhkWK2peRj}Z7
zk?Qx6onN&!lMPPGf%n(TZ_4#;7UO^Uv`F&uj&^m0X5(<lb3~;*u|w_*4cH2%3O;`P
z%zl>NeM`MVtsnG8i>2>xUwn9I<4?Ao$gU<YFOPTa-4jw$vg5VvKZ7^=#<uR)W2;fW
zo1?z9;kS9n684v$Dy_z{78dmNycR$M82Kcyu9(r8$}S`%BqE}-)e!pJ#AJ1~>m9&Z
z-Y9Bc{2UHWaMwE(ZKM7D<2(NlQc^qM*Mq0_&hGBySC677psODry|y<^S+o{fY74xN
zmAd=%#4cGSkR(4pe|>GuaiLMez<}rUxkD<~n{rG{Oz7<}{fp@NW~BmGfYIQlDOY7M
zGF9Iok!PFPfp=%~PCY$6cwy*>PYDSKuyekekdly?SXo&KrkV@txVxV=x~wA*h>Xn4
z9%M#gZLRzMLK7%$O5J!iSU$y*mA`*|_7_9~0|Pslg<%M=kX&4L=lhFAs+oecF|m$O
zugN{Y|3f<%bHZnZv`6#RKABJ_4uCFQbhO?_Oe@qsH>Y!GJ|v&-vN@Xh*m4+#Bzzn(
z6Gclc;`%#F!WZT0MibN9-Q5k4Zu9qV4)Q2AsWDjRPzs-$CVH0L?(S}0US1maOe9P&
z^(AN0-!Lk}Pof@Q8yXrIvulQjhXZb}l0JSsT(12Su^0t`a3<MKebsXMeuVABLrFz-
z@T-nXKtQ8p3IWyIl}JrZ1&`=vOP&%3=N-6qz4j?391~7JM3g0Hq0|;|doiI>GNqa!
zEC7eg+|*b+sLaE@xw!%Ru*+bSE`Q=vM#e)1hV1zG37DqIWl=+MF^8B~I&+V3PgfT+
z2L}{xJ`npLfGu%ATwENRm|onp8@m6h0f5^Z<rLm2+q#DX?C(dkNg&c+H2;IPcMJiH
z)OOnX`rrMp&p_uhx3aPmN&~IhY*?>W*TKg}^ik5qXHe2hOH0&L(^FFhEk6Hs$~miS
z|Gl~yQ&Up~5l+y)ZwI+57QVloM9foS)SJr@Ha0blWJ?83<jL8iK7alU7!}W>M~~Rq
zivUqtjRoCbP2wMU?@+$Y)y?Gz&**zu1#9bK-Ll@s!--WY#B9C8{P_4dczCgNV&I|_
zYN^M^$ACPru&{vsD2|IT@kRcW2Ka)kFq8n)VTf<SwhpxPS+L~*(Bk9a(R%rS1*Vtq
zG1ewQ9WFGv)t~Rfqobp{=T-X$2W?$@4pvsi0e1xT8PJKsMPfN~8@1k)RJ49AE^b$s
zcebAbPtvvNriaQ%zrisx_2e@_*Fv+$&PqopE-vooSa!viF9OW!Uo_=kyf7npL@rlQ
zSP1S^$2YeU)DJ)t6MZQBrHabbw);jP84NaFVbmsI)_Z!eyxh@|JCF@W0U~@hDt4gX
z;zRMAEZ(>a`7<aqv<tK>QLp`l7Y$F`MHidgHo-&s`011P-mfS4gwNR$pXeP=bHh5p
z7Xb(sZHLvpwA2drzPFi^l2X)wdG+BrSX=NY=|E+-2V?mA`O)7=NJ#~PuCcbDP=}Y^
zkcZvuxd-0Aa&mG$e*AcQea_CtX1dES4P|Cx(&VHFM{jCs0{o7e3NPaQdu3~Dj&KSM
za*vH+nrIn4-jo;e@*n6Wu9`Np#C*?o*LvQMj1k#~Ax-57)yaEYBN<3ZLmGs6d3Zoy
zqf9Tn>>C;y8XF^CM<foo-`%`@aGdKB(`Z_t-MOTU)X|Cb$_4yzC0=Rz$AWHw9PMaj
zoK|n4jTW*y>(?(`aWk;IrufVDB)eT$PaDvG(?0M$($AmSIVz3F<Cq_um(?I&!h<Ow
ze?kYM?y%EEa-m}`pJcvhuBA$##^s+oH9fD+YwO@A@Z4oSD>8u1MrW)M6aS(4@55dE
z-swe9_`GOWbY}A}N{q}#`RcsBj-?Km_)M&p@ywwBZA?Pwz5olC&%<4HUSD6|2d<uC
zqM~aw&pkYzxLDZJ4Mfr7%+Hmnb6`s8JBZAh#hc5;#FuWl5MX1}*UTdy61X-!)YICH
z*+xd2%c%rO95hf^HN5)LEvb2aD4g8={J%4!U`vW{R9u-bbtRoU6h81`hWfwL!p-k~
zN7L9B9K+A@6n;IjB^`)L19gYvO=a5WbsXK&BC%9Taee)xIli<Qw{lUvo-{E^!m|Fu
zx^#C{@S9PoS${d+lzCLBOw@DM_y1kIB`6$b$|vHDAx1<2XNi$hVbal<G=7k9(GWfR
zQjGPPS0Y$MA@8{zht9c}J@oj8?j!L3KA~pNeXv_!Q`6-(KBwO)u@qNYY*V?euY07;
zLN{th1a1pkY^)iP3wvuLA<oBy8sGSVJPrp}3~g!QNF3-E{}KvYyOe?<64Jkk*tbW4
z{nHzmZ;#&Fy<7PDi>CK;*7SCc<XVS$WSl3@i(TYrWC_^tPc4V3@6vk>U%nS1f?jjL
zRVG8csTLL%Q~}KFe>*t-e>m&8zp%ZrQ4e^@{^GZj1)-%SC_-WQLB;GS@lcH`S@-Cu
z<9xkCaB#44GPjG1%c>C?K1m&g#O>+i^Kb$*$n5-lUteE?-OPuv>8ku~a6@j+&h2h)
zCvD408b7NohQf&%h#=}EQ`cvE>pEydBo+Vdf|d5*cUG1D{{Dblk67XKc<yqN<4v#`
zx6`v<8j<((_O_lc`4ZnB1fgMMz1^V6@~DIz=}v%M!cZbU2Ri8!yXiwpp%@9uN8qpx
z#U4+$6MfTv08AGvO}g>}b2<L@$1|__RWdEkIeU1hC@5IpoP+6haB%SBM{;_1W9mXM
ztWf9U$!UNl!bBjFIA9Kd*?ZkQAVAV-DGcmtR#sLK5fO<quP}rOKecL>_&_XeGIMWL
zL|!o<BP~sVb@edTr%?DVYn||-yQin8H?v3=zfVh6qofK`%24b>ksldezH`+U`}_Mh
z)}|t+wRwk!hXC#Cn*zgNy?uSY-rk2fid@R=K?d}_=7L9*Q9g$&9pmHbkEJgDq!@MA
z?~-Ry06M+_zR5=5`tEK<LPBR(zP$x5HQ+?d$HG4WiE2IU#NP<~k0AB;D+HWY!6tMj
zeh(xvxN!<aW@j&NPZl*H<x8eaQyw#w6Zlp>jyxfgdFHu0>$UW@F9C<1fr0O<iipcw
zDsc%3z&yE6yW9aK1+a%hO#fSz0SfoL7y!UFz}ZFb<m42+TL$YqK6Wh+-9kr4CnY1}
zxw#S+6SK0gC@3g!`I_)2!j4<F(m41J7anwVIQ6lanOV~$&bQM%eO{`mzG^i4X96>h
zj!8=YVPFYmBB(fu*mN0LBsnRmpx3^B32*#>dHORaB4XlA1=d}yCn$A$W#%UR51Tpb
zqC{G}DMf{ax?&q8Q?_=#_+Ak`QH&_Si9~w+0Gww^`lo%XH2R*u4hia=r|VqX+KSlA
zS$8~8W=nLKt1bZ7qMqT^u4Lrrk84z-1_y(VYv^|*_uY<;jxI4FLHJi*hiW@xJxyk4
zC`J~A%bQ9lLfC3FV<3@z-Jtx{7fK#oStP5ttce^T^V>fP>{(DK6qtp>-s?NhhG}=#
zTm0VLjkY3K*lQr76|&y@RcFugGE=k;5cbcf9rENzA^X|NyW8s;azViQE>AYemSsCV
zkE6<xNzP{b<0-;Ws85mVRj|~T_1;IO9nVa{8i3f)YCb^9l$XqBB<XW%&6G!<H)UJ3
z=$@z49z^$UQ0@omn>RC{j!9BaKhQj8V`B?%dH59SB*)iwBiK>41s-F(#F!O7_2GvP
zugO`z7La&yi@V@tzWM?fF9X<nkqV(OUND}{t|}M<{lpgZHcYHR^Xl$y*$@rSS@r@r
zYIJn;^G{=3Pf5*ilYU)50N(SpQj2@@%cO#`U=Xr~$plX`RZ@VlpJHstCLGWWdSU0F
z6??pS751!tNBf3v6V@ybWS`khmx7Xem(z|dd3*YLO_1k>F&C2<OoByJ)Msb9?DJ=n
z!04X!!Y+D>fqn9Sd-La2HC~^$7Qa1{+O$ZMRp5$>i6O+pTT{6Bte7ZybNHMo&s~&m
zsa8*1OS`g<DP*z<wD+5<or;HaTH!EWqt*=kfn>(d&pZKdTHwKhqX2d(s;NmiuRxSF
zW>q;$G8V}(7hBq;rC{qAH;X}u5|ytZSXkyT2*etbK&bdx$XC(0TS&$*R^LI;DO0=l
zhGh49fp@TkYNjwmd|VtL(n_+riL$b?fQLvudKCGME$ul!m(O-V3fLLK4u~(B05r>h
z)CP8@CG(4-NdbaTFL(W1^-nr))M2N8p=@3_x3@AlRx8JqCC_Xg;6ZjF&gdq4?VpMu
zh@2k~yszz5_Lb{`3N6IL!oREDM1CHX-Cb^z0%Ac#@kZQ$IhYrsqoUSolh{axrGUyf
zu;{+8Q4KmwXXmWnYdEUK=U?Z%92ixt1@V;{JXiLLI&ye(63K!pX=<u8rGjAnW!RC=
zI-1R$TRu;;J&#C{z(IIl9$P%UmIG2BaV%f!g(-j;apC+Jc{6i!b3kBc2qnV#ck<9M
zun#F;Y#kf~?#>E$d3o*9h#;V1Y;`WYovSh{vs^1{>Bg2Uhc4)_%ExdB1RVx3vf}?n
z)p$&K;fC$KdSE7={_?|YFuqbjwcF+>nEC<1?**83IX9-kLH_V9-!Sv=h7SUPE)_{e
zyER*728Q_R>S}VlFx8?i;oY1G>qAx1aUlaFa{6#tK+^ac^H4@=rD)@C(-7m~Opv04
zG=q_I4LP|c1|+DYglj3J+nAr6oLt*CDKs>+qM`!maJpq@=jTREuB_SH6#)4F{f)}R
zA|ysD-TG3Lb+wfr>s{WnSfHE&E(@d#K0ZDm)3g{mO+AeOrvT*InhK$<t-WPQ-1>lU
zIvUbyE4eWagGdoZ#Gun<c5Lg9*ZZ@7SCjVe_}8T-{a&5?4;Yyb4weB64Zm;!8jIZw
zZ`PO&V3|Nk+ncQl9h1K_q>_R1={LeiNIKlUK_CG7?0285J(rV{laZ0}@Tg-oam~ug
z0$rFI%|rgVzt~=n0a;MK^c<9Hr{f*fO@-!L>A}Bzmf*vVj*jo85{Lc(iNLJyLu?^m
zA%|_>2Rfk3PCp%_5A6W8J7_f`*jlELKLL0vl;Xf%Fts<D=A=^9@OiO?p`jtb^Glm7
zpuBo}H`XD|abgZoOLVKR2~a!{O2PhKzx-3?27*fYEugC->Ccpvl}B#mzi9e+d%JIq
z1JWpY<;;kBPsQgbkWTCcKyMX@mz!lGhGkGhBM`oD$=D9(w#>*WC{!|pk2IXnP~+A@
z8=IRcA3qAE^lE@PKwe(ARaPEa_j;;V!mY;aK~@619)j6acjh*RnVin8f`JJi26fGA
z6RA{i3?$amQxr_{%tZzo0~B#E^4oh@qIK~DneF=@%1sXgz=gmZFktmQ#sv(>=jZoe
zUZ=lhmeU|~BMn1nyna0?9FbmVqo$^Y|4tpH{>Eb}xphVek0goAQ-k_`^^MO)>m)|#
zVCR^Oq2ZF*bNA<xk#TXbz`%R9d`uF=f1}>pjRXl;Cz!Jho82R`H@pqj+RlF2`8}O^
z2!!y-LKVB?@1ZFvZw{7Po<D!C^|kL?TG*%~O1;*%r%-Z+99Bcl;8o06<IrB`tWv=G
z`gP*KX)y*iVry*;4ENx*y1TouU=t4zu2iq#!>3;E3!nqM6-(`0*8aV+;(WTL(Gkn~
z6jV-pQj!Ol=6kP%KEDJTC;#2M7b+?vUCu9Gyy&B>VPZn%Ei#nuXX46Q$=qWEuVyOo
zC5cdO?+&-UZ*Fb|lX>{P<8rINw)Ur@qM}P`C=h&rNf7m0GwCIp7?8YyPUvm@zOAYl
za5iz@hLMxY&Fu8KOABiGf>%IR;t>`7H8g~;O_@mhwfv@fM&&3?9RupOcx{>U8efdF
zuCC6tX<>Q!9+0$u|Nc3Azq1+ss#S7$h9SImebBa9G;|~+*l%84@}>eC2j^rmBTN&C
zR812aNGQz~Qkj{a{yJs*SYp6Hr=i6tyhcB0Fos%_nmkbrrInhtI1Hu?aQ4n7px)tA
z@sfYODSu1rIp5?MR@4FK;83t<!-P1yxBxA@fHj*d^`)icJ0jDUMsmy56lCZS>yN!j
zEsm*22YQAiaVDR@v`jYUErSA0`eYnW4cR?5VmuC0=%_A*s!S?3FXKA@c1n+hs(rDe
z^c*rVdQ|{m-fd%;WFYEXz|_p_EeFo<JFgC)@DC;P<S9j*Z~z4lnhR6|ld;@uZ{#rE
zDAh#TnCVUCPPvvS#oxnF_g@W8ZMIXKySC)|%!va)#^N(-9k$`}`+fzSiO8CVRv55O
zK;_O4mKpfWk_l*}pkv83gu|5BSh5VBZ5Y(U{yYV*F2RH?^g)k`0xZDqt8sx%<Y#pb
z`Z97JRdT!@AWv-V?K$j)L30B=#z?02zt+`iO^p$cboEpA@(&;X8B%2JUi;AAE?r&{
z?&2s1V43NZOQ?5ZLI7xOzZ5gyDM?kf6ljd)S$G$b#{6i;(1hkTEcujxT6p+HHW^3?
z&Yan9Tx(a@P^QFzQe9i-a2*<tN%>9J*gVwmv4Y!OGaJdk{#VwQX+mF2CS#c!>zF{B
zNihmYon%u8hW)Cxc(0XG+fYHQ?zWv08gti2V^aR4oRe$e6xIpYJ`kgwi%4aFgd`tB
z+mq?%SZ4jZKYndsz%mPn%Yf?Wtd`4J+r)DBcL<{(jYc>`<{_8wIsgeAV;i?3qprjF
zo(&;&4DJ+F?UlsK9rLk-+aX^FsT|BV#9|l-n*ab@=n-(f@DGKtv9baNlJf1p+tO`x
zUY)D4;%Vzfn`R|ydwI4JhZdxK-oAUwST?>emM0qWFJI;vpY-g(BMgjy1DnsKhdz%9
zPJn{xwKX1G%Jgs||3xh5)z0wLt||@=j$$D3EDW&sPnEnW8#D`tT@@{3gs`C)8}%_4
zl0%A~)fyupLHOs=zZ=@kXc`T%VI5<Pgz{HNoj?0U9Djj;O)Ns#Xz}B-;zPxa@u<R=
zsZ67{yS;wEAVNAk>W4@S#A;XahphZtmhNuI>7|v@(UO41U>vZ<WvC59`}0eq3nTza
z1K5tVX=f#4d%0r0lg;%X_XC>#LtOSDV62oIwK-0)Iu82au%^cMN3<938LwlxiO{5D
zz$>qWs2d)PqX-5HVkQ(V7gzP0^zRnEmg8-*%)Ym@yd!+j8)jZ!TI{skdUtmR&IdNk
z&P+waU$QV*)Nv`R>rF74aVNcV++va6vKGGsU+xz=LLcv~vb3KvP@wO79sgD&9dRS_
zB-A-^wvd}FQfr9ZUMN&a2jaV#1Nv$%9W5(k4<zKAw7p^ms_-ibJNY5}MDT?>XZ<*s
z2Czfnj~_pN^27r)0q?pW-j-m>)Hgp{Gf(4483J-^_iKz2ky_ooi=%ZQY(>3)?;)BA
zgjm*8id~NNZw77_rI`yasypU!T-aPyT%Qt)Z{mnnNiuJmSS|P$(V5koNki*&9gs*Q
zXt53sJYD?2Aq0EdyoA~{xTVG4(vt0nygMUWE)<8j9`|4~ih^r@xs4bC+(e+-0xNN*
z!stJ-ON!Tq{2!jk`~h#sN<MQC+xg{F0plJWoU?;TRT;5?;VEuTAp5xfQ3CFwg~gxz
z^)WCt_8L5K4SAU=7}oewwR9`#jUmasdwFrOHIRv8@4`$zfr0Han8J#RfK`V9NgEy<
z?})T)JGz{q`-{FE4f$g6VVhW+Sf0Ro^WtJp25OVW%fZp;zWt+2uK}1vv_@WFJO|sX
z(jn6qcrB6H>x@ovpuKJvWwY@n3%{r2vE>aa0BvGbeGo8zo3wzR$uPv7s%SkDv*QDS
z?;0G69qMwwSZ`0a480KDrss`eL;;uwBQzDC;qb`Flk8O<fFud)=bb=lkG!Vt*PDog
zKmS$lpsdfW1BfeVTy}TQJUl!=vu^S}T3h_)#lSPXwb}jDv;0GHcB8VSm_6ubsZ5(b
zX?tRX&R-oW^U~7Nz`O{|ZD0rsr5qe<fM=>W#rK;Wh`nIflBFnS0CR4!^9sq9_()1h
z>dBLTK#?U(ad$QryKd9`>s;~CPXi;gBkpx+i(#0K-!YtS*CQz@iH3#-7*b$4ks_^L
zyR#av5S_sTtiTj8$M}J(M<S;YVqP8HyUqcDkp2BH3(yb+ByI+&fQ7HXCkM|Ocqgqc
zx6LIX4okmYH`G473_CeKuKqe3elMCA_28M~3I*Sn@^VVWebvXsQ?}JM<+yqpK(X$Y
z%1j4xIO|Cw+m{LCBQ#67%6AJDYqoZB6*EOvR5kjvB3x)ah)&=@04_14gs~4#$Iq^$
zXt}?;Hpe2}+?vRrDPKKsALPg}z8q#O-mFHUM%$-llU$KVbAIZ(qu9X8pTTw^p`p0+
z9~tfC*0M(d2P5HAR>UAcXPd@|%ouuYup9P3$M?8GzsdFAU#)r{=SbZ$dPzUwM>Z_W
zR?g0q>FEz-g1hIMJ-CMI_(m$}6=BZn)y)|t67z^EAF}y9<8Tw8mJcgoo^xwg27Tm6
zK%U-RAH3%zJ2&GeIGNUSs-g&K_vg`5L5R;O@jvI^v9OVh<jL;r>_nk3(L;op!Gr^j
z$_(g^Ai*pk*_>39a&Vno)ZIr`Cylo~R(DNYtByhMb~oi>Ns$%ALXCsXT*jF-^cYO4
za5!96mZXLW_#wa&RibtIT2dl)f8)lKCm1!WWL<&XBATFHK;kco@oaj6hljqtE)G->
zL%>CFG&fNWN7PSx0RgTwU?r$e>FQy^g`Aee&v3sy=;tu?|Naqevhk?1TOLxsIs3>t
zW}$pr?BIK7!$CJO^NSBGq=$;V0DyK=9xlYEq`cslXwSsKB>MOg4<}P`^ADjb&i&S)
zE}opF!B1&_|62eI5s}O>Kxl~X*Azs4*5ni!N$bN7HvyKjN(lOUTS!-PyV3&@?b%q=
z)7ZmRNRIifq>8+{l2G3gXqW?PGGYYgf;91dk>;hvfKuo2;JREM{{gT=O0J!YF%zYu
zEMtsh@s<n<k|d1ALnG^&yJ|#(q~HZ5JJ|Ow=h*lht@YTSZ3+KrIbSk6&}K7}%NwzB
z5~3X-l7&F9gC$r-l?LInlJxE_?2Md0$!-qS1UHi#jNqO(XK=j+M~Xc*dt+n9>wZmi
z<Y%D7>bxL?02&IW3Gy}5z;7}e*OR044>PeuYup^Ln?u_y(Y%-h1_hlX(o3}u+U_ME
z9T2$;e>|^)q5F4$$V$ea$Wx!&d8f9Ku;1U6j9GrNii(EdJB1WEHz;+@2cI}W)DRu8
zW*_xoAGIdMyNh+=i4EMe$5uqjxR|BZAn~yq=G>tsb=$3Bu|SJ4t5`0Y{tZt*6@O`$
zaJO{sk##=gpeN{OLlAxw-)teibf1pJFD!gY<99#Y29^0*x~pGOqglOmb*+Z(%>MlO
z^FPZB?vGA&(HOK4R{G3}9t$0V(6T2qy8^vsZq$+;C($=3CSUO#=}>T=pn9(bNi^`r
z6*HP7TfTpfiaPX~oNEPLf(HS3Wp_`HixueSA-3u=^<D6s&+TU}IhHiSl4Jzi=nu65
zuf41&s7VM^+wg29G14Q`VUQlJm0-EPz#|=?q6wRYbar*k>5qDH;}H?Hx~yX>!@Gg^
zb98c2Que2Q%S*~APUwA*TayhVKiv2#+Zzu;gX!9?<pvF+Uk(zQ?oi>W2L2iFI#W(8
zOU(gd*sHcx-{!e|y!gb*5O^an14yxOCO&7Aa(j5tLx>pU7i1h8LIH8@PVGTg*T(qK
z^b8JZZ@a&BBI(79p%w^H$>l*JG2y>CjszZn$+ZqR?)0>IB-AY!{HAK(X9R^H`JRWG
z+BK!6|0!hOg)FeZbY>soq^%QQQep?D>{*4C5Ms%TpazyqcDG15X?$!<s}pHkv_L|~
zrSDBSL49Z3p(;M+NaXMJb>{l^Y*0|uN0K~(u42V?!QuxauN)v|fxjDi{@RjkY<eH{
zP*qh}Sjd4P%bs^L1PI2lR($F*Pqb6J9kxyPrD1-qm>*%n->m6Cre%6MdMyq9Jlyyl
zdQ~-3Re_I)_o1<?tKj`!fDggvg&LXXAuHZQ+GcVBdZt_duE3~{H|~4_+&7QEsJE)r
z%TXYURO}fALx7|S)z_%eMuQyG`UvG3xpl|TH!M4eM~}8ow<klMER%ya;Z3!s7Y{sl
zr2^YaFTbPg`<u<_GCf3HKn3ma4c3-}Rj}rZ&_}*9xSR86Bc_6>-O15cV3_Lr23wBO
zc05n$F&DhuF}f#3z6(uV$(K?L$8>pz8{|bCvhIb6TnAZ;>+=ID?Z_7(CdHW5K(HJI
zLPkOUJT8&|>;zbJj67)lJfhSiwMLB@wLJ;!zcbd-Ll{vYnW1&`a0MR<wVo-b>ka#a
zWJww7F_QxkmLa}2a^3g$$1+UX{<`18yQM34IkbIVT1(u$P*fb~jd>6@z1AiT1?q<Y
zZ+9&d0|Ud+&x{NKv+ytr&5P9*pujLmuMIgxavV+{tdLE7Qpd>qTDnm3hA+B=-{{|K
zHHk1UxC@Ab1l+_g8$8F?eoIQQJgBi}qt9`;U|D&WF>Wh_sF-<Q<f(mscPmidS<4iE
z(MW<|mXC(5YM5h6ck;k0Ny#J4qK9YDv-zZ75vg^!P9Fo6+_rAvVRc<XadGiehf+xq
z`+21M<|v)r&f6o!GYr@Tg?2jARt^gWmug7P6r)-<)*Fzaik#8QpSZZb*7K$KKruHz
zUxT~I95!H1E9O}`u3IY|gZAAGdU{1k{_~K20V1PHu~kKRv!j+nwm#9=Rt4Y|<O6c+
zAP~C)ioU3u+gk$z0|8zZWmnhZ|3VGZc@{8qs{P=0t(C>+In&+md1TZrAWk<#i0L4%
zFs95N2{76JN8h@Bi*s@g{!(@>RUo)76U}tII^9OtnP7=BYr9cmmZA?ON?S-+)nm#u
z5&8KLxa(lGisAh2`NaKM=MLzcKwrTt!-|NGu011t$kk~bE(}Vd&F#fji`UMhA0foC
zK|xx^OK|5e)Qk%K8H~mdVI%00I0XGosM-fSnqOVvB5oVh1hTJdbk)GTUq^(U;pM&7
z9SKrxruqs|z$O6!9|26RN;JfH8Qn$SYXJAqbIcE%kWx`HBD5gs5}Y?t9Y#8gceIU2
z`v-~7PJlQW2oh<Xe_{0WSy_&9cX}md3I(tJY;FRdL)#ZF^Pj;Sc;|;k!T8}9k@zI;
z={eS7i}VY^!%Cb{rJRq!FNQ++q0}~Du?jp^mN1-~U@U)vev7Lc@MSDLTmkw}R@VN?
z3S$ltNT<y;xv{?^#Kgh^swyhKvQmBa#V`g8-OCsDgHn74Ba0Xkdec#pDP4)<T!X_h
zxEGNb^WYiYYzGWcf-GA*BLYDW#$CGlY7K=v0l?*fyAP|3Wo2X2EvTGY3IkyRU0+-o
zApW)9UD=^g#H|Da)4Z`!7>xo-M8x*WtU`x~L6UprMTo)(8}5;rm6g~1oquj~>VWy*
z+4%IqZ-nL+7PuZxo1>9@A76z$wj4=g)l_>9C1jAyD0$%K;_{`WgzRr`mhZkux#LTO
zA4oibAqjtKu2fXiVX>J*SeTl5EeQ(pMZO@($EczV4FMq>&=J(j^peVdigNv($bXkK
z2s0Z<U|ka#V(lOXK|;h7(aFh4%}w95PP}^V0-(k9wtPBy9>#*HsKLCydwV0Twyu*8
zr2;bUX}(TapB^2p{tjS~C6?0w6;1JZ=B=-<o2xQVt2gcgBrkuHsXEGc%0r=07>m9o
z7_=#Et$RLMI5{oX^Egr%>D$`b&6Mf&x#g4QtpP^89B|EZzvt?T&LJf9@m{U7RHvqY
zITBU2y1ELyGw*$0;BZ%|OK|l93(VQEi-{J<3-HbxNz$9wy1LE4<H&kY=l8@hjN<5E
zBLHaVvPsse2<ho^gObVZ3;PKWtn4(>HIXy;=GpTKI}zl<%=%=LgVYhi08)VBa%n%Y
zxJdUcPooBmKu1qm3v8N!+JbVD?(EIw_?nj&(xBSUA05X0j>0Vd+c&ZOJ-rby0b_CJ
zGr?7<!)bt>vBo7Pi5l+|W>hZg2R>j=Pgs}|(pZT0`gFTXO^>v`2WUZ;!@6d<HS@2y
zj=|dT5d9mIy65KO+brV2O*aEkDmF5;N1Y&h!+n`rfb33B*8|~`G@;0M;VkwaL5S}J
zIryWK5u87wLHH-oDK)hsg$rs?&`;uT1*P;DQEm_hV4UDoD1fCY89QK>K{?FVAC1Gg
zI5`zmJAO<~zE$@DW=6MAvh`GBb8~V^irXTb5F2A)b^_p0`IFJX!B?C~|NVOp<S#OI
zBqL!=I_AZtrO~eqXu_+?cK?xvtgozqSZtq7gKToobG_dNl{Gc%K1~T}Y0VDvPgT?7
ztSvx@w_Lv|VFwBLcs~@6fZ(%DnwVRWjnCG2uDN@XcS79IpP6!l^>QmF6e%fb|CXrj
zPYzWI3BL<|8adW1anLFHwyS^{Tpq7+njb5<rmCDcfYNAriCBY!kkMLsAW(W6ii6~K
zm{iAP|4YAtRN=xviuFIgi`91#H83sHV5fnBfrm7rUHl;7VqW{vJLD4Jyzt+=Cr_T3
zzq0-F`?vGwH82p%OG`zvXMwn~>rXkb4yli2z%;JERW!McDjQ&*unmF*oQyovKYfLQ
zrRw88q~p(!@O_H*hlK^Cy1jjUL5!JK)b{<q0Nt!Z8E6x9_z@QuNI_G%RFSH2UtV4U
zfZae;hZRK+=ORmD<e6QrDZhWHmEC!sKVe;`yXNolAD?=H5AdM1Bq=kq?9~?q@n^V^
zZ2}g9<kkKZ@Q=W(MV0}=0ehqT%Q9&t;;F+gaw@9Cy>c)TZ#-~#Yd{WzNpE4_5B&kN
zqd~JQvJfSUA)2{gkYdQhH3{;gH^jR2c|edu41zmGSOb17q(b)b5&VdQT`dbt)T|up
zz)reHTQ-}BXMO>^`xojtsBW`yq1&62F|yL{K=YW3V*Es^RWzxniiH~>9C#=GC7@(x
zXU@`yk-G5^WE;tRWJyVRfTQwvXD9Mh4<x<TeiUPYSa@XdD-8{qtxE+3?QURNM!FlM
z6@rYnePM3$3@|{W`+3R?ThbyP;^N}dJag0sNe*8TaycEtumT$Z4Rd;Kz(#*$_c5+A
z0|;F;2QAQCm-XJNAI~dhYTh6Q518Rlkp2QE-W59x!NMP|{m~h%%9dCqmG?0|9@x*G
z$p{t}{^E)X_5}9+o91FH5NOkpPk&7C*t{Qh)&PeGzeD8q4-cD*P|}He!;CPDjEs_V
zi-Fh5dM?ev;_MAdMn`u7Y}%vr*yw2U$@&iCt*H{KrXp}ChMWcn`dCaR*3{G-Ju`eq
zL^oKt2l#OO)?{2<yE)K|>;)5(latr<CV+=s^`N}0EQ#}>as<xP^hzLNTQ1o1Tr2~{
zHn!{(lzRbQAL-iadaTq_Y69;WkeI)z+WL0T+Eud%nka}7nACH^I|xC9y>n*_I}}Z-
z`nq8`pv&$bP|a9<u1QHT508#I-ZKG>h$l<XHW}m*jfHe{bqAkfBM~7FlDTz4tmH0I
zD-ZEBK+Gw5D@IuX21?MF;00SE?uj)BzU0F!JUyS@&9cKgB>of3>fcNX#n{M^%bAep
z?M@aEZ+}aUV~hmyl%ir}9TL@~08Dn#%+asCqnTnaR^pmbn0?ym3?EFWpFMk)k^I}W
zsV=uT11Xvi#~AkN%lEe@g<41y%`}MTl;X)PwgpP1D)Et$E=;!gdX>mWfV4t}<wvCg
zE#&V%f8?%ISy>tpY>7H`@n&qf6-~KaU*q0^&Pz!_q2mJL1tEyZQxq;)Tu%Y_-rk-|
zS`~N#&fGtC{=Lc*!A-|NP%|(%t!fJat6}4J9L;;l>)o2GE1#WxX#~O=h9F~Ct*zWK
z^=Ssj@>EUy`0?uDHYw?v@nW+_^63f43_oQL-qS|GeC}`0UEEXRU^q@~w`X7|*1bth
zt%@k404XplAj$LGy+j~t8Bxem?TNK9ek*t26m9eg1Kom<7R9WKK$tJI_|Et_88y4x
zxXo1mVrc;~nNi?vk9-IUrJ!AF9e>I2=?Jktwq>36AtvU@awQ5?RtdUjZLQE_DSo$C
zXo1`yqOLA4kA3!slr#_he?r2~8#eBZ4<MQ6==eeV&6~}go%a<$p5eFzQgQmu2`CWT
zeNH#C_|)+q0Ql>)y>$?s8`_}hPgvU@XY=<ld3l|)#Z-U)p5Y)ug^OEN4L-&8ttFMb
zKzJt)2zLNmYQ|q95a0cd2iQTG#@ss=LQ<xXAG5RD92Z6HDiY!<DO_D$TQ4^rn69N|
zOr%D#CB#|Nd3$>cjS3$FnPs)#)?V(J<3gOOw1PP9_uI31eVqxArctotg2Uw>($O6(
zezVG@(5d28QdPYJ6|Z2;0f&16^>8WR+5tU;p6)$$`1V{4J6bL&>C+H>-oV<Atie@V
zAUy{hT&B-iC=?-JBS6hPJG>Vp2xab>n);UuS2~g;RbwQV%LK|-2POy*Oz(~jM|fNN
zEdw#c(UDi@mW8F8xQid8O|37ShVe{QRaFU*Tl@Q}ub$xI&Z8k3t;Xn4<6u|KFF5HM
zQt{|FR)VfqYzl4y15w<eV`a%Ln375lmz_NQRcAL)!Ui`H`<R?uu3HyXxV;fD-l={1
z%dTSkpU)3nMTJ>XXl|_J74-3X-p6J`(6wIC`hb`sE-uMQpc<DgZOwAfEP!K(qMWL1
JIl?&P{{R3wB+vi=

literal 0
HcmV?d00001


From 14e528d3a395c19f40bed737186c9c39765ae5f3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 25 Jun 2023 23:21:02 -0400
Subject: [PATCH 132/387] better error handling in clean_url()

---
 bbot/core/helpers/url.py | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/url.py b/bbot/core/helpers/url.py
index a6c5a7aa7e..9454617e0e 100644
--- a/bbot/core/helpers/url.py
+++ b/bbot/core/helpers/url.py
@@ -72,8 +72,16 @@ def clean_url(url):
     """
     parsed = parse_url(url)
     parsed = parsed._replace(netloc=str(parsed.netloc).lower(), fragment="", query="")
+    try:
+        scheme = parsed.scheme
+    except ValueError:
+        scheme = "https"
+    try:
+        port = parsed.port
+    except ValueError:
+        port = (80 if scheme == "http" else 443)
     # remove ports if they're redundant
-    if (parsed.scheme == "http" and parsed.port == 80) or (parsed.scheme == "https" and parsed.port == 443):
+    if (scheme == "http" and port == 80) or (scheme == "https" and port == 443):
         hostname = parsed.hostname
         # special case for IPv6 URLs
         if parsed.netloc.startswith("["):

From 66610a798873b8f3990009c6b3be00753e8c314b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 26 Jun 2023 00:00:39 -0400
Subject: [PATCH 133/387] better error handling for non-200 response codes

---
 bbot/modules/crobat.py | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index 9fe03f11e0..09c29d9a2c 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -123,7 +123,16 @@ async def query(self, query, parse_fn=None, request_fn=None):
         if request_fn is None:
             request_fn = self.request_url
         try:
-            results = list(parse_fn(await request_fn(query), query))
+            response = await request_fn(query)
+            try:
+                results = list(parse_fn(response, query))
+            except Exception as e:
+                if response:
+                    self.info(f'Status code {response.status_code} for query "{query}"')
+                    self.debug(response.text)
+                else:
+                    self.info(f'Error parsing results for "{query}": {e}', trace=True)
+                return
             if results:
                 return results
             self.debug(f'No results for "{query}"')

From c1bb94258e041dd585a23c061f1392f89c124948 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 26 Jun 2023 00:10:03 -0400
Subject: [PATCH 134/387] blacked

---
 bbot/core/helpers/url.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/url.py b/bbot/core/helpers/url.py
index 9454617e0e..4d14262bd4 100644
--- a/bbot/core/helpers/url.py
+++ b/bbot/core/helpers/url.py
@@ -79,7 +79,7 @@ def clean_url(url):
     try:
         port = parsed.port
     except ValueError:
-        port = (80 if scheme == "http" else 443)
+        port = 80 if scheme == "http" else 443
     # remove ports if they're redundant
     if (scheme == "http" and port == 80) or (scheme == "https" and port == 443):
         hostname = parsed.hostname

From 4cef08a5c949e2cacdcb60c8e352b067d72834a4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 26 Jun 2023 02:06:55 -0400
Subject: [PATCH 135/387] better memory measurement

---
 bbot/core/helpers/misc.py | 71 ++++++++++++++++++++-------------------
 1 file changed, 37 insertions(+), 34 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 1563e20c3c..b86129338f 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -26,6 +26,7 @@
 from contextlib import suppress
 import cloudcheck as _cloudcheck
 import tldextract as _tldextract
+from collections.abc import Mapping
 from hashlib import sha1 as hashlib_sha1
 from urllib.parse import urlparse, quote, unquote, urlunparse  # noqa F401
 from asyncio import as_completed, create_task, sleep, wait_for  # noqa
@@ -979,42 +980,44 @@ def swap_status():
 
 def get_size(obj, max_depth=5, seen=None):
     """
-    Recursively get size of object in bytes
+    Rough recursive measurement of a python object's memory footprint
     """
-    size = 0
-    if max_depth <= 0:
-        return size
+    # If seen is not provided, initialize an empty set
+    if seen is None:
+        seen = set()
+    # Get the id of the object
+    obj_id = id(obj)
+    # Decrease the maximum depth for the next recursion
     new_max_depth = max_depth - 1
-    try:
-        size = sys.getsizeof(obj)
-        if seen is None:
-            seen = set()
-        obj_id = id(obj)
-        if obj_id in seen:
-            return 0
-        # Important mark as seen *before* entering recursion to gracefully handle
-        # self-referential objects
-        seen.add(obj_id)
-        if hasattr(obj, "__dict__"):
-            for _cls in obj.__class__.__mro__:
-                if "__dict__" in _cls.__dict__:
-                    d = _cls.__dict__["__dict__"]
-                    if inspect.isgetsetdescriptor(d) or inspect.ismemberdescriptor(d):
-                        size += get_size(obj.__dict__, max_depth=new_max_depth, seen=seen)
-                    break
-        if isinstance(obj, dict):
-            size += sum((get_size(v, max_depth=new_max_depth, seen=seen) for v in obj.values()))
-            size += sum((get_size(k, max_depth=new_max_depth, seen=seen) for k in obj.keys()))
-        # elif hasattr(obj, "__iter__") and not isinstance(obj, (str, bytes, bytearray)):
-        #     size += sum((get_size(i, seen) for i in obj))
-        if hasattr(obj, "__slots__"):  # can have __slots__ with __dict__
-            size += sum(
-                get_size(getattr(obj, s), max_depth=new_max_depth, seen=seen) for s in obj.__slots__ if hasattr(obj, s)
-            )
-    except Exception as e:
-        log.debug(f"Error getting size of {obj}: {e}")
-        log.trace(traceback.format_exc())
-
+    # If the object has already been seen or we've reached the maximum recursion depth, return 0
+    if obj_id in seen or new_max_depth <= 0:
+        return 0
+    # Get the size of the object
+    size = sys.getsizeof(obj)
+    # Add the object's id to the set of seen objects
+    seen.add(obj_id)
+    # If the object has a __dict__ attribute, we want to measure its size
+    if hasattr(obj, "__dict__"):
+        # Iterate over the Method Resolution Order (MRO) of the class of the object
+        for cls in obj.__class__.__mro__:
+            # If the class's __dict__ contains a __dict__ key
+            if "__dict__" in cls.__dict__:
+                for k, v in obj.__dict__.items():
+                    size += get_size(k, new_max_depth, seen)
+                    size += get_size(v, new_max_depth, seen)
+                break
+    # If the object is a mapping (like a dictionary), we want to measure the size of its items
+    if isinstance(obj, Mapping):
+        with suppress(StopIteration):
+            k, v = next(iter(obj.items()))
+            size += (get_size(k, new_max_depth, seen) + get_size(v, new_max_depth, seen)) * len(obj)
+    # If the object is a container (like a list or tuple) but not a string or bytes-like object
+    elif isinstance(obj, (list, tuple, set)):
+        with suppress(StopIteration):
+            size += get_size(next(iter(obj)), new_max_depth, seen) * len(obj)
+    # If the object has __slots__, we want to measure the size of the attributes in __slots__
+    if hasattr(obj, "__slots__"):
+        size += sum(get_size(getattr(obj, s), new_max_depth, seen) for s in obj.__slots__ if hasattr(obj, s))
     return size
 
 
From 2bf9815899b4197f47da038ae8bdb079a7e976dd Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 27 Jun 2023 15:06:41 -0400
Subject: [PATCH 136/387] option to list flags and their descriptions

---
 bbot/cli.py                    | 10 +++++++++-
 bbot/core/configurator/args.py |  1 +
 bbot/core/flags.py             | 22 ++++++++++++++++++++++
 bbot/core/helpers/misc.py      | 10 +++++++++-
 bbot/core/helpers/modules.py   | 23 ++++++++++++++++++++++-
 5 files changed, 63 insertions(+), 3 deletions(-)
 create mode 100644 bbot/core/flags.py

diff --git a/bbot/cli.py b/bbot/cli.py
index 09cdb19cd0..d2009ab702 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -228,6 +228,14 @@ async def _main():
                 if options.help_all:
                     log_fn(parser.format_help())
 
+                if options.list_flags:
+                    log.stdout("")
+                    log.stdout("### FLAGS ###")
+                    log.stdout("")
+                    for row in module_loader.flags_table(flags=options.flags).splitlines():
+                        log.stdout(row)
+                    return
+
                 log_fn("")
                 log_fn("### MODULES ###")
                 log_fn("")
@@ -241,7 +249,7 @@ async def _main():
                     for row in module_loader.modules_options_table(modules=help_modules).splitlines():
                         log_fn(row)
 
-                if options.list_modules or options.help_all:
+                if options.list_modules or options.list_flags or options.help_all:
                     return
 
                 module_list = module_loader.filter_modules(modules=modules)
diff --git a/bbot/core/configurator/args.py b/bbot/core/configurator/args.py
index 48c4297ad7..c08383f266 100644
--- a/bbot/core/configurator/args.py
+++ b/bbot/core/configurator/args.py
@@ -125,6 +125,7 @@ def error(self, message):
         help=f'Enable modules by flag. Choices: {",".join(sorted(flag_choices))}',
         metavar="FLAG",
     )
+    modules.add_argument("-lf", "--list-flags", action="store_true", help=f"List available flags.")
     modules.add_argument(
         "-rf",
         "--require-flags",
diff --git a/bbot/core/flags.py b/bbot/core/flags.py
new file mode 100644
index 0000000000..f8bf9abcfe
--- /dev/null
+++ b/bbot/core/flags.py
@@ -0,0 +1,22 @@
+flag_descriptions = {
+    "active": "",
+    "affiliates": "",
+    "aggressive": "",
+    "cloud-enum": "",
+    "deadly": "",
+    "email-enum": "",
+    "iis-shortnames": "",
+    "passive": "",
+    "portscan": "",
+    "report": "",
+    "safe": "",
+    "service-enum": "",
+    "slow": "",
+    "social-enum": "",
+    "subdomain-enum": "",
+    "subdomain-hijack": "",
+    "web-basic": "",
+    "web-paramminer": "",
+    "web-screenshots": "",
+    "web-thorough": "",
+}
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index b86129338f..e1b70a02f7 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -837,10 +837,18 @@ def make_table(*args, **kwargs):
     # fix IndexError: list index out of range
     if args and not args[0]:
         args = ([[]],) + args[1:]
-    defaults = {"tablefmt": "grid", "disable_numparse": True, "maxcolwidths": 40}
+    tablefmt = os.environ.get("BBOT_TABLE_FORMAT", None)
+    defaults = {"tablefmt": "grid", "disable_numparse": True, "maxcolwidths": None}
+    if tablefmt is None:
+        defaults.update({"maxcolwidths": 40})
+    else:
+        defaults.update({"tablefmt": tablefmt})
     for k, v in defaults.items():
         if k not in kwargs:
             kwargs[k] = v
+    # don't wrap columns in markdown
+    if tablefmt in ("github", "markdown"):
+        kwargs.pop("maxcolwidths")
     return tabulate(*args, **kwargs)
 
 
diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index 16b2755e2f..86d29bd433 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -6,6 +6,7 @@
 from omegaconf import OmegaConf
 from contextlib import suppress
 
+from ..flags import flag_descriptions
 from .misc import list_files, sha1, search_dict_by_key, search_format_dict, make_table, os_platform
 
 
@@ -269,7 +270,7 @@ def add_or_create(d, k, *items):
 
     def modules_table(self, modules=None, mod_type=None):
         table = []
-        header = ["Module", "Type", "Needs\nAPI\nKey", "Description", "Flags", "Produced Events"]
+        header = ["Module", "Type", "Needs API Key", "Description", "Flags", "Produced Events"]
         maxcolwidths = [20, 20, 5, 40, 40, 40]
         for module_name, preloaded in self.filter_modules(modules, mod_type):
             module_type = preloaded["type"]
@@ -285,6 +286,26 @@ def modules_table(self, modules=None, mod_type=None):
             )
         return make_table(table, header, maxcolwidths=maxcolwidths)
 
+    def flags_table(self, flags=None):
+        table = []
+        header = ["Flag", "Description", "# Modules", "Modules"]
+        maxcolwidths = [20, 40, 5, 80]
+        _flags = {}
+        for module_name, preloaded in self.preloaded().items():
+            for flag in preloaded.get("flags", []):
+                if not flags or flag in flags:
+                    try:
+                        _flags[flag].add(module_name)
+                    except KeyError:
+                        _flags[flag] = {module_name}
+
+        _flags = sorted(_flags.items(), key=lambda x: len(x[-1]), reverse=True)
+
+        for flag, modules in _flags:
+            description = flag_descriptions.get(flag, "")
+            table.append([flag, description, f"{len(modules)}", ", ".join(sorted(modules))])
+        return make_table(table, header, maxcolwidths=maxcolwidths)
+
     def modules_options(self, modules=None, mod_type=None):
         """
         Return a list of module options

From 0b5633518e4cc555f9493f33e3b55c6e1691254c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 27 Jun 2023 17:40:20 -0400
Subject: [PATCH 137/387] autogenerate BBOT tables

---
 README.md                    | 232 -------------------------------
 bbot/core/helpers/modules.py |  43 +++---
 bbot/scripts/docs.py         |  62 +++++++++
 docs/index.md                | 258 +++++++++++++++++++++++++++++++++++
 4 files changed, 343 insertions(+), 252 deletions(-)
 create mode 100755 bbot/scripts/docs.py

diff --git a/README.md b/README.md
index a5153c26f0..5697f0ae61 100644
--- a/README.md
+++ b/README.md
@@ -244,238 +244,6 @@ bbot -f subdomain-enum -t evilcorp.com --output-modules neo4j
 - Browse data at http://localhost:7474
 
 
-# Modules
-
-### Note: You can find more fun and interesting modules at the [Module Playground](https://github.com/blacklanternsecurity/bbot-module-playground). For instructions on how to install these other modules, see the [wiki](https://github.com/blacklanternsecurity/bbot/wiki#module-playground).
-
-To see modules' options (how to change wordlists, thread count, etc.), use `--help-all`.
-
-~~~
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| Module               | Type     | Needs   | Description                              | Flags                                    | Produced Events                          |
-|                      |          | API     |                                          |                                          |                                          |
-|                      |          | Key     |                                          |                                          |                                          |
-+======================+==========+=========+==========================================+==========================================+==========================================+
-| badsecrets           | scan     |         | Library for detecting known or weak      | active,safe,web-basic,web-thorough       | FINDING,VULNERABILITY                    |
-|                      |          |         | secrets across many web frameworks       |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| bucket_aws           | scan     |         | Check for S3 buckets related to target   | active,cloud-enum,safe,web-basic,web-    | FINDING,STORAGE_BUCKET                   |
-|                      |          |         |                                          | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| bucket_azure         | scan     |         | Check for Azure storage blobs related to | active,cloud-enum,safe,web-basic,web-    | FINDING,STORAGE_BUCKET                   |
-|                      |          |         | target                                   | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| bucket_digitalocean  | scan     |         | Check for DigitalOcean spaces related to | active,cloud-enum,safe,slow,web-thorough | FINDING,STORAGE_BUCKET                   |
-|                      |          |         | target                                   |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| bucket_firebase      | scan     |         | Check for open Firebase databases        | active,cloud-enum,safe,web-basic,web-    | FINDING,STORAGE_BUCKET                   |
-|                      |          |         | related to target                        | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| bucket_gcp           | scan     |         | Check for Google object storage related  | active,cloud-enum,safe,web-basic,web-    | FINDING,STORAGE_BUCKET                   |
-|                      |          |         | to target                                | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| bypass403            | scan     |         | Check 403 pages for common bypasses      | active,aggressive,web-thorough           | FINDING                                  |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| dnszonetransfer      | scan     |         | Attempt DNS zone transfers               | active,safe,subdomain-enum               | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| ffuf                 | scan     |         | A fast web fuzzer written in Go          | active,aggressive,deadly                 | URL_UNVERIFIED                           |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| ffuf_shortnames      | scan     |         | Use ffuf in combination IIS shortnames   | active,aggressive,iis-shortnames,web-    | URL_UNVERIFIED                           |
-|                      |          |         |                                          | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| fingerprintx         | scan     |         | Fingerprint exposed services like RDP,   | active,safe,service-enum,slow            | PROTOCOL                                 |
-|                      |          |         | SSH, MySQL, etc.                         |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| generic_ssrf         | scan     |         | Check for generic SSRFs                  | active,aggressive,web-thorough           | VULNERABILITY                            |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| gowitness            | scan     |         | Take screenshots of webpages             | active,safe,web-screenshots              | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENS |
-|                      |          |         |                                          |                                          | HOT                                      |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| host_header          | scan     |         | Try common HTTP Host header spoofing     | active,aggressive,web-thorough           | FINDING                                  |
-|                      |          |         | techniques                               |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| httpx                | scan     |         | Visit webpages. Many other modules rely  | active,cloud-enum,safe,social-           | HTTP_RESPONSE,URL                        |
-|                      |          |         | on httpx                                 | enum,subdomain-enum,web-basic,web-       |                                          |
-|                      |          |         |                                          | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| hunt                 | scan     |         | Watch for commonly-exploitable HTTP      | active,safe,web-basic,web-thorough       | FINDING                                  |
-|                      |          |         | parameters                               |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| iis_shortnames       | scan     |         | Check for IIS shortname vulnerability    | active,iis-shortnames,safe,web-          | URL_HINT                                 |
-|                      |          |         |                                          | basic,web-thorough                       |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| masscan              | scan     |         | Port scan IP subnets with masscan        | active,aggressive,portscan               | OPEN_TCP_PORT                            |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| naabu                | scan     |         | Execute port scans with naabu            | active,aggressive,portscan,web-thorough  | OPEN_TCP_PORT                            |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| nmap                 | scan     |         | Execute port scans with nmap             | active,aggressive,portscan,web-thorough  | OPEN_TCP_PORT                            |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| ntlm                 | scan     |         | Watch for HTTP endpoints that support    | active,safe,web-basic,web-thorough       | DNS_NAME,FINDING                         |
-|                      |          |         | NTLM authentication                      |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| nuclei               | scan     |         | Fast and customisable vulnerability      | active,aggressive,deadly                 | FINDING,VULNERABILITY                    |
-|                      |          |         | scanner                                  |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| paramminer_cookies   | scan     |         | Smart brute-force to check for common    | active,aggressive,slow,web-paramminer    | FINDING                                  |
-|                      |          |         | HTTP cookie parameters                   |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| paramminer_getparams | scan     |         | Use smart brute-force to check for       | active,aggressive,slow,web-paramminer    | FINDING                                  |
-|                      |          |         | common HTTP GET parameters               |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| paramminer_headers   | scan     |         | Use smart brute-force to check for       | active,aggressive,slow,web-paramminer    | FINDING                                  |
-|                      |          |         | common HTTP header parameters            |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| robots               | scan     |         | Look for and parse robots.txt            | active,safe,web-basic,web-thorough       | URL_UNVERIFIED                           |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| secretsdb            | scan     |         | Detect common secrets with secrets-      | active,safe,web-basic,web-thorough       | FINDING                                  |
-|                      |          |         | patterns-db                              |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| smuggler             | scan     |         | Check for HTTP smuggling                 | active,aggressive,slow,web-thorough      | FINDING                                  |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| social               | scan     |         | Look for social media links in webpages  | active,safe,social-enum                  | SOCIAL                                   |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| sslcert              | scan     |         | Visit open ports and retrieve SSL        | active,affiliates,email-                 | DNS_NAME,EMAIL_ADDRESS                   |
-|                      |          |         | certificates                             | enum,safe,subdomain-enum,web-basic,web-  |                                          |
-|                      |          |         |                                          | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| subdomain_hijack     | scan     |         | Detect hijackable subdomains             | active,cloud-enum,safe,subdomain-        | FINDING                                  |
-|                      |          |         |                                          | enum,subdomain-hijack,web-basic,web-     |                                          |
-|                      |          |         |                                          | thorough                                 |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| telerik              | scan     |         | Scan for critical Telerik                | active,aggressive,slow,web-thorough      | FINDING,VULNERABILITY                    |
-|                      |          |         | vulnerabilities                          |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| url_manipulation     | scan     |         | Attempt to identify URL parsing/routing  | active,aggressive,web-thorough           | FINDING                                  |
-|                      |          |         | based vulnerabilities                    |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| vhost                | scan     |         | Fuzz for virtual hosts                   | active,aggressive,deadly,slow            | DNS_NAME,VHOST                           |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| wafw00f              | scan     |         | Web Application Firewall Fingerprinting  | active,aggressive                        | WAF                                      |
-|                      |          |         | Tool                                     |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| wappalyzer           | scan     |         | Extract technologies from web responses  | active,safe,web-basic,web-thorough       | TECHNOLOGY                               |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| affiliates           | scan     |         | Summarize affiliate domains at the end   | affiliates,passive,report,safe           |                                          |
-|                      |          |         | of a scan                                |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| anubisdb             | scan     |         | Query jldc.me's database for subdomains  | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| asn                  | scan     |         | Query ripe and bgpview.io for ASNs       | passive,report,safe,subdomain-enum       | ASN                                      |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| azure_tenant         | scan     |         | Query Azure for tenant sister domains    | affiliates,passive,safe,subdomain-enum   | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| bevigil              | scan     | X       | Retrieve OSINT data from mobile          | passive,safe,subdomain-enum              | DNS_NAME,URL_UNVERIFIED                  |
-|                      |          |         | applications using BeVigil               |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| binaryedge           | scan     | X       | Query the BinaryEdge API                 | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| builtwith            | scan     | X       | Query Builtwith.com for subdomains       | affiliates,passive,safe,subdomain-enum   | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| c99                  | scan     | X       | Query the C99 API for subdomains         | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| censys               | scan     | X       | Query the Censys API                     | email-enum,passive,safe,subdomain-enum   | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_P |
-|                      |          |         |                                          |                                          | ORT,PROTOCOL                             |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| certspotter          | scan     |         | Query Certspotter's API for subdomains   | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| crobat               | scan     |         | Query Project Crobat for subdomains      | passive,safe                             | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| crt                  | scan     |         | Query crt.sh (certificate transparency)  | passive,safe,subdomain-enum              | DNS_NAME                                 |
-|                      |          |         | for subdomains                           |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| dnscommonsrv         | scan     |         | Check for common SRV records             | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| dnsdumpster          | scan     |         | Query dnsdumpster for subdomains         | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| emailformat          | scan     |         | Query email-format.com for email         | email-enum,passive,safe                  | EMAIL_ADDRESS                            |
-|                      |          |         | addresses                                |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| fullhunt             | scan     | X       | Query the fullhunt.io API for subdomains | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| github               | scan     | X       | Query Github's API for related           | passive,safe,subdomain-enum              | URL_UNVERIFIED                           |
-|                      |          |         | repositories                             |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| hackertarget         | scan     |         | Query the hackertarget.com API for       | passive,safe,subdomain-enum              | DNS_NAME                                 |
-|                      |          |         | subdomains                               |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| hunterio             | scan     | X       | Query hunter.io for emails               | email-enum,passive,safe,subdomain-enum   | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED    |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| ipneighbor           | scan     |         | Look beside IPs in their surrounding     | aggressive,passive,subdomain-enum        | IP_ADDRESS                               |
-|                      |          |         | subnet                                   |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| ipstack              | scan     | X       | Query IPStack's API for GeoIP            | passive,safe                             | GEOLOCATION                              |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| leakix               | scan     |         | Query leakix.net for subdomains          | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| massdns              | scan     |         | Brute-force subdomains with massdns      | aggressive,passive,slow,subdomain-enum   | DNS_NAME                                 |
-|                      |          |         | (highly effective)                       |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| otx                  | scan     |         | Query otx.alienvault.com for subdomains  | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| passivetotal         | scan     | X       | Query the PassiveTotal API for           | passive,safe,subdomain-enum              | DNS_NAME                                 |
-|                      |          |         | subdomains                               |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| pgp                  | scan     |         | Query common PGP servers for email       | email-enum,passive,safe                  | EMAIL_ADDRESS                            |
-|                      |          |         | addresses                                |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| rapiddns             | scan     |         | Query rapiddns.io for subdomains         | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| riddler              | scan     |         | Query riddler.io for subdomains          | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| securitytrails       | scan     | X       | Query the SecurityTrails API for         | passive,safe,subdomain-enum              | DNS_NAME                                 |
-|                      |          |         | subdomains                               |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| shodan_dns           | scan     | X       | Query Shodan for subdomains              | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| skymem               | scan     |         | Query skymem.info for email addresses    | email-enum,passive,safe                  | EMAIL_ADDRESS                            |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| sublist3r            | scan     |         | Query sublist3r's API for subdomains     | passive,safe                             | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| threatminer          | scan     |         | Query threatminer's API for subdomains   | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| urlscan              | scan     |         | Query urlscan.io for subdomains          | passive,safe,subdomain-enum              | DNS_NAME,URL_UNVERIFIED                  |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| viewdns              | scan     |         | Query viewdns.info's reverse whois for   | affiliates,passive,safe                  | DNS_NAME                                 |
-|                      |          |         | related domains                          |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| virustotal           | scan     | X       | Query VirusTotal's API for subdomains    | passive,safe,subdomain-enum              | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| wayback              | scan     |         | Query archive.org's API for subdomains   | passive,safe,subdomain-enum              | DNS_NAME,URL_UNVERIFIED                  |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| zoomeye              | scan     | X       | Query ZoomEye's API for subdomains       | affiliates,passive,safe,subdomain-enum   | DNS_NAME                                 |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| asset_inventory      | output   |         | Output to an asset inventory style       |                                          | IP_ADDRESS,OPEN_TCP_PORT                 |
-|                      |          |         | flattened CSV file                       |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| csv                  | output   |         | Output to CSV                            |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| http                 | output   |         | Send every event to a custom URL via a   |                                          |                                          |
-|                      |          |         | web request                              |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| human                | output   |         | Output to text                           |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| json                 | output   |         | Output to JSON                           |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| neo4j                | output   |         | Output to Neo4j                          |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| python               | output   |         | Output via Python API                    |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| web_report           | output   |         | Create a markdown report with web assets |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| websocket            | output   |         | Output to websockets                     |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| aggregate            | internal |         | Summarize statistics at the end of a     | passive,safe                             |                                          |
-|                      |          |         | scan                                     |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| excavate             | internal |         | Passively extract juicy tidbits from     | passive                                  | URL_UNVERIFIED                           |
-|                      |          |         | scan data                                |                                          |                                          |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-| speculate            | internal |         | Derive certain event types from others   | passive                                  | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_POR |
-|                      |          |         | by common sense                          |                                          | T                                        |
-+----------------------+----------+---------+------------------------------------------+------------------------------------------+------------------------------------------+
-~~~
-
-
 # Acknowledgements
 
 Thanks to all these amazing people for contributing to BBOT! :heart:
diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index 86d29bd433..21c03c9eae 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -286,26 +286,6 @@ def modules_table(self, modules=None, mod_type=None):
             )
         return make_table(table, header, maxcolwidths=maxcolwidths)
 
-    def flags_table(self, flags=None):
-        table = []
-        header = ["Flag", "Description", "# Modules", "Modules"]
-        maxcolwidths = [20, 40, 5, 80]
-        _flags = {}
-        for module_name, preloaded in self.preloaded().items():
-            for flag in preloaded.get("flags", []):
-                if not flags or flag in flags:
-                    try:
-                        _flags[flag].add(module_name)
-                    except KeyError:
-                        _flags[flag] = {module_name}
-
-        _flags = sorted(_flags.items(), key=lambda x: len(x[-1]), reverse=True)
-
-        for flag, modules in _flags:
-            description = flag_descriptions.get(flag, "")
-            table.append([flag, description, f"{len(modules)}", ", ".join(sorted(modules))])
-        return make_table(table, header, maxcolwidths=maxcolwidths)
-
     def modules_options(self, modules=None, mod_type=None):
         """
         Return a list of module options
@@ -333,6 +313,29 @@ def modules_options_table(self, modules=None, mod_type=None):
             table += module_options
         return make_table(table, header)
 
+    def flags(self, flags=None):
+        _flags = {}
+        for module_name, preloaded in self.preloaded().items():
+            for flag in preloaded.get("flags", []):
+                if not flags or flag in flags:
+                    try:
+                        _flags[flag].add(module_name)
+                    except KeyError:
+                        _flags[flag] = {module_name}
+
+        _flags = sorted(_flags.items(), key=lambda x: len(x[-1]), reverse=True)
+        return _flags
+
+    def flags_table(self, flags=None):
+        table = []
+        header = ["Flag", "# Modules", "Description", "Modules"]
+        maxcolwidths = [20, 40, 5, 80]
+        _flags = self.flags(flags=flags)
+        for flag, modules in _flags:
+            description = flag_descriptions.get(flag, "")
+            table.append([flag, f"{len(modules)}", description, ", ".join(sorted(modules))])
+        return make_table(table, header, maxcolwidths=maxcolwidths)
+
     def filter_modules(self, modules=None, mod_type=None):
         if modules is None:
             module_list = list(self.preloaded(type=mod_type).items())
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
new file mode 100755
index 0000000000..838a6af959
--- /dev/null
+++ b/bbot/scripts/docs.py
@@ -0,0 +1,62 @@
+#!/usr/bin/env python3
+
+import os
+import re
+from pathlib import Path
+
+from bbot.modules import module_loader
+
+os.environ["BBOT_TABLE_FORMAT"] = "github"
+
+
+# Make a regex pattern which will match any group of non-space characters that include a blacklisted character
+blacklist_chars = ["<", ">"]
+blacklist_re = re.compile(r"\|([^|]*[" + re.escape("".join(blacklist_chars)) + r"][^|]*)\|")
+
+def enclose_tags(text):
+    # Use re.sub() to replace matched words with the same words enclosed in backticks
+    result = blacklist_re.sub(r"|`\1`|", text)
+    return result
+
+
+def find_replace_markdown(content, keyword, replace):
+    begin_re = re.compile(r"<!--\s*" + keyword + r"\s*-->", re.I)
+    end_re = re.compile(r"<!--\s*END\s+" + keyword + r"\s*-->", re.I)
+
+    begin_match = begin_re.search(content)
+    end_match = end_re.search(content)
+
+    new_content = str(content)
+    if begin_match and end_match:
+        start_index = begin_match.span()[-1] + 1
+        end_index = end_match.span()[0] - 1
+        new_content = new_content[:start_index] + enclose_tags(replace) + new_content[end_index:]
+    return new_content
+
+
+def find_replace_file(file, keyword, replace):
+    with open(file) as f:
+        content = f.read()
+        new_content = find_replace_markdown(content, keyword, replace)
+    if new_content != content:
+        with open(file, "w") as f:
+            f.write(new_content)
+
+
+bbot_code_dir = Path(__file__).parent.parent.parent
+md_files = [p for p in bbot_code_dir.glob("**/*.md") if p.is_file()]
+
+# BBOT modules
+bbot_module_table = module_loader.modules_table()
+for file in md_files:
+    find_replace_file(file, "BBOT MODULES", bbot_module_table)
+
+# BBOT module options
+bbot_module_table = module_loader.modules_options_table()
+for file in md_files:
+    find_replace_file(file, "BBOT MODULE OPTIONS", bbot_module_table)
+
+# BBOT module options
+bbot_module_table = module_loader.flags_table()
+for file in md_files:
+    find_replace_file(file, "BBOT MODULE FLAGS", bbot_module_table)
diff --git a/docs/index.md b/docs/index.md
index 6cb30b8ea6..8e529d27d1 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -11,3 +11,261 @@ pip install --pre bbot
 
 bbot --help
 ~~~
+
+# Modules and Flags
+
+## BBOT Modules
+
+<!-- BBOT MODULES -->
+| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
+|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
+| badsecrets           | scan     |                 | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
+| bucket_aws           | scan     |                 | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_azure         | scan     |                 | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_digitalocean  | scan     |                 | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
+| bucket_firebase      | scan     |                 | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_gcp           | scan     |                 | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bypass403            | scan     |                 | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
+| dnszonetransfer      | scan     |                 | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
+| ffuf                 | scan     |                 | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
+| ffuf_shortnames      | scan     |                 | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
+| fingerprintx         | scan     |                 | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
+| generic_ssrf         | scan     |                 | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
+| git                  | scan     |                 | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| gowitness            | scan     |                 | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
+| host_header          | scan     |                 | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
+| httpx                | scan     |                 | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
+| hunt                 | scan     |                 | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| iis_shortnames       | scan     |                 | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
+| masscan              | scan     |                 | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
+| naabu                | scan     |                 | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| nmap                 | scan     |                 | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| ntlm                 | scan     |                 | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
+| nuclei               | scan     |                 | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
+| paramminer_cookies   | scan     |                 | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_getparams | scan     |                 | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_headers   | scan     |                 | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| robots               | scan     |                 | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
+| secretsdb            | scan     |                 | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| smuggler             | scan     |                 | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
+| social               | scan     |                 | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
+| sslcert              | scan     |                 | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
+| subdomain_hijack     | scan     |                 | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
+| telerik              | scan     |                 | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
+| url_manipulation     | scan     |                 | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
+| vhost                | scan     |                 | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
+| wafw00f              | scan     |                 | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
+| wappalyzer           | scan     |                 | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
+| affiliates           | scan     |                 | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
+| anubisdb             | scan     |                 | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| asn                  | scan     |                 | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
+| azure_tenant         | scan     |                 | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| bevigil              | scan     | X               | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| binaryedge           | scan     | X               | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| builtwith            | scan     | X               | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| c99                  | scan     | X               | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| censys               | scan     | X               | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
+| certspotter          | scan     |                 | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| columbus             | scan     |                 | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| crobat               | scan     |                 | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
+| crt                  | scan     |                 | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnscommonsrv         | scan     |                 | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnsdumpster          | scan     |                 | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| emailformat          | scan     |                 | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| fullhunt             | scan     | X               | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| github               | scan     | X               | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
+| hackertarget         | scan     |                 | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| hunterio             | scan     | X               | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
+| ipneighbor           | scan     |                 | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
+| ipstack              | scan     | X               | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
+| leakix               | scan     |                 | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| massdns              | scan     |                 | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
+| otx                  | scan     |                 | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| passivetotal         | scan     | X               | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| pgp                  | scan     |                 | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| rapiddns             | scan     |                 | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| riddler              | scan     |                 | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| securitytrails       | scan     | X               | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| shodan_dns           | scan     | X               | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| skymem               | scan     |                 | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| sublist3r            | scan     |                 | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
+| threatminer          | scan     |                 | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| urlscan              | scan     |                 | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| viewdns              | scan     |                 | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
+| virustotal           | scan     | X               | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| wayback              | scan     |                 | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| zoomeye              | scan     | X               | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| asset_inventory      | output   |                 | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
+| csv                  | output   |                 | Output to CSV                                                          |                                                                               |                                                      |
+| http                 | output   |                 | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
+| human                | output   |                 | Output to text                                                         |                                                                               |                                                      |
+| json                 | output   |                 | Output to JSON                                                         |                                                                               |                                                      |
+| neo4j                | output   |                 | Output to Neo4j                                                        |                                                                               |                                                      |
+| python               | output   |                 | Output via Python API                                                  |                                                                               |                                                      |
+| web_report           | output   |                 | Create a markdown report with web assets                               |                                                                               |                                                      |
+| websocket            | output   |                 | Output to websockets                                                   |                                                                               |                                                      |
+| aggregate            | internal |                 | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
+| excavate             | internal |                 | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
+| speculate            | internal |                 | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
+<!-- END BBOT MODULES -->
+
+## BBOT Module Flags
+
+<!-- BBOT MODULE FLAGS -->
+| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
+|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
+| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
+| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
+| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
+| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+<!-- END BBOT MODULE FLAGS -->
+
+## BBOT Module Options
+
+<!-- BBOT MODULE OPTIONS -->
+| Option                                         | Type   | Default                                                                                                                                                             | Description                                                                                                                                                                                                                                                                                                     |
+|------------------------------------------------|--------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| modules.bucket_aws.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_azure.permutations              | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_digitalocean.permutations       | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_firebase.permutations           | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_gcp.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.dnszonetransfer.timeout                | int    | 10                                                                                                                                                                  | Max seconds to wait before timing out                                                                                                                                                                                                                                                                           |
+| modules.ffuf.extensions                        | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
+| modules.ffuf.lines                             | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
+| modules.ffuf.max_depth                         | int    | 0                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
+| modules.ffuf.version                           | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
+| modules.ffuf.wordlist                          | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/Web-Content/raft-small-directories.txt                                                   | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
+| modules.ffuf_shortnames.extensions             | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
+| modules.ffuf_shortnames.find_common_prefixes   | bool   | False                                                                                                                                                               | Attempt to automatically detect common prefixes and make additional ffuf runs against them                                                                                                                                                                                                                      |
+| modules.ffuf_shortnames.find_delimeters        | bool   | True                                                                                                                                                                | Attempt to detect common delimeters and make additional ffuf runs against them                                                                                                                                                                                                                                  |
+| modules.ffuf_shortnames.ignore_redirects       | bool   | True                                                                                                                                                                | Explicitly ignore redirects (301,302)                                                                                                                                                                                                                                                                           |
+| modules.ffuf_shortnames.lines                  | int    | 1000000                                                                                                                                                             | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
+| modules.ffuf_shortnames.max_depth              | int    | 1                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
+| modules.ffuf_shortnames.version                | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
+| modules.ffuf_shortnames.wordlist               | str    |                                                                                                                                                                     | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
+| modules.ffuf_shortnames.wordlist_extensions    | str    |                                                                                                                                                                     | Specify wordlist to use when making extension lists                                                                                                                                                                                                                                                             |
+| modules.fingerprintx.version                   | str    | 1.1.4                                                                                                                                                               | fingerprintx version                                                                                                                                                                                                                                                                                            |
+| modules.gowitness.output_path                  | str    |                                                                                                                                                                     | where to save screenshots                                                                                                                                                                                                                                                                                       |
+| modules.gowitness.resolution_x                 | int    | 1440                                                                                                                                                                | screenshot resolution x                                                                                                                                                                                                                                                                                         |
+| modules.gowitness.resolution_y                 | int    | 900                                                                                                                                                                 | screenshot resolution y                                                                                                                                                                                                                                                                                         |
+| modules.gowitness.threads                      | int    | 4                                                                                                                                                                   | threads used to run                                                                                                                                                                                                                                                                                             |
+| modules.gowitness.timeout                      | int    | 10                                                                                                                                                                  | preflight check timeout                                                                                                                                                                                                                                                                                         |
+| modules.gowitness.version                      | str    | 2.4.2                                                                                                                                                               | gowitness version                                                                                                                                                                                                                                                                                               |
+| modules.httpx.in_scope_only                    | bool   | True                                                                                                                                                                | Only visit web resources that are in scope.                                                                                                                                                                                                                                                                     |
+| modules.httpx.max_response_size                | int    | 5242880                                                                                                                                                             | Max response size in bytes                                                                                                                                                                                                                                                                                      |
+| modules.httpx.threads                          | int    | 50                                                                                                                                                                  | Number of httpx threads to use                                                                                                                                                                                                                                                                                  |
+| modules.httpx.version                          | str    | 1.2.5                                                                                                                                                               | httpx version                                                                                                                                                                                                                                                                                                   |
+| modules.iis_shortnames.detect_only             | bool   | True                                                                                                                                                                | Only detect the vulnerability and do not run the shortname scanner                                                                                                                                                                                                                                              |
+| modules.iis_shortnames.max_node_count          | int    | 30                                                                                                                                                                  | Limit how many nodes to attempt to resolve on any given recursion branch                                                                                                                                                                                                                                        |
+| modules.masscan.ping_first                     | bool   | False                                                                                                                                                               | Only portscan hosts that reply to pings                                                                                                                                                                                                                                                                         |
+| modules.masscan.ports                          | str    | 80,443                                                                                                                                                              | Ports to scan                                                                                                                                                                                                                                                                                                   |
+| modules.masscan.rate                           | int    | 600                                                                                                                                                                 | Rate in packets per second                                                                                                                                                                                                                                                                                      |
+| modules.masscan.use_cache                      | bool   | False                                                                                                                                                               | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     |
+| modules.masscan.wait                           | int    | 10                                                                                                                                                                  | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              |
+| modules.naabu.ports                            | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
+| modules.naabu.skip_host_discovery              | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
+| modules.naabu.top_ports                        | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
+| modules.naabu.version                          | str    | 2.1.1                                                                                                                                                               | naabu version                                                                                                                                                                                                                                                                                                   |
+| modules.nmap.ports                             | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
+| modules.nmap.skip_host_discovery               | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
+| modules.nmap.timing                            | str    | T4                                                                                                                                                                  |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `|
+| modules.nmap.top_ports                         | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
+| modules.ntlm.try_all                           | bool   | False                                                                                                                                                               | Try every NTLM endpoint                                                                                                                                                                                                                                                                                         |
+| modules.nuclei.budget                          | int    | 1                                                                                                                                                                   | Used in budget mode to set the number of requests which will be alloted to the nuclei scan                                                                                                                                                                                                                      |
+| modules.nuclei.concurrency                     | int    | 25                                                                                                                                                                  | maximum number of templates to be executed in parallel (default 25)                                                                                                                                                                                                                                             |
+| modules.nuclei.directory_only                  | bool   | True                                                                                                                                                                | Filter out 'file' URL event (default True)                                                                                                                                                                                                                                                                      |
+| modules.nuclei.etags                           | str    |                                                                                                                                                                     | tags to exclude from the scan                                                                                                                                                                                                                                                                                   |
+| modules.nuclei.mode                            | str    | manual                                                                                                                                                              | manual | technology | severe | budget. Technology: Only activate based on technology events that match nuclei tags (nuclei -as mode). Manual (DEFAULT): Fully manual settings. Severe: Only critical and high severity templates without intrusive. Budget: Limit Nuclei to a specified number of HTTP requests |
+| modules.nuclei.ratelimit                       | int    | 150                                                                                                                                                                 | maximum number of requests to send per second (default 150)                                                                                                                                                                                                                                                     |
+| modules.nuclei.severity                        | str    |                                                                                                                                                                     | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |
+| modules.nuclei.tags                            | str    |                                                                                                                                                                     | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |
+| modules.nuclei.templates                       | str    |                                                                                                                                                                     | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |
+| modules.nuclei.version                         | str    | 2.9.4                                                                                                                                                               | nuclei version                                                                                                                                                                                                                                                                                                  |
+| modules.paramminer_cookies.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                |
+| modules.paramminer_getparams.wordlist          | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             |
+| modules.paramminer_headers.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                |
+| modules.robots.include_allow                   | bool   | True                                                                                                                                                                | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         |
+| modules.robots.include_disallow                | bool   | True                                                                                                                                                                | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      |
+| modules.robots.include_sitemap                 | bool   | False                                                                                                                                                               | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       |
+| modules.secretsdb.min_confidence               | int    | 99                                                                                                                                                                  | Only use signatures with this confidence score or higher                                                                                                                                                                                                                                                        |
+| modules.secretsdb.signatures                   | str    | https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml                                                               | File path or URL to YAML signatures                                                                                                                                                                                                                                                                             |
+| modules.sslcert.skip_non_ssl                   | bool   | True                                                                                                                                                                | Don't try common non-SSL ports                                                                                                                                                                                                                                                                                  |
+| modules.sslcert.timeout                        | float  | 5.0                                                                                                                                                                 | Socket connect timeout in seconds                                                                                                                                                                                                                                                                               |
+| modules.subdomain_hijack.fingerprints          | str    | https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json                                                                           | URL or path to fingerprints.json                                                                                                                                                                                                                                                                                |
+| modules.telerik.exploit_RAU_crypto             | bool   | False                                                                                                                                                               | Attempt to confirm any RAU AXD detections are vulnerable                                                                                                                                                                                                                                                        |
+| modules.url_manipulation.allow_redirects       | bool   | True                                                                                                                                                                | Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default.                                                                                                                                                                                |
+| modules.vhost.force_basehost                   | str    |                                                                                                                                                                     | Use a custom base host (e.g. evilcorp.com) instead of the default behavior of using the current URL                                                                                                                                                                                                             |
+| modules.vhost.lines                            | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
+| modules.vhost.wordlist                         | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Wordlist containing subdomains                                                                                                                                                                                                                                                                                  |
+| modules.wafw00f.generic_detect                 | bool   | True                                                                                                                                                                | When no specific WAF detections are made, try to peform a generic detect                                                                                                                                                                                                                                        |
+| modules.bevigil.api_key                        | str    |                                                                                                                                                                     | BeVigil OSINT API Key                                                                                                                                                                                                                                                                                           |
+| modules.bevigil.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
+| modules.binaryedge.api_key                     | str    |                                                                                                                                                                     | BinaryEdge API key                                                                                                                                                                                                                                                                                              |
+| modules.binaryedge.max_records                 | int    | 1000                                                                                                                                                                | Limit results to help prevent exceeding API quota                                                                                                                                                                                                                                                               |
+| modules.builtwith.api_key                      | str    |                                                                                                                                                                     | Builtwith API key                                                                                                                                                                                                                                                                                               |
+| modules.builtwith.redirects                    | bool   | True                                                                                                                                                                | Also look up inbound and outbound redirects                                                                                                                                                                                                                                                                     |
+| modules.c99.api_key                            | str    |                                                                                                                                                                     | c99.nl API key                                                                                                                                                                                                                                                                                                  |
+| modules.censys.api_id                          | str    |                                                                                                                                                                     | Censys.io API ID                                                                                                                                                                                                                                                                                                |
+| modules.censys.api_secret                      | str    |                                                                                                                                                                     | Censys.io API Secret                                                                                                                                                                                                                                                                                            |
+| modules.fullhunt.api_key                       | str    |                                                                                                                                                                     | FullHunt API Key                                                                                                                                                                                                                                                                                                |
+| modules.github.api_key                         | str    |                                                                                                                                                                     | Github token                                                                                                                                                                                                                                                                                                    |
+| modules.hunterio.api_key                       | str    |                                                                                                                                                                     | Hunter.IO API key                                                                                                                                                                                                                                                                                               |
+| modules.ipneighbor.num_bits                    | int    | 4                                                                                                                                                                   | Netmask size (in CIDR notation) to check. Default is 4 bits (16 hosts)                                                                                                                                                                                                                                          |
+| modules.ipstack.api_key                        | str    |                                                                                                                                                                     | IPStack GeoIP API Key                                                                                                                                                                                                                                                                                           |
+| modules.leakix.api_key                         | str    |                                                                                                                                                                     | LeakIX API Key                                                                                                                                                                                                                                                                                                  |
+| modules.massdns.max_mutations                  | int    | 500                                                                                                                                                                 | Max number of smart mutations per subdomain                                                                                                                                                                                                                                                                     |
+| modules.massdns.max_resolvers                  | int    | 1000                                                                                                                                                                | Number of concurrent massdns resolvers                                                                                                                                                                                                                                                                          |
+| modules.massdns.wordlist                       | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Subdomain wordlist URL                                                                                                                                                                                                                                                                                          |
+| modules.passivetotal.api_key                   | str    |                                                                                                                                                                     | RiskIQ API Key                                                                                                                                                                                                                                                                                                  |
+| modules.passivetotal.username                  | str    |                                                                                                                                                                     | RiskIQ Username                                                                                                                                                                                                                                                                                                 |
+| modules.pgp.search_urls                        | list   |` ['https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=<query>', 'http://the.earth.li:11371/pks/lookup?fingerprint=on&op=vindex&search=<query>'] `| PGP key servers to search                                                                                                                                                                                                                                                                                       |
+| modules.securitytrails.api_key                 | str    |                                                                                                                                                                     | SecurityTrails API key                                                                                                                                                                                                                                                                                          |
+| modules.shodan_dns.api_key                     | str    |                                                                                                                                                                     | Shodan API key                                                                                                                                                                                                                                                                                                  |
+| modules.urlscan.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
+| modules.virustotal.api_key                     | str    |                                                                                                                                                                     | VirusTotal API Key                                                                                                                                                                                                                                                                                              |
+| modules.wayback.garbage_threshold              | int    | 10                                                                                                                                                                  | Dedupe similar urls if they are in a group of this size or higher (lower values == less garbage data)                                                                                                                                                                                                           |
+| modules.wayback.urls                           | bool   | False                                                                                                                                                               | emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
+| modules.zoomeye.api_key                        | str    |                                                                                                                                                                     | ZoomEye API key                                                                                                                                                                                                                                                                                                 |
+| modules.zoomeye.include_related                | bool   | False                                                                                                                                                               | Include domains which may be related to the target                                                                                                                                                                                                                                                              |
+| modules.zoomeye.max_pages                      | int    | 20                                                                                                                                                                  | How many pages of results to fetch                                                                                                                                                                                                                                                                              |
+| output_modules.asset_inventory.output_file     | str    |                                                                                                                                                                     | Set a custom output file                                                                                                                                                                                                                                                                                        |
+| output_modules.asset_inventory.summary_netmask | int    | 16                                                                                                                                                                  | Subnet mask to use when summarizing IP addresses at end of scan                                                                                                                                                                                                                                                 |
+| output_modules.asset_inventory.use_previous    | bool   | False                                                                                                                                                               |` Emit previous asset inventory as new events (use in conjunction with -n <old_scan_name>)                                                                                                                                                                                                                        `|
+| output_modules.csv.output_file                 | str    |                                                                                                                                                                     | Output to CSV file                                                                                                                                                                                                                                                                                              |
+| output_modules.http.bearer                     | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
+| output_modules.http.method                     | str    | POST                                                                                                                                                                | HTTP method                                                                                                                                                                                                                                                                                                     |
+| output_modules.http.password                   | str    |                                                                                                                                                                     | Password (basic auth)                                                                                                                                                                                                                                                                                           |
+| output_modules.http.timeout                    | int    | 10                                                                                                                                                                  | HTTP timeout                                                                                                                                                                                                                                                                                                    |
+| output_modules.http.url                        | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
+| output_modules.http.username                   | str    |                                                                                                                                                                     | Username (basic auth)                                                                                                                                                                                                                                                                                           |
+| output_modules.human.console                   | bool   | True                                                                                                                                                                | Output to console                                                                                                                                                                                                                                                                                               |
+| output_modules.human.output_file               | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
+| output_modules.json.console                    | bool   | False                                                                                                                                                               | Output to console                                                                                                                                                                                                                                                                                               |
+| output_modules.json.output_file                | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
+| output_modules.neo4j.password                  | str    | bbotislife                                                                                                                                                          | Neo4j password                                                                                                                                                                                                                                                                                                  |
+| output_modules.neo4j.uri                       | str    | bolt://localhost:7687                                                                                                                                               | Neo4j server + port                                                                                                                                                                                                                                                                                             |
+| output_modules.neo4j.username                  | str    | neo4j                                                                                                                                                               | Neo4j username                                                                                                                                                                                                                                                                                                  |
+| output_modules.web_report.css_theme_file       | str    | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   |
+| output_modules.web_report.output_file          | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
+| output_modules.websocket.token                 | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
+| output_modules.websocket.url                   | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
+| internal_modules.speculate.max_hosts           | int    | 65536                                                                                                                                                               | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  |
+| internal_modules.speculate.ports               | list   | [80, 443]                                                                                                                                                           | The set of ports to speculate on                                                                                                                                                                                                                                                                                |
+<!-- END BBOT MODULE OPTIONS -->

From e2f8ce07c08527eddaef5c9b2d2a58c64d976068 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 27 Jun 2023 17:41:08 -0400
Subject: [PATCH 138/387] blacked

---
 bbot/scripts/docs.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 838a6af959..595b6252b2 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -13,6 +13,7 @@
 blacklist_chars = ["<", ">"]
 blacklist_re = re.compile(r"\|([^|]*[" + re.escape("".join(blacklist_chars)) + r"][^|]*)\|")
 
+
 def enclose_tags(text):
     # Use re.sub() to replace matched words with the same words enclosed in backticks
     result = blacklist_re.sub(r"|`\1`|", text)

From cbcc66c1c0b063fa78ea44dee499badc98fbde34 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 28 Jun 2023 12:35:20 -0400
Subject: [PATCH 139/387] more docs automation

---
 .github/workflows/docs.yml  |  24 +++-
 bbot/scripts/docs.py        |  13 +-
 docs/index.md               | 262 +-----------------------------------
 docs/modules.md             |  17 +++
 docs/stylesheets/extra.css  |  15 ---
 docs/stylesheets/extra.scss |   0
 mkdocs.yml                  |   4 +-
 7 files changed, 52 insertions(+), 283 deletions(-)
 create mode 100644 docs/modules.md
 delete mode 100644 docs/stylesheets/extra.css
 create mode 100644 docs/stylesheets/extra.scss

diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
index bb15cd3d30..e98250ea15 100644
--- a/.github/workflows/docs.yml
+++ b/.github/workflows/docs.yml
@@ -6,8 +6,30 @@ on:
 permissions:
   contents: write
 jobs:
+  docgen:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: "3.10"
+      - name: Install dependencies
+        run: |
+          pip install poetry
+          poetry install
+      - name: Generate docs
+        run: |
+          poetry run bbot/scripts/docs.py
+      - name: Commit docs
+        uses: EndBug/add-and-commit@v9
+        with:
+          add: '*.md'
+          default_author: github_actions
+          message: "Refresh module docs"
   deploy:
     runs-on: ubuntu-latest
+    needs: docgen
     steps:
       - uses: actions/checkout@v3
       - uses: actions/setup-python@v4
@@ -20,5 +42,5 @@ jobs:
           path: .cache
           restore-keys: |
             mkdocs-material-
-      - run: pip install mkdocs-material 
+      - run: pip install mkdocs-material mkdocs-extra-sass-plugin livereload
       - run: mkdocs gh-deploy --force
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 595b6252b2..c3b6c2666d 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -49,15 +49,18 @@ def find_replace_file(file, keyword, replace):
 
 # BBOT modules
 bbot_module_table = module_loader.modules_table()
+assert len(bbot_module_table.splitlines()) > 50
 for file in md_files:
     find_replace_file(file, "BBOT MODULES", bbot_module_table)
 
 # BBOT module options
-bbot_module_table = module_loader.modules_options_table()
+bbot_module_options_table = module_loader.modules_options_table()
+assert len(bbot_module_options_table.splitlines()) > 50
 for file in md_files:
-    find_replace_file(file, "BBOT MODULE OPTIONS", bbot_module_table)
+    find_replace_file(file, "BBOT MODULE OPTIONS", bbot_module_options_table)
 
-# BBOT module options
-bbot_module_table = module_loader.flags_table()
+# BBOT module flags
+bbot_module_flags_table = module_loader.flags_table()
+assert len(bbot_module_flags_table.splitlines()) > 50
 for file in md_files:
-    find_replace_file(file, "BBOT MODULE FLAGS", bbot_module_table)
+    find_replace_file(file, "BBOT MODULE FLAGS", bbot_module_flags_table)
diff --git a/docs/index.md b/docs/index.md
index 8e529d27d1..c415ff79e4 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -1,4 +1,4 @@
-# bbot
+# Installation
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 Note: installing in a virtualenv (e.g. via `pipx`) is recommended
@@ -10,262 +10,4 @@ pip install bbot
 pip install --pre bbot
 
 bbot --help
-~~~
-
-# Modules and Flags
-
-## BBOT Modules
-
-<!-- BBOT MODULES -->
-| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
-|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
-| badsecrets           | scan     |                 | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
-| bucket_aws           | scan     |                 | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_azure         | scan     |                 | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_digitalocean  | scan     |                 | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
-| bucket_firebase      | scan     |                 | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_gcp           | scan     |                 | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bypass403            | scan     |                 | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
-| dnszonetransfer      | scan     |                 | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
-| ffuf                 | scan     |                 | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
-| ffuf_shortnames      | scan     |                 | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
-| fingerprintx         | scan     |                 | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
-| generic_ssrf         | scan     |                 | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
-| git                  | scan     |                 | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| gowitness            | scan     |                 | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
-| host_header          | scan     |                 | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
-| httpx                | scan     |                 | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
-| hunt                 | scan     |                 | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| iis_shortnames       | scan     |                 | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
-| masscan              | scan     |                 | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
-| naabu                | scan     |                 | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| nmap                 | scan     |                 | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| ntlm                 | scan     |                 | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
-| nuclei               | scan     |                 | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
-| paramminer_cookies   | scan     |                 | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_getparams | scan     |                 | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_headers   | scan     |                 | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| robots               | scan     |                 | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
-| secretsdb            | scan     |                 | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| smuggler             | scan     |                 | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
-| social               | scan     |                 | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
-| sslcert              | scan     |                 | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
-| subdomain_hijack     | scan     |                 | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
-| telerik              | scan     |                 | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
-| url_manipulation     | scan     |                 | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
-| vhost                | scan     |                 | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
-| wafw00f              | scan     |                 | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
-| wappalyzer           | scan     |                 | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
-| affiliates           | scan     |                 | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
-| anubisdb             | scan     |                 | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| asn                  | scan     |                 | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
-| azure_tenant         | scan     |                 | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| bevigil              | scan     | X               | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| binaryedge           | scan     | X               | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| builtwith            | scan     | X               | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| c99                  | scan     | X               | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| censys               | scan     | X               | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
-| certspotter          | scan     |                 | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| columbus             | scan     |                 | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| crobat               | scan     |                 | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
-| crt                  | scan     |                 | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnscommonsrv         | scan     |                 | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnsdumpster          | scan     |                 | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| emailformat          | scan     |                 | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| fullhunt             | scan     | X               | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| github               | scan     | X               | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
-| hackertarget         | scan     |                 | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| hunterio             | scan     | X               | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
-| ipneighbor           | scan     |                 | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
-| ipstack              | scan     | X               | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
-| leakix               | scan     |                 | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| massdns              | scan     |                 | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
-| otx                  | scan     |                 | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| passivetotal         | scan     | X               | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| pgp                  | scan     |                 | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| rapiddns             | scan     |                 | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| riddler              | scan     |                 | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| securitytrails       | scan     | X               | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| shodan_dns           | scan     | X               | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| skymem               | scan     |                 | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| sublist3r            | scan     |                 | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
-| threatminer          | scan     |                 | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| urlscan              | scan     |                 | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| viewdns              | scan     |                 | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
-| virustotal           | scan     | X               | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| wayback              | scan     |                 | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| zoomeye              | scan     | X               | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| asset_inventory      | output   |                 | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
-| csv                  | output   |                 | Output to CSV                                                          |                                                                               |                                                      |
-| http                 | output   |                 | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
-| human                | output   |                 | Output to text                                                         |                                                                               |                                                      |
-| json                 | output   |                 | Output to JSON                                                         |                                                                               |                                                      |
-| neo4j                | output   |                 | Output to Neo4j                                                        |                                                                               |                                                      |
-| python               | output   |                 | Output via Python API                                                  |                                                                               |                                                      |
-| web_report           | output   |                 | Create a markdown report with web assets                               |                                                                               |                                                      |
-| websocket            | output   |                 | Output to websockets                                                   |                                                                               |                                                      |
-| aggregate            | internal |                 | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
-| excavate             | internal |                 | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
-| speculate            | internal |                 | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
-<!-- END BBOT MODULES -->
-
-## BBOT Module Flags
-
-<!-- BBOT MODULE FLAGS -->
-| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
-|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
-| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
-| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
-| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
-| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
-| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-<!-- END BBOT MODULE FLAGS -->
-
-## BBOT Module Options
-
-<!-- BBOT MODULE OPTIONS -->
-| Option                                         | Type   | Default                                                                                                                                                             | Description                                                                                                                                                                                                                                                                                                     |
-|------------------------------------------------|--------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| modules.bucket_aws.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_azure.permutations              | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_digitalocean.permutations       | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_firebase.permutations           | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_gcp.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.dnszonetransfer.timeout                | int    | 10                                                                                                                                                                  | Max seconds to wait before timing out                                                                                                                                                                                                                                                                           |
-| modules.ffuf.extensions                        | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
-| modules.ffuf.lines                             | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
-| modules.ffuf.max_depth                         | int    | 0                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
-| modules.ffuf.version                           | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
-| modules.ffuf.wordlist                          | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/Web-Content/raft-small-directories.txt                                                   | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
-| modules.ffuf_shortnames.extensions             | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
-| modules.ffuf_shortnames.find_common_prefixes   | bool   | False                                                                                                                                                               | Attempt to automatically detect common prefixes and make additional ffuf runs against them                                                                                                                                                                                                                      |
-| modules.ffuf_shortnames.find_delimeters        | bool   | True                                                                                                                                                                | Attempt to detect common delimeters and make additional ffuf runs against them                                                                                                                                                                                                                                  |
-| modules.ffuf_shortnames.ignore_redirects       | bool   | True                                                                                                                                                                | Explicitly ignore redirects (301,302)                                                                                                                                                                                                                                                                           |
-| modules.ffuf_shortnames.lines                  | int    | 1000000                                                                                                                                                             | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
-| modules.ffuf_shortnames.max_depth              | int    | 1                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
-| modules.ffuf_shortnames.version                | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
-| modules.ffuf_shortnames.wordlist               | str    |                                                                                                                                                                     | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
-| modules.ffuf_shortnames.wordlist_extensions    | str    |                                                                                                                                                                     | Specify wordlist to use when making extension lists                                                                                                                                                                                                                                                             |
-| modules.fingerprintx.version                   | str    | 1.1.4                                                                                                                                                               | fingerprintx version                                                                                                                                                                                                                                                                                            |
-| modules.gowitness.output_path                  | str    |                                                                                                                                                                     | where to save screenshots                                                                                                                                                                                                                                                                                       |
-| modules.gowitness.resolution_x                 | int    | 1440                                                                                                                                                                | screenshot resolution x                                                                                                                                                                                                                                                                                         |
-| modules.gowitness.resolution_y                 | int    | 900                                                                                                                                                                 | screenshot resolution y                                                                                                                                                                                                                                                                                         |
-| modules.gowitness.threads                      | int    | 4                                                                                                                                                                   | threads used to run                                                                                                                                                                                                                                                                                             |
-| modules.gowitness.timeout                      | int    | 10                                                                                                                                                                  | preflight check timeout                                                                                                                                                                                                                                                                                         |
-| modules.gowitness.version                      | str    | 2.4.2                                                                                                                                                               | gowitness version                                                                                                                                                                                                                                                                                               |
-| modules.httpx.in_scope_only                    | bool   | True                                                                                                                                                                | Only visit web resources that are in scope.                                                                                                                                                                                                                                                                     |
-| modules.httpx.max_response_size                | int    | 5242880                                                                                                                                                             | Max response size in bytes                                                                                                                                                                                                                                                                                      |
-| modules.httpx.threads                          | int    | 50                                                                                                                                                                  | Number of httpx threads to use                                                                                                                                                                                                                                                                                  |
-| modules.httpx.version                          | str    | 1.2.5                                                                                                                                                               | httpx version                                                                                                                                                                                                                                                                                                   |
-| modules.iis_shortnames.detect_only             | bool   | True                                                                                                                                                                | Only detect the vulnerability and do not run the shortname scanner                                                                                                                                                                                                                                              |
-| modules.iis_shortnames.max_node_count          | int    | 30                                                                                                                                                                  | Limit how many nodes to attempt to resolve on any given recursion branch                                                                                                                                                                                                                                        |
-| modules.masscan.ping_first                     | bool   | False                                                                                                                                                               | Only portscan hosts that reply to pings                                                                                                                                                                                                                                                                         |
-| modules.masscan.ports                          | str    | 80,443                                                                                                                                                              | Ports to scan                                                                                                                                                                                                                                                                                                   |
-| modules.masscan.rate                           | int    | 600                                                                                                                                                                 | Rate in packets per second                                                                                                                                                                                                                                                                                      |
-| modules.masscan.use_cache                      | bool   | False                                                                                                                                                               | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     |
-| modules.masscan.wait                           | int    | 10                                                                                                                                                                  | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              |
-| modules.naabu.ports                            | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
-| modules.naabu.skip_host_discovery              | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
-| modules.naabu.top_ports                        | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
-| modules.naabu.version                          | str    | 2.1.1                                                                                                                                                               | naabu version                                                                                                                                                                                                                                                                                                   |
-| modules.nmap.ports                             | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
-| modules.nmap.skip_host_discovery               | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
-| modules.nmap.timing                            | str    | T4                                                                                                                                                                  |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `|
-| modules.nmap.top_ports                         | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
-| modules.ntlm.try_all                           | bool   | False                                                                                                                                                               | Try every NTLM endpoint                                                                                                                                                                                                                                                                                         |
-| modules.nuclei.budget                          | int    | 1                                                                                                                                                                   | Used in budget mode to set the number of requests which will be alloted to the nuclei scan                                                                                                                                                                                                                      |
-| modules.nuclei.concurrency                     | int    | 25                                                                                                                                                                  | maximum number of templates to be executed in parallel (default 25)                                                                                                                                                                                                                                             |
-| modules.nuclei.directory_only                  | bool   | True                                                                                                                                                                | Filter out 'file' URL event (default True)                                                                                                                                                                                                                                                                      |
-| modules.nuclei.etags                           | str    |                                                                                                                                                                     | tags to exclude from the scan                                                                                                                                                                                                                                                                                   |
-| modules.nuclei.mode                            | str    | manual                                                                                                                                                              | manual | technology | severe | budget. Technology: Only activate based on technology events that match nuclei tags (nuclei -as mode). Manual (DEFAULT): Fully manual settings. Severe: Only critical and high severity templates without intrusive. Budget: Limit Nuclei to a specified number of HTTP requests |
-| modules.nuclei.ratelimit                       | int    | 150                                                                                                                                                                 | maximum number of requests to send per second (default 150)                                                                                                                                                                                                                                                     |
-| modules.nuclei.severity                        | str    |                                                                                                                                                                     | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |
-| modules.nuclei.tags                            | str    |                                                                                                                                                                     | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |
-| modules.nuclei.templates                       | str    |                                                                                                                                                                     | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |
-| modules.nuclei.version                         | str    | 2.9.4                                                                                                                                                               | nuclei version                                                                                                                                                                                                                                                                                                  |
-| modules.paramminer_cookies.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                |
-| modules.paramminer_getparams.wordlist          | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             |
-| modules.paramminer_headers.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                |
-| modules.robots.include_allow                   | bool   | True                                                                                                                                                                | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         |
-| modules.robots.include_disallow                | bool   | True                                                                                                                                                                | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      |
-| modules.robots.include_sitemap                 | bool   | False                                                                                                                                                               | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       |
-| modules.secretsdb.min_confidence               | int    | 99                                                                                                                                                                  | Only use signatures with this confidence score or higher                                                                                                                                                                                                                                                        |
-| modules.secretsdb.signatures                   | str    | https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml                                                               | File path or URL to YAML signatures                                                                                                                                                                                                                                                                             |
-| modules.sslcert.skip_non_ssl                   | bool   | True                                                                                                                                                                | Don't try common non-SSL ports                                                                                                                                                                                                                                                                                  |
-| modules.sslcert.timeout                        | float  | 5.0                                                                                                                                                                 | Socket connect timeout in seconds                                                                                                                                                                                                                                                                               |
-| modules.subdomain_hijack.fingerprints          | str    | https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json                                                                           | URL or path to fingerprints.json                                                                                                                                                                                                                                                                                |
-| modules.telerik.exploit_RAU_crypto             | bool   | False                                                                                                                                                               | Attempt to confirm any RAU AXD detections are vulnerable                                                                                                                                                                                                                                                        |
-| modules.url_manipulation.allow_redirects       | bool   | True                                                                                                                                                                | Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default.                                                                                                                                                                                |
-| modules.vhost.force_basehost                   | str    |                                                                                                                                                                     | Use a custom base host (e.g. evilcorp.com) instead of the default behavior of using the current URL                                                                                                                                                                                                             |
-| modules.vhost.lines                            | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
-| modules.vhost.wordlist                         | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Wordlist containing subdomains                                                                                                                                                                                                                                                                                  |
-| modules.wafw00f.generic_detect                 | bool   | True                                                                                                                                                                | When no specific WAF detections are made, try to peform a generic detect                                                                                                                                                                                                                                        |
-| modules.bevigil.api_key                        | str    |                                                                                                                                                                     | BeVigil OSINT API Key                                                                                                                                                                                                                                                                                           |
-| modules.bevigil.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
-| modules.binaryedge.api_key                     | str    |                                                                                                                                                                     | BinaryEdge API key                                                                                                                                                                                                                                                                                              |
-| modules.binaryedge.max_records                 | int    | 1000                                                                                                                                                                | Limit results to help prevent exceeding API quota                                                                                                                                                                                                                                                               |
-| modules.builtwith.api_key                      | str    |                                                                                                                                                                     | Builtwith API key                                                                                                                                                                                                                                                                                               |
-| modules.builtwith.redirects                    | bool   | True                                                                                                                                                                | Also look up inbound and outbound redirects                                                                                                                                                                                                                                                                     |
-| modules.c99.api_key                            | str    |                                                                                                                                                                     | c99.nl API key                                                                                                                                                                                                                                                                                                  |
-| modules.censys.api_id                          | str    |                                                                                                                                                                     | Censys.io API ID                                                                                                                                                                                                                                                                                                |
-| modules.censys.api_secret                      | str    |                                                                                                                                                                     | Censys.io API Secret                                                                                                                                                                                                                                                                                            |
-| modules.fullhunt.api_key                       | str    |                                                                                                                                                                     | FullHunt API Key                                                                                                                                                                                                                                                                                                |
-| modules.github.api_key                         | str    |                                                                                                                                                                     | Github token                                                                                                                                                                                                                                                                                                    |
-| modules.hunterio.api_key                       | str    |                                                                                                                                                                     | Hunter.IO API key                                                                                                                                                                                                                                                                                               |
-| modules.ipneighbor.num_bits                    | int    | 4                                                                                                                                                                   | Netmask size (in CIDR notation) to check. Default is 4 bits (16 hosts)                                                                                                                                                                                                                                          |
-| modules.ipstack.api_key                        | str    |                                                                                                                                                                     | IPStack GeoIP API Key                                                                                                                                                                                                                                                                                           |
-| modules.leakix.api_key                         | str    |                                                                                                                                                                     | LeakIX API Key                                                                                                                                                                                                                                                                                                  |
-| modules.massdns.max_mutations                  | int    | 500                                                                                                                                                                 | Max number of smart mutations per subdomain                                                                                                                                                                                                                                                                     |
-| modules.massdns.max_resolvers                  | int    | 1000                                                                                                                                                                | Number of concurrent massdns resolvers                                                                                                                                                                                                                                                                          |
-| modules.massdns.wordlist                       | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Subdomain wordlist URL                                                                                                                                                                                                                                                                                          |
-| modules.passivetotal.api_key                   | str    |                                                                                                                                                                     | RiskIQ API Key                                                                                                                                                                                                                                                                                                  |
-| modules.passivetotal.username                  | str    |                                                                                                                                                                     | RiskIQ Username                                                                                                                                                                                                                                                                                                 |
-| modules.pgp.search_urls                        | list   |` ['https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=<query>', 'http://the.earth.li:11371/pks/lookup?fingerprint=on&op=vindex&search=<query>'] `| PGP key servers to search                                                                                                                                                                                                                                                                                       |
-| modules.securitytrails.api_key                 | str    |                                                                                                                                                                     | SecurityTrails API key                                                                                                                                                                                                                                                                                          |
-| modules.shodan_dns.api_key                     | str    |                                                                                                                                                                     | Shodan API key                                                                                                                                                                                                                                                                                                  |
-| modules.urlscan.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
-| modules.virustotal.api_key                     | str    |                                                                                                                                                                     | VirusTotal API Key                                                                                                                                                                                                                                                                                              |
-| modules.wayback.garbage_threshold              | int    | 10                                                                                                                                                                  | Dedupe similar urls if they are in a group of this size or higher (lower values == less garbage data)                                                                                                                                                                                                           |
-| modules.wayback.urls                           | bool   | False                                                                                                                                                               | emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
-| modules.zoomeye.api_key                        | str    |                                                                                                                                                                     | ZoomEye API key                                                                                                                                                                                                                                                                                                 |
-| modules.zoomeye.include_related                | bool   | False                                                                                                                                                               | Include domains which may be related to the target                                                                                                                                                                                                                                                              |
-| modules.zoomeye.max_pages                      | int    | 20                                                                                                                                                                  | How many pages of results to fetch                                                                                                                                                                                                                                                                              |
-| output_modules.asset_inventory.output_file     | str    |                                                                                                                                                                     | Set a custom output file                                                                                                                                                                                                                                                                                        |
-| output_modules.asset_inventory.summary_netmask | int    | 16                                                                                                                                                                  | Subnet mask to use when summarizing IP addresses at end of scan                                                                                                                                                                                                                                                 |
-| output_modules.asset_inventory.use_previous    | bool   | False                                                                                                                                                               |` Emit previous asset inventory as new events (use in conjunction with -n <old_scan_name>)                                                                                                                                                                                                                        `|
-| output_modules.csv.output_file                 | str    |                                                                                                                                                                     | Output to CSV file                                                                                                                                                                                                                                                                                              |
-| output_modules.http.bearer                     | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
-| output_modules.http.method                     | str    | POST                                                                                                                                                                | HTTP method                                                                                                                                                                                                                                                                                                     |
-| output_modules.http.password                   | str    |                                                                                                                                                                     | Password (basic auth)                                                                                                                                                                                                                                                                                           |
-| output_modules.http.timeout                    | int    | 10                                                                                                                                                                  | HTTP timeout                                                                                                                                                                                                                                                                                                    |
-| output_modules.http.url                        | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
-| output_modules.http.username                   | str    |                                                                                                                                                                     | Username (basic auth)                                                                                                                                                                                                                                                                                           |
-| output_modules.human.console                   | bool   | True                                                                                                                                                                | Output to console                                                                                                                                                                                                                                                                                               |
-| output_modules.human.output_file               | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
-| output_modules.json.console                    | bool   | False                                                                                                                                                               | Output to console                                                                                                                                                                                                                                                                                               |
-| output_modules.json.output_file                | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
-| output_modules.neo4j.password                  | str    | bbotislife                                                                                                                                                          | Neo4j password                                                                                                                                                                                                                                                                                                  |
-| output_modules.neo4j.uri                       | str    | bolt://localhost:7687                                                                                                                                               | Neo4j server + port                                                                                                                                                                                                                                                                                             |
-| output_modules.neo4j.username                  | str    | neo4j                                                                                                                                                               | Neo4j username                                                                                                                                                                                                                                                                                                  |
-| output_modules.web_report.css_theme_file       | str    | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   |
-| output_modules.web_report.output_file          | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
-| output_modules.websocket.token                 | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
-| output_modules.websocket.url                   | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
-| internal_modules.speculate.max_hosts           | int    | 65536                                                                                                                                                               | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  |
-| internal_modules.speculate.ports               | list   | [80, 443]                                                                                                                                                           | The set of ports to speculate on                                                                                                                                                                                                                                                                                |
-<!-- END BBOT MODULE OPTIONS -->
+~~~
\ No newline at end of file
diff --git a/docs/modules.md b/docs/modules.md
new file mode 100644
index 0000000000..088fba19a7
--- /dev/null
+++ b/docs/modules.md
@@ -0,0 +1,17 @@
+
+# BBOT Modules and Flags
+
+## Modules
+
+<!-- BBOT MODULES -->
+<!-- END BBOT MODULES -->
+
+## Module Flags
+
+<!-- BBOT MODULE FLAGS -->
+<!-- END BBOT MODULE FLAGS -->
+
+## Module Options
+
+<!-- BBOT MODULE OPTIONS -->
+<!-- END BBOT MODULE OPTIONS -->
diff --git a/docs/stylesheets/extra.css b/docs/stylesheets/extra.css
deleted file mode 100644
index 74f952bfe8..0000000000
--- a/docs/stylesheets/extra.css
+++ /dev/null
@@ -1,15 +0,0 @@
-:root {
-  --bbot-orange: #FF8400;
-}
-
-.md-typeset a, a {
-  color: var(--bbot-orange);
-}
-
-a.md-source, .md-header__topic {
-  color: var(--bbot-orange);
-}
-
-div.md-source__repository ul {
-  color: white;
-}
diff --git a/docs/stylesheets/extra.scss b/docs/stylesheets/extra.scss
new file mode 100644
index 0000000000..e69de29bb2
diff --git a/mkdocs.yml b/mkdocs.yml
index 38f1b39229..7cbd8076c2 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -29,5 +29,5 @@ theme:
         icon: material/brightness-7 
         name: Switch to dark mode
 
-extra_css:
-  - stylesheets/extra.css
+plugins:
+  - extra-sass

From b5a4cef85d45dfc14426d3fc9ff6fb81bbd82cf5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 28 Jun 2023 12:46:22 -0400
Subject: [PATCH 140/387] update docs script

---
 bbot/scripts/docs.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index c3b6c2666d..24d84e406e 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -55,12 +55,12 @@ def find_replace_file(file, keyword, replace):
 
 # BBOT module options
 bbot_module_options_table = module_loader.modules_options_table()
-assert len(bbot_module_options_table.splitlines()) > 50
+assert len(bbot_module_options_table.splitlines()) > 100
 for file in md_files:
     find_replace_file(file, "BBOT MODULE OPTIONS", bbot_module_options_table)
 
 # BBOT module flags
 bbot_module_flags_table = module_loader.flags_table()
-assert len(bbot_module_flags_table.splitlines()) > 50
+assert len(bbot_module_flags_table.splitlines()) > 10
 for file in md_files:
     find_replace_file(file, "BBOT MODULE FLAGS", bbot_module_flags_table)

From a36bc9b8c638bf5175c8a04fc2c384860cd86dae Mon Sep 17 00:00:00 2001
From: github-actions <41898282+github-actions[bot]@users.noreply.github.com>
Date: Wed, 28 Jun 2023 16:47:17 +0000
Subject: [PATCH 141/387] Refresh module docs

---
 docs/modules.md | 241 ++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 241 insertions(+)

diff --git a/docs/modules.md b/docs/modules.md
index 088fba19a7..dc21f0e8f6 100644
--- a/docs/modules.md
+++ b/docs/modules.md
@@ -4,14 +4,255 @@
 ## Modules
 
 <!-- BBOT MODULES -->
+| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
+|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
+| badsecrets           | scan     |                 | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
+| bucket_aws           | scan     |                 | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_azure         | scan     |                 | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_digitalocean  | scan     |                 | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
+| bucket_firebase      | scan     |                 | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_gcp           | scan     |                 | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bypass403            | scan     |                 | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
+| dnszonetransfer      | scan     |                 | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
+| ffuf                 | scan     |                 | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
+| ffuf_shortnames      | scan     |                 | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
+| fingerprintx         | scan     |                 | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
+| generic_ssrf         | scan     |                 | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
+| git                  | scan     |                 | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| gowitness            | scan     |                 | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
+| host_header          | scan     |                 | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
+| httpx                | scan     |                 | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
+| hunt                 | scan     |                 | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| iis_shortnames       | scan     |                 | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
+| masscan              | scan     |                 | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
+| naabu                | scan     |                 | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| nmap                 | scan     |                 | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| ntlm                 | scan     |                 | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
+| nuclei               | scan     |                 | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
+| paramminer_cookies   | scan     |                 | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_getparams | scan     |                 | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_headers   | scan     |                 | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| robots               | scan     |                 | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
+| secretsdb            | scan     |                 | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| smuggler             | scan     |                 | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
+| social               | scan     |                 | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
+| sslcert              | scan     |                 | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
+| subdomain_hijack     | scan     |                 | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
+| telerik              | scan     |                 | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
+| url_manipulation     | scan     |                 | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
+| vhost                | scan     |                 | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
+| wafw00f              | scan     |                 | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
+| wappalyzer           | scan     |                 | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
+| affiliates           | scan     |                 | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
+| anubisdb             | scan     |                 | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| asn                  | scan     |                 | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
+| azure_tenant         | scan     |                 | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| bevigil              | scan     | X               | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| binaryedge           | scan     | X               | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| builtwith            | scan     | X               | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| c99                  | scan     | X               | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| censys               | scan     | X               | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
+| certspotter          | scan     |                 | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| columbus             | scan     |                 | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| crobat               | scan     |                 | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
+| crt                  | scan     |                 | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnscommonsrv         | scan     |                 | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnsdumpster          | scan     |                 | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| emailformat          | scan     |                 | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| fullhunt             | scan     | X               | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| github               | scan     | X               | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
+| hackertarget         | scan     |                 | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| hunterio             | scan     | X               | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
+| ipneighbor           | scan     |                 | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
+| ipstack              | scan     | X               | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
+| leakix               | scan     |                 | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| massdns              | scan     |                 | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
+| otx                  | scan     |                 | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| passivetotal         | scan     | X               | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| pgp                  | scan     |                 | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| rapiddns             | scan     |                 | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| riddler              | scan     |                 | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| securitytrails       | scan     | X               | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| shodan_dns           | scan     | X               | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| skymem               | scan     |                 | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| sublist3r            | scan     |                 | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
+| threatminer          | scan     |                 | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| urlscan              | scan     |                 | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| viewdns              | scan     |                 | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
+| virustotal           | scan     | X               | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| wayback              | scan     |                 | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| zoomeye              | scan     | X               | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| asset_inventory      | output   |                 | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
+| csv                  | output   |                 | Output to CSV                                                          |                                                                               |                                                      |
+| http                 | output   |                 | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
+| human                | output   |                 | Output to text                                                         |                                                                               |                                                      |
+| json                 | output   |                 | Output to JSON                                                         |                                                                               |                                                      |
+| neo4j                | output   |                 | Output to Neo4j                                                        |                                                                               |                                                      |
+| python               | output   |                 | Output via Python API                                                  |                                                                               |                                                      |
+| web_report           | output   |                 | Create a markdown report with web assets                               |                                                                               |                                                      |
+| websocket            | output   |                 | Output to websockets                                                   |                                                                               |                                                      |
+| aggregate            | internal |                 | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
+| excavate             | internal |                 | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
+| speculate            | internal |                 | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
 <!-- END BBOT MODULES -->
 
 ## Module Flags
 
 <!-- BBOT MODULE FLAGS -->
+| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
+|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
+| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
+| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
+| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
+| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS -->
 
 ## Module Options
 
 <!-- BBOT MODULE OPTIONS -->
+| Option                                         | Type   | Default                                                                                                                                                             | Description                                                                                                                                                                                                                                                                                                     |
+|------------------------------------------------|--------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| modules.bucket_aws.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_azure.permutations              | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_digitalocean.permutations       | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_firebase.permutations           | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.bucket_gcp.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
+| modules.dnszonetransfer.timeout                | int    | 10                                                                                                                                                                  | Max seconds to wait before timing out                                                                                                                                                                                                                                                                           |
+| modules.ffuf.extensions                        | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
+| modules.ffuf.lines                             | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
+| modules.ffuf.max_depth                         | int    | 0                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
+| modules.ffuf.version                           | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
+| modules.ffuf.wordlist                          | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/Web-Content/raft-small-directories.txt                                                   | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
+| modules.ffuf_shortnames.extensions             | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
+| modules.ffuf_shortnames.find_common_prefixes   | bool   | False                                                                                                                                                               | Attempt to automatically detect common prefixes and make additional ffuf runs against them                                                                                                                                                                                                                      |
+| modules.ffuf_shortnames.find_delimeters        | bool   | True                                                                                                                                                                | Attempt to detect common delimeters and make additional ffuf runs against them                                                                                                                                                                                                                                  |
+| modules.ffuf_shortnames.ignore_redirects       | bool   | True                                                                                                                                                                | Explicitly ignore redirects (301,302)                                                                                                                                                                                                                                                                           |
+| modules.ffuf_shortnames.lines                  | int    | 1000000                                                                                                                                                             | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
+| modules.ffuf_shortnames.max_depth              | int    | 1                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
+| modules.ffuf_shortnames.version                | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
+| modules.ffuf_shortnames.wordlist               | str    |                                                                                                                                                                     | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
+| modules.ffuf_shortnames.wordlist_extensions    | str    |                                                                                                                                                                     | Specify wordlist to use when making extension lists                                                                                                                                                                                                                                                             |
+| modules.fingerprintx.version                   | str    | 1.1.4                                                                                                                                                               | fingerprintx version                                                                                                                                                                                                                                                                                            |
+| modules.gowitness.output_path                  | str    |                                                                                                                                                                     | where to save screenshots                                                                                                                                                                                                                                                                                       |
+| modules.gowitness.resolution_x                 | int    | 1440                                                                                                                                                                | screenshot resolution x                                                                                                                                                                                                                                                                                         |
+| modules.gowitness.resolution_y                 | int    | 900                                                                                                                                                                 | screenshot resolution y                                                                                                                                                                                                                                                                                         |
+| modules.gowitness.threads                      | int    | 4                                                                                                                                                                   | threads used to run                                                                                                                                                                                                                                                                                             |
+| modules.gowitness.timeout                      | int    | 10                                                                                                                                                                  | preflight check timeout                                                                                                                                                                                                                                                                                         |
+| modules.gowitness.version                      | str    | 2.4.2                                                                                                                                                               | gowitness version                                                                                                                                                                                                                                                                                               |
+| modules.httpx.in_scope_only                    | bool   | True                                                                                                                                                                | Only visit web resources that are in scope.                                                                                                                                                                                                                                                                     |
+| modules.httpx.max_response_size                | int    | 5242880                                                                                                                                                             | Max response size in bytes                                                                                                                                                                                                                                                                                      |
+| modules.httpx.threads                          | int    | 50                                                                                                                                                                  | Number of httpx threads to use                                                                                                                                                                                                                                                                                  |
+| modules.httpx.version                          | str    | 1.2.5                                                                                                                                                               | httpx version                                                                                                                                                                                                                                                                                                   |
+| modules.iis_shortnames.detect_only             | bool   | True                                                                                                                                                                | Only detect the vulnerability and do not run the shortname scanner                                                                                                                                                                                                                                              |
+| modules.iis_shortnames.max_node_count          | int    | 30                                                                                                                                                                  | Limit how many nodes to attempt to resolve on any given recursion branch                                                                                                                                                                                                                                        |
+| modules.masscan.ping_first                     | bool   | False                                                                                                                                                               | Only portscan hosts that reply to pings                                                                                                                                                                                                                                                                         |
+| modules.masscan.ports                          | str    | 80,443                                                                                                                                                              | Ports to scan                                                                                                                                                                                                                                                                                                   |
+| modules.masscan.rate                           | int    | 600                                                                                                                                                                 | Rate in packets per second                                                                                                                                                                                                                                                                                      |
+| modules.masscan.use_cache                      | bool   | False                                                                                                                                                               | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     |
+| modules.masscan.wait                           | int    | 10                                                                                                                                                                  | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              |
+| modules.naabu.ports                            | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
+| modules.naabu.skip_host_discovery              | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
+| modules.naabu.top_ports                        | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
+| modules.naabu.version                          | str    | 2.1.1                                                                                                                                                               | naabu version                                                                                                                                                                                                                                                                                                   |
+| modules.nmap.ports                             | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
+| modules.nmap.skip_host_discovery               | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
+| modules.nmap.timing                            | str    | T4                                                                                                                                                                  |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `|
+| modules.nmap.top_ports                         | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
+| modules.ntlm.try_all                           | bool   | False                                                                                                                                                               | Try every NTLM endpoint                                                                                                                                                                                                                                                                                         |
+| modules.nuclei.budget                          | int    | 1                                                                                                                                                                   | Used in budget mode to set the number of requests which will be alloted to the nuclei scan                                                                                                                                                                                                                      |
+| modules.nuclei.concurrency                     | int    | 25                                                                                                                                                                  | maximum number of templates to be executed in parallel (default 25)                                                                                                                                                                                                                                             |
+| modules.nuclei.directory_only                  | bool   | True                                                                                                                                                                | Filter out 'file' URL event (default True)                                                                                                                                                                                                                                                                      |
+| modules.nuclei.etags                           | str    |                                                                                                                                                                     | tags to exclude from the scan                                                                                                                                                                                                                                                                                   |
+| modules.nuclei.mode                            | str    | manual                                                                                                                                                              | manual | technology | severe | budget. Technology: Only activate based on technology events that match nuclei tags (nuclei -as mode). Manual (DEFAULT): Fully manual settings. Severe: Only critical and high severity templates without intrusive. Budget: Limit Nuclei to a specified number of HTTP requests |
+| modules.nuclei.ratelimit                       | int    | 150                                                                                                                                                                 | maximum number of requests to send per second (default 150)                                                                                                                                                                                                                                                     |
+| modules.nuclei.severity                        | str    |                                                                                                                                                                     | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |
+| modules.nuclei.tags                            | str    |                                                                                                                                                                     | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |
+| modules.nuclei.templates                       | str    |                                                                                                                                                                     | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |
+| modules.nuclei.version                         | str    | 2.9.4                                                                                                                                                               | nuclei version                                                                                                                                                                                                                                                                                                  |
+| modules.paramminer_cookies.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                |
+| modules.paramminer_getparams.wordlist          | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             |
+| modules.paramminer_headers.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                |
+| modules.robots.include_allow                   | bool   | True                                                                                                                                                                | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         |
+| modules.robots.include_disallow                | bool   | True                                                                                                                                                                | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      |
+| modules.robots.include_sitemap                 | bool   | False                                                                                                                                                               | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       |
+| modules.secretsdb.min_confidence               | int    | 99                                                                                                                                                                  | Only use signatures with this confidence score or higher                                                                                                                                                                                                                                                        |
+| modules.secretsdb.signatures                   | str    | https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml                                                               | File path or URL to YAML signatures                                                                                                                                                                                                                                                                             |
+| modules.sslcert.skip_non_ssl                   | bool   | True                                                                                                                                                                | Don't try common non-SSL ports                                                                                                                                                                                                                                                                                  |
+| modules.sslcert.timeout                        | float  | 5.0                                                                                                                                                                 | Socket connect timeout in seconds                                                                                                                                                                                                                                                                               |
+| modules.subdomain_hijack.fingerprints          | str    | https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json                                                                           | URL or path to fingerprints.json                                                                                                                                                                                                                                                                                |
+| modules.telerik.exploit_RAU_crypto             | bool   | False                                                                                                                                                               | Attempt to confirm any RAU AXD detections are vulnerable                                                                                                                                                                                                                                                        |
+| modules.url_manipulation.allow_redirects       | bool   | True                                                                                                                                                                | Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default.                                                                                                                                                                                |
+| modules.vhost.force_basehost                   | str    |                                                                                                                                                                     | Use a custom base host (e.g. evilcorp.com) instead of the default behavior of using the current URL                                                                                                                                                                                                             |
+| modules.vhost.lines                            | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
+| modules.vhost.wordlist                         | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Wordlist containing subdomains                                                                                                                                                                                                                                                                                  |
+| modules.wafw00f.generic_detect                 | bool   | True                                                                                                                                                                | When no specific WAF detections are made, try to peform a generic detect                                                                                                                                                                                                                                        |
+| modules.bevigil.api_key                        | str    |                                                                                                                                                                     | BeVigil OSINT API Key                                                                                                                                                                                                                                                                                           |
+| modules.bevigil.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
+| modules.binaryedge.api_key                     | str    |                                                                                                                                                                     | BinaryEdge API key                                                                                                                                                                                                                                                                                              |
+| modules.binaryedge.max_records                 | int    | 1000                                                                                                                                                                | Limit results to help prevent exceeding API quota                                                                                                                                                                                                                                                               |
+| modules.builtwith.api_key                      | str    |                                                                                                                                                                     | Builtwith API key                                                                                                                                                                                                                                                                                               |
+| modules.builtwith.redirects                    | bool   | True                                                                                                                                                                | Also look up inbound and outbound redirects                                                                                                                                                                                                                                                                     |
+| modules.c99.api_key                            | str    |                                                                                                                                                                     | c99.nl API key                                                                                                                                                                                                                                                                                                  |
+| modules.censys.api_id                          | str    |                                                                                                                                                                     | Censys.io API ID                                                                                                                                                                                                                                                                                                |
+| modules.censys.api_secret                      | str    |                                                                                                                                                                     | Censys.io API Secret                                                                                                                                                                                                                                                                                            |
+| modules.fullhunt.api_key                       | str    |                                                                                                                                                                     | FullHunt API Key                                                                                                                                                                                                                                                                                                |
+| modules.github.api_key                         | str    |                                                                                                                                                                     | Github token                                                                                                                                                                                                                                                                                                    |
+| modules.hunterio.api_key                       | str    |                                                                                                                                                                     | Hunter.IO API key                                                                                                                                                                                                                                                                                               |
+| modules.ipneighbor.num_bits                    | int    | 4                                                                                                                                                                   | Netmask size (in CIDR notation) to check. Default is 4 bits (16 hosts)                                                                                                                                                                                                                                          |
+| modules.ipstack.api_key                        | str    |                                                                                                                                                                     | IPStack GeoIP API Key                                                                                                                                                                                                                                                                                           |
+| modules.leakix.api_key                         | str    |                                                                                                                                                                     | LeakIX API Key                                                                                                                                                                                                                                                                                                  |
+| modules.massdns.max_mutations                  | int    | 500                                                                                                                                                                 | Max number of smart mutations per subdomain                                                                                                                                                                                                                                                                     |
+| modules.massdns.max_resolvers                  | int    | 1000                                                                                                                                                                | Number of concurrent massdns resolvers                                                                                                                                                                                                                                                                          |
+| modules.massdns.wordlist                       | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Subdomain wordlist URL                                                                                                                                                                                                                                                                                          |
+| modules.passivetotal.api_key                   | str    |                                                                                                                                                                     | RiskIQ API Key                                                                                                                                                                                                                                                                                                  |
+| modules.passivetotal.username                  | str    |                                                                                                                                                                     | RiskIQ Username                                                                                                                                                                                                                                                                                                 |
+| modules.pgp.search_urls                        | list   |` ['https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=<query>', 'http://the.earth.li:11371/pks/lookup?fingerprint=on&op=vindex&search=<query>'] `| PGP key servers to search                                                                                                                                                                                                                                                                                       |
+| modules.securitytrails.api_key                 | str    |                                                                                                                                                                     | SecurityTrails API key                                                                                                                                                                                                                                                                                          |
+| modules.shodan_dns.api_key                     | str    |                                                                                                                                                                     | Shodan API key                                                                                                                                                                                                                                                                                                  |
+| modules.urlscan.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
+| modules.virustotal.api_key                     | str    |                                                                                                                                                                     | VirusTotal API Key                                                                                                                                                                                                                                                                                              |
+| modules.wayback.garbage_threshold              | int    | 10                                                                                                                                                                  | Dedupe similar urls if they are in a group of this size or higher (lower values == less garbage data)                                                                                                                                                                                                           |
+| modules.wayback.urls                           | bool   | False                                                                                                                                                               | emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
+| modules.zoomeye.api_key                        | str    |                                                                                                                                                                     | ZoomEye API key                                                                                                                                                                                                                                                                                                 |
+| modules.zoomeye.include_related                | bool   | False                                                                                                                                                               | Include domains which may be related to the target                                                                                                                                                                                                                                                              |
+| modules.zoomeye.max_pages                      | int    | 20                                                                                                                                                                  | How many pages of results to fetch                                                                                                                                                                                                                                                                              |
+| output_modules.asset_inventory.output_file     | str    |                                                                                                                                                                     | Set a custom output file                                                                                                                                                                                                                                                                                        |
+| output_modules.asset_inventory.summary_netmask | int    | 16                                                                                                                                                                  | Subnet mask to use when summarizing IP addresses at end of scan                                                                                                                                                                                                                                                 |
+| output_modules.asset_inventory.use_previous    | bool   | False                                                                                                                                                               |` Emit previous asset inventory as new events (use in conjunction with -n <old_scan_name>)                                                                                                                                                                                                                        `|
+| output_modules.csv.output_file                 | str    |                                                                                                                                                                     | Output to CSV file                                                                                                                                                                                                                                                                                              |
+| output_modules.http.bearer                     | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
+| output_modules.http.method                     | str    | POST                                                                                                                                                                | HTTP method                                                                                                                                                                                                                                                                                                     |
+| output_modules.http.password                   | str    |                                                                                                                                                                     | Password (basic auth)                                                                                                                                                                                                                                                                                           |
+| output_modules.http.timeout                    | int    | 10                                                                                                                                                                  | HTTP timeout                                                                                                                                                                                                                                                                                                    |
+| output_modules.http.url                        | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
+| output_modules.http.username                   | str    |                                                                                                                                                                     | Username (basic auth)                                                                                                                                                                                                                                                                                           |
+| output_modules.human.console                   | bool   | True                                                                                                                                                                | Output to console                                                                                                                                                                                                                                                                                               |
+| output_modules.human.output_file               | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
+| output_modules.json.console                    | bool   | False                                                                                                                                                               | Output to console                                                                                                                                                                                                                                                                                               |
+| output_modules.json.output_file                | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
+| output_modules.neo4j.password                  | str    | bbotislife                                                                                                                                                          | Neo4j password                                                                                                                                                                                                                                                                                                  |
+| output_modules.neo4j.uri                       | str    | bolt://localhost:7687                                                                                                                                               | Neo4j server + port                                                                                                                                                                                                                                                                                             |
+| output_modules.neo4j.username                  | str    | neo4j                                                                                                                                                               | Neo4j username                                                                                                                                                                                                                                                                                                  |
+| output_modules.web_report.css_theme_file       | str    | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   |
+| output_modules.web_report.output_file          | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
+| output_modules.websocket.token                 | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
+| output_modules.websocket.url                   | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
+| internal_modules.speculate.max_hosts           | int    | 65536                                                                                                                                                               | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  |
+| internal_modules.speculate.ports               | list   | [80, 443]                                                                                                                                                           | The set of ports to speculate on                                                                                                                                                                                                                                                                                |
 <!-- END BBOT MODULE OPTIONS -->

From 8df90a8ddd6de557ef3a2ccebcb3aca3d0cd6bc3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 28 Jun 2023 17:17:48 -0400
Subject: [PATCH 142/387] fleshing out docs

---
 bbot/core/helpers/modules.py         |   7 +-
 bbot/defaults.yml                    |   2 +-
 bbot/scripts/docs.py                 |  53 +++--
 bbot/test/test_step_1/test_docs.py   |   4 +
 docs/configuration/global_options.md | 156 +++++++++++++
 docs/configuration/index.md          |  32 +++
 docs/configuration/module_options.md | 180 +++++++++++++++
 docs/contribution/index.md           |  93 ++++++++
 docs/index.md                        |  38 +++-
 docs/modules.md                      | 327 ++++++++-------------------
 docs/stylesheets/extra.scss          |   0
 extra_sass/style.css.scss            |  72 ++++++
 mkdocs.yml                           |  42 ++--
 13 files changed, 728 insertions(+), 278 deletions(-)
 create mode 100644 bbot/test/test_step_1/test_docs.py
 create mode 100644 docs/configuration/global_options.md
 create mode 100644 docs/configuration/index.md
 create mode 100644 docs/configuration/module_options.md
 create mode 100644 docs/contribution/index.md
 delete mode 100644 docs/stylesheets/extra.scss
 create mode 100644 extra_sass/style.css.scss

diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index 21c03c9eae..fdba0ae3fa 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -278,8 +278,7 @@ def modules_table(self, modules=None, mod_type=None):
             flags = sorted(preloaded.get("flags", []))
             api_key_required = ""
             meta = preloaded.get("meta", {})
-            if meta.get("auth_required", False):
-                api_key_required = "X"
+            api_key_required = ("Yes" if meta.get("auth_required", False) else "No")
             description = meta.get("description", "")
             table.append(
                 [module_name, module_type, api_key_required, description, ",".join(flags), ",".join(produced_events)]
@@ -303,12 +302,12 @@ def modules_options(self, modules=None, mod_type=None):
                 option_name = f"{module_key}.{module_name}.{k}"
                 option_type = type(v).__name__
                 option_description = module_options_desc[k]
-                modules_options[module_name].append((option_name, option_type, str(v), option_description))
+                modules_options[module_name].append((option_name, option_type, option_description, str(v)))
         return modules_options
 
     def modules_options_table(self, modules=None, mod_type=None):
         table = []
-        header = ["Option", "Type", "Default", "Description"]
+        header = ["Config Option", "Type", "Description", "Default"]
         for module_name, module_options in self.modules_options(modules, mod_type).items():
             table += module_options
         return make_table(table, header)
diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 715ae5547d..2ed0f2e039 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -28,7 +28,7 @@ user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (
 scope_search_distance: 0
 # How far out from the main scope to resolve DNS names / IPs
 scope_dns_search_distance: 2
-# Limit how many DNS records can be followed in a row (for malicious/misconfigured DNS records)
+# Limit how many DNS records can be followed in a row (stop malicious/runaway DNS records)
 dns_resolve_distance: 5
 
 # Infer certain events from others, e.g. IPs from IP ranges, DNS_NAMEs from URLs, etc.
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 24d84e406e..e1b809d295 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -44,23 +44,36 @@ def find_replace_file(file, keyword, replace):
             f.write(new_content)
 
 
-bbot_code_dir = Path(__file__).parent.parent.parent
-md_files = [p for p in bbot_code_dir.glob("**/*.md") if p.is_file()]
-
-# BBOT modules
-bbot_module_table = module_loader.modules_table()
-assert len(bbot_module_table.splitlines()) > 50
-for file in md_files:
-    find_replace_file(file, "BBOT MODULES", bbot_module_table)
-
-# BBOT module options
-bbot_module_options_table = module_loader.modules_options_table()
-assert len(bbot_module_options_table.splitlines()) > 100
-for file in md_files:
-    find_replace_file(file, "BBOT MODULE OPTIONS", bbot_module_options_table)
-
-# BBOT module flags
-bbot_module_flags_table = module_loader.flags_table()
-assert len(bbot_module_flags_table.splitlines()) > 10
-for file in md_files:
-    find_replace_file(file, "BBOT MODULE FLAGS", bbot_module_flags_table)
+def update_docs():
+    bbot_code_dir = Path(__file__).parent.parent.parent
+    md_files = [p for p in bbot_code_dir.glob("**/*.md") if p.is_file()]
+
+    # BBOT modules
+    bbot_module_table = module_loader.modules_table()
+    assert len(bbot_module_table.splitlines()) > 50
+    for file in md_files:
+        find_replace_file(file, "BBOT MODULES", bbot_module_table)
+
+    # BBOT module options
+    bbot_module_options_table = module_loader.modules_options_table()
+    assert len(bbot_module_options_table.splitlines()) > 100
+    for file in md_files:
+        find_replace_file(file, "BBOT MODULE OPTIONS", bbot_module_options_table)
+
+    # BBOT module flags
+    bbot_module_flags_table = module_loader.flags_table()
+    assert len(bbot_module_flags_table.splitlines()) > 10
+    for file in md_files:
+        find_replace_file(file, "BBOT MODULE FLAGS", bbot_module_flags_table)
+
+    # Default config
+    default_config_file = bbot_code_dir / "bbot" / "defaults.yml"
+    with open(default_config_file) as f:
+        default_config_yml = f.read()
+    default_config_yml = f"```yaml\n{default_config_yml}\n```"
+    assert len(default_config_yml.splitlines()) > 20
+    for file in md_files:
+        find_replace_file(file, "BBOT DEFAULT CONFIG", default_config_yml)
+
+
+update_docs()
diff --git a/bbot/test/test_step_1/test_docs.py b/bbot/test/test_step_1/test_docs.py
new file mode 100644
index 0000000000..ceb563c4f2
--- /dev/null
+++ b/bbot/test/test_step_1/test_docs.py
@@ -0,0 +1,4 @@
+from bbot.scripts.docs import update_docs
+
+def test_docs():
+    update_docs()
diff --git a/docs/configuration/global_options.md b/docs/configuration/global_options.md
new file mode 100644
index 0000000000..585fbdab09
--- /dev/null
+++ b/docs/configuration/global_options.md
@@ -0,0 +1,156 @@
+# Global Options
+
+## Overview
+
+BBOT is highly configurable, and allows tweaking of many internal values such as **user-agent** and **thread count**. Below is a full list of the config options supported, along with their defaults.
+
+You can specify these either via the command line or the config. For example, if you want to proxy your BBOT scan through a local proxy like [Burp Suite](https://portswigger.net/burp), you could either do:
+
+```bash
+bbot -t evilcorp.com --config http_proxy=http://127.0.0.1:8080
+```
+
+Or, in `~/.config/bbot/config.yml`:
+
+```yaml
+http_proxy: http://127.0.0.1:8080
+```
+
+## Defaults.yml
+
+<!-- BBOT DEFAULT CONFIG -->
+```yaml
+### BASIC OPTIONS ###
+
+# BBOT working directory
+home: ~/.bbot
+# Don't output events that are further than this from the main scope
+# 1 == 1 hope away from main scope
+# 0 == in scope only
+scope_report_distance: 0
+# Generate new DNS_NAME and IP_ADDRESS events through DNS resolution
+dns_resolution: true
+# Limit the number of BBOT threads
+max_threads: 25
+# Rate-limit DNS
+dns_queries_per_second: 1000
+# Rate-limit HTTP
+web_requests_per_second: 100
+# Interval for displaying status messages
+status_frequency: 15
+# HTTP proxy
+http_proxy: 
+# Web user-agent
+user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36
+
+
+### ADVANCED OPTIONS ###
+
+# How far out from the main scope to search
+scope_search_distance: 0
+# How far out from the main scope to resolve DNS names / IPs
+scope_dns_search_distance: 2
+# Limit how many DNS records can be followed in a row (stop malicious/runaway DNS records)
+dns_resolve_distance: 5
+
+# Infer certain events from others, e.g. IPs from IP ranges, DNS_NAMEs from URLs, etc.
+speculate: True
+# Passively search event data for URLs, hostnames, emails, etc.
+excavate: True
+# Summarize activity at the end of a scan
+aggregate: True
+
+# HTTP timeout (for Python requests; API calls, etc.)
+http_timeout: 10
+# HTTP timeout (for httpx)
+httpx_timeout: 5
+# Custom HTTP headers (e.g. cookies, etc.)
+# in the format { "Header-Key": "header_value" }
+# These are attached to all in-scope HTTP requests
+# Note that some modules (e.g. github) may end up sending these to out-of-scope resources
+http_headers: {}
+# HTTP retries (for Python requests; API calls, etc.)
+http_retries: 1
+# HTTP retries (for httpx)
+httpx_retries: 1
+# Enable/disable debug messages for web requests/responses
+http_debug: false
+# Maximum number of HTTP redirects to follow
+http_max_redirects: 5
+# Set the maximum number of HTTP links that can be followed in a row (0 == no spidering allowed)
+web_spider_distance: 0
+# Set the maximum directory depth for the web spider
+web_spider_depth: 1
+# Set the maximum number of links that can be followed per page
+web_spider_links_per_page: 25
+# DNS query timeout
+dns_timeout: 5
+# How many times to retry DNS queries
+dns_retries: 1
+# Disable BBOT's smart DNS wildcard handling for select domains
+dns_wildcard_ignore: []
+# How many sanity checks to make when verifying wildcard DNS
+# Increase this value if BBOT's wildcard detection isn't working
+dns_wildcard_tests: 10
+# Skip DNS requests for a certain domain and rdtype after encountering this many timeouts or SERVFAILs
+# This helps prevent faulty DNS servers from hanging up the scan
+dns_abort_threshold: 10
+# Don't show PTR records containing IP addresses
+dns_filter_ptrs: true
+# Enable/disable debug messages for dns queries
+dns_debug: false
+# Whether to verify SSL certificates
+ssl_verify: false
+# How many scan results to keep before cleaning up the older ones
+keep_scans: 20
+# Completely ignore URLs with these extensions
+url_extension_blacklist:
+    # images
+    - png
+    - jpg
+    - bmp
+    - ico
+    - jpeg
+    - gif
+    - svg
+    # web/fonts
+    - css
+    - woff
+    - woff2
+    - ttf
+    # audio
+    - mp3
+    - m4a
+    - wav
+    - flac
+    # video
+    - mp4
+    - mkv
+    - avi
+    - wmv
+    - mov
+    - flv
+    - webm
+# Distribute URLs with these extensions only to httpx (these are omitted from output)
+url_extension_httpx_only:
+    - js
+# Don't output these types of events (they are still distributed to modules)
+omit_event_types:
+    - HTTP_RESPONSE
+    - URL_UNVERIFIED
+    # - DNS_NAME_UNRESOLVED
+    # - IP_ADDRESS
+# URL of BBOT server
+agent_url: ''
+# Agent Bearer authentication token
+agent_token: ''
+
+# Custom interactsh server settings
+interactsh_server: null
+interactsh_token: null
+interactsh_disable: false
+
+```
+<!-- END BBOT DEFAULT CONFIG -->
+
+Note that these are BBOT's global config options. If you're looking for module-specific config options, see [Module Options](../module_options/).
\ No newline at end of file
diff --git a/docs/configuration/index.md b/docs/configuration/index.md
new file mode 100644
index 0000000000..7bfb0d12a7
--- /dev/null
+++ b/docs/configuration/index.md
@@ -0,0 +1,32 @@
+# Configuration Overview
+
+BBOT and its modules are built to be configurable for a wide range of use cases. Config options are different from standard command-line arguments. They're designed to perform more granular changes such as setting the HTTP proxy, the global user-agent, or a module's API key.
+
+BBOT loads its config from the following files, in this order:
+
+- `~/.config/bbot/bbot.yml`     <-- Use this one as your main config
+- `~/.config/bbot/secrets.yml`  <-- Use this one for sensitive stuff like API keys
+- command line (`--config`)     <-- Use this to specify a custom config file or override individual config options
+
+These config files will be automatically created for you when you first run BBOT.
+
+Config options specified via the command-line take precedence over all others. You can give BBOT a custom config file with `--config myconf.yml`, or individual arguments like this: `--config http_proxy=http://127.0.0.1:8080 modules.shodan_dns.api_key=1234`. To display the full and current BBOT config, including any command-line arguments, use `bbot --current-config`.
+
+Note that placing the following in `bbot.yml`:
+```yaml
+modules:
+  shodan:
+    api_key: deadbeef
+```
+Is the same as:
+```bash
+bbot --config modules.shodan.api_key=deadbeef
+```
+
+Here is an example of what a standard BBOT config might look like:
+```yaml
+modules:
+  
+```
+
+For a list of global config options, see [Global Options](./global_options/). For a full list of module config options, see [Module Options](./module_options/)
diff --git a/docs/configuration/module_options.md b/docs/configuration/module_options.md
new file mode 100644
index 0000000000..8e998d4403
--- /dev/null
+++ b/docs/configuration/module_options.md
@@ -0,0 +1,180 @@
+# Module Options
+
+## Overview
+
+Many modules accept their own configuration options. These are detailed in the table below. 
+
+Module's options have the ability to change their behavior. For example, the `nmap` module accepts options for `ports`, `timing`, etc.
+
+## Command-line vs Config File
+
+If you wanted to pass these options to `nmap`, you could do it from the command line:
+```bash
+bbot --config modules.nmap.ports=80,443 modules.nmap.timing=T5
+```
+
+or via the config (`~/.config/bbot/bbot.yml`):
+
+```yaml
+modules:
+  nmap:
+    ports: 80,443
+    timing: T5
+```
+
+If you wanted to add an API keys for `shodan` and `virustotal`, you could either specify them like this on the command line:
+
+```bash
+bbot --config modules.shodan.api_key=deadbeef modules.virustotal.api_key=deadbeef
+```
+
+Or in the config:
+```yaml
+modules:
+  shodan:
+    api_key: deadbeef
+  virustotal:
+    api_key: deadbeef
+```
+
+For a list of global BBOT config options such as HTTP Proxy, User-Agent, etc, see [Defaults](../defaults/)
+
+
+## Module Config Options
+
+- **Config Option**: Name of the config option (`--config` syntax, see above for `yaml` equivalent)
+- **Type**: Data type of the option, e.g. `bool`, `str`, etc.
+- **Description**: Description of what the option does
+- **Default**: The option's default value
+
+<!-- BBOT MODULE OPTIONS -->
+| Config Option                                  | Type   | Description                                                                                                                                                                                                                                                                                                     | Default                                                                                                                                                             |
+|------------------------------------------------|--------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| modules.bucket_aws.permutations                | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_azure.permutations              | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_digitalocean.permutations       | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_firebase.permutations           | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_gcp.permutations                | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.dnszonetransfer.timeout                | int    | Max seconds to wait before timing out                                                                                                                                                                                                                                                                           | 10                                                                                                                                                                  |
+| modules.ffuf.extensions                        | str    | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.ffuf.lines                             | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 5000                                                                                                                                                                |
+| modules.ffuf.max_depth                         | int    | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  | 0                                                                                                                                                                   |
+| modules.ffuf.version                           | str    | ffuf version                                                                                                                                                                                                                                                                                                    | 2.0.0                                                                                                                                                               |
+| modules.ffuf.wordlist                          | str    | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/Web-Content/raft-small-directories.txt                                                   |
+| modules.ffuf_shortnames.extensions             | str    | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.ffuf_shortnames.find_common_prefixes   | bool   | Attempt to automatically detect common prefixes and make additional ffuf runs against them                                                                                                                                                                                                                      | False                                                                                                                                                               |
+| modules.ffuf_shortnames.find_delimeters        | bool   | Attempt to detect common delimeters and make additional ffuf runs against them                                                                                                                                                                                                                                  | True                                                                                                                                                                |
+| modules.ffuf_shortnames.ignore_redirects       | bool   | Explicitly ignore redirects (301,302)                                                                                                                                                                                                                                                                           | True                                                                                                                                                                |
+| modules.ffuf_shortnames.lines                  | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 1000000                                                                                                                                                             |
+| modules.ffuf_shortnames.max_depth              | int    | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  | 1                                                                                                                                                                   |
+| modules.ffuf_shortnames.version                | str    | ffuf version                                                                                                                                                                                                                                                                                                    | 2.0.0                                                                                                                                                               |
+| modules.ffuf_shortnames.wordlist               | str    | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.ffuf_shortnames.wordlist_extensions    | str    | Specify wordlist to use when making extension lists                                                                                                                                                                                                                                                             |                                                                                                                                                                     |
+| modules.fingerprintx.version                   | str    | fingerprintx version                                                                                                                                                                                                                                                                                            | 1.1.4                                                                                                                                                               |
+| modules.gowitness.output_path                  | str    | where to save screenshots                                                                                                                                                                                                                                                                                       |                                                                                                                                                                     |
+| modules.gowitness.resolution_x                 | int    | screenshot resolution x                                                                                                                                                                                                                                                                                         | 1440                                                                                                                                                                |
+| modules.gowitness.resolution_y                 | int    | screenshot resolution y                                                                                                                                                                                                                                                                                         | 900                                                                                                                                                                 |
+| modules.gowitness.threads                      | int    | threads used to run                                                                                                                                                                                                                                                                                             | 4                                                                                                                                                                   |
+| modules.gowitness.timeout                      | int    | preflight check timeout                                                                                                                                                                                                                                                                                         | 10                                                                                                                                                                  |
+| modules.gowitness.version                      | str    | gowitness version                                                                                                                                                                                                                                                                                               | 2.4.2                                                                                                                                                               |
+| modules.httpx.in_scope_only                    | bool   | Only visit web resources that are in scope.                                                                                                                                                                                                                                                                     | True                                                                                                                                                                |
+| modules.httpx.max_response_size                | int    | Max response size in bytes                                                                                                                                                                                                                                                                                      | 5242880                                                                                                                                                             |
+| modules.httpx.threads                          | int    | Number of httpx threads to use                                                                                                                                                                                                                                                                                  | 50                                                                                                                                                                  |
+| modules.httpx.version                          | str    | httpx version                                                                                                                                                                                                                                                                                                   | 1.2.5                                                                                                                                                               |
+| modules.iis_shortnames.detect_only             | bool   | Only detect the vulnerability and do not run the shortname scanner                                                                                                                                                                                                                                              | True                                                                                                                                                                |
+| modules.iis_shortnames.max_node_count          | int    | Limit how many nodes to attempt to resolve on any given recursion branch                                                                                                                                                                                                                                        | 30                                                                                                                                                                  |
+| modules.masscan.ping_first                     | bool   | Only portscan hosts that reply to pings                                                                                                                                                                                                                                                                         | False                                                                                                                                                               |
+| modules.masscan.ports                          | str    | Ports to scan                                                                                                                                                                                                                                                                                                   | 80,443                                                                                                                                                              |
+| modules.masscan.rate                           | int    | Rate in packets per second                                                                                                                                                                                                                                                                                      | 600                                                                                                                                                                 |
+| modules.masscan.use_cache                      | bool   | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.masscan.wait                           | int    | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              | 10                                                                                                                                                                  |
+| modules.naabu.ports                            | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
+| modules.naabu.skip_host_discovery              | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
+| modules.naabu.top_ports                        | int    | top ports to scan                                                                                                                                                                                                                                                                                               | 100                                                                                                                                                                 |
+| modules.naabu.version                          | str    | naabu version                                                                                                                                                                                                                                                                                                   | 2.1.1                                                                                                                                                               |
+| modules.nmap.ports                             | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
+| modules.nmap.skip_host_discovery               | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
+| modules.nmap.timing                            | str    |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `| T4                                                                                                                                                                  |
+| modules.nmap.top_ports                         | int    | top ports to scan                                                                                                                                                                                                                                                                                               | 100                                                                                                                                                                 |
+| modules.ntlm.try_all                           | bool   | Try every NTLM endpoint                                                                                                                                                                                                                                                                                         | False                                                                                                                                                               |
+| modules.nuclei.budget                          | int    | Used in budget mode to set the number of requests which will be alloted to the nuclei scan                                                                                                                                                                                                                      | 1                                                                                                                                                                   |
+| modules.nuclei.concurrency                     | int    | maximum number of templates to be executed in parallel (default 25)                                                                                                                                                                                                                                             | 25                                                                                                                                                                  |
+| modules.nuclei.directory_only                  | bool   | Filter out 'file' URL event (default True)                                                                                                                                                                                                                                                                      | True                                                                                                                                                                |
+| modules.nuclei.etags                           | str    | tags to exclude from the scan                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
+| modules.nuclei.mode                            | str    | manual | technology | severe | budget. Technology: Only activate based on technology events that match nuclei tags (nuclei -as mode). Manual (DEFAULT): Fully manual settings. Severe: Only critical and high severity templates without intrusive. Budget: Limit Nuclei to a specified number of HTTP requests | manual                                                                                                                                                              |
+| modules.nuclei.ratelimit                       | int    | maximum number of requests to send per second (default 150)                                                                                                                                                                                                                                                     | 150                                                                                                                                                                 |
+| modules.nuclei.severity                        | str    | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |                                                                                                                                                                     |
+| modules.nuclei.tags                            | str    | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
+| modules.nuclei.templates                       | str    | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |                                                                                                                                                                     |
+| modules.nuclei.version                         | str    | nuclei version                                                                                                                                                                                                                                                                                                  | 2.9.4                                                                                                                                                               |
+| modules.paramminer_cookies.wordlist            | str    | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
+| modules.paramminer_getparams.wordlist          | str    | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
+| modules.paramminer_headers.wordlist            | str    | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  |
+| modules.robots.include_allow                   | bool   | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         | True                                                                                                                                                                |
+| modules.robots.include_disallow                | bool   | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      | True                                                                                                                                                                |
+| modules.robots.include_sitemap                 | bool   | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       | False                                                                                                                                                               |
+| modules.secretsdb.min_confidence               | int    | Only use signatures with this confidence score or higher                                                                                                                                                                                                                                                        | 99                                                                                                                                                                  |
+| modules.secretsdb.signatures                   | str    | File path or URL to YAML signatures                                                                                                                                                                                                                                                                             | https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml                                                               |
+| modules.sslcert.skip_non_ssl                   | bool   | Don't try common non-SSL ports                                                                                                                                                                                                                                                                                  | True                                                                                                                                                                |
+| modules.sslcert.timeout                        | float  | Socket connect timeout in seconds                                                                                                                                                                                                                                                                               | 5.0                                                                                                                                                                 |
+| modules.subdomain_hijack.fingerprints          | str    | URL or path to fingerprints.json                                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json                                                                           |
+| modules.telerik.exploit_RAU_crypto             | bool   | Attempt to confirm any RAU AXD detections are vulnerable                                                                                                                                                                                                                                                        | False                                                                                                                                                               |
+| modules.url_manipulation.allow_redirects       | bool   | Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default.                                                                                                                                                                                | True                                                                                                                                                                |
+| modules.vhost.force_basehost                   | str    | Use a custom base host (e.g. evilcorp.com) instead of the default behavior of using the current URL                                                                                                                                                                                                             |                                                                                                                                                                     |
+| modules.vhost.lines                            | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 5000                                                                                                                                                                |
+| modules.vhost.wordlist                         | str    | Wordlist containing subdomains                                                                                                                                                                                                                                                                                  | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      |
+| modules.wafw00f.generic_detect                 | bool   | When no specific WAF detections are made, try to peform a generic detect                                                                                                                                                                                                                                        | True                                                                                                                                                                |
+| modules.bevigil.api_key                        | str    | BeVigil OSINT API Key                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| modules.bevigil.urls                           | bool   | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.binaryedge.api_key                     | str    | BinaryEdge API key                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
+| modules.binaryedge.max_records                 | int    | Limit results to help prevent exceeding API quota                                                                                                                                                                                                                                                               | 1000                                                                                                                                                                |
+| modules.builtwith.api_key                      | str    | Builtwith API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
+| modules.builtwith.redirects                    | bool   | Also look up inbound and outbound redirects                                                                                                                                                                                                                                                                     | True                                                                                                                                                                |
+| modules.c99.api_key                            | str    | c99.nl API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.censys.api_id                          | str    | Censys.io API ID                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.censys.api_secret                      | str    | Censys.io API Secret                                                                                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.fullhunt.api_key                       | str    | FullHunt API Key                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.github.api_key                         | str    | Github token                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
+| modules.hunterio.api_key                       | str    | Hunter.IO API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
+| modules.ipneighbor.num_bits                    | int    | Netmask size (in CIDR notation) to check. Default is 4 bits (16 hosts)                                                                                                                                                                                                                                          | 4                                                                                                                                                                   |
+| modules.ipstack.api_key                        | str    | IPStack GeoIP API Key                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| modules.leakix.api_key                         | str    | LeakIX API Key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.massdns.max_mutations                  | int    | Max number of smart mutations per subdomain                                                                                                                                                                                                                                                                     | 500                                                                                                                                                                 |
+| modules.massdns.max_resolvers                  | int    | Number of concurrent massdns resolvers                                                                                                                                                                                                                                                                          | 1000                                                                                                                                                                |
+| modules.massdns.wordlist                       | str    | Subdomain wordlist URL                                                                                                                                                                                                                                                                                          | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      |
+| modules.passivetotal.api_key                   | str    | RiskIQ API Key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.passivetotal.username                  | str    | RiskIQ Username                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                     |
+| modules.pgp.search_urls                        | list   | PGP key servers to search                                                                                                                                                                                                                                                                                       |` ['https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=<query>', 'http://the.earth.li:11371/pks/lookup?fingerprint=on&op=vindex&search=<query>'] `|
+| modules.securitytrails.api_key                 | str    | SecurityTrails API key                                                                                                                                                                                                                                                                                          |                                                                                                                                                                     |
+| modules.shodan_dns.api_key                     | str    | Shodan API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.urlscan.urls                           | bool   | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.virustotal.api_key                     | str    | VirusTotal API Key                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
+| modules.wayback.garbage_threshold              | int    | Dedupe similar urls if they are in a group of this size or higher (lower values == less garbage data)                                                                                                                                                                                                           | 10                                                                                                                                                                  |
+| modules.wayback.urls                           | bool   | emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.zoomeye.api_key                        | str    | ZoomEye API key                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                     |
+| modules.zoomeye.include_related                | bool   | Include domains which may be related to the target                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.zoomeye.max_pages                      | int    | How many pages of results to fetch                                                                                                                                                                                                                                                                              | 20                                                                                                                                                                  |
+| output_modules.asset_inventory.output_file     | str    | Set a custom output file                                                                                                                                                                                                                                                                                        |                                                                                                                                                                     |
+| output_modules.asset_inventory.summary_netmask | int    | Subnet mask to use when summarizing IP addresses at end of scan                                                                                                                                                                                                                                                 | 16                                                                                                                                                                  |
+| output_modules.asset_inventory.use_previous    | bool   |` Emit previous asset inventory as new events (use in conjunction with -n <old_scan_name>)                                                                                                                                                                                                                        `| False                                                                                                                                                               |
+| output_modules.csv.output_file                 | str    | Output to CSV file                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
+| output_modules.http.bearer                     | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
+| output_modules.http.method                     | str    | HTTP method                                                                                                                                                                                                                                                                                                     | POST                                                                                                                                                                |
+| output_modules.http.password                   | str    | Password (basic auth)                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| output_modules.http.timeout                    | int    | HTTP timeout                                                                                                                                                                                                                                                                                                    | 10                                                                                                                                                                  |
+| output_modules.http.url                        | str    | Web URL                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                     |
+| output_modules.http.username                   | str    | Username (basic auth)                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| output_modules.human.console                   | bool   | Output to console                                                                                                                                                                                                                                                                                               | True                                                                                                                                                                |
+| output_modules.human.output_file               | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| output_modules.json.console                    | bool   | Output to console                                                                                                                                                                                                                                                                                               | False                                                                                                                                                               |
+| output_modules.json.output_file                | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| output_modules.neo4j.password                  | str    | Neo4j password                                                                                                                                                                                                                                                                                                  | bbotislife                                                                                                                                                          |
+| output_modules.neo4j.uri                       | str    | Neo4j server + port                                                                                                                                                                                                                                                                                             | bolt://localhost:7687                                                                                                                                               |
+| output_modules.neo4j.username                  | str    | Neo4j username                                                                                                                                                                                                                                                                                                  | neo4j                                                                                                                                                               |
+| output_modules.web_report.css_theme_file       | str    | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            |
+| output_modules.web_report.output_file          | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| output_modules.websocket.token                 | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
+| output_modules.websocket.url                   | str    | Web URL                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                     |
+| internal_modules.speculate.max_hosts           | int    | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  | 65536                                                                                                                                                               |
+| internal_modules.speculate.ports               | list   | The set of ports to speculate on                                                                                                                                                                                                                                                                                | [80, 443]                                                                                                                                                           |
+<!-- END BBOT MODULE OPTIONS -->
diff --git a/docs/contribution/index.md b/docs/contribution/index.md
new file mode 100644
index 0000000000..220768c3e0
--- /dev/null
+++ b/docs/contribution/index.md
@@ -0,0 +1,93 @@
+# Devving on BBOT
+
+## Installation (Poetry)
+
+[Poetry](https://python-poetry.org/) is the recommended method of installation if you want to dev on BBOT. To set up a dev environment in Poetry, you can follow these steps:
+
+- Fork [BBOT](https://github.com/blacklanternsecurity/bbot) on GitHub
+- Clone your fork and set up a development environment with Poetry:
+~~~bash
+# clone your forked repo and cd into it
+git clone git@github.com/<username>/bbot.git && cd bbot
+
+# install poetry
+curl -sSL https://install.python-poetry.org | python3 -
+
+# install pip dependencies
+poetry install
+
+# enter virtual environment
+poetry shell
+
+bbot --help
+~~~
+- Now, any changes you make in the code will be reflected in the `bbot` command.
+- Finally, commit and push your changes, and create a pull request to the main BBOT repo.
+
+## Creating a Module
+
+Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
+
+1. Create a new `.py` file in `bbot/modules`
+1. At the top of the file, import `BaseModule`
+1. Declare a class that inherits from `BaseModule`
+    - the class must have the same name as your file (case-insensitive)
+1. Define (via `watched_events` and `produced_events`) what types of events your module consumes
+1. Define (via `flags`) whether your module is `active` or `passive`
+1. Override `.handle_event()`
+    - this is where you put your custom code
+
+Here is a simple example of a working module (`bbot/modules/mymodule.py`):
+~~~python
+from bbot.modules.base import BaseModule
+
+class MyModule(BaseModule):
+    """
+    Resolve DNS_NAMEs to IPs
+    """
+    watched_events = ["DNS_NAME"]
+    produced_events = ["IP_ADDRESS"]
+    flags = ["passive"]
+
+    async def handle_event(self, event):
+        for ip in await self.helpers.resolve(event.data):
+            self.emit_event(ip, "IP_ADDRESS", source=event)
+~~~
+
+### Module Dependencies
+
+BBOT automates module dependencies with **Ansible**. If your module relies on a third-party binary, OS package, or python library, you can specify them in the `deps_*` attributes of your module.
+
+~~~python
+class MyModule(BaseModule):
+    ...
+    deps_pip = ["beautifulsoup4"]
+    deps_apt = ["chromium-browser"]
+    deps_ansible = [
+        {
+            "name": "install dev tools",
+            "package": {"name": ["gcc", "git", "make"], "state": "present"},
+            "become": True,
+            "ignore_errors": True,
+        },
+        {
+            "name": "Download massdns source code",
+            "git": {
+                "repo": "https://github.com/blechschmidt/massdns.git",
+                "dest": "#{BBOT_TEMP}/massdns",
+                "single_branch": True,
+                "version": "master",
+            },
+        },
+        {
+            "name": "Build massdns",
+            "command": {"chdir": "#{BBOT_TEMP}/massdns", "cmd": "make", "creates": "#{BBOT_TEMP}/massdns/bin/massdns"},
+        },
+        {
+            "name": "Install massdns",
+            "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
+        },
+    ]
+~~~
+
+
diff --git a/docs/index.md b/docs/index.md
index c415ff79e4..9a8a21ac98 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -1,13 +1,39 @@
-# Installation
+## Installation
 
-## Installation ([pip](https://pypi.org/project/bbot/))
-Note: installing in a virtualenv (e.g. via `pipx`) is recommended
+BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you want to dev on BBOT, please see [Installation (Poetry)](./contribution).
+
+### [Python (pip / pipx)](https://pypi.org/project/bbot/)
+Note: `pipx` installs BBOT inside its own virtual environment.
 ~~~bash
 # stable version
-pip install bbot
+pipx install bbot
 
 # bleeding edge (dev branch)
-pip install --pre bbot
+pipx install --pre bbot
 
+# execute bbot command
 bbot --help
-~~~
\ No newline at end of file
+~~~
+
+### [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot)
+BBOT provides docker images, along with helper script `bbot-docker.sh` to persist your BBOT scan data.
+~~~bash
+# bleeding edge (dev)
+docker run -it blacklanternsecurity/bbot --help
+
+# stable
+docker run -it blacklanternsecurity/bbot:stable --help
+
+# helper script
+git clone https://github.com/blacklanternsecurity/bbot && cd bbot
+./bbot-docker.sh --help
+~~~
+
+## First Scan
+
+Execute a subdomain enumeration against `evilcorp.com`:
+~~~bash
+bbot -t evilcorp.com -f subdomain-enum
+~~~
+
+## Example Scans
\ No newline at end of file
diff --git a/docs/modules.md b/docs/modules.md
index dc21f0e8f6..b78d44e702 100644
--- a/docs/modules.md
+++ b/docs/modules.md
@@ -1,102 +1,6 @@
+# Modules
 
-# BBOT Modules and Flags
-
-## Modules
-
-<!-- BBOT MODULES -->
-| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
-|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
-| badsecrets           | scan     |                 | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
-| bucket_aws           | scan     |                 | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_azure         | scan     |                 | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_digitalocean  | scan     |                 | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
-| bucket_firebase      | scan     |                 | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_gcp           | scan     |                 | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bypass403            | scan     |                 | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
-| dnszonetransfer      | scan     |                 | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
-| ffuf                 | scan     |                 | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
-| ffuf_shortnames      | scan     |                 | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
-| fingerprintx         | scan     |                 | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
-| generic_ssrf         | scan     |                 | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
-| git                  | scan     |                 | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| gowitness            | scan     |                 | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
-| host_header          | scan     |                 | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
-| httpx                | scan     |                 | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
-| hunt                 | scan     |                 | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| iis_shortnames       | scan     |                 | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
-| masscan              | scan     |                 | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
-| naabu                | scan     |                 | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| nmap                 | scan     |                 | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| ntlm                 | scan     |                 | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
-| nuclei               | scan     |                 | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
-| paramminer_cookies   | scan     |                 | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_getparams | scan     |                 | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_headers   | scan     |                 | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| robots               | scan     |                 | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
-| secretsdb            | scan     |                 | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| smuggler             | scan     |                 | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
-| social               | scan     |                 | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
-| sslcert              | scan     |                 | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
-| subdomain_hijack     | scan     |                 | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
-| telerik              | scan     |                 | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
-| url_manipulation     | scan     |                 | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
-| vhost                | scan     |                 | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
-| wafw00f              | scan     |                 | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
-| wappalyzer           | scan     |                 | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
-| affiliates           | scan     |                 | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
-| anubisdb             | scan     |                 | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| asn                  | scan     |                 | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
-| azure_tenant         | scan     |                 | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| bevigil              | scan     | X               | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| binaryedge           | scan     | X               | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| builtwith            | scan     | X               | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| c99                  | scan     | X               | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| censys               | scan     | X               | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
-| certspotter          | scan     |                 | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| columbus             | scan     |                 | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| crobat               | scan     |                 | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
-| crt                  | scan     |                 | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnscommonsrv         | scan     |                 | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnsdumpster          | scan     |                 | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| emailformat          | scan     |                 | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| fullhunt             | scan     | X               | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| github               | scan     | X               | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
-| hackertarget         | scan     |                 | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| hunterio             | scan     | X               | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
-| ipneighbor           | scan     |                 | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
-| ipstack              | scan     | X               | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
-| leakix               | scan     |                 | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| massdns              | scan     |                 | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
-| otx                  | scan     |                 | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| passivetotal         | scan     | X               | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| pgp                  | scan     |                 | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| rapiddns             | scan     |                 | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| riddler              | scan     |                 | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| securitytrails       | scan     | X               | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| shodan_dns           | scan     | X               | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| skymem               | scan     |                 | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| sublist3r            | scan     |                 | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
-| threatminer          | scan     |                 | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| urlscan              | scan     |                 | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| viewdns              | scan     |                 | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
-| virustotal           | scan     | X               | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| wayback              | scan     |                 | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| zoomeye              | scan     | X               | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| asset_inventory      | output   |                 | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
-| csv                  | output   |                 | Output to CSV                                                          |                                                                               |                                                      |
-| http                 | output   |                 | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
-| human                | output   |                 | Output to text                                                         |                                                                               |                                                      |
-| json                 | output   |                 | Output to JSON                                                         |                                                                               |                                                      |
-| neo4j                | output   |                 | Output to Neo4j                                                        |                                                                               |                                                      |
-| python               | output   |                 | Output via Python API                                                  |                                                                               |                                                      |
-| web_report           | output   |                 | Create a markdown report with web assets                               |                                                                               |                                                      |
-| websocket            | output   |                 | Output to websockets                                                   |                                                                               |                                                      |
-| aggregate            | internal |                 | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
-| excavate             | internal |                 | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
-| speculate            | internal |                 | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
-<!-- END BBOT MODULES -->
-
-## Module Flags
+## Modules by Flag
 
 <!-- BBOT MODULE FLAGS -->
 | Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
@@ -112,9 +16,9 @@
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
@@ -123,136 +27,97 @@
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS -->
 
-## Module Options
+## Full Module List
 
-<!-- BBOT MODULE OPTIONS -->
-| Option                                         | Type   | Default                                                                                                                                                             | Description                                                                                                                                                                                                                                                                                                     |
-|------------------------------------------------|--------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| modules.bucket_aws.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_azure.permutations              | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_digitalocean.permutations       | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_firebase.permutations           | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.bucket_gcp.permutations                | bool   | False                                                                                                                                                               | Whether to try permutations                                                                                                                                                                                                                                                                                     |
-| modules.dnszonetransfer.timeout                | int    | 10                                                                                                                                                                  | Max seconds to wait before timing out                                                                                                                                                                                                                                                                           |
-| modules.ffuf.extensions                        | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
-| modules.ffuf.lines                             | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
-| modules.ffuf.max_depth                         | int    | 0                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
-| modules.ffuf.version                           | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
-| modules.ffuf.wordlist                          | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/Web-Content/raft-small-directories.txt                                                   | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
-| modules.ffuf_shortnames.extensions             | str    |                                                                                                                                                                     | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |
-| modules.ffuf_shortnames.find_common_prefixes   | bool   | False                                                                                                                                                               | Attempt to automatically detect common prefixes and make additional ffuf runs against them                                                                                                                                                                                                                      |
-| modules.ffuf_shortnames.find_delimeters        | bool   | True                                                                                                                                                                | Attempt to detect common delimeters and make additional ffuf runs against them                                                                                                                                                                                                                                  |
-| modules.ffuf_shortnames.ignore_redirects       | bool   | True                                                                                                                                                                | Explicitly ignore redirects (301,302)                                                                                                                                                                                                                                                                           |
-| modules.ffuf_shortnames.lines                  | int    | 1000000                                                                                                                                                             | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
-| modules.ffuf_shortnames.max_depth              | int    | 1                                                                                                                                                                   | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  |
-| modules.ffuf_shortnames.version                | str    | 2.0.0                                                                                                                                                               | ffuf version                                                                                                                                                                                                                                                                                                    |
-| modules.ffuf_shortnames.wordlist               | str    |                                                                                                                                                                     | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |
-| modules.ffuf_shortnames.wordlist_extensions    | str    |                                                                                                                                                                     | Specify wordlist to use when making extension lists                                                                                                                                                                                                                                                             |
-| modules.fingerprintx.version                   | str    | 1.1.4                                                                                                                                                               | fingerprintx version                                                                                                                                                                                                                                                                                            |
-| modules.gowitness.output_path                  | str    |                                                                                                                                                                     | where to save screenshots                                                                                                                                                                                                                                                                                       |
-| modules.gowitness.resolution_x                 | int    | 1440                                                                                                                                                                | screenshot resolution x                                                                                                                                                                                                                                                                                         |
-| modules.gowitness.resolution_y                 | int    | 900                                                                                                                                                                 | screenshot resolution y                                                                                                                                                                                                                                                                                         |
-| modules.gowitness.threads                      | int    | 4                                                                                                                                                                   | threads used to run                                                                                                                                                                                                                                                                                             |
-| modules.gowitness.timeout                      | int    | 10                                                                                                                                                                  | preflight check timeout                                                                                                                                                                                                                                                                                         |
-| modules.gowitness.version                      | str    | 2.4.2                                                                                                                                                               | gowitness version                                                                                                                                                                                                                                                                                               |
-| modules.httpx.in_scope_only                    | bool   | True                                                                                                                                                                | Only visit web resources that are in scope.                                                                                                                                                                                                                                                                     |
-| modules.httpx.max_response_size                | int    | 5242880                                                                                                                                                             | Max response size in bytes                                                                                                                                                                                                                                                                                      |
-| modules.httpx.threads                          | int    | 50                                                                                                                                                                  | Number of httpx threads to use                                                                                                                                                                                                                                                                                  |
-| modules.httpx.version                          | str    | 1.2.5                                                                                                                                                               | httpx version                                                                                                                                                                                                                                                                                                   |
-| modules.iis_shortnames.detect_only             | bool   | True                                                                                                                                                                | Only detect the vulnerability and do not run the shortname scanner                                                                                                                                                                                                                                              |
-| modules.iis_shortnames.max_node_count          | int    | 30                                                                                                                                                                  | Limit how many nodes to attempt to resolve on any given recursion branch                                                                                                                                                                                                                                        |
-| modules.masscan.ping_first                     | bool   | False                                                                                                                                                               | Only portscan hosts that reply to pings                                                                                                                                                                                                                                                                         |
-| modules.masscan.ports                          | str    | 80,443                                                                                                                                                              | Ports to scan                                                                                                                                                                                                                                                                                                   |
-| modules.masscan.rate                           | int    | 600                                                                                                                                                                 | Rate in packets per second                                                                                                                                                                                                                                                                                      |
-| modules.masscan.use_cache                      | bool   | False                                                                                                                                                               | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     |
-| modules.masscan.wait                           | int    | 10                                                                                                                                                                  | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              |
-| modules.naabu.ports                            | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
-| modules.naabu.skip_host_discovery              | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
-| modules.naabu.top_ports                        | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
-| modules.naabu.version                          | str    | 2.1.1                                                                                                                                                               | naabu version                                                                                                                                                                                                                                                                                                   |
-| modules.nmap.ports                             | str    |                                                                                                                                                                     | ports to scan                                                                                                                                                                                                                                                                                                   |
-| modules.nmap.skip_host_discovery               | bool   | True                                                                                                                                                                | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       |
-| modules.nmap.timing                            | str    | T4                                                                                                                                                                  |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `|
-| modules.nmap.top_ports                         | int    | 100                                                                                                                                                                 | top ports to scan                                                                                                                                                                                                                                                                                               |
-| modules.ntlm.try_all                           | bool   | False                                                                                                                                                               | Try every NTLM endpoint                                                                                                                                                                                                                                                                                         |
-| modules.nuclei.budget                          | int    | 1                                                                                                                                                                   | Used in budget mode to set the number of requests which will be alloted to the nuclei scan                                                                                                                                                                                                                      |
-| modules.nuclei.concurrency                     | int    | 25                                                                                                                                                                  | maximum number of templates to be executed in parallel (default 25)                                                                                                                                                                                                                                             |
-| modules.nuclei.directory_only                  | bool   | True                                                                                                                                                                | Filter out 'file' URL event (default True)                                                                                                                                                                                                                                                                      |
-| modules.nuclei.etags                           | str    |                                                                                                                                                                     | tags to exclude from the scan                                                                                                                                                                                                                                                                                   |
-| modules.nuclei.mode                            | str    | manual                                                                                                                                                              | manual | technology | severe | budget. Technology: Only activate based on technology events that match nuclei tags (nuclei -as mode). Manual (DEFAULT): Fully manual settings. Severe: Only critical and high severity templates without intrusive. Budget: Limit Nuclei to a specified number of HTTP requests |
-| modules.nuclei.ratelimit                       | int    | 150                                                                                                                                                                 | maximum number of requests to send per second (default 150)                                                                                                                                                                                                                                                     |
-| modules.nuclei.severity                        | str    |                                                                                                                                                                     | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |
-| modules.nuclei.tags                            | str    |                                                                                                                                                                     | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |
-| modules.nuclei.templates                       | str    |                                                                                                                                                                     | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |
-| modules.nuclei.version                         | str    | 2.9.4                                                                                                                                                               | nuclei version                                                                                                                                                                                                                                                                                                  |
-| modules.paramminer_cookies.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                |
-| modules.paramminer_getparams.wordlist          | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             |
-| modules.paramminer_headers.wordlist            | str    | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                |
-| modules.robots.include_allow                   | bool   | True                                                                                                                                                                | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         |
-| modules.robots.include_disallow                | bool   | True                                                                                                                                                                | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      |
-| modules.robots.include_sitemap                 | bool   | False                                                                                                                                                               | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       |
-| modules.secretsdb.min_confidence               | int    | 99                                                                                                                                                                  | Only use signatures with this confidence score or higher                                                                                                                                                                                                                                                        |
-| modules.secretsdb.signatures                   | str    | https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml                                                               | File path or URL to YAML signatures                                                                                                                                                                                                                                                                             |
-| modules.sslcert.skip_non_ssl                   | bool   | True                                                                                                                                                                | Don't try common non-SSL ports                                                                                                                                                                                                                                                                                  |
-| modules.sslcert.timeout                        | float  | 5.0                                                                                                                                                                 | Socket connect timeout in seconds                                                                                                                                                                                                                                                                               |
-| modules.subdomain_hijack.fingerprints          | str    | https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json                                                                           | URL or path to fingerprints.json                                                                                                                                                                                                                                                                                |
-| modules.telerik.exploit_RAU_crypto             | bool   | False                                                                                                                                                               | Attempt to confirm any RAU AXD detections are vulnerable                                                                                                                                                                                                                                                        |
-| modules.url_manipulation.allow_redirects       | bool   | True                                                                                                                                                                | Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default.                                                                                                                                                                                |
-| modules.vhost.force_basehost                   | str    |                                                                                                                                                                     | Use a custom base host (e.g. evilcorp.com) instead of the default behavior of using the current URL                                                                                                                                                                                                             |
-| modules.vhost.lines                            | int    | 5000                                                                                                                                                                | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          |
-| modules.vhost.wordlist                         | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Wordlist containing subdomains                                                                                                                                                                                                                                                                                  |
-| modules.wafw00f.generic_detect                 | bool   | True                                                                                                                                                                | When no specific WAF detections are made, try to peform a generic detect                                                                                                                                                                                                                                        |
-| modules.bevigil.api_key                        | str    |                                                                                                                                                                     | BeVigil OSINT API Key                                                                                                                                                                                                                                                                                           |
-| modules.bevigil.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
-| modules.binaryedge.api_key                     | str    |                                                                                                                                                                     | BinaryEdge API key                                                                                                                                                                                                                                                                                              |
-| modules.binaryedge.max_records                 | int    | 1000                                                                                                                                                                | Limit results to help prevent exceeding API quota                                                                                                                                                                                                                                                               |
-| modules.builtwith.api_key                      | str    |                                                                                                                                                                     | Builtwith API key                                                                                                                                                                                                                                                                                               |
-| modules.builtwith.redirects                    | bool   | True                                                                                                                                                                | Also look up inbound and outbound redirects                                                                                                                                                                                                                                                                     |
-| modules.c99.api_key                            | str    |                                                                                                                                                                     | c99.nl API key                                                                                                                                                                                                                                                                                                  |
-| modules.censys.api_id                          | str    |                                                                                                                                                                     | Censys.io API ID                                                                                                                                                                                                                                                                                                |
-| modules.censys.api_secret                      | str    |                                                                                                                                                                     | Censys.io API Secret                                                                                                                                                                                                                                                                                            |
-| modules.fullhunt.api_key                       | str    |                                                                                                                                                                     | FullHunt API Key                                                                                                                                                                                                                                                                                                |
-| modules.github.api_key                         | str    |                                                                                                                                                                     | Github token                                                                                                                                                                                                                                                                                                    |
-| modules.hunterio.api_key                       | str    |                                                                                                                                                                     | Hunter.IO API key                                                                                                                                                                                                                                                                                               |
-| modules.ipneighbor.num_bits                    | int    | 4                                                                                                                                                                   | Netmask size (in CIDR notation) to check. Default is 4 bits (16 hosts)                                                                                                                                                                                                                                          |
-| modules.ipstack.api_key                        | str    |                                                                                                                                                                     | IPStack GeoIP API Key                                                                                                                                                                                                                                                                                           |
-| modules.leakix.api_key                         | str    |                                                                                                                                                                     | LeakIX API Key                                                                                                                                                                                                                                                                                                  |
-| modules.massdns.max_mutations                  | int    | 500                                                                                                                                                                 | Max number of smart mutations per subdomain                                                                                                                                                                                                                                                                     |
-| modules.massdns.max_resolvers                  | int    | 1000                                                                                                                                                                | Number of concurrent massdns resolvers                                                                                                                                                                                                                                                                          |
-| modules.massdns.wordlist                       | str    | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      | Subdomain wordlist URL                                                                                                                                                                                                                                                                                          |
-| modules.passivetotal.api_key                   | str    |                                                                                                                                                                     | RiskIQ API Key                                                                                                                                                                                                                                                                                                  |
-| modules.passivetotal.username                  | str    |                                                                                                                                                                     | RiskIQ Username                                                                                                                                                                                                                                                                                                 |
-| modules.pgp.search_urls                        | list   |` ['https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=<query>', 'http://the.earth.li:11371/pks/lookup?fingerprint=on&op=vindex&search=<query>'] `| PGP key servers to search                                                                                                                                                                                                                                                                                       |
-| modules.securitytrails.api_key                 | str    |                                                                                                                                                                     | SecurityTrails API key                                                                                                                                                                                                                                                                                          |
-| modules.shodan_dns.api_key                     | str    |                                                                                                                                                                     | Shodan API key                                                                                                                                                                                                                                                                                                  |
-| modules.urlscan.urls                           | bool   | False                                                                                                                                                               | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
-| modules.virustotal.api_key                     | str    |                                                                                                                                                                     | VirusTotal API Key                                                                                                                                                                                                                                                                                              |
-| modules.wayback.garbage_threshold              | int    | 10                                                                                                                                                                  | Dedupe similar urls if they are in a group of this size or higher (lower values == less garbage data)                                                                                                                                                                                                           |
-| modules.wayback.urls                           | bool   | False                                                                                                                                                               | emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              |
-| modules.zoomeye.api_key                        | str    |                                                                                                                                                                     | ZoomEye API key                                                                                                                                                                                                                                                                                                 |
-| modules.zoomeye.include_related                | bool   | False                                                                                                                                                               | Include domains which may be related to the target                                                                                                                                                                                                                                                              |
-| modules.zoomeye.max_pages                      | int    | 20                                                                                                                                                                  | How many pages of results to fetch                                                                                                                                                                                                                                                                              |
-| output_modules.asset_inventory.output_file     | str    |                                                                                                                                                                     | Set a custom output file                                                                                                                                                                                                                                                                                        |
-| output_modules.asset_inventory.summary_netmask | int    | 16                                                                                                                                                                  | Subnet mask to use when summarizing IP addresses at end of scan                                                                                                                                                                                                                                                 |
-| output_modules.asset_inventory.use_previous    | bool   | False                                                                                                                                                               |` Emit previous asset inventory as new events (use in conjunction with -n <old_scan_name>)                                                                                                                                                                                                                        `|
-| output_modules.csv.output_file                 | str    |                                                                                                                                                                     | Output to CSV file                                                                                                                                                                                                                                                                                              |
-| output_modules.http.bearer                     | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
-| output_modules.http.method                     | str    | POST                                                                                                                                                                | HTTP method                                                                                                                                                                                                                                                                                                     |
-| output_modules.http.password                   | str    |                                                                                                                                                                     | Password (basic auth)                                                                                                                                                                                                                                                                                           |
-| output_modules.http.timeout                    | int    | 10                                                                                                                                                                  | HTTP timeout                                                                                                                                                                                                                                                                                                    |
-| output_modules.http.url                        | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
-| output_modules.http.username                   | str    |                                                                                                                                                                     | Username (basic auth)                                                                                                                                                                                                                                                                                           |
-| output_modules.human.console                   | bool   | True                                                                                                                                                                | Output to console                                                                                                                                                                                                                                                                                               |
-| output_modules.human.output_file               | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
-| output_modules.json.console                    | bool   | False                                                                                                                                                               | Output to console                                                                                                                                                                                                                                                                                               |
-| output_modules.json.output_file                | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
-| output_modules.neo4j.password                  | str    | bbotislife                                                                                                                                                          | Neo4j password                                                                                                                                                                                                                                                                                                  |
-| output_modules.neo4j.uri                       | str    | bolt://localhost:7687                                                                                                                                               | Neo4j server + port                                                                                                                                                                                                                                                                                             |
-| output_modules.neo4j.username                  | str    | neo4j                                                                                                                                                               | Neo4j username                                                                                                                                                                                                                                                                                                  |
-| output_modules.web_report.css_theme_file       | str    | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   |
-| output_modules.web_report.output_file          | str    |                                                                                                                                                                     | Output to file                                                                                                                                                                                                                                                                                                  |
-| output_modules.websocket.token                 | str    |                                                                                                                                                                     | Authorization Bearer token                                                                                                                                                                                                                                                                                      |
-| output_modules.websocket.url                   | str    |                                                                                                                                                                     | Web URL                                                                                                                                                                                                                                                                                                         |
-| internal_modules.speculate.max_hosts           | int    | 65536                                                                                                                                                               | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  |
-| internal_modules.speculate.ports               | list   | [80, 443]                                                                                                                                                           | The set of ports to speculate on                                                                                                                                                                                                                                                                                |
-<!-- END BBOT MODULE OPTIONS -->
+<!-- BBOT MODULES -->
+| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
+|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
+| badsecrets           | scan     | No              | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
+| bucket_aws           | scan     | No              | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_azure         | scan     | No              | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_digitalocean  | scan     | No              | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
+| bucket_firebase      | scan     | No              | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_gcp           | scan     | No              | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bypass403            | scan     | No              | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
+| dnszonetransfer      | scan     | No              | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
+| ffuf                 | scan     | No              | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
+| ffuf_shortnames      | scan     | No              | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
+| fingerprintx         | scan     | No              | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
+| generic_ssrf         | scan     | No              | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
+| git                  | scan     | No              | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| gowitness            | scan     | No              | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
+| host_header          | scan     | No              | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
+| httpx                | scan     | No              | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
+| hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
+| masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
+| naabu                | scan     | No              | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| nmap                 | scan     | No              | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
+| nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
+| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| robots               | scan     | No              | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
+| secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| smuggler             | scan     | No              | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
+| social               | scan     | No              | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
+| sslcert              | scan     | No              | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
+| subdomain_hijack     | scan     | No              | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
+| telerik              | scan     | No              | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
+| url_manipulation     | scan     | No              | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
+| vhost                | scan     | No              | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
+| wafw00f              | scan     | No              | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
+| wappalyzer           | scan     | No              | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
+| affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
+| anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
+| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| c99                  | scan     | Yes             | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| censys               | scan     | Yes             | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
+| certspotter          | scan     | No              | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
+| crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| fullhunt             | scan     | Yes             | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| github               | scan     | Yes             | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
+| hackertarget         | scan     | No              | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| hunterio             | scan     | Yes             | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
+| ipneighbor           | scan     | No              | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
+| ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
+| leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
+| otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| rapiddns             | scan     | No              | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
+| threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| viewdns              | scan     | No              | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
+| virustotal           | scan     | Yes             | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| wayback              | scan     | No              | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| zoomeye              | scan     | Yes             | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| asset_inventory      | output   | No              | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
+| csv                  | output   | No              | Output to CSV                                                          |                                                                               |                                                      |
+| http                 | output   | No              | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
+| human                | output   | No              | Output to text                                                         |                                                                               |                                                      |
+| json                 | output   | No              | Output to JSON                                                         |                                                                               |                                                      |
+| neo4j                | output   | No              | Output to Neo4j                                                        |                                                                               |                                                      |
+| python               | output   | No              | Output via Python API                                                  |                                                                               |                                                      |
+| web_report           | output   | No              | Create a markdown report with web assets                               |                                                                               |                                                      |
+| websocket            | output   | No              | Output to websockets                                                   |                                                                               |                                                      |
+| aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
+| excavate             | internal | No              | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
+| speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
+<!-- END BBOT MODULES -->
\ No newline at end of file
diff --git a/docs/stylesheets/extra.scss b/docs/stylesheets/extra.scss
deleted file mode 100644
index e69de29bb2..0000000000
diff --git a/extra_sass/style.css.scss b/extra_sass/style.css.scss
new file mode 100644
index 0000000000..3857b5b48a
--- /dev/null
+++ b/extra_sass/style.css.scss
@@ -0,0 +1,72 @@
+/* GLOBAL STYLES */
+
+:root {
+  --bbot-orange: #FF8400;
+}
+
+.md-grid {
+  margin-left: unset;
+  margin-right: unset;
+  max-width: unset;
+}
+
+.md-nav__link--active {
+  font-weight: bold
+}
+
+.md-typeset__table tr {
+  white-space: nowrap;
+}
+
+.md-typeset__table td:first-child {
+  font-weight: bold;
+}
+
+.md-typeset a {
+  color: var(--bbot-orange);
+}
+
+a.md-source, .md-header__topic {
+  color: var(--bbot-orange);
+}
+
+div.md-source__repository ul {
+  color: white;
+}
+
+.md-typeset {
+  h1 h2 h3 h4 h5 {
+    font-weight: 500 !important;
+  }
+}
+
+table {
+  font-family: monospace;
+}
+
+/* DARK MODE SPECIFIC */
+
+[data-md-color-scheme=slate] {
+
+  a {
+    color: var(--bbot-orange);
+  }
+
+  .md-nav__link {
+    color: white;
+  }
+
+  .md-nav__link--active {
+    color: white;
+    font-weight: bold
+  }
+
+  .md-typeset__table tr {
+    background-color: #202027;
+  }
+
+  .md-typeset__table thead tr {
+    color: var(--bbot-orange);
+    background-color: var(--md-primary-fg-color--dark);
+  }
+}
\ No newline at end of file
diff --git a/mkdocs.yml b/mkdocs.yml
index 7cbd8076c2..794faa5de5 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -8,26 +8,36 @@ site_description: >-
 repo_name: blacklanternsecurity/bbot
 repo_url: https://github.com/blacklanternsecurity/bbot
 
+# Page tree
+nav:
+  - Basics:
+    - Getting Started: index.md
+  - Modules:
+    - modules.md
+  - Configuration:
+    - configuration/index.md
+    - Global Options: configuration/global_options.md
+    - Module Options: configuration/module_options.md
+  - Contribution:
+    - contribution/index.md
+
 theme:
   name: material
   logo: bbot.png
+  features:
+    - content.code.copy
+    - navigation.sections
   palette: 
-
-    # Palette toggle for dark mode
-    - scheme: slate
-      primary: black
-      accent: deep orange
-      toggle:
-        icon: material/brightness-4
-        name: Switch to light mode
-
-    # Palette toggle for light mode
-    - scheme: default
-      primary: black
-      accent: deep orange
-      toggle:
-        icon: material/brightness-7 
-        name: Switch to dark mode
+  - scheme: slate
+    primary: black
+    accent: deep orange
 
 plugins:
+  - search
   - extra-sass
+
+markdown_extensions:
+  - codehilite:
+      use_pygments: True
+      noclasses: True
+      pygments_style: github-dark

From 9fde5393c82e5a98be569d8506a208fb465943bf Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 28 Jun 2023 17:19:31 -0400
Subject: [PATCH 143/387] flag description todo

---
 bbot/test/test_step_1/test_modules_basic.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index c92f3ce4e3..0fbcfde355 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -89,6 +89,7 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
     scan2.status = "RUNNING"
 
     # attributes, descriptions, etc.
+    # TODO: Ensure every flag has a description
     for module_name, module in sorted(scan2.modules.items()):
         # flags
         assert module._type in ("internal", "output", "scan")

From 0d360dfa3cb904b9e40984935ebb435a1d400b8c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 28 Jun 2023 17:19:40 -0400
Subject: [PATCH 144/387] blacked

---
 bbot/core/helpers/modules.py       | 2 +-
 bbot/test/test_step_1/test_docs.py | 1 +
 2 files changed, 2 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index fdba0ae3fa..bb62a4b98d 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -278,7 +278,7 @@ def modules_table(self, modules=None, mod_type=None):
             flags = sorted(preloaded.get("flags", []))
             api_key_required = ""
             meta = preloaded.get("meta", {})
-            api_key_required = ("Yes" if meta.get("auth_required", False) else "No")
+            api_key_required = "Yes" if meta.get("auth_required", False) else "No"
             description = meta.get("description", "")
             table.append(
                 [module_name, module_type, api_key_required, description, ",".join(flags), ",".join(produced_events)]
diff --git a/bbot/test/test_step_1/test_docs.py b/bbot/test/test_step_1/test_docs.py
index ceb563c4f2..6b00d2d0d8 100644
--- a/bbot/test/test_step_1/test_docs.py
+++ b/bbot/test/test_step_1/test_docs.py
@@ -1,4 +1,5 @@
 from bbot.scripts.docs import update_docs
 
+
 def test_docs():
     update_docs()

From 4a4aae0d7e5b3477f3f02d755f9ff522366c2b30 Mon Sep 17 00:00:00 2001
From: github-actions <41898282+github-actions[bot]@users.noreply.github.com>
Date: Wed, 28 Jun 2023 21:20:35 +0000
Subject: [PATCH 145/387] Refresh module docs

---
 docs/modules.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/modules.md b/docs/modules.md
index b78d44e702..768d6194c6 100644
--- a/docs/modules.md
+++ b/docs/modules.md
@@ -19,9 +19,9 @@
 | deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |

From a5cedd8a555ae15138b771f91b202fea988cc412 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 29 Jun 2023 15:39:18 -0400
Subject: [PATCH 146/387] continued work on docs, columbus module update

---
 bbot/core/configurator/args.py    |  78 +++++++++++++++-------
 bbot/core/configurator/environ.py |   5 +-
 bbot/core/configurator/files.py   |   6 +-
 bbot/core/logger/logger.py        |  10 +--
 bbot/modules/columbus.py          |   8 ++-
 bbot/scripts/docs.py              |  35 +++++++---
 docs/advanced/index.md            |   1 +
 docs/configuration/index.md       |   4 ++
 docs/index.md                     |  61 +++++++++++++++--
 docs/modules/flags.md             |  29 ++++++++
 docs/modules/index.md             | 106 ++++++++++++++++++++++++++++++
 docs/usage.md                     | 100 ++++++++++++++++++++++++++++
 mkdocs.yml                        |   6 +-
 13 files changed, 396 insertions(+), 53 deletions(-)
 create mode 100644 docs/advanced/index.md
 create mode 100644 docs/modules/flags.md
 create mode 100644 docs/modules/index.md
 create mode 100644 docs/usage.md

diff --git a/bbot/core/configurator/args.py b/bbot/core/configurator/args.py
index c08383f266..ad539edbb3 100644
--- a/bbot/core/configurator/args.py
+++ b/bbot/core/configurator/args.py
@@ -25,6 +25,9 @@ def parse_args(self, *args, **kwargs):
         For targets, also allow input files containing additional targets
         """
         ret = super().parse_args(*args, **kwargs)
+        # silent implies -y
+        if ret.silent:
+            ret.yes = True
         ret.modules = chain_lists(ret.modules)
         ret.output_modules = chain_lists(ret.output_modules)
         ret.targets = chain_lists(ret.targets, try_files=True, msg="Reading targets from file: {filename}")
@@ -55,30 +58,57 @@ def error(self, message):
         pass
 
 
-epilog = """EXAMPLES
-
-    Subdomains:
-        bbot -t evilcorp.com -f subdomain-enum
-
-    Subdomains (passive only):
-        bbot -t evilcorp.com -f subdomain-enum -rf passive
-
-    Subdomains + port scan + web screenshots:
-        bbot -t evilcorp.com -f subdomain-enum -m naabu gowitness -n my_scan -o .
-
-    Subdomains + basic web scan (wappalyzer, robots.txt, iis shortnames, etc.):
-        bbot -t evilcorp.com -f subdomain-enum web-basic
-
-    Subdomains + web spider (search for emails, etc.):
-        bbot -t evilcorp.com -f subdomain-enum -c web_spider_distance=2 web_spider_depth=2
-
-    Subdomains + emails + cloud + port scan + non-intrusive web + web screenshots + nuclei:
-        bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m naabu gowitness nuclei --allow-deadly
-
-    List modules:
-        bbot -l
-
-"""
+scan_examples = [
+    (
+        "Subdomains",
+        "Enable all modules with the `subdomain-enum` flag",
+        "bbot -t evilcorp.com -f subdomain-enum",
+    ),
+    (
+        "Subdomains (passive only)",
+        "Require modules to have the `passive` flag",
+        "bbot -t evilcorp.com -f subdomain-enum -rf passive",
+    ),
+    (
+        "Subdomains + port scan + web screenshots",
+        "Port-scan every subdomain, screenshot every webpage, output to current directory",
+        "bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .",
+    ),
+    (
+        "Subdomains + basic web scan",
+        "A basic web scan includes wappalyzer, robots.txt, and other non-intrusive web modules",
+        "bbot -t evilcorp.com -f subdomain-enum web-basic",
+    ),
+    (
+        "Web Spider",
+        "Use the web spider to crawl for emails, secrets, etc.",
+        "bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2",
+    ),
+    (
+        "Subdomains + emails + cloud + port scan + basic web + web screenshots + nuclei",
+        "Everything everywhere all at once",
+        "bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly",
+    ),
+]
+
+usage_examples = [
+    (
+        "List modules",
+        "",
+        "bbot -l",
+    ),
+    (
+        "List flags",
+        "",
+        "bbot -lf",
+    ),
+]
+
+
+epilog = "EXAMPLES\n"
+for example in (scan_examples, usage_examples):
+    for title, description, command in example:
+        epilog += f"\n    {title}:\n        {command}\n"
 
 
 parser = BBOTArgumentParser(
diff --git a/bbot/core/configurator/environ.py b/bbot/core/configurator/environ.py
index 6651bad012..e194ad1029 100644
--- a/bbot/core/configurator/environ.py
+++ b/bbot/core/configurator/environ.py
@@ -114,12 +114,13 @@ def prepare_environment(bbot_config):
 
     log = logging.getLogger()
     if bbot_config.get("debug", False):
-        global _log_level_override
         bbot_config["silent"] = False
-        _log_level_override = logging.DEBUG
         log = logging.getLogger("bbot")
         log.setLevel(logging.DEBUG)
         logging.getLogger("asyncio").setLevel(logging.DEBUG)
+    elif bbot_config.get("silent", False):
+        log = logging.getLogger("bbot")
+        log.setLevel(logging.CRITICAL)
 
     # copy config to environment
     bbot_environ = flatten_config(bbot_config)
diff --git a/bbot/core/configurator/files.py b/bbot/core/configurator/files.py
index 1d96f34ad4..16557d1fff 100644
--- a/bbot/core/configurator/files.py
+++ b/bbot/core/configurator/files.py
@@ -1,3 +1,4 @@
+import sys
 from pathlib import Path
 from omegaconf import OmegaConf
 
@@ -13,7 +14,10 @@
 default_config = None
 
 
-def _get_config(filename, name="config", notify=True):
+def _get_config(filename, name="config"):
+    notify = False
+    if sys.argv and sys.argv[0].endswith("bbot") and not any(x in sys.argv for x in ("-s", "--silent")):
+        notify = True
     filename = Path(filename).resolve()
     try:
         conf = OmegaConf.load(str(filename))
diff --git a/bbot/core/logger/logger.py b/bbot/core/logger/logger.py
index 57feb6f8f1..97241e343b 100644
--- a/bbot/core/logger/logger.py
+++ b/bbot/core/logger/logger.py
@@ -147,19 +147,11 @@ def log_listener_setup(logging_queue):
     )
 
     def stderr_filter(record):
-        config_silent = config.get("silent", False)
         log_level = get_log_level()
-        excluded_levels = [logging.STDOUT]
-        if log_level > logging.DEBUG:
-            excluded_levels.append(logging.TRACE)
-        if record.levelno in excluded_levels:
+        if record.levelno == logging.STDOUT or (record.levelno == logging.TRACE and log_level > logging.DEBUG):
             return False
-        if record.levelno >= logging.ERROR:
-            return True
         if record.levelno < log_level:
             return False
-        if config_silent and not record.levelname.startswith("HUGE"):
-            return False
         return True
 
     stderr_handler.addFilter(stderr_filter)
diff --git a/bbot/modules/columbus.py b/bbot/modules/columbus.py
index 66340b8609..1f2e13f7eb 100644
--- a/bbot/modules/columbus.py
+++ b/bbot/modules/columbus.py
@@ -6,9 +6,15 @@ class columbus(crobat):
     watched_events = ["DNS_NAME"]
     produced_events = ["DNS_NAME"]
     meta = {"description": "Query the Columbus Project API for subdomains"}
+    options = {"limit": 500}
+    options_desc = {"limit": "Max number of subdomains to retrieve"}
 
     base_url = "https://columbus.elmasy.com/api/lookup"
 
+    async def setup(self):
+        self.limit = self.config.get("limit", 500)
+        return await super().setup()
+
     async def request_url(self, query):
         url = f"{self.base_url}/{self.helpers.quote(query)}"
         return await self.request_with_fail_count(url)
@@ -17,5 +23,5 @@ def parse_results(self, r, query):
         results = set()
         json = r.json()
         if json and isinstance(json, list):
-            return set([f"{s.lower()}.{query}" for s in json])
+            return set([f"{s.lower()}.{query}" for s in json[: self.limit]])
         return results
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index e1b809d295..65d7b7b401 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -5,6 +5,7 @@
 from pathlib import Path
 
 from bbot.modules import module_loader
+from bbot.core.configurator.args import parser, scan_examples, usage_examples
 
 os.environ["BBOT_TABLE_FORMAT"] = "github"
 
@@ -48,23 +49,42 @@ def update_docs():
     bbot_code_dir = Path(__file__).parent.parent.parent
     md_files = [p for p in bbot_code_dir.glob("**/*.md") if p.is_file()]
 
+    def update_md_files(keyword, s):
+        for file in md_files:
+            find_replace_file(file, keyword, s)
+
+    # Example commands
+    bbot_example_commands = ""
+    for examples in (scan_examples, usage_examples):
+        for title, description, command in examples:
+            example = "\n"
+            example += f"### {title}\n"
+            example += f"{description}\n"
+            example += f"```bash\n{command}\n```\n"
+            bbot_example_commands += example
+    assert len(bbot_example_commands.splitlines()) > 10
+    update_md_files("BBOT EXAMPLE COMMANDS", bbot_example_commands)
+
+    # Help output
+    bbot_help_output = parser.format_help()
+    bbot_help_output = f"```\n{bbot_help_output}\n```"
+    assert len(bbot_help_output.splitlines()) > 50
+    update_md_files("BBOT HELP OUTPUT", bbot_help_output)
+
     # BBOT modules
     bbot_module_table = module_loader.modules_table()
     assert len(bbot_module_table.splitlines()) > 50
-    for file in md_files:
-        find_replace_file(file, "BBOT MODULES", bbot_module_table)
+    update_md_files("BBOT MODULES", bbot_module_table)
 
     # BBOT module options
     bbot_module_options_table = module_loader.modules_options_table()
     assert len(bbot_module_options_table.splitlines()) > 100
-    for file in md_files:
-        find_replace_file(file, "BBOT MODULE OPTIONS", bbot_module_options_table)
+    update_md_files("BBOT MODULE OPTIONS", bbot_module_options_table)
 
     # BBOT module flags
     bbot_module_flags_table = module_loader.flags_table()
     assert len(bbot_module_flags_table.splitlines()) > 10
-    for file in md_files:
-        find_replace_file(file, "BBOT MODULE FLAGS", bbot_module_flags_table)
+    update_md_files("BBOT MODULE FLAGS", bbot_module_flags_table)
 
     # Default config
     default_config_file = bbot_code_dir / "bbot" / "defaults.yml"
@@ -72,8 +92,7 @@ def update_docs():
         default_config_yml = f.read()
     default_config_yml = f"```yaml\n{default_config_yml}\n```"
     assert len(default_config_yml.splitlines()) > 20
-    for file in md_files:
-        find_replace_file(file, "BBOT DEFAULT CONFIG", default_config_yml)
+    update_md_files("BBOT DEFAULT CONFIG", default_config_yml)
 
 
 update_docs()
diff --git a/docs/advanced/index.md b/docs/advanced/index.md
new file mode 100644
index 0000000000..6c93a3f059
--- /dev/null
+++ b/docs/advanced/index.md
@@ -0,0 +1 @@
+# Tips and Tricks
\ No newline at end of file
diff --git a/docs/configuration/index.md b/docs/configuration/index.md
index 7bfb0d12a7..9b19422363 100644
--- a/docs/configuration/index.md
+++ b/docs/configuration/index.md
@@ -2,6 +2,8 @@
 
 BBOT and its modules are built to be configurable for a wide range of use cases. Config options are different from standard command-line arguments. They're designed to perform more granular changes such as setting the HTTP proxy, the global user-agent, or a module's API key.
 
+## Configuration Files
+
 BBOT loads its config from the following files, in this order:
 
 - `~/.config/bbot/bbot.yml`     <-- Use this one as your main config
@@ -10,6 +12,8 @@ BBOT loads its config from the following files, in this order:
 
 These config files will be automatically created for you when you first run BBOT.
 
+## Command Line
+
 Config options specified via the command-line take precedence over all others. You can give BBOT a custom config file with `--config myconf.yml`, or individual arguments like this: `--config http_proxy=http://127.0.0.1:8080 modules.shodan_dns.api_key=1234`. To display the full and current BBOT config, including any command-line arguments, use `bbot --current-config`.
 
 Note that placing the following in `bbot.yml`:
diff --git a/docs/index.md b/docs/index.md
index 9a8a21ac98..483717a05d 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -1,6 +1,6 @@
 ## Installation
 
-BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you want to dev on BBOT, please see [Installation (Poetry)](./contribution).
+BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, please see [Installation (Poetry)](./contribution).
 
 ### [Python (pip / pipx)](https://pypi.org/project/bbot/)
 Note: `pipx` installs BBOT inside its own virtual environment.
@@ -16,7 +16,7 @@ bbot --help
 ~~~
 
 ### [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot)
-BBOT provides docker images, along with helper script `bbot-docker.sh` to persist your BBOT scan data.
+Docker images are provided, along with helper script `bbot-docker.sh` to persist your scan data.
 ~~~bash
 # bleeding edge (dev)
 docker run -it blacklanternsecurity/bbot --help
@@ -29,11 +29,58 @@ git clone https://github.com/blacklanternsecurity/bbot && cd bbot
 ./bbot-docker.sh --help
 ~~~
 
-## First Scan
+## Example Scans
 
-Execute a subdomain enumeration against `evilcorp.com`:
-~~~bash
+---
+
+<!-- BBOT EXAMPLE COMMANDS -->
+
+### Subdomains
+Enable all modules with the `subdomain-enum` flag
+```bash
 bbot -t evilcorp.com -f subdomain-enum
-~~~
+```
+
+### Subdomains (passive only)
+Require modules to have the `passive` flag
+```bash
+bbot -t evilcorp.com -f subdomain-enum -rf passive
+```
+
+### Subdomains + port scan + web screenshots
+Port-scan every subdomain, screenshot every webpage, output to current directory
+```bash
+bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .
+```
+
+### Subdomains + basic web scan
+A basic web scan includes wappalyzer, robots.txt, and other non-intrusive web modules
+```bash
+bbot -t evilcorp.com -f subdomain-enum web-basic
+```
+
+### Web Spider
+Use the web spider to crawl for emails, secrets, etc.
+```bash
+bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
+```
+
+### Subdomains + emails + cloud + port scan + basic web + web screenshots + nuclei
+Everything everywhere all at once
+```bash
+bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
+```
+
+### List modules
+
+```bash
+bbot -l
+```
+
+### List flags
+
+```bash
+bbot -lf
+```
 
-## Example Scans
\ No newline at end of file
+<!-- END BBOT EXAMPLE COMMANDS -->
diff --git a/docs/modules/flags.md b/docs/modules/flags.md
new file mode 100644
index 0000000000..9a27677d49
--- /dev/null
+++ b/docs/modules/flags.md
@@ -0,0 +1,29 @@
+# Flags
+
+
+## List of Flags
+
+<!-- BBOT MODULE FLAGS -->
+| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
+|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
+| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
+| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
+| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
+| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+<!-- END BBOT MODULE FLAGS -->
\ No newline at end of file
diff --git a/docs/modules/index.md b/docs/modules/index.md
new file mode 100644
index 0000000000..5b02379018
--- /dev/null
+++ b/docs/modules/index.md
@@ -0,0 +1,106 @@
+# Modules Overview
+
+BBOT's power is in its modules. Modules can perform any kind of task, from port scans to subdomain brute-force to API queries. Modules in BBOT fall into four main categories:
+
+- **Scan Modules**
+- **Output Modules**
+- **Report Modules**
+- **Internal Modules**
+
+
+## List of Modules
+
+<!-- BBOT MODULES -->
+| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
+|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
+| badsecrets           | scan     | No              | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
+| bucket_aws           | scan     | No              | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_azure         | scan     | No              | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_digitalocean  | scan     | No              | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
+| bucket_firebase      | scan     | No              | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bucket_gcp           | scan     | No              | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
+| bypass403            | scan     | No              | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
+| dnszonetransfer      | scan     | No              | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
+| ffuf                 | scan     | No              | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
+| ffuf_shortnames      | scan     | No              | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
+| fingerprintx         | scan     | No              | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
+| generic_ssrf         | scan     | No              | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
+| git                  | scan     | No              | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| gowitness            | scan     | No              | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
+| host_header          | scan     | No              | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
+| httpx                | scan     | No              | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
+| hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
+| masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
+| naabu                | scan     | No              | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| nmap                 | scan     | No              | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
+| ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
+| nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
+| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
+| robots               | scan     | No              | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
+| secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
+| smuggler             | scan     | No              | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
+| social               | scan     | No              | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
+| sslcert              | scan     | No              | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
+| subdomain_hijack     | scan     | No              | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
+| telerik              | scan     | No              | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
+| url_manipulation     | scan     | No              | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
+| vhost                | scan     | No              | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
+| wafw00f              | scan     | No              | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
+| wappalyzer           | scan     | No              | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
+| affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
+| anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
+| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| c99                  | scan     | Yes             | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| censys               | scan     | Yes             | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
+| certspotter          | scan     | No              | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
+| crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| fullhunt             | scan     | Yes             | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| github               | scan     | Yes             | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
+| hackertarget         | scan     | No              | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| hunterio             | scan     | Yes             | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
+| ipneighbor           | scan     | No              | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
+| ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
+| leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
+| otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| rapiddns             | scan     | No              | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
+| sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
+| threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| viewdns              | scan     | No              | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
+| virustotal           | scan     | Yes             | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
+| wayback              | scan     | No              | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
+| zoomeye              | scan     | Yes             | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
+| asset_inventory      | output   | No              | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
+| csv                  | output   | No              | Output to CSV                                                          |                                                                               |                                                      |
+| http                 | output   | No              | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
+| human                | output   | No              | Output to text                                                         |                                                                               |                                                      |
+| json                 | output   | No              | Output to JSON                                                         |                                                                               |                                                      |
+| neo4j                | output   | No              | Output to Neo4j                                                        |                                                                               |                                                      |
+| python               | output   | No              | Output via Python API                                                  |                                                                               |                                                      |
+| web_report           | output   | No              | Create a markdown report with web assets                               |                                                                               |                                                      |
+| websocket            | output   | No              | Output to websockets                                                   |                                                                               |                                                      |
+| aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
+| excavate             | internal | No              | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
+| speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
+<!-- END BBOT MODULES -->
+
+For a list of module config options, see [Module Options](../configuration/module_options/).
diff --git a/docs/usage.md b/docs/usage.md
new file mode 100644
index 0000000000..582a3aba10
--- /dev/null
+++ b/docs/usage.md
@@ -0,0 +1,100 @@
+# Command-Line Usage
+
+<!-- BBOT HELP OUTPUT -->
+```
+usage: docs.py [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR]
+               [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a]
+               [--version]
+
+Bighuge BLS OSINT Tool
+
+options:
+  -h, --help            show this help message and exit
+  --help-all            Display full help including module config options
+
+Target:
+  -t TARGET [TARGET ...], --targets TARGET [TARGET ...]
+                        Targets to seed the scan
+  -w WHITELIST [WHITELIST ...], --whitelist WHITELIST [WHITELIST ...]
+                        What's considered in-scope (by default it's the same as --targets)
+  -b BLACKLIST [BLACKLIST ...], --blacklist BLACKLIST [BLACKLIST ...]
+                        Don't touch these things
+  --strict-scope        Don't consider subdomains of target/whitelist to be in-scope
+
+Modules:
+  -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+  -l, --list-modules    List available modules.
+  -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
+                        Exclude these modules.
+  -f FLAG [FLAG ...], --flags FLAG [FLAG ...]
+                        Enable modules by flag. Choices: active,affiliates,aggressive,cloud-enum,deadly,email-enum,iis-shortnames,passive,portscan,report,safe,service-enum,slow,social-enum,subdomain-enum,subdomain-hijack,web-basic,web-paramminer,web-screenshots,web-thorough
+  -lf, --list-flags     List available flags.
+  -rf FLAG [FLAG ...], --require-flags FLAG [FLAG ...]
+                        Only enable modules with these flags (e.g. -rf passive)
+  -ef FLAG [FLAG ...], --exclude-flags FLAG [FLAG ...]
+                        Disable modules with these flags. (e.g. -ef aggressive)
+  -om MODULE [MODULE ...], --output-modules MODULE [MODULE ...]
+                        Output module(s). Choices: asset_inventory,csv,http,human,json,neo4j,python,web_report,websocket
+  --allow-deadly        Enable the use of highly aggressive modules
+
+Scan:
+  -n SCAN_NAME, --name SCAN_NAME
+                        Name of scan (default: random)
+  -o DIR, --output-dir DIR
+  -c [CONFIG ...], --config [CONFIG ...]
+                        custom config file, or configuration options in key=value format: 'modules.shodan.api_key=1234'
+  -v, --verbose         Be more verbose
+  -d, --debug           Enable debugging
+  -s, --silent          Be quiet
+  --force               Run scan even if module setups fail
+  -y, --yes             Skip scan confirmation prompt
+  --dry-run             Abort before executing scan
+  --current-config      Show current config in YAML format
+
+Module dependencies:
+  Control how modules install their dependencies
+
+  --no-deps             Don't install module dependencies
+  --force-deps          Force install all module dependencies
+  --retry-deps          Try again to install failed module dependencies
+  --ignore-failed-deps  Run modules even if they have failed dependencies
+  --install-all-deps    Install dependencies for all modules
+
+Agent:
+  Report back to a central server
+
+  -a, --agent-mode      Start in agent mode
+
+Misc:
+  --version             show BBOT version and exit
+
+EXAMPLES
+
+    Subdomains:
+        bbot -t evilcorp.com -f subdomain-enum
+
+    Subdomains (passive only):
+        bbot -t evilcorp.com -f subdomain-enum -rf passive
+
+    Subdomains + port scan + web screenshots:
+        bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .
+
+    Subdomains + basic web scan:
+        bbot -t evilcorp.com -f subdomain-enum web-basic
+
+    Web Spider:
+        bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
+
+    Subdomains + emails + cloud + port scan + basic web + web screenshots + nuclei:
+        bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
+
+    List modules:
+        bbot -l
+
+    List flags:
+        bbot -lf
+
+```
+<!-- END BBOT HELP OUTPUT -->
diff --git a/mkdocs.yml b/mkdocs.yml
index 794faa5de5..bc4bb99ffc 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -12,8 +12,12 @@ repo_url: https://github.com/blacklanternsecurity/bbot
 nav:
   - Basics:
     - Getting Started: index.md
+    - Usage: usage.md
   - Modules:
-    - modules.md
+    - modules/index.md
+    - Flags: modules/flags.md
+  - Advanced Usage:
+    - advanced/index.md
   - Configuration:
     - configuration/index.md
     - Global Options: configuration/global_options.md

From c250ed4d56d43bfbb09b038f64402da2485d4406 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 30 Jun 2023 16:33:25 -0400
Subject: [PATCH 147/387] steady work on docs

---
 README.md                                     | 153 ---------------
 bbot/core/configurator/args.py                |   8 +-
 bbot/core/helpers/modules.py                  |  31 +++
 bbot/modules/output/human.py                  |   1 +
 bbot/scripts/docs.py                          |  27 +--
 docs/advanced/index.md                        |   1 -
 docs/comparison.md                            |   1 +
 docs/configuration/module_options.md          |   1 +
 docs/contribution/index.md                    |  70 +------
 docs/contribution/module_creation.md          |  67 +++++++
 docs/how_it_works.md                          |   1 +
 docs/index.md                                 |  48 ++---
 docs/modules.md                               |   4 +-
 docs/modules/flags.md                         |   6 +-
 docs/scanning/advanced.md                     | 128 +++++++++++++
 .../configuration/global_options.md           |   0
 docs/{ => scanning}/configuration/index.md    |   7 +-
 docs/scanning/configuration/module_options.md | 181 ++++++++++++++++++
 docs/scanning/events.md                       |  43 +++++
 docs/scanning/index.md                        | 145 ++++++++++++++
 .../index.md => scanning/modules_table.md}    |  12 +-
 docs/scanning/output.md                       |  34 ++++
 docs/usage.md                                 |   8 +-
 extra_sass/style.css.scss                     |  50 ++---
 mkdocs.yml                                    |  25 ++-
 25 files changed, 729 insertions(+), 323 deletions(-)
 delete mode 100644 docs/advanced/index.md
 create mode 100644 docs/comparison.md
 create mode 100644 docs/contribution/module_creation.md
 create mode 100644 docs/how_it_works.md
 create mode 100644 docs/scanning/advanced.md
 rename docs/{ => scanning}/configuration/global_options.md (100%)
 rename docs/{ => scanning}/configuration/index.md (89%)
 create mode 100644 docs/scanning/configuration/module_options.md
 create mode 100644 docs/scanning/events.md
 create mode 100644 docs/scanning/index.md
 rename docs/{modules/index.md => scanning/modules_table.md} (98%)
 create mode 100644 docs/scanning/output.md

diff --git a/README.md b/README.md
index 5697f0ae61..e7594fb614 100644
--- a/README.md
+++ b/README.md
@@ -59,30 +59,6 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m naabu
 bbot -l
 ~~~
 
-## Using BBOT as a Python library
-**Synchronous**
-~~~python
-from bbot.scanner import Scanner
-
-# any number of targets can be specified
-scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
-for event in scan.start():
-    print(event.json())
-~~~
-
-**Asynchronous**
-~~~python
-from bbot.scanner import Scanner
-
-async def main():
-    scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
-    async for event in scan.async_start():
-        print(event.json())
-
-import asyncio
-asyncio.run(main())
-~~~
-
 ## Targets
 
 Targets seed a scan with initial data. You can specify an unlimited number of targets, either directly on the command line or in files (or both!). Targets can be any of the following:
@@ -115,135 +91,6 @@ docker run -it blacklanternsecurity/bbot --help
 docker run -it blacklanternsecurity/bbot:stable --help
 ~~~
 
-
-# Usage
-~~~
-$ bbot --help
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
-            [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR] [-c [CONFIG ...]]
-            [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a] [--version]
-
-Bighuge BLS OSINT Tool
-
-options:
-  -h, --help            show this help message and exit
-  --help-all            Display full help including module config options
-
-Target:
-  -t TARGET [TARGET ...], --targets TARGET [TARGET ...]
-                        Targets to seed the scan
-  -w WHITELIST [WHITELIST ...], --whitelist WHITELIST [WHITELIST ...]
-                        What's considered in-scope (by default it's the same as --targets)
-  -b BLACKLIST [BLACKLIST ...], --blacklist BLACKLIST [BLACKLIST ...]
-                        Don't touch these things
-  --strict-scope        Don't consider subdomains of target/whitelist to be in-scope
-
-Modules:
-  -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
-  -l, --list-modules    List available modules.
-  -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
-                        Exclude these modules.
-  -f FLAG [FLAG ...], --flags FLAG [FLAG ...]
-                        Enable modules by flag. Choices: active,affiliates,aggressive,cloud-enum,deadly,email-enum,iis-shortnames,passive,portscan,report,safe,service-enum,slow,social-enum,subdomain-enum,subdomain-hijack,web-basic,web-paramminer,web-screenshots,web-thorough
-  -rf FLAG [FLAG ...], --require-flags FLAG [FLAG ...]
-                        Only enable modules with these flags (e.g. -rf passive)
-  -ef FLAG [FLAG ...], --exclude-flags FLAG [FLAG ...]
-                        Disable modules with these flags. (e.g. -ef aggressive)
-  -om MODULE [MODULE ...], --output-modules MODULE [MODULE ...]
-                        Output module(s). Choices: asset_inventory,csv,http,human,json,neo4j,python,web_report,websocket
-  --allow-deadly        Enable the use of highly aggressive modules
-
-Scan:
-  -n SCAN_NAME, --name SCAN_NAME
-                        Name of scan (default: random)
-  -o DIR, --output-dir DIR
-  -c [CONFIG ...], --config [CONFIG ...]
-                        custom config file, or configuration options in key=value format: 'modules.shodan.api_key=1234'
-  -v, --verbose         Be more verbose
-  -d, --debug           Enable debugging
-  -s, --silent          Be quiet
-  --force               Run scan even if module setups fail
-  -y, --yes             Skip scan confirmation prompt
-  --dry-run             Abort before executing scan
-  --current-config      Show current config in YAML format
-
-Module dependencies:
-  Control how modules install their dependencies
-
-  --no-deps             Don't install module dependencies
-  --force-deps          Force install all module dependencies
-  --retry-deps          Try again to install failed module dependencies
-  --ignore-failed-deps  Run modules even if they have failed dependencies
-  --install-all-deps    Install dependencies for all modules
-
-Agent:
-  Report back to a central server
-
-  -a, --agent-mode      Start in agent mode
-
-Misc:
-  --version             show BBOT version and exit
-~~~
-
-
-# BBOT Config
-Additional config options (such as API keys, rate limits, user-agent, etc.) can be passed to BBOT via its YAML config. BBOT loads its config beginning from `~/.config/bbot`:
-
-- `~/.config/bbot/bbot.yml` <-- Use this one as your main config
-- `~/.config/bbot/secrets.yml` <-- Use this one for sensitive stuff like API keys
-- command line (`--config`) <-- Use this to specify a custom `.yml` or override individual config options
-
-These config files will be automatically created for you when you first run BBOT.
-
-Command-line arguments take precedence over all others. You can give BBOT a custom config file with `--config myconf.yml`, or individual arguments like this: `--config http_proxy=http://127.0.0.1:8080 modules.shodan_dns.api_key=1234`. To display the full and current BBOT config, including any command-line arguments, use `bbot --current-config`.
-
-Note that placing the following in `bbot.yml`:
-```yaml
-modules:
-  shodan:
-    api_key: deadbeef
-```
-Is the same as:
-```bash
-bbot --config modules.shodan.api_key=deadbeef
-```
-
-For explanations of config options, see `defaults.yml` or the [wiki](https://github.com/blacklanternsecurity/bbot/wiki#yaml-config)
-
-
-# Output
-By default, BBOT saves its output in TXT, JSON, and CSV formats. You can enable other output modules with `--output-module`.
-~~~bash
-# tee to a file
-bbot -f subdomain-enum -t evilcorp.com | tee evilcorp.txt
-
-# output to JSON
-bbot --output-module json -f subdomain-enum -t evilcorp.com | jq
-
-# output asset inventory in current directory
-bbot -o . --output-module asset_inventory -f subdomain-enum -t evilcorp.com
-~~~
-For every scan, BBOT generates a unique and mildly-entertaining name like `demonic_jimmy`. Output for that scan, including scan stats and any gowitness screenshots, etc., are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed. You can change the location of BBOT's output with `--output`, and you can also pick a custom scan name with `--name`.
-
-If you reuse a scan name, it will append to its original output files and leverage the previous.
-
-## Neo4j
-Neo4j is the funnest (and prettiest) way to view and interact with BBOT data.
-
-![neo4j](https://user-images.githubusercontent.com/20261699/182398274-729f3c48-c23c-4db0-8c2e-8b403c1bf790.png)
-
-- You can get Neo4j up and running with a single docker command:
-~~~bash
-docker run -p 7687:7687 -p 7474:7474 -v "$(pwd)/data/:/data/" -e NEO4J_AUTH=neo4j/bbotislife neo4j
-~~~
-- After that, run bbot with `--output-modules neo4j`
-~~~bash
-bbot -f subdomain-enum -t evilcorp.com --output-modules neo4j
-~~~
-- Browse data at http://localhost:7474
-
-
 # Acknowledgements
 
 Thanks to all these amazing people for contributing to BBOT! :heart:
diff --git a/bbot/core/configurator/args.py b/bbot/core/configurator/args.py
index ad539edbb3..e27a92adf4 100644
--- a/bbot/core/configurator/args.py
+++ b/bbot/core/configurator/args.py
@@ -61,12 +61,12 @@ def error(self, message):
 scan_examples = [
     (
         "Subdomains",
-        "Enable all modules with the `subdomain-enum` flag",
+        "Perform a full subdomain enumeration on evilcorp.com",
         "bbot -t evilcorp.com -f subdomain-enum",
     ),
     (
         "Subdomains (passive only)",
-        "Require modules to have the `passive` flag",
+        "Perform a passive-only subdomain enumeration on evilcorp.com",
         "bbot -t evilcorp.com -f subdomain-enum -rf passive",
     ),
     (
@@ -80,13 +80,13 @@ def error(self, message):
         "bbot -t evilcorp.com -f subdomain-enum web-basic",
     ),
     (
-        "Web Spider",
+        "Web spider",
         "Use the web spider to crawl for emails, secrets, etc.",
         "bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2",
     ),
     (
-        "Subdomains + emails + cloud + port scan + basic web + web screenshots + nuclei",
         "Everything everywhere all at once",
+        "Subdomains, emails, cloud buckets, port scan, basic web, web screenshots, nuclei",
         "bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly",
     ),
 ]
diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index bb62a4b98d..27c10c0da5 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -335,6 +335,37 @@ def flags_table(self, flags=None):
             table.append([flag, f"{len(modules)}", description, ", ".join(sorted(modules))])
         return make_table(table, header, maxcolwidths=maxcolwidths)
 
+    def events(self):
+        consuming_events = {}
+        producing_events = {}
+        for module_name, preloaded in self.preloaded().items():
+            consumed = preloaded.get("watched_events", [])
+            produced = preloaded.get("produced_events", [])
+            for c in consumed:
+                try:
+                    consuming_events[c].add(module_name)
+                except KeyError:
+                    consuming_events[c] = {module_name}
+            for c in produced:
+                try:
+                    producing_events[c].add(module_name)
+                except KeyError:
+                    producing_events[c] = {module_name}
+        return consuming_events, producing_events
+
+    def events_table(self):
+        table = []
+        header = ["Event Type", "# Consuming Modules", "# Producing Modules", "Consuming Modules", "Producing Modules"]
+        consuming_events, producing_events = self.events()
+        all_event_types = sorted(set(consuming_events).union(set(producing_events)))
+        for e in all_event_types:
+            consuming = sorted(consuming_events.get(e, []))
+            producing = sorted(producing_events.get(e, []))
+            table.append(
+                [e, len(consuming), len(producing), ", ".join(consuming), ", ".join(producing)]
+            )
+        return make_table(table, header)
+
     def filter_modules(self, modules=None, mod_type=None):
         if modules is None:
             module_list = list(self.preloaded(type=mod_type).items())
diff --git a/bbot/modules/output/human.py b/bbot/modules/output/human.py
index ac80144bb1..c6fc32c9fd 100644
--- a/bbot/modules/output/human.py
+++ b/bbot/modules/output/human.py
@@ -10,6 +10,7 @@ class Human(BaseOutputModule):
     options = {"output_file": "", "console": True}
     options_desc = {"output_file": "Output to file", "console": "Output to console"}
     vuln_severity_map = {"LOW": "HUGEWARNING", "MEDIUM": "HUGEWARNING", "HIGH": "CRITICAL", "CRITICAL": "CRITICAL"}
+    accept_dupes = False
 
     async def setup(self):
         self._prep_output_dir("output.txt")
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 65d7b7b401..b28b482978 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -5,7 +5,7 @@
 from pathlib import Path
 
 from bbot.modules import module_loader
-from bbot.core.configurator.args import parser, scan_examples, usage_examples
+from bbot.core.configurator.args import parser, scan_examples
 
 os.environ["BBOT_TABLE_FORMAT"] = "github"
 
@@ -54,23 +54,28 @@ def update_md_files(keyword, s):
             find_replace_file(file, keyword, s)
 
     # Example commands
-    bbot_example_commands = ""
-    for examples in (scan_examples, usage_examples):
-        for title, description, command in examples:
-            example = "\n"
-            example += f"### {title}\n"
-            example += f"{description}\n"
-            example += f"```bash\n{command}\n```\n"
-            bbot_example_commands += example
+    bbot_example_commands = []
+    for title, description, command in scan_examples:
+        example = ""
+        example += f"**{title}:**\n"
+        # example += f"{description}\n"
+        example += f"```bash\n# {description}\n{command}\n```"
+        bbot_example_commands.append(example)
+    bbot_example_commands = "\n\n".join(bbot_example_commands)
     assert len(bbot_example_commands.splitlines()) > 10
     update_md_files("BBOT EXAMPLE COMMANDS", bbot_example_commands)
 
     # Help output
-    bbot_help_output = parser.format_help()
-    bbot_help_output = f"```\n{bbot_help_output}\n```"
+    bbot_help_output = parser.format_help().replace("docs.py", "bbot")
+    bbot_help_output = f"```text\n{bbot_help_output}\n```"
     assert len(bbot_help_output.splitlines()) > 50
     update_md_files("BBOT HELP OUTPUT", bbot_help_output)
 
+    # BBOT events
+    bbot_event_table = module_loader.events_table()
+    assert len(bbot_event_table.splitlines()) > 10
+    update_md_files("BBOT EVENTS", bbot_event_table)
+
     # BBOT modules
     bbot_module_table = module_loader.modules_table()
     assert len(bbot_module_table.splitlines()) > 50
diff --git a/docs/advanced/index.md b/docs/advanced/index.md
deleted file mode 100644
index 6c93a3f059..0000000000
--- a/docs/advanced/index.md
+++ /dev/null
@@ -1 +0,0 @@
-# Tips and Tricks
\ No newline at end of file
diff --git a/docs/comparison.md b/docs/comparison.md
new file mode 100644
index 0000000000..5cfcf16199
--- /dev/null
+++ b/docs/comparison.md
@@ -0,0 +1 @@
+# Comparison to Other Tools
\ No newline at end of file
diff --git a/docs/configuration/module_options.md b/docs/configuration/module_options.md
index 8e998d4403..f5d12fdb5b 100644
--- a/docs/configuration/module_options.md
+++ b/docs/configuration/module_options.md
@@ -133,6 +133,7 @@ For a list of global BBOT config options such as HTTP Proxy, User-Agent, etc, se
 | modules.c99.api_key                            | str    | c99.nl API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
 | modules.censys.api_id                          | str    | Censys.io API ID                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
 | modules.censys.api_secret                      | str    | Censys.io API Secret                                                                                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.columbus.limit                         | int    | Max number of subdomains to retrieve                                                                                                                                                                                                                                                                            | 500                                                                                                                                                                 |
 | modules.fullhunt.api_key                       | str    | FullHunt API Key                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
 | modules.github.api_key                         | str    | Github token                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
 | modules.hunterio.api_key                       | str    | Hunter.IO API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
diff --git a/docs/contribution/index.md b/docs/contribution/index.md
index 220768c3e0..b1b5f5b334 100644
--- a/docs/contribution/index.md
+++ b/docs/contribution/index.md
@@ -1,4 +1,4 @@
-# Devving on BBOT
+# Setting Up a Dev Environment
 
 ## Installation (Poetry)
 
@@ -23,71 +23,3 @@ bbot --help
 ~~~
 - Now, any changes you make in the code will be reflected in the `bbot` command.
 - Finally, commit and push your changes, and create a pull request to the main BBOT repo.
-
-## Creating a Module
-
-Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
-
-1. Create a new `.py` file in `bbot/modules`
-1. At the top of the file, import `BaseModule`
-1. Declare a class that inherits from `BaseModule`
-    - the class must have the same name as your file (case-insensitive)
-1. Define (via `watched_events` and `produced_events`) what types of events your module consumes
-1. Define (via `flags`) whether your module is `active` or `passive`
-1. Override `.handle_event()`
-    - this is where you put your custom code
-
-Here is a simple example of a working module (`bbot/modules/mymodule.py`):
-~~~python
-from bbot.modules.base import BaseModule
-
-class MyModule(BaseModule):
-    """
-    Resolve DNS_NAMEs to IPs
-    """
-    watched_events = ["DNS_NAME"]
-    produced_events = ["IP_ADDRESS"]
-    flags = ["passive"]
-
-    async def handle_event(self, event):
-        for ip in await self.helpers.resolve(event.data):
-            self.emit_event(ip, "IP_ADDRESS", source=event)
-~~~
-
-### Module Dependencies
-
-BBOT automates module dependencies with **Ansible**. If your module relies on a third-party binary, OS package, or python library, you can specify them in the `deps_*` attributes of your module.
-
-~~~python
-class MyModule(BaseModule):
-    ...
-    deps_pip = ["beautifulsoup4"]
-    deps_apt = ["chromium-browser"]
-    deps_ansible = [
-        {
-            "name": "install dev tools",
-            "package": {"name": ["gcc", "git", "make"], "state": "present"},
-            "become": True,
-            "ignore_errors": True,
-        },
-        {
-            "name": "Download massdns source code",
-            "git": {
-                "repo": "https://github.com/blechschmidt/massdns.git",
-                "dest": "#{BBOT_TEMP}/massdns",
-                "single_branch": True,
-                "version": "master",
-            },
-        },
-        {
-            "name": "Build massdns",
-            "command": {"chdir": "#{BBOT_TEMP}/massdns", "cmd": "make", "creates": "#{BBOT_TEMP}/massdns/bin/massdns"},
-        },
-        {
-            "name": "Install massdns",
-            "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
-        },
-    ]
-~~~
-
-
diff --git a/docs/contribution/module_creation.md b/docs/contribution/module_creation.md
new file mode 100644
index 0000000000..88abf182eb
--- /dev/null
+++ b/docs/contribution/module_creation.md
@@ -0,0 +1,67 @@
+# Creating a Module
+
+Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
+
+1. Create a new `.py` file in `bbot/modules`
+1. At the top of the file, import `BaseModule`
+1. Declare a class that inherits from `BaseModule`
+    - the class must have the same name as your file (case-insensitive)
+1. Define (via `watched_events` and `produced_events`) what types of events your module consumes
+1. Define (via `flags`) whether your module is `active` or `passive`
+1. Override `.handle_event()`
+    - this is where you put your custom code
+
+Here is a simple example of a working module (`bbot/modules/mymodule.py`):
+~~~python
+from bbot.modules.base import BaseModule
+
+class MyModule(BaseModule):
+    """
+    Resolve DNS_NAMEs to IPs
+    """
+    watched_events = ["DNS_NAME"]
+    produced_events = ["IP_ADDRESS"]
+    flags = ["passive"]
+
+    async def handle_event(self, event):
+        for ip in await self.helpers.resolve(event.data):
+            self.emit_event(ip, "IP_ADDRESS", source=event)
+~~~
+
+### Module Dependencies
+
+BBOT automates module dependencies with **Ansible**. If your module relies on a third-party binary, OS package, or python library, you can specify them in the `deps_*` attributes of your module.
+
+~~~python
+class MyModule(BaseModule):
+    ...
+    deps_pip = ["beautifulsoup4"]
+    deps_apt = ["chromium-browser"]
+    deps_ansible = [
+        {
+            "name": "install dev tools",
+            "package": {"name": ["gcc", "git", "make"], "state": "present"},
+            "become": True,
+            "ignore_errors": True,
+        },
+        {
+            "name": "Download massdns source code",
+            "git": {
+                "repo": "https://github.com/blechschmidt/massdns.git",
+                "dest": "#{BBOT_TEMP}/massdns",
+                "single_branch": True,
+                "version": "master",
+            },
+        },
+        {
+            "name": "Build massdns",
+            "command": {"chdir": "#{BBOT_TEMP}/massdns", "cmd": "make", "creates": "#{BBOT_TEMP}/massdns/bin/massdns"},
+        },
+        {
+            "name": "Install massdns",
+            "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
+        },
+    ]
+~~~
+
+
diff --git a/docs/how_it_works.md b/docs/how_it_works.md
new file mode 100644
index 0000000000..5f43e2386f
--- /dev/null
+++ b/docs/how_it_works.md
@@ -0,0 +1 @@
+# How It Works
\ No newline at end of file
diff --git a/docs/index.md b/docs/index.md
index 483717a05d..01dec78a22 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -1,6 +1,8 @@
+# Getting Started
+
 ## Installation
 
-BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, please see [Installation (Poetry)](./contribution).
+BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, please see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution).
 
 ### [Python (pip / pipx)](https://pypi.org/project/bbot/)
 Note: `pipx` installs BBOT inside its own virtual environment.
@@ -29,58 +31,46 @@ git clone https://github.com/blacklanternsecurity/bbot && cd bbot
 ./bbot-docker.sh --help
 ~~~
 
-## Example Scans
+## Examples
 
----
+Below are some common scan examples.
 
 <!-- BBOT EXAMPLE COMMANDS -->
-
-### Subdomains
-Enable all modules with the `subdomain-enum` flag
+**Subdomains:**
 ```bash
+# Perform a full subdomain enumeration on evilcorp.com
 bbot -t evilcorp.com -f subdomain-enum
 ```
 
-### Subdomains (passive only)
-Require modules to have the `passive` flag
+**Subdomains (passive only):**
 ```bash
+# Perform a passive-only subdomain enumeration on evilcorp.com
 bbot -t evilcorp.com -f subdomain-enum -rf passive
 ```
 
-### Subdomains + port scan + web screenshots
-Port-scan every subdomain, screenshot every webpage, output to current directory
+**Subdomains + port scan + web screenshots:**
 ```bash
+# Port-scan every subdomain, screenshot every webpage, output to current directory
 bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .
 ```
 
-### Subdomains + basic web scan
-A basic web scan includes wappalyzer, robots.txt, and other non-intrusive web modules
+**Subdomains + basic web scan:**
 ```bash
+# A basic web scan includes wappalyzer, robots.txt, and other non-intrusive web modules
 bbot -t evilcorp.com -f subdomain-enum web-basic
 ```
 
-### Web Spider
-Use the web spider to crawl for emails, secrets, etc.
+**Web spider:**
 ```bash
+# Use the web spider to crawl for emails, secrets, etc.
 bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
 ```
 
-### Subdomains + emails + cloud + port scan + basic web + web screenshots + nuclei
-Everything everywhere all at once
+**Everything everywhere all at once:**
 ```bash
+# Subdomains, emails, cloud buckets, port scan, basic web, web screenshots, nuclei
 bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
 ```
-
-### List modules
-
-```bash
-bbot -l
-```
-
-### List flags
-
-```bash
-bbot -lf
-```
-
 <!-- END BBOT EXAMPLE COMMANDS -->
+
+For more information, see [Scanning](./scanning)
diff --git a/docs/modules.md b/docs/modules.md
index 768d6194c6..34056b944c 100644
--- a/docs/modules.md
+++ b/docs/modules.md
@@ -14,11 +14,11 @@
 | web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
diff --git a/docs/modules/flags.md b/docs/modules/flags.md
index 9a27677d49..1e35eefe77 100644
--- a/docs/modules/flags.md
+++ b/docs/modules/flags.md
@@ -15,14 +15,14 @@
 | web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
new file mode 100644
index 0000000000..98d44573da
--- /dev/null
+++ b/docs/scanning/advanced.md
@@ -0,0 +1,128 @@
+# Advanced
+
+Below you can find some advanced uses of BBOT.
+
+## BBOT as a Python library
+**Synchronous**
+~~~python
+from bbot.scanner import Scanner
+
+# any number of targets can be specified
+scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
+for event in scan.start():
+    print(event.json())
+~~~
+
+**Asynchronous**
+~~~python
+from bbot.scanner import Scanner
+
+async def main():
+    scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
+    async for event in scan.async_start():
+        print(event.json())
+
+import asyncio
+asyncio.run(main())
+~~~
+
+## Command-Line Help
+
+<!-- BBOT HELP OUTPUT -->
+```text
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR]
+               [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a]
+               [--version]
+
+Bighuge BLS OSINT Tool
+
+options:
+  -h, --help            show this help message and exit
+  --help-all            Display full help including module config options
+
+Target:
+  -t TARGET [TARGET ...], --targets TARGET [TARGET ...]
+                        Targets to seed the scan
+  -w WHITELIST [WHITELIST ...], --whitelist WHITELIST [WHITELIST ...]
+                        What's considered in-scope (by default it's the same as --targets)
+  -b BLACKLIST [BLACKLIST ...], --blacklist BLACKLIST [BLACKLIST ...]
+                        Don't touch these things
+  --strict-scope        Don't consider subdomains of target/whitelist to be in-scope
+
+Modules:
+  -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+  -l, --list-modules    List available modules.
+  -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
+                        Exclude these modules.
+  -f FLAG [FLAG ...], --flags FLAG [FLAG ...]
+                        Enable modules by flag. Choices: active,affiliates,aggressive,cloud-enum,deadly,email-enum,iis-shortnames,passive,portscan,report,safe,service-enum,slow,social-enum,subdomain-enum,subdomain-hijack,web-basic,web-paramminer,web-screenshots,web-thorough
+  -lf, --list-flags     List available flags.
+  -rf FLAG [FLAG ...], --require-flags FLAG [FLAG ...]
+                        Only enable modules with these flags (e.g. -rf passive)
+  -ef FLAG [FLAG ...], --exclude-flags FLAG [FLAG ...]
+                        Disable modules with these flags. (e.g. -ef aggressive)
+  -om MODULE [MODULE ...], --output-modules MODULE [MODULE ...]
+                        Output module(s). Choices: asset_inventory,csv,http,human,json,neo4j,python,web_report,websocket
+  --allow-deadly        Enable the use of highly aggressive modules
+
+Scan:
+  -n SCAN_NAME, --name SCAN_NAME
+                        Name of scan (default: random)
+  -o DIR, --output-dir DIR
+  -c [CONFIG ...], --config [CONFIG ...]
+                        custom config file, or configuration options in key=value format: 'modules.shodan.api_key=1234'
+  -v, --verbose         Be more verbose
+  -d, --debug           Enable debugging
+  -s, --silent          Be quiet
+  --force               Run scan even if module setups fail
+  -y, --yes             Skip scan confirmation prompt
+  --dry-run             Abort before executing scan
+  --current-config      Show current config in YAML format
+
+Module dependencies:
+  Control how modules install their dependencies
+
+  --no-deps             Don't install module dependencies
+  --force-deps          Force install all module dependencies
+  --retry-deps          Try again to install failed module dependencies
+  --ignore-failed-deps  Run modules even if they have failed dependencies
+  --install-all-deps    Install dependencies for all modules
+
+Agent:
+  Report back to a central server
+
+  -a, --agent-mode      Start in agent mode
+
+Misc:
+  --version             show BBOT version and exit
+
+EXAMPLES
+
+    Subdomains:
+        bbot -t evilcorp.com -f subdomain-enum
+
+    Subdomains (passive only):
+        bbot -t evilcorp.com -f subdomain-enum -rf passive
+
+    Subdomains + port scan + web screenshots:
+        bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .
+
+    Subdomains + basic web scan:
+        bbot -t evilcorp.com -f subdomain-enum web-basic
+
+    Web spider:
+        bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
+
+    Everything everywhere all at once:
+        bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
+
+    List modules:
+        bbot -l
+
+    List flags:
+        bbot -lf
+
+```
+<!-- END BBOT HELP OUTPUT -->
diff --git a/docs/configuration/global_options.md b/docs/scanning/configuration/global_options.md
similarity index 100%
rename from docs/configuration/global_options.md
rename to docs/scanning/configuration/global_options.md
diff --git a/docs/configuration/index.md b/docs/scanning/configuration/index.md
similarity index 89%
rename from docs/configuration/index.md
rename to docs/scanning/configuration/index.md
index 9b19422363..68f0c862e9 100644
--- a/docs/configuration/index.md
+++ b/docs/scanning/configuration/index.md
@@ -2,6 +2,11 @@
 
 BBOT and its modules are built to be configurable for a wide range of use cases. Config options are different from standard command-line arguments. They're designed to perform more granular changes such as setting the HTTP proxy, the global user-agent, or a module's API key.
 
+For a list of all possible config options, see:
+
+- [Global Options](./global_options/)
+- [Module Options](./module_options/)
+
 ## Configuration Files
 
 BBOT loads its config from the following files, in this order:
@@ -32,5 +37,3 @@ Here is an example of what a standard BBOT config might look like:
 modules:
   
 ```
-
-For a list of global config options, see [Global Options](./global_options/). For a full list of module config options, see [Module Options](./module_options/)
diff --git a/docs/scanning/configuration/module_options.md b/docs/scanning/configuration/module_options.md
new file mode 100644
index 0000000000..f5d12fdb5b
--- /dev/null
+++ b/docs/scanning/configuration/module_options.md
@@ -0,0 +1,181 @@
+# Module Options
+
+## Overview
+
+Many modules accept their own configuration options. These are detailed in the table below. 
+
+Module's options have the ability to change their behavior. For example, the `nmap` module accepts options for `ports`, `timing`, etc.
+
+## Command-line vs Config File
+
+If you wanted to pass these options to `nmap`, you could do it from the command line:
+```bash
+bbot --config modules.nmap.ports=80,443 modules.nmap.timing=T5
+```
+
+or via the config (`~/.config/bbot/bbot.yml`):
+
+```yaml
+modules:
+  nmap:
+    ports: 80,443
+    timing: T5
+```
+
+If you wanted to add an API keys for `shodan` and `virustotal`, you could either specify them like this on the command line:
+
+```bash
+bbot --config modules.shodan.api_key=deadbeef modules.virustotal.api_key=deadbeef
+```
+
+Or in the config:
+```yaml
+modules:
+  shodan:
+    api_key: deadbeef
+  virustotal:
+    api_key: deadbeef
+```
+
+For a list of global BBOT config options such as HTTP Proxy, User-Agent, etc, see [Defaults](../defaults/)
+
+
+## Module Config Options
+
+- **Config Option**: Name of the config option (`--config` syntax, see above for `yaml` equivalent)
+- **Type**: Data type of the option, e.g. `bool`, `str`, etc.
+- **Description**: Description of what the option does
+- **Default**: The option's default value
+
+<!-- BBOT MODULE OPTIONS -->
+| Config Option                                  | Type   | Description                                                                                                                                                                                                                                                                                                     | Default                                                                                                                                                             |
+|------------------------------------------------|--------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| modules.bucket_aws.permutations                | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_azure.permutations              | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_digitalocean.permutations       | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_firebase.permutations           | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.bucket_gcp.permutations                | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.dnszonetransfer.timeout                | int    | Max seconds to wait before timing out                                                                                                                                                                                                                                                                           | 10                                                                                                                                                                  |
+| modules.ffuf.extensions                        | str    | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.ffuf.lines                             | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 5000                                                                                                                                                                |
+| modules.ffuf.max_depth                         | int    | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  | 0                                                                                                                                                                   |
+| modules.ffuf.version                           | str    | ffuf version                                                                                                                                                                                                                                                                                                    | 2.0.0                                                                                                                                                               |
+| modules.ffuf.wordlist                          | str    | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/Web-Content/raft-small-directories.txt                                                   |
+| modules.ffuf_shortnames.extensions             | str    | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.ffuf_shortnames.find_common_prefixes   | bool   | Attempt to automatically detect common prefixes and make additional ffuf runs against them                                                                                                                                                                                                                      | False                                                                                                                                                               |
+| modules.ffuf_shortnames.find_delimeters        | bool   | Attempt to detect common delimeters and make additional ffuf runs against them                                                                                                                                                                                                                                  | True                                                                                                                                                                |
+| modules.ffuf_shortnames.ignore_redirects       | bool   | Explicitly ignore redirects (301,302)                                                                                                                                                                                                                                                                           | True                                                                                                                                                                |
+| modules.ffuf_shortnames.lines                  | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 1000000                                                                                                                                                             |
+| modules.ffuf_shortnames.max_depth              | int    | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  | 1                                                                                                                                                                   |
+| modules.ffuf_shortnames.version                | str    | ffuf version                                                                                                                                                                                                                                                                                                    | 2.0.0                                                                                                                                                               |
+| modules.ffuf_shortnames.wordlist               | str    | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.ffuf_shortnames.wordlist_extensions    | str    | Specify wordlist to use when making extension lists                                                                                                                                                                                                                                                             |                                                                                                                                                                     |
+| modules.fingerprintx.version                   | str    | fingerprintx version                                                                                                                                                                                                                                                                                            | 1.1.4                                                                                                                                                               |
+| modules.gowitness.output_path                  | str    | where to save screenshots                                                                                                                                                                                                                                                                                       |                                                                                                                                                                     |
+| modules.gowitness.resolution_x                 | int    | screenshot resolution x                                                                                                                                                                                                                                                                                         | 1440                                                                                                                                                                |
+| modules.gowitness.resolution_y                 | int    | screenshot resolution y                                                                                                                                                                                                                                                                                         | 900                                                                                                                                                                 |
+| modules.gowitness.threads                      | int    | threads used to run                                                                                                                                                                                                                                                                                             | 4                                                                                                                                                                   |
+| modules.gowitness.timeout                      | int    | preflight check timeout                                                                                                                                                                                                                                                                                         | 10                                                                                                                                                                  |
+| modules.gowitness.version                      | str    | gowitness version                                                                                                                                                                                                                                                                                               | 2.4.2                                                                                                                                                               |
+| modules.httpx.in_scope_only                    | bool   | Only visit web resources that are in scope.                                                                                                                                                                                                                                                                     | True                                                                                                                                                                |
+| modules.httpx.max_response_size                | int    | Max response size in bytes                                                                                                                                                                                                                                                                                      | 5242880                                                                                                                                                             |
+| modules.httpx.threads                          | int    | Number of httpx threads to use                                                                                                                                                                                                                                                                                  | 50                                                                                                                                                                  |
+| modules.httpx.version                          | str    | httpx version                                                                                                                                                                                                                                                                                                   | 1.2.5                                                                                                                                                               |
+| modules.iis_shortnames.detect_only             | bool   | Only detect the vulnerability and do not run the shortname scanner                                                                                                                                                                                                                                              | True                                                                                                                                                                |
+| modules.iis_shortnames.max_node_count          | int    | Limit how many nodes to attempt to resolve on any given recursion branch                                                                                                                                                                                                                                        | 30                                                                                                                                                                  |
+| modules.masscan.ping_first                     | bool   | Only portscan hosts that reply to pings                                                                                                                                                                                                                                                                         | False                                                                                                                                                               |
+| modules.masscan.ports                          | str    | Ports to scan                                                                                                                                                                                                                                                                                                   | 80,443                                                                                                                                                              |
+| modules.masscan.rate                           | int    | Rate in packets per second                                                                                                                                                                                                                                                                                      | 600                                                                                                                                                                 |
+| modules.masscan.use_cache                      | bool   | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
+| modules.masscan.wait                           | int    | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              | 10                                                                                                                                                                  |
+| modules.naabu.ports                            | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
+| modules.naabu.skip_host_discovery              | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
+| modules.naabu.top_ports                        | int    | top ports to scan                                                                                                                                                                                                                                                                                               | 100                                                                                                                                                                 |
+| modules.naabu.version                          | str    | naabu version                                                                                                                                                                                                                                                                                                   | 2.1.1                                                                                                                                                               |
+| modules.nmap.ports                             | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
+| modules.nmap.skip_host_discovery               | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
+| modules.nmap.timing                            | str    |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `| T4                                                                                                                                                                  |
+| modules.nmap.top_ports                         | int    | top ports to scan                                                                                                                                                                                                                                                                                               | 100                                                                                                                                                                 |
+| modules.ntlm.try_all                           | bool   | Try every NTLM endpoint                                                                                                                                                                                                                                                                                         | False                                                                                                                                                               |
+| modules.nuclei.budget                          | int    | Used in budget mode to set the number of requests which will be alloted to the nuclei scan                                                                                                                                                                                                                      | 1                                                                                                                                                                   |
+| modules.nuclei.concurrency                     | int    | maximum number of templates to be executed in parallel (default 25)                                                                                                                                                                                                                                             | 25                                                                                                                                                                  |
+| modules.nuclei.directory_only                  | bool   | Filter out 'file' URL event (default True)                                                                                                                                                                                                                                                                      | True                                                                                                                                                                |
+| modules.nuclei.etags                           | str    | tags to exclude from the scan                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
+| modules.nuclei.mode                            | str    | manual | technology | severe | budget. Technology: Only activate based on technology events that match nuclei tags (nuclei -as mode). Manual (DEFAULT): Fully manual settings. Severe: Only critical and high severity templates without intrusive. Budget: Limit Nuclei to a specified number of HTTP requests | manual                                                                                                                                                              |
+| modules.nuclei.ratelimit                       | int    | maximum number of requests to send per second (default 150)                                                                                                                                                                                                                                                     | 150                                                                                                                                                                 |
+| modules.nuclei.severity                        | str    | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |                                                                                                                                                                     |
+| modules.nuclei.tags                            | str    | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
+| modules.nuclei.templates                       | str    | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |                                                                                                                                                                     |
+| modules.nuclei.version                         | str    | nuclei version                                                                                                                                                                                                                                                                                                  | 2.9.4                                                                                                                                                               |
+| modules.paramminer_cookies.wordlist            | str    | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
+| modules.paramminer_getparams.wordlist          | str    | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
+| modules.paramminer_headers.wordlist            | str    | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  |
+| modules.robots.include_allow                   | bool   | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         | True                                                                                                                                                                |
+| modules.robots.include_disallow                | bool   | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      | True                                                                                                                                                                |
+| modules.robots.include_sitemap                 | bool   | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       | False                                                                                                                                                               |
+| modules.secretsdb.min_confidence               | int    | Only use signatures with this confidence score or higher                                                                                                                                                                                                                                                        | 99                                                                                                                                                                  |
+| modules.secretsdb.signatures                   | str    | File path or URL to YAML signatures                                                                                                                                                                                                                                                                             | https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml                                                               |
+| modules.sslcert.skip_non_ssl                   | bool   | Don't try common non-SSL ports                                                                                                                                                                                                                                                                                  | True                                                                                                                                                                |
+| modules.sslcert.timeout                        | float  | Socket connect timeout in seconds                                                                                                                                                                                                                                                                               | 5.0                                                                                                                                                                 |
+| modules.subdomain_hijack.fingerprints          | str    | URL or path to fingerprints.json                                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json                                                                           |
+| modules.telerik.exploit_RAU_crypto             | bool   | Attempt to confirm any RAU AXD detections are vulnerable                                                                                                                                                                                                                                                        | False                                                                                                                                                               |
+| modules.url_manipulation.allow_redirects       | bool   | Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default.                                                                                                                                                                                | True                                                                                                                                                                |
+| modules.vhost.force_basehost                   | str    | Use a custom base host (e.g. evilcorp.com) instead of the default behavior of using the current URL                                                                                                                                                                                                             |                                                                                                                                                                     |
+| modules.vhost.lines                            | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 5000                                                                                                                                                                |
+| modules.vhost.wordlist                         | str    | Wordlist containing subdomains                                                                                                                                                                                                                                                                                  | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      |
+| modules.wafw00f.generic_detect                 | bool   | When no specific WAF detections are made, try to peform a generic detect                                                                                                                                                                                                                                        | True                                                                                                                                                                |
+| modules.bevigil.api_key                        | str    | BeVigil OSINT API Key                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| modules.bevigil.urls                           | bool   | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.binaryedge.api_key                     | str    | BinaryEdge API key                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
+| modules.binaryedge.max_records                 | int    | Limit results to help prevent exceeding API quota                                                                                                                                                                                                                                                               | 1000                                                                                                                                                                |
+| modules.builtwith.api_key                      | str    | Builtwith API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
+| modules.builtwith.redirects                    | bool   | Also look up inbound and outbound redirects                                                                                                                                                                                                                                                                     | True                                                                                                                                                                |
+| modules.c99.api_key                            | str    | c99.nl API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.censys.api_id                          | str    | Censys.io API ID                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.censys.api_secret                      | str    | Censys.io API Secret                                                                                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.columbus.limit                         | int    | Max number of subdomains to retrieve                                                                                                                                                                                                                                                                            | 500                                                                                                                                                                 |
+| modules.fullhunt.api_key                       | str    | FullHunt API Key                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.github.api_key                         | str    | Github token                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
+| modules.hunterio.api_key                       | str    | Hunter.IO API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
+| modules.ipneighbor.num_bits                    | int    | Netmask size (in CIDR notation) to check. Default is 4 bits (16 hosts)                                                                                                                                                                                                                                          | 4                                                                                                                                                                   |
+| modules.ipstack.api_key                        | str    | IPStack GeoIP API Key                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| modules.leakix.api_key                         | str    | LeakIX API Key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.massdns.max_mutations                  | int    | Max number of smart mutations per subdomain                                                                                                                                                                                                                                                                     | 500                                                                                                                                                                 |
+| modules.massdns.max_resolvers                  | int    | Number of concurrent massdns resolvers                                                                                                                                                                                                                                                                          | 1000                                                                                                                                                                |
+| modules.massdns.wordlist                       | str    | Subdomain wordlist URL                                                                                                                                                                                                                                                                                          | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      |
+| modules.passivetotal.api_key                   | str    | RiskIQ API Key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.passivetotal.username                  | str    | RiskIQ Username                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                     |
+| modules.pgp.search_urls                        | list   | PGP key servers to search                                                                                                                                                                                                                                                                                       |` ['https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=<query>', 'http://the.earth.li:11371/pks/lookup?fingerprint=on&op=vindex&search=<query>'] `|
+| modules.securitytrails.api_key                 | str    | SecurityTrails API key                                                                                                                                                                                                                                                                                          |                                                                                                                                                                     |
+| modules.shodan_dns.api_key                     | str    | Shodan API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| modules.urlscan.urls                           | bool   | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.virustotal.api_key                     | str    | VirusTotal API Key                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
+| modules.wayback.garbage_threshold              | int    | Dedupe similar urls if they are in a group of this size or higher (lower values == less garbage data)                                                                                                                                                                                                           | 10                                                                                                                                                                  |
+| modules.wayback.urls                           | bool   | emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.zoomeye.api_key                        | str    | ZoomEye API key                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                     |
+| modules.zoomeye.include_related                | bool   | Include domains which may be related to the target                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
+| modules.zoomeye.max_pages                      | int    | How many pages of results to fetch                                                                                                                                                                                                                                                                              | 20                                                                                                                                                                  |
+| output_modules.asset_inventory.output_file     | str    | Set a custom output file                                                                                                                                                                                                                                                                                        |                                                                                                                                                                     |
+| output_modules.asset_inventory.summary_netmask | int    | Subnet mask to use when summarizing IP addresses at end of scan                                                                                                                                                                                                                                                 | 16                                                                                                                                                                  |
+| output_modules.asset_inventory.use_previous    | bool   |` Emit previous asset inventory as new events (use in conjunction with -n <old_scan_name>)                                                                                                                                                                                                                        `| False                                                                                                                                                               |
+| output_modules.csv.output_file                 | str    | Output to CSV file                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
+| output_modules.http.bearer                     | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
+| output_modules.http.method                     | str    | HTTP method                                                                                                                                                                                                                                                                                                     | POST                                                                                                                                                                |
+| output_modules.http.password                   | str    | Password (basic auth)                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| output_modules.http.timeout                    | int    | HTTP timeout                                                                                                                                                                                                                                                                                                    | 10                                                                                                                                                                  |
+| output_modules.http.url                        | str    | Web URL                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                     |
+| output_modules.http.username                   | str    | Username (basic auth)                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
+| output_modules.human.console                   | bool   | Output to console                                                                                                                                                                                                                                                                                               | True                                                                                                                                                                |
+| output_modules.human.output_file               | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| output_modules.json.console                    | bool   | Output to console                                                                                                                                                                                                                                                                                               | False                                                                                                                                                               |
+| output_modules.json.output_file                | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| output_modules.neo4j.password                  | str    | Neo4j password                                                                                                                                                                                                                                                                                                  | bbotislife                                                                                                                                                          |
+| output_modules.neo4j.uri                       | str    | Neo4j server + port                                                                                                                                                                                                                                                                                             | bolt://localhost:7687                                                                                                                                               |
+| output_modules.neo4j.username                  | str    | Neo4j username                                                                                                                                                                                                                                                                                                  | neo4j                                                                                                                                                               |
+| output_modules.web_report.css_theme_file       | str    | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            |
+| output_modules.web_report.output_file          | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
+| output_modules.websocket.token                 | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
+| output_modules.websocket.url                   | str    | Web URL                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                     |
+| internal_modules.speculate.max_hosts           | int    | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  | 65536                                                                                                                                                               |
+| internal_modules.speculate.ports               | list   | The set of ports to speculate on                                                                                                                                                                                                                                                                                | [80, 443]                                                                                                                                                           |
+<!-- END BBOT MODULE OPTIONS -->
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
new file mode 100644
index 0000000000..79e8da373c
--- /dev/null
+++ b/docs/scanning/events.md
@@ -0,0 +1,43 @@
+# Events
+
+Events are how data is represented inside BBOT. Examples of an event include `IP_ADDRESS`, `DNS_NAME`, `EMAIL_ADDRESS`, `URL`, etc. When you run a BBOT scan, events are constantly being exchanged between modules. They are also output to the console.
+
+The event type is in the left-most output column:
+
+```text
+[DNS_NAME]      www.evilcorp.com    sslcert    (distance-0, in-scope, resolved, subdomain, a-record)
+ ^^^^^^^^
+```
+
+See below for a full list of event types and which modules produce/consume them.
+
+## Event Types
+
+<!-- BBOT EVENTS -->
+| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | Producing Modules                                                                                                                                                                                                                                                                                                                                                                 |
+|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                              |                                                                                                                                                                                                                                                                                                                                                                                   |
+| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | asn                                                                                                                                                                                                                                                                                                                                                                               |
+| DNS_NAME            | 46                    | 36                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, naabu, nmap, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
+| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |                                                                                                                                                                                                                                                                                                                                                                                   |
+| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                               |
+| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                |
+| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | ipstack                                                                                                                                                                                                                                                                                                                                                                           |
+| HTTP_RESPONSE       | 8                     | 1                     | badsecrets, excavate, host_header, hunt, ntlm, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                           | httpx                                                                                                                                                                                                                                                                                                                                                                             |
+| IP_ADDRESS          | 7                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                         | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                    |
+| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                                                                                                                                                                                                                                   |
+| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys                                                                                                                                                                                                                                                                                                                                                                            |
+| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                  |
+| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                              |
+| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                                                                                                                                                                                                                                   |
+| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | social                                                                                                                                                                                                                                                                                                                                                                            |
+| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                        |
+| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                             |
+| URL                 | 21                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                     | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                  |
+| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                    |
+| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                   |
+| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                | vhost                                                                                                                                                                                                                                                                                                                                                                             |
+| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                         |
+| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | wafw00f                                                                                                                                                                                                                                                                                                                                                                           |
+| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | gowitness                                                                                                                                                                                                                                                                                                                                                                         |
+<!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
new file mode 100644
index 0000000000..97284e5e5b
--- /dev/null
+++ b/docs/scanning/index.md
@@ -0,0 +1,145 @@
+# Scanning Overview
+
+<video controls="" autoplay="" name="media"><source src="https://github-production-user-asset-6210df.s3.amazonaws.com/20261699/245941416-ebf2a81e-7530-4a9e-922d-4e62eb949f35.mp4" type="video/mp4"></video>
+
+Scan visualization courtesy of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
+
+
+## Targets (`-t`)
+
+Targets determine what's in-scope, and seed a scan with initial data. BBOT accepts an unlimited number of targets. They can be any of the following:
+
+- `DNS_NAME` (`evilcorp.com`)
+- `IP_ADDRESS` (`1.2.3.4`)
+- `IP_RANGE` (`1.2.3.0/24`)
+- `URL` (`https://www.evilcorp.com`)
+
+You can specify targets directly on the command line, load them from files, or both! For example:
+
+~~~bash
+$ cat targets.txt
+4.3.2.1
+1.2.3.0/24
+evilcorp.com
+evilcorp.co.uk
+https://www.evilcorp.co.uk
+
+# load targets from a file and from the command-line
+$ bbot -t targets.txt fsociety.com 5.6.7.0/24 -m nmap
+~~~
+
+On start, BBOT automatically converts Targets into [Events](./events).
+
+## Scope
+
+For pentesters and bug bounty hunters, staying in scope is extremely important. BBOT takes this seriously, meaning that active modules (e.g. `nuclei`) will only touch in-scope resources.
+
+By default, whatever you specify with `-t` becomes in-scope. This includes child subdomains. For example, if you specify `-t evilcorp.com`, any subdomains (`www.evilcorp.com`, `mail.evilcorp.com`, etc.) become in-scope.
+
+### Strict Scope
+
+If you want to include ***only*** that specific hostname and none of its children, you can specify `--strict-scope`.
+
+Note that `--strict-scope` only applies to targets and whitelists, not blacklists. This means that if you put `internal.evilcorp.com` in your blacklist, you can be sure none of its subdomains will be scanned, even when using `--strict-scope`.
+
+### Whitelists and Blacklists
+
+BBOT allows precise control over scope with whitelists and blacklists. These both use the same syntax as `--target`, meaning they accept the same event types, and you can specify an unlimited number of them, via a file, the CLI, or both.
+
+`--whitelist` enables you to override what's in scope. For example, if you want to run nuclei against `evilcorp.com`, but stay only inside their corporate IP range of `1.2.3.0/24`, you can accomplish this like so:
+
+```bash
+# Seed scan with evilcorp.com, but restrict scope to 1.2.3.0/24
+bbot -t evilcorp.com --whitelist 1.2.3.0/24 -f subdomain-enum -m nmap nuclei --allow-deadly
+```
+
+`--blacklist` takes ultimate precedence. Anything in the blacklist is completely excluded from the scan, even if it's in the whitelist.
+
+```bash
+# Scan evilcorp.com, but exclude internal.evilcorp.com and its children
+bbot -t evilcorp.com --blacklist internal.evilcorp.com -f subdomain-enum -m nmap nuclei --allow-deadly
+```
+
+## Modules (`-m`)
+
+To see a full list of modules and their descriptions, use `bbot -l` or see [Modules Table](./modules_table).
+
+Modules are the part of BBOT that does the work -- port scanning, subdomain brute-forcing, API querying, etc. Modules consume [Events](../events/) (`IP_ADDRESS`, `DNS_NAME`, etc.) from each other, process the data in a useful way, then emit the results as new events. You can enable individual modules with `-m`.
+
+```bash
+# Enable modules: nmap, sslcert, and httpx
+bbot -t www.evilcorp.com -m nmap sslcert httpx
+```
+
+### Types of Modules
+
+Modules fall into three categories:
+
+- **Scan Modules**:
+    - These make up the majority of modules. Examples are `nmap`, `sslcert`, `httpx`, etc. Enable with `-m`.
+- **Output Modules**:
+    - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output))
+- **Internal Modules**:
+    - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disable via the config (e.g. `-c speculate=false`).
+        - `aggregate`: Summarizes results at the end of a scan
+        - `excavate`: Extracts useful data such as subdomains from webpages, etc.
+        - `speculate`: Intelligently infers new events, e.g. `OPEN_TCP_PORT` from `URL` or `IP_ADDRESS` from `IP_NETWORK`.
+
+For details in the inner workings of modules, see [Creating a Module](../contribution/module_creation/).
+
+## Flags (`-f`)
+
+Flags are how BBOT categorizes its modules. In a way, you can think of them as groups. Flags let you enable a bunch of similar modules at the same time without having to specify them each individually. For example, `-f subdomain-enum` would enable all the modules having the `subdomain-enum` flag.
+
+### Filtering by Flag
+
+Modules can be easily filtered based on their flags:
+
+- `-f` Enable modules with this flag
+- `-rf` Require modules to have this flag
+- `-ef` Exclude modules with this flag
+- `-em` Exclude these individual modules
+- `-lf` List all available flags
+
+Every module is either `safe` or `aggressive`, and either `active` or `passive`. These can be useful for filtering. For example, if you wanted to enable all the `safe` modules, but exclude active ones, you could do:
+
+```bash
+# Enable safe modules but exclude active ones
+bbot -t evilcorp.com -f safe -ef active
+```
+
+This is equivalent to requiring the passive flag:
+
+```bash
+# Enable safe modules but only if they're also passive
+bbot -t evilcorp.com -f safe -rf passive
+```
+
+A single module can have multiple flags. For example, the `securitytrails` module is `passive`, `safe`, `subdomain-enum`. Below is a full list of flags and their associated modules.
+
+### List of Flags
+
+<!-- BBOT MODULE FLAGS -->
+| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
+|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
+| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
+| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
+| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
+| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+<!-- END BBOT MODULE FLAGS -->
diff --git a/docs/modules/index.md b/docs/scanning/modules_table.md
similarity index 98%
rename from docs/modules/index.md
rename to docs/scanning/modules_table.md
index 5b02379018..bf899080e0 100644
--- a/docs/modules/index.md
+++ b/docs/scanning/modules_table.md
@@ -1,14 +1,4 @@
-# Modules Overview
-
-BBOT's power is in its modules. Modules can perform any kind of task, from port scans to subdomain brute-force to API queries. Modules in BBOT fall into four main categories:
-
-- **Scan Modules**
-- **Output Modules**
-- **Report Modules**
-- **Internal Modules**
-
-
-## List of Modules
+# List of Modules
 
 <!-- BBOT MODULES -->
 | Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
diff --git a/docs/scanning/output.md b/docs/scanning/output.md
new file mode 100644
index 0000000000..8b770a4306
--- /dev/null
+++ b/docs/scanning/output.md
@@ -0,0 +1,34 @@
+# Output
+
+By default, BBOT saves its output in TXT, JSON, and CSV formats:
+![image](https://github.com/blacklanternsecurity/bbot/assets/20261699/779207f4-1c2f-4f65-a132-794ca8bd2f8a)
+
+You can enable other output modules with `-om`.
+~~~bash
+# tee to a file
+bbot -t evilcorp.com -f subdomain-enum | tee evilcorp.txt
+
+# output JSON to stdout
+bbot -t evilcorp.com -f subdomain-enum -om json | jq
+
+# output asset inventory in current directory
+bbot -t evilcorp.com -f subdomain-enum -om asset_inventory -o .
+~~~
+For every scan, BBOT generates a unique and mildly-entertaining name like `demonic_jimmy`. Output for that scan, including scan stats and any gowitness screenshots, etc., are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed. You can change the location of BBOT's output with `--output`, and you can also pick a custom scan name with `--name`.
+
+If you reuse a scan name, it will append to its original output files and leverage the previous.
+
+## Neo4j
+Neo4j is the funnest (and prettiest) way to view and interact with BBOT data.
+
+![neo4j](https://user-images.githubusercontent.com/20261699/182398274-729f3c48-c23c-4db0-8c2e-8b403c1bf790.png)
+
+- You can get Neo4j up and running with a single docker command:
+~~~bash
+docker run -p 7687:7687 -p 7474:7474 -v "$(pwd)/data/:/data/" -e NEO4J_AUTH=neo4j/bbotislife neo4j
+~~~
+- After that, run bbot with `--output-modules neo4j`
+~~~bash
+bbot -f subdomain-enum -t evilcorp.com --output-modules neo4j
+~~~
+- Browse data at [http://localhost:7474](http://localhost:7474)
diff --git a/docs/usage.md b/docs/usage.md
index 582a3aba10..f8cacf470d 100644
--- a/docs/usage.md
+++ b/docs/usage.md
@@ -1,8 +1,8 @@
 # Command-Line Usage
 
 <!-- BBOT HELP OUTPUT -->
-```
-usage: docs.py [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+```text
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
                [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR]
                [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a]
                [--version]
@@ -84,10 +84,10 @@ EXAMPLES
     Subdomains + basic web scan:
         bbot -t evilcorp.com -f subdomain-enum web-basic
 
-    Web Spider:
+    Web spider:
         bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
 
-    Subdomains + emails + cloud + port scan + basic web + web screenshots + nuclei:
+    Everything everywhere all at once:
         bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
 
     List modules:
diff --git a/extra_sass/style.css.scss b/extra_sass/style.css.scss
index 3857b5b48a..72d631cb8d 100644
--- a/extra_sass/style.css.scss
+++ b/extra_sass/style.css.scss
@@ -4,52 +4,51 @@
   --bbot-orange: #FF8400;
 }
 
-.md-grid {
-  margin-left: unset;
-  margin-right: unset;
-  max-width: unset;
-}
+// .md-grid {
+//   margin-left: unset;
+//   margin-right: unset;
+//   max-width: unset;
+// }
 
 .md-nav__link--active {
   font-weight: bold
 }
 
-.md-typeset__table tr {
-  white-space: nowrap;
-}
-
 .md-typeset__table td:first-child {
   font-weight: bold;
 }
 
-.md-typeset a {
-  color: var(--bbot-orange);
-}
-
-a.md-source, .md-header__topic {
+a.md-source, .md-header__topic, a:hover {
   color: var(--bbot-orange);
 }
 
-div.md-source__repository ul {
-  color: white;
-}
-
-.md-typeset {
-  h1 h2 h3 h4 h5 {
-    font-weight: 500 !important;
+article.md-content__inner {
+  h1 {
+    font-weight: 500;
+    color: var(--bbot-orange);
+  }
+  h1, h2 {
+    color: var(--bbot-orange);
+  }
+  h2, h3, h4, h5, {
+    font-weight: 300;
   }
 }
 
 table {
   font-family: monospace;
+
+  td {
+    max-width: 100em;
+  }
 }
 
 /* DARK MODE SPECIFIC */
 
 [data-md-color-scheme=slate] {
 
-  a {
-    color: var(--bbot-orange);
+  div.md-source__repository ul {
+    color: white;
   }
 
   .md-nav__link {
@@ -57,7 +56,6 @@ table {
   }
 
   .md-nav__link--active {
-    color: white;
     font-weight: bold
   }
 
@@ -65,6 +63,10 @@ table {
     background-color: #202027;
   }
 
+  .md-nav__link.md-nav__link--active {
+    color: var(--bbot-orange);
+  }
+
   .md-typeset__table thead tr {
     color: var(--bbot-orange);
     background-color: var(--md-primary-fg-color--dark);
diff --git a/mkdocs.yml b/mkdocs.yml
index bc4bb99ffc..2376ac00ce 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -12,18 +12,21 @@ repo_url: https://github.com/blacklanternsecurity/bbot
 nav:
   - Basics:
     - Getting Started: index.md
-    - Usage: usage.md
-  - Modules:
-    - modules/index.md
-    - Flags: modules/flags.md
-  - Advanced Usage:
-    - advanced/index.md
-  - Configuration:
-    - configuration/index.md
-    - Global Options: configuration/global_options.md
-    - Module Options: configuration/module_options.md
+    - How it Works: how_it_works.md
+    - Comparison to Other Tools: comparison.md
+  - Scanning:
+    - scanning/index.md
+    - Events: scanning/events.md
+    - Output: scanning/output.md
+    - Advanced Usage: scanning/advanced.md
+    - Configuration:
+      - scanning/configuration/index.md
+      - Global Options: scanning/configuration/global_options.md
+      - Module Options: scanning/configuration/module_options.md
+    - Modules Table: scanning/modules_table.md
   - Contribution:
     - contribution/index.md
+    - Creating a Module: contribution/module_creation.md
 
 theme:
   name: material
@@ -31,6 +34,8 @@ theme:
   features:
     - content.code.copy
     - navigation.sections
+    - navigation.expand
+    - toc.integrate
   palette: 
   - scheme: slate
     primary: black

From b33d4b35634c3694b966a6bb88be626d7c0188b4 Mon Sep 17 00:00:00 2001
From: github-actions <41898282+github-actions[bot]@users.noreply.github.com>
Date: Fri, 30 Jun 2023 20:34:22 +0000
Subject: [PATCH 148/387] Refresh module docs

---
 docs/modules.md           |  6 +++---
 docs/modules/flags.md     |  6 +++---
 docs/scanning/advanced.md | 14 ++++++++++----
 docs/scanning/index.md    |  6 +++---
 docs/usage.md             | 14 ++++++++++----
 5 files changed, 29 insertions(+), 17 deletions(-)

diff --git a/docs/modules.md b/docs/modules.md
index 34056b944c..3a7d1b9ff8 100644
--- a/docs/modules.md
+++ b/docs/modules.md
@@ -14,17 +14,17 @@
 | web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS -->
 
 ## Full Module List
diff --git a/docs/modules/flags.md b/docs/modules/flags.md
index 1e35eefe77..f8bffe7b52 100644
--- a/docs/modules/flags.md
+++ b/docs/modules/flags.md
@@ -15,15 +15,15 @@
 | web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS -->
\ No newline at end of file
diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 98d44573da..9f3c754b2a 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -30,10 +30,16 @@ asyncio.run(main())
 
 <!-- BBOT HELP OUTPUT -->
 ```text
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
-               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR]
-               [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a]
-               [--version]
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]]
+               [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]]
+               [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf]
+               [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
+               [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME]
+               [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y]
+               [--dry-run] [--current-config]
+               [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps]
+               [-a] [--version]
 
 Bighuge BLS OSINT Tool
 
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 97284e5e5b..e3c73be29a 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -131,15 +131,15 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS -->
diff --git a/docs/usage.md b/docs/usage.md
index f8cacf470d..02596118b1 100644
--- a/docs/usage.md
+++ b/docs/usage.md
@@ -2,10 +2,16 @@
 
 <!-- BBOT HELP OUTPUT -->
 ```text
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
-               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR]
-               [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a]
-               [--version]
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]]
+               [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]]
+               [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf]
+               [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
+               [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME]
+               [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y]
+               [--dry-run] [--current-config]
+               [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps]
+               [-a] [--version]
 
 Bighuge BLS OSINT Tool
 

From 0358a48d79de1d1a6f05c49ec2fdfae2d60d2858 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 30 Jun 2023 16:51:42 -0400
Subject: [PATCH 149/387] blacked

---
 bbot/core/helpers/modules.py | 4 +---
 docs/scanning/index.md       | 2 +-
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index 27c10c0da5..eee3d7a512 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -361,9 +361,7 @@ def events_table(self):
         for e in all_event_types:
             consuming = sorted(consuming_events.get(e, []))
             producing = sorted(producing_events.get(e, []))
-            table.append(
-                [e, len(consuming), len(producing), ", ".join(consuming), ", ".join(producing)]
-            )
+            table.append([e, len(consuming), len(producing), ", ".join(consuming), ", ".join(producing)])
         return make_table(table, header)
 
     def filter_modules(self, modules=None, mod_type=None):
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index e3c73be29a..0bd91f5484 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -80,7 +80,7 @@ Modules fall into three categories:
 - **Output Modules**:
     - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output))
 - **Internal Modules**:
-    - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disable via the config (e.g. `-c speculate=false`).
+    - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disabled via the config (e.g. `-c speculate=false`).
         - `aggregate`: Summarizes results at the end of a scan
         - `excavate`: Extracts useful data such as subdomains from webpages, etc.
         - `speculate`: Intelligently infers new events, e.g. `OPEN_TCP_PORT` from `URL` or `IP_ADDRESS` from `IP_NETWORK`.

From c2b99f144887709c629df2cd7cbbce39eecea7a9 Mon Sep 17 00:00:00 2001
From: github-actions <41898282+github-actions[bot]@users.noreply.github.com>
Date: Fri, 30 Jun 2023 20:52:36 +0000
Subject: [PATCH 150/387] Refresh module docs

---
 docs/modules.md        | 4 ++--
 docs/modules/flags.md  | 4 ++--
 docs/scanning/index.md | 4 ++--
 3 files changed, 6 insertions(+), 6 deletions(-)

diff --git a/docs/modules.md b/docs/modules.md
index 3a7d1b9ff8..7c6acdf97e 100644
--- a/docs/modules.md
+++ b/docs/modules.md
@@ -16,12 +16,12 @@
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
diff --git a/docs/modules/flags.md b/docs/modules/flags.md
index f8bffe7b52..4fb55d616c 100644
--- a/docs/modules/flags.md
+++ b/docs/modules/flags.md
@@ -17,12 +17,12 @@
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 0bd91f5484..427895db7b 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -133,12 +133,12 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |

From 079de87f087dfd4567394e479818b46f307b40f8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 3 Jul 2023 14:11:40 -0400
Subject: [PATCH 151/387] allow user to specify download destination

---
 bbot/core/helpers/web.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 1b48369c38..7233182f8f 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -124,7 +124,7 @@ async def download(self, url, **kwargs):
         Caching supported via "cache_hrs"
         """
         success = False
-        filename = self.parent_helper.cache_filename(url)
+        filename = kwargs.get(filename, self.parent_helper.cache_filename(url))
         cache_hrs = float(kwargs.pop("cache_hrs", -1))
         log.debug(f"Downloading file from {url} with cache_hrs={cache_hrs}")
         if cache_hrs > 0 and self.parent_helper.is_cached(url):

From 9a8d26c866ce647003f7f9ca7fbd0a1c1fdda91a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 3 Jul 2023 14:13:17 -0400
Subject: [PATCH 152/387] fix download bug

---
 bbot/core/helpers/web.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 7233182f8f..c1700f3fab 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -124,7 +124,7 @@ async def download(self, url, **kwargs):
         Caching supported via "cache_hrs"
         """
         success = False
-        filename = kwargs.get(filename, self.parent_helper.cache_filename(url))
+        filename = kwargs.get("filename", self.parent_helper.cache_filename(url))
         cache_hrs = float(kwargs.pop("cache_hrs", -1))
         log.debug(f"Downloading file from {url} with cache_hrs={cache_hrs}")
         if cache_hrs > 0 and self.parent_helper.is_cached(url):

From ebfe022011610d9127fe7b9ac52a75bed6795fbe Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 3 Jul 2023 18:05:03 -0400
Subject: [PATCH 153/387] steady work on docs

---
 bbot/core/configurator/args.py       |   4 +-
 docs/configuration/module_options.md | 181 ---------------------------
 docs/contribution/index.md           |  25 ----
 docs/contribution/module_creation.md |  67 ----------
 docs/index.md                        |   2 +-
 docs/modules.md                      | 123 ------------------
 docs/modules/flags.md                |  29 -----
 docs/scanning/events.md              |  19 ++-
 docs/scanning/index.md               |  16 ++-
 docs/usage.md                        | 106 ----------------
 mkdocs.yml                           |   4 +-
 11 files changed, 30 insertions(+), 546 deletions(-)
 delete mode 100644 docs/configuration/module_options.md
 delete mode 100644 docs/contribution/index.md
 delete mode 100644 docs/contribution/module_creation.md
 delete mode 100644 docs/modules.md
 delete mode 100644 docs/modules/flags.md
 delete mode 100644 docs/usage.md

diff --git a/bbot/core/configurator/args.py b/bbot/core/configurator/args.py
index e27a92adf4..795242911b 100644
--- a/bbot/core/configurator/args.py
+++ b/bbot/core/configurator/args.py
@@ -81,8 +81,8 @@ def error(self, message):
     ),
     (
         "Web spider",
-        "Use the web spider to crawl for emails, secrets, etc.",
-        "bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2",
+        "Crawl www.evilcorp.com up to a max depth of 2, automatically extracting emails, secrets, etc.",
+        "bbot -t www.evilcorp.com -m httpx robots badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2",
     ),
     (
         "Everything everywhere all at once",
diff --git a/docs/configuration/module_options.md b/docs/configuration/module_options.md
deleted file mode 100644
index f5d12fdb5b..0000000000
--- a/docs/configuration/module_options.md
+++ /dev/null
@@ -1,181 +0,0 @@
-# Module Options
-
-## Overview
-
-Many modules accept their own configuration options. These are detailed in the table below. 
-
-Module's options have the ability to change their behavior. For example, the `nmap` module accepts options for `ports`, `timing`, etc.
-
-## Command-line vs Config File
-
-If you wanted to pass these options to `nmap`, you could do it from the command line:
-```bash
-bbot --config modules.nmap.ports=80,443 modules.nmap.timing=T5
-```
-
-or via the config (`~/.config/bbot/bbot.yml`):
-
-```yaml
-modules:
-  nmap:
-    ports: 80,443
-    timing: T5
-```
-
-If you wanted to add an API keys for `shodan` and `virustotal`, you could either specify them like this on the command line:
-
-```bash
-bbot --config modules.shodan.api_key=deadbeef modules.virustotal.api_key=deadbeef
-```
-
-Or in the config:
-```yaml
-modules:
-  shodan:
-    api_key: deadbeef
-  virustotal:
-    api_key: deadbeef
-```
-
-For a list of global BBOT config options such as HTTP Proxy, User-Agent, etc, see [Defaults](../defaults/)
-
-
-## Module Config Options
-
-- **Config Option**: Name of the config option (`--config` syntax, see above for `yaml` equivalent)
-- **Type**: Data type of the option, e.g. `bool`, `str`, etc.
-- **Description**: Description of what the option does
-- **Default**: The option's default value
-
-<!-- BBOT MODULE OPTIONS -->
-| Config Option                                  | Type   | Description                                                                                                                                                                                                                                                                                                     | Default                                                                                                                                                             |
-|------------------------------------------------|--------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| modules.bucket_aws.permutations                | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
-| modules.bucket_azure.permutations              | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
-| modules.bucket_digitalocean.permutations       | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
-| modules.bucket_firebase.permutations           | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
-| modules.bucket_gcp.permutations                | bool   | Whether to try permutations                                                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
-| modules.dnszonetransfer.timeout                | int    | Max seconds to wait before timing out                                                                                                                                                                                                                                                                           | 10                                                                                                                                                                  |
-| modules.ffuf.extensions                        | str    | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |                                                                                                                                                                     |
-| modules.ffuf.lines                             | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 5000                                                                                                                                                                |
-| modules.ffuf.max_depth                         | int    | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  | 0                                                                                                                                                                   |
-| modules.ffuf.version                           | str    | ffuf version                                                                                                                                                                                                                                                                                                    | 2.0.0                                                                                                                                                               |
-| modules.ffuf.wordlist                          | str    | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/Web-Content/raft-small-directories.txt                                                   |
-| modules.ffuf_shortnames.extensions             | str    | Optionally include a list of extensions to extend the keyword with (comma separated)                                                                                                                                                                                                                            |                                                                                                                                                                     |
-| modules.ffuf_shortnames.find_common_prefixes   | bool   | Attempt to automatically detect common prefixes and make additional ffuf runs against them                                                                                                                                                                                                                      | False                                                                                                                                                               |
-| modules.ffuf_shortnames.find_delimeters        | bool   | Attempt to detect common delimeters and make additional ffuf runs against them                                                                                                                                                                                                                                  | True                                                                                                                                                                |
-| modules.ffuf_shortnames.ignore_redirects       | bool   | Explicitly ignore redirects (301,302)                                                                                                                                                                                                                                                                           | True                                                                                                                                                                |
-| modules.ffuf_shortnames.lines                  | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 1000000                                                                                                                                                             |
-| modules.ffuf_shortnames.max_depth              | int    | the maxium directory depth to attempt to solve                                                                                                                                                                                                                                                                  | 1                                                                                                                                                                   |
-| modules.ffuf_shortnames.version                | str    | ffuf version                                                                                                                                                                                                                                                                                                    | 2.0.0                                                                                                                                                               |
-| modules.ffuf_shortnames.wordlist               | str    | Specify wordlist to use when finding directories                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
-| modules.ffuf_shortnames.wordlist_extensions    | str    | Specify wordlist to use when making extension lists                                                                                                                                                                                                                                                             |                                                                                                                                                                     |
-| modules.fingerprintx.version                   | str    | fingerprintx version                                                                                                                                                                                                                                                                                            | 1.1.4                                                                                                                                                               |
-| modules.gowitness.output_path                  | str    | where to save screenshots                                                                                                                                                                                                                                                                                       |                                                                                                                                                                     |
-| modules.gowitness.resolution_x                 | int    | screenshot resolution x                                                                                                                                                                                                                                                                                         | 1440                                                                                                                                                                |
-| modules.gowitness.resolution_y                 | int    | screenshot resolution y                                                                                                                                                                                                                                                                                         | 900                                                                                                                                                                 |
-| modules.gowitness.threads                      | int    | threads used to run                                                                                                                                                                                                                                                                                             | 4                                                                                                                                                                   |
-| modules.gowitness.timeout                      | int    | preflight check timeout                                                                                                                                                                                                                                                                                         | 10                                                                                                                                                                  |
-| modules.gowitness.version                      | str    | gowitness version                                                                                                                                                                                                                                                                                               | 2.4.2                                                                                                                                                               |
-| modules.httpx.in_scope_only                    | bool   | Only visit web resources that are in scope.                                                                                                                                                                                                                                                                     | True                                                                                                                                                                |
-| modules.httpx.max_response_size                | int    | Max response size in bytes                                                                                                                                                                                                                                                                                      | 5242880                                                                                                                                                             |
-| modules.httpx.threads                          | int    | Number of httpx threads to use                                                                                                                                                                                                                                                                                  | 50                                                                                                                                                                  |
-| modules.httpx.version                          | str    | httpx version                                                                                                                                                                                                                                                                                                   | 1.2.5                                                                                                                                                               |
-| modules.iis_shortnames.detect_only             | bool   | Only detect the vulnerability and do not run the shortname scanner                                                                                                                                                                                                                                              | True                                                                                                                                                                |
-| modules.iis_shortnames.max_node_count          | int    | Limit how many nodes to attempt to resolve on any given recursion branch                                                                                                                                                                                                                                        | 30                                                                                                                                                                  |
-| modules.masscan.ping_first                     | bool   | Only portscan hosts that reply to pings                                                                                                                                                                                                                                                                         | False                                                                                                                                                               |
-| modules.masscan.ports                          | str    | Ports to scan                                                                                                                                                                                                                                                                                                   | 80,443                                                                                                                                                              |
-| modules.masscan.rate                           | int    | Rate in packets per second                                                                                                                                                                                                                                                                                      | 600                                                                                                                                                                 |
-| modules.masscan.use_cache                      | bool   | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
-| modules.masscan.wait                           | int    | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              | 10                                                                                                                                                                  |
-| modules.naabu.ports                            | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
-| modules.naabu.skip_host_discovery              | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
-| modules.naabu.top_ports                        | int    | top ports to scan                                                                                                                                                                                                                                                                                               | 100                                                                                                                                                                 |
-| modules.naabu.version                          | str    | naabu version                                                                                                                                                                                                                                                                                                   | 2.1.1                                                                                                                                                               |
-| modules.nmap.ports                             | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
-| modules.nmap.skip_host_discovery               | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
-| modules.nmap.timing                            | str    |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `| T4                                                                                                                                                                  |
-| modules.nmap.top_ports                         | int    | top ports to scan                                                                                                                                                                                                                                                                                               | 100                                                                                                                                                                 |
-| modules.ntlm.try_all                           | bool   | Try every NTLM endpoint                                                                                                                                                                                                                                                                                         | False                                                                                                                                                               |
-| modules.nuclei.budget                          | int    | Used in budget mode to set the number of requests which will be alloted to the nuclei scan                                                                                                                                                                                                                      | 1                                                                                                                                                                   |
-| modules.nuclei.concurrency                     | int    | maximum number of templates to be executed in parallel (default 25)                                                                                                                                                                                                                                             | 25                                                                                                                                                                  |
-| modules.nuclei.directory_only                  | bool   | Filter out 'file' URL event (default True)                                                                                                                                                                                                                                                                      | True                                                                                                                                                                |
-| modules.nuclei.etags                           | str    | tags to exclude from the scan                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
-| modules.nuclei.mode                            | str    | manual | technology | severe | budget. Technology: Only activate based on technology events that match nuclei tags (nuclei -as mode). Manual (DEFAULT): Fully manual settings. Severe: Only critical and high severity templates without intrusive. Budget: Limit Nuclei to a specified number of HTTP requests | manual                                                                                                                                                              |
-| modules.nuclei.ratelimit                       | int    | maximum number of requests to send per second (default 150)                                                                                                                                                                                                                                                     | 150                                                                                                                                                                 |
-| modules.nuclei.severity                        | str    | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |                                                                                                                                                                     |
-| modules.nuclei.tags                            | str    | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
-| modules.nuclei.templates                       | str    | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |                                                                                                                                                                     |
-| modules.nuclei.version                         | str    | nuclei version                                                                                                                                                                                                                                                                                                  | 2.9.4                                                                                                                                                               |
-| modules.paramminer_cookies.wordlist            | str    | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
-| modules.paramminer_getparams.wordlist          | str    | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
-| modules.paramminer_headers.wordlist            | str    | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  |
-| modules.robots.include_allow                   | bool   | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         | True                                                                                                                                                                |
-| modules.robots.include_disallow                | bool   | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      | True                                                                                                                                                                |
-| modules.robots.include_sitemap                 | bool   | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       | False                                                                                                                                                               |
-| modules.secretsdb.min_confidence               | int    | Only use signatures with this confidence score or higher                                                                                                                                                                                                                                                        | 99                                                                                                                                                                  |
-| modules.secretsdb.signatures                   | str    | File path or URL to YAML signatures                                                                                                                                                                                                                                                                             | https://raw.githubusercontent.com/blacklanternsecurity/secrets-patterns-db/master/db/rules-stable.yml                                                               |
-| modules.sslcert.skip_non_ssl                   | bool   | Don't try common non-SSL ports                                                                                                                                                                                                                                                                                  | True                                                                                                                                                                |
-| modules.sslcert.timeout                        | float  | Socket connect timeout in seconds                                                                                                                                                                                                                                                                               | 5.0                                                                                                                                                                 |
-| modules.subdomain_hijack.fingerprints          | str    | URL or path to fingerprints.json                                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/EdOverflow/can-i-take-over-xyz/master/fingerprints.json                                                                           |
-| modules.telerik.exploit_RAU_crypto             | bool   | Attempt to confirm any RAU AXD detections are vulnerable                                                                                                                                                                                                                                                        | False                                                                                                                                                               |
-| modules.url_manipulation.allow_redirects       | bool   | Allowing redirects will sometimes create false positives. Disallowing will sometimes create false negatives. Allowed by default.                                                                                                                                                                                | True                                                                                                                                                                |
-| modules.vhost.force_basehost                   | str    | Use a custom base host (e.g. evilcorp.com) instead of the default behavior of using the current URL                                                                                                                                                                                                             |                                                                                                                                                                     |
-| modules.vhost.lines                            | int    | take only the first N lines from the wordlist when finding directories                                                                                                                                                                                                                                          | 5000                                                                                                                                                                |
-| modules.vhost.wordlist                         | str    | Wordlist containing subdomains                                                                                                                                                                                                                                                                                  | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      |
-| modules.wafw00f.generic_detect                 | bool   | When no specific WAF detections are made, try to peform a generic detect                                                                                                                                                                                                                                        | True                                                                                                                                                                |
-| modules.bevigil.api_key                        | str    | BeVigil OSINT API Key                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
-| modules.bevigil.urls                           | bool   | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
-| modules.binaryedge.api_key                     | str    | BinaryEdge API key                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
-| modules.binaryedge.max_records                 | int    | Limit results to help prevent exceeding API quota                                                                                                                                                                                                                                                               | 1000                                                                                                                                                                |
-| modules.builtwith.api_key                      | str    | Builtwith API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
-| modules.builtwith.redirects                    | bool   | Also look up inbound and outbound redirects                                                                                                                                                                                                                                                                     | True                                                                                                                                                                |
-| modules.c99.api_key                            | str    | c99.nl API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
-| modules.censys.api_id                          | str    | Censys.io API ID                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
-| modules.censys.api_secret                      | str    | Censys.io API Secret                                                                                                                                                                                                                                                                                            |                                                                                                                                                                     |
-| modules.columbus.limit                         | int    | Max number of subdomains to retrieve                                                                                                                                                                                                                                                                            | 500                                                                                                                                                                 |
-| modules.fullhunt.api_key                       | str    | FullHunt API Key                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
-| modules.github.api_key                         | str    | Github token                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
-| modules.hunterio.api_key                       | str    | Hunter.IO API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
-| modules.ipneighbor.num_bits                    | int    | Netmask size (in CIDR notation) to check. Default is 4 bits (16 hosts)                                                                                                                                                                                                                                          | 4                                                                                                                                                                   |
-| modules.ipstack.api_key                        | str    | IPStack GeoIP API Key                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
-| modules.leakix.api_key                         | str    | LeakIX API Key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
-| modules.massdns.max_mutations                  | int    | Max number of smart mutations per subdomain                                                                                                                                                                                                                                                                     | 500                                                                                                                                                                 |
-| modules.massdns.max_resolvers                  | int    | Number of concurrent massdns resolvers                                                                                                                                                                                                                                                                          | 1000                                                                                                                                                                |
-| modules.massdns.wordlist                       | str    | Subdomain wordlist URL                                                                                                                                                                                                                                                                                          | https://raw.githubusercontent.com/danielmiessler/SecLists/master/Discovery/DNS/subdomains-top1million-5000.txt                                                      |
-| modules.passivetotal.api_key                   | str    | RiskIQ API Key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
-| modules.passivetotal.username                  | str    | RiskIQ Username                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                     |
-| modules.pgp.search_urls                        | list   | PGP key servers to search                                                                                                                                                                                                                                                                                       |` ['https://keyserver.ubuntu.com/pks/lookup?fingerprint=on&op=vindex&search=<query>', 'http://the.earth.li:11371/pks/lookup?fingerprint=on&op=vindex&search=<query>'] `|
-| modules.securitytrails.api_key                 | str    | SecurityTrails API key                                                                                                                                                                                                                                                                                          |                                                                                                                                                                     |
-| modules.shodan_dns.api_key                     | str    | Shodan API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
-| modules.urlscan.urls                           | bool   | Emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
-| modules.virustotal.api_key                     | str    | VirusTotal API Key                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
-| modules.wayback.garbage_threshold              | int    | Dedupe similar urls if they are in a group of this size or higher (lower values == less garbage data)                                                                                                                                                                                                           | 10                                                                                                                                                                  |
-| modules.wayback.urls                           | bool   | emit URLs in addition to DNS_NAMEs                                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
-| modules.zoomeye.api_key                        | str    | ZoomEye API key                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                     |
-| modules.zoomeye.include_related                | bool   | Include domains which may be related to the target                                                                                                                                                                                                                                                              | False                                                                                                                                                               |
-| modules.zoomeye.max_pages                      | int    | How many pages of results to fetch                                                                                                                                                                                                                                                                              | 20                                                                                                                                                                  |
-| output_modules.asset_inventory.output_file     | str    | Set a custom output file                                                                                                                                                                                                                                                                                        |                                                                                                                                                                     |
-| output_modules.asset_inventory.summary_netmask | int    | Subnet mask to use when summarizing IP addresses at end of scan                                                                                                                                                                                                                                                 | 16                                                                                                                                                                  |
-| output_modules.asset_inventory.use_previous    | bool   |` Emit previous asset inventory as new events (use in conjunction with -n <old_scan_name>)                                                                                                                                                                                                                        `| False                                                                                                                                                               |
-| output_modules.csv.output_file                 | str    | Output to CSV file                                                                                                                                                                                                                                                                                              |                                                                                                                                                                     |
-| output_modules.http.bearer                     | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
-| output_modules.http.method                     | str    | HTTP method                                                                                                                                                                                                                                                                                                     | POST                                                                                                                                                                |
-| output_modules.http.password                   | str    | Password (basic auth)                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
-| output_modules.http.timeout                    | int    | HTTP timeout                                                                                                                                                                                                                                                                                                    | 10                                                                                                                                                                  |
-| output_modules.http.url                        | str    | Web URL                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                     |
-| output_modules.http.username                   | str    | Username (basic auth)                                                                                                                                                                                                                                                                                           |                                                                                                                                                                     |
-| output_modules.human.console                   | bool   | Output to console                                                                                                                                                                                                                                                                                               | True                                                                                                                                                                |
-| output_modules.human.output_file               | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
-| output_modules.json.console                    | bool   | Output to console                                                                                                                                                                                                                                                                                               | False                                                                                                                                                               |
-| output_modules.json.output_file                | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
-| output_modules.neo4j.password                  | str    | Neo4j password                                                                                                                                                                                                                                                                                                  | bbotislife                                                                                                                                                          |
-| output_modules.neo4j.uri                       | str    | Neo4j server + port                                                                                                                                                                                                                                                                                             | bolt://localhost:7687                                                                                                                                               |
-| output_modules.neo4j.username                  | str    | Neo4j username                                                                                                                                                                                                                                                                                                  | neo4j                                                                                                                                                               |
-| output_modules.web_report.css_theme_file       | str    | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            |
-| output_modules.web_report.output_file          | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
-| output_modules.websocket.token                 | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
-| output_modules.websocket.url                   | str    | Web URL                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                     |
-| internal_modules.speculate.max_hosts           | int    | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  | 65536                                                                                                                                                               |
-| internal_modules.speculate.ports               | list   | The set of ports to speculate on                                                                                                                                                                                                                                                                                | [80, 443]                                                                                                                                                           |
-<!-- END BBOT MODULE OPTIONS -->
diff --git a/docs/contribution/index.md b/docs/contribution/index.md
deleted file mode 100644
index b1b5f5b334..0000000000
--- a/docs/contribution/index.md
+++ /dev/null
@@ -1,25 +0,0 @@
-# Setting Up a Dev Environment
-
-## Installation (Poetry)
-
-[Poetry](https://python-poetry.org/) is the recommended method of installation if you want to dev on BBOT. To set up a dev environment in Poetry, you can follow these steps:
-
-- Fork [BBOT](https://github.com/blacklanternsecurity/bbot) on GitHub
-- Clone your fork and set up a development environment with Poetry:
-~~~bash
-# clone your forked repo and cd into it
-git clone git@github.com/<username>/bbot.git && cd bbot
-
-# install poetry
-curl -sSL https://install.python-poetry.org | python3 -
-
-# install pip dependencies
-poetry install
-
-# enter virtual environment
-poetry shell
-
-bbot --help
-~~~
-- Now, any changes you make in the code will be reflected in the `bbot` command.
-- Finally, commit and push your changes, and create a pull request to the main BBOT repo.
diff --git a/docs/contribution/module_creation.md b/docs/contribution/module_creation.md
deleted file mode 100644
index 88abf182eb..0000000000
--- a/docs/contribution/module_creation.md
+++ /dev/null
@@ -1,67 +0,0 @@
-# Creating a Module
-
-Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
-
-1. Create a new `.py` file in `bbot/modules`
-1. At the top of the file, import `BaseModule`
-1. Declare a class that inherits from `BaseModule`
-    - the class must have the same name as your file (case-insensitive)
-1. Define (via `watched_events` and `produced_events`) what types of events your module consumes
-1. Define (via `flags`) whether your module is `active` or `passive`
-1. Override `.handle_event()`
-    - this is where you put your custom code
-
-Here is a simple example of a working module (`bbot/modules/mymodule.py`):
-~~~python
-from bbot.modules.base import BaseModule
-
-class MyModule(BaseModule):
-    """
-    Resolve DNS_NAMEs to IPs
-    """
-    watched_events = ["DNS_NAME"]
-    produced_events = ["IP_ADDRESS"]
-    flags = ["passive"]
-
-    async def handle_event(self, event):
-        for ip in await self.helpers.resolve(event.data):
-            self.emit_event(ip, "IP_ADDRESS", source=event)
-~~~
-
-### Module Dependencies
-
-BBOT automates module dependencies with **Ansible**. If your module relies on a third-party binary, OS package, or python library, you can specify them in the `deps_*` attributes of your module.
-
-~~~python
-class MyModule(BaseModule):
-    ...
-    deps_pip = ["beautifulsoup4"]
-    deps_apt = ["chromium-browser"]
-    deps_ansible = [
-        {
-            "name": "install dev tools",
-            "package": {"name": ["gcc", "git", "make"], "state": "present"},
-            "become": True,
-            "ignore_errors": True,
-        },
-        {
-            "name": "Download massdns source code",
-            "git": {
-                "repo": "https://github.com/blechschmidt/massdns.git",
-                "dest": "#{BBOT_TEMP}/massdns",
-                "single_branch": True,
-                "version": "master",
-            },
-        },
-        {
-            "name": "Build massdns",
-            "command": {"chdir": "#{BBOT_TEMP}/massdns", "cmd": "make", "creates": "#{BBOT_TEMP}/massdns/bin/massdns"},
-        },
-        {
-            "name": "Install massdns",
-            "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
-        },
-    ]
-~~~
-
-
diff --git a/docs/index.md b/docs/index.md
index 01dec78a22..ee4eae7cae 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -2,7 +2,7 @@
 
 ## Installation
 
-BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, please see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution).
+BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution#installation-poetry).
 
 ### [Python (pip / pipx)](https://pypi.org/project/bbot/)
 Note: `pipx` installs BBOT inside its own virtual environment.
diff --git a/docs/modules.md b/docs/modules.md
deleted file mode 100644
index 7c6acdf97e..0000000000
--- a/docs/modules.md
+++ /dev/null
@@ -1,123 +0,0 @@
-# Modules
-
-## Modules by Flag
-
-<!-- BBOT MODULE FLAGS -->
-| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
-|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
-| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
-| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
-| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
-| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
-| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-<!-- END BBOT MODULE FLAGS -->
-
-## Full Module List
-
-<!-- BBOT MODULES -->
-| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
-|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
-| badsecrets           | scan     | No              | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
-| bucket_aws           | scan     | No              | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_azure         | scan     | No              | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_digitalocean  | scan     | No              | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
-| bucket_firebase      | scan     | No              | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_gcp           | scan     | No              | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bypass403            | scan     | No              | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
-| dnszonetransfer      | scan     | No              | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
-| ffuf                 | scan     | No              | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
-| ffuf_shortnames      | scan     | No              | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
-| fingerprintx         | scan     | No              | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
-| generic_ssrf         | scan     | No              | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
-| git                  | scan     | No              | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| gowitness            | scan     | No              | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
-| host_header          | scan     | No              | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
-| httpx                | scan     | No              | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
-| hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
-| masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
-| naabu                | scan     | No              | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| nmap                 | scan     | No              | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
-| nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
-| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| robots               | scan     | No              | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
-| secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| smuggler             | scan     | No              | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
-| social               | scan     | No              | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
-| sslcert              | scan     | No              | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
-| subdomain_hijack     | scan     | No              | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
-| telerik              | scan     | No              | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
-| url_manipulation     | scan     | No              | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
-| vhost                | scan     | No              | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
-| wafw00f              | scan     | No              | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
-| wappalyzer           | scan     | No              | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
-| affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
-| anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
-| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| c99                  | scan     | Yes             | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| censys               | scan     | Yes             | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
-| certspotter          | scan     | No              | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
-| crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| fullhunt             | scan     | Yes             | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| github               | scan     | Yes             | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
-| hackertarget         | scan     | No              | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| hunterio             | scan     | Yes             | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
-| ipneighbor           | scan     | No              | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
-| ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
-| leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
-| otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| rapiddns             | scan     | No              | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
-| threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| viewdns              | scan     | No              | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
-| virustotal           | scan     | Yes             | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| wayback              | scan     | No              | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| zoomeye              | scan     | Yes             | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| asset_inventory      | output   | No              | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
-| csv                  | output   | No              | Output to CSV                                                          |                                                                               |                                                      |
-| http                 | output   | No              | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
-| human                | output   | No              | Output to text                                                         |                                                                               |                                                      |
-| json                 | output   | No              | Output to JSON                                                         |                                                                               |                                                      |
-| neo4j                | output   | No              | Output to Neo4j                                                        |                                                                               |                                                      |
-| python               | output   | No              | Output via Python API                                                  |                                                                               |                                                      |
-| web_report           | output   | No              | Create a markdown report with web assets                               |                                                                               |                                                      |
-| websocket            | output   | No              | Output to websockets                                                   |                                                                               |                                                      |
-| aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
-| excavate             | internal | No              | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
-| speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
-<!-- END BBOT MODULES -->
\ No newline at end of file
diff --git a/docs/modules/flags.md b/docs/modules/flags.md
deleted file mode 100644
index 4fb55d616c..0000000000
--- a/docs/modules/flags.md
+++ /dev/null
@@ -1,29 +0,0 @@
-# Flags
-
-
-## List of Flags
-
-<!-- BBOT MODULE FLAGS -->
-| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
-|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
-| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
-| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
-| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
-| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
-| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-<!-- END BBOT MODULE FLAGS -->
\ No newline at end of file
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index 79e8da373c..396cf282c2 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -1,14 +1,23 @@
 # Events
 
-Events are how data is represented inside BBOT. Examples of an event include `IP_ADDRESS`, `DNS_NAME`, `EMAIL_ADDRESS`, `URL`, etc. When you run a BBOT scan, events are constantly being exchanged between modules. They are also output to the console.
-
-The event type is in the left-most output column:
+Events are how data is represented inside BBOT. Examples of an event include `IP_ADDRESS`, `DNS_NAME`, `EMAIL_ADDRESS`, `URL`, etc. When you run a BBOT scan, events are constantly being exchanged between modules. They are also output to the console:
 
 ```text
-[DNS_NAME]      www.evilcorp.com    sslcert    (distance-0, in-scope, resolved, subdomain, a-record)
- ^^^^^^^^
+[DNS_NAME]      www.evilcorp.com    sslcert         (distance-0, in-scope, resolved, subdomain, a-record)
+ ^^^^^^^^       ^^^^^^^^^^^^^^^^    ^^^^^^^          ^^^^^^^^^^
+event type      event data          source module    tags
 ```
 
+In addition to the obvious data (e.g. `www.evilcorp.com`), an event also contains other useful information such as:
+
+- a `.timestamp` of when the event was discovered
+- the `.module` that discovered it
+- the `.source` event that led to its discovery
+- its `.scope_distance` (how many hops it is from the main scope, 0 == in-scope)
+- a list of `.tags` that describe the data (`mx-record`, `http-title`, etc.)
+
+These attributes allow us to construct a visual graph of events (e.g. in Neo4j) and let us query/filter/grep them more easily.
+
 See below for a full list of event types and which modules produce/consume them.
 
 ## Event Types
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 427895db7b..d357b63e61 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -2,12 +2,12 @@
 
 <video controls="" autoplay="" name="media"><source src="https://github-production-user-asset-6210df.s3.amazonaws.com/20261699/245941416-ebf2a81e-7530-4a9e-922d-4e62eb949f35.mp4" type="video/mp4"></video>
 
-Scan visualization courtesy of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
+*A BBOT scan in real-time - visualization courtesy of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)*
 
 
 ## Targets (`-t`)
 
-Targets determine what's in-scope, and seed a scan with initial data. BBOT accepts an unlimited number of targets. They can be any of the following:
+Targets declare what's in-scope, and seed a scan with initial data. BBOT accepts an unlimited number of targets. They can be any of the following:
 
 - `DNS_NAME` (`evilcorp.com`)
 - `IP_ADDRESS` (`1.2.3.4`)
@@ -36,11 +36,19 @@ For pentesters and bug bounty hunters, staying in scope is extremely important.
 
 By default, whatever you specify with `-t` becomes in-scope. This includes child subdomains. For example, if you specify `-t evilcorp.com`, any subdomains (`www.evilcorp.com`, `mail.evilcorp.com`, etc.) become in-scope.
 
+### Scope Distance
+
+Since BBOT is recursive, it would quickly resort to scannning the entire internet if left unscoped. To solve this problem, every [event](./events) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
+
+For example, if your target is `evilcorp.com` and `evilcorp.com` resolves to `1.2.3.4`, `evilcorp.com` itself would have a scope distance of `0` (i.e. in-scope) and `1.2.3.4` would have a scope distance of `1`. 
+
+Scope distance continues to increase the further out you get. Most modules (e.g. `nuclei` and `nmap`) only consume in-scope events. Certain other passive modules such as `asn` accept out to distance `1`. By default, DNS resolution happens out to a distance of `2`. Any [event](./events) that's determined to be in-scope (i.e. `www.evilcorp.com`) immediately becomes distance `0`, and the cycle of discovery starts again.
+
 ### Strict Scope
 
-If you want to include ***only*** that specific hostname and none of its children, you can specify `--strict-scope`.
+If you want to scan ***only*** that specific target hostname and none of its children, you can specify `--strict-scope`.
 
-Note that `--strict-scope` only applies to targets and whitelists, not blacklists. This means that if you put `internal.evilcorp.com` in your blacklist, you can be sure none of its subdomains will be scanned, even when using `--strict-scope`.
+Note that `--strict-scope` only applies to targets and whitelists, but not blacklists. This means that if you put `internal.evilcorp.com` in your blacklist, you can be sure none of its subdomains will be scanned, even when using `--strict-scope`.
 
 ### Whitelists and Blacklists
 
diff --git a/docs/usage.md b/docs/usage.md
deleted file mode 100644
index 02596118b1..0000000000
--- a/docs/usage.md
+++ /dev/null
@@ -1,106 +0,0 @@
-# Command-Line Usage
-
-<!-- BBOT HELP OUTPUT -->
-```text
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]]
-               [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]]
-               [--strict-scope] [-m MODULE [MODULE ...]] [-l]
-               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf]
-               [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
-               [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME]
-               [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y]
-               [--dry-run] [--current-config]
-               [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps]
-               [-a] [--version]
-
-Bighuge BLS OSINT Tool
-
-options:
-  -h, --help            show this help message and exit
-  --help-all            Display full help including module config options
-
-Target:
-  -t TARGET [TARGET ...], --targets TARGET [TARGET ...]
-                        Targets to seed the scan
-  -w WHITELIST [WHITELIST ...], --whitelist WHITELIST [WHITELIST ...]
-                        What's considered in-scope (by default it's the same as --targets)
-  -b BLACKLIST [BLACKLIST ...], --blacklist BLACKLIST [BLACKLIST ...]
-                        Don't touch these things
-  --strict-scope        Don't consider subdomains of target/whitelist to be in-scope
-
-Modules:
-  -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
-  -l, --list-modules    List available modules.
-  -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
-                        Exclude these modules.
-  -f FLAG [FLAG ...], --flags FLAG [FLAG ...]
-                        Enable modules by flag. Choices: active,affiliates,aggressive,cloud-enum,deadly,email-enum,iis-shortnames,passive,portscan,report,safe,service-enum,slow,social-enum,subdomain-enum,subdomain-hijack,web-basic,web-paramminer,web-screenshots,web-thorough
-  -lf, --list-flags     List available flags.
-  -rf FLAG [FLAG ...], --require-flags FLAG [FLAG ...]
-                        Only enable modules with these flags (e.g. -rf passive)
-  -ef FLAG [FLAG ...], --exclude-flags FLAG [FLAG ...]
-                        Disable modules with these flags. (e.g. -ef aggressive)
-  -om MODULE [MODULE ...], --output-modules MODULE [MODULE ...]
-                        Output module(s). Choices: asset_inventory,csv,http,human,json,neo4j,python,web_report,websocket
-  --allow-deadly        Enable the use of highly aggressive modules
-
-Scan:
-  -n SCAN_NAME, --name SCAN_NAME
-                        Name of scan (default: random)
-  -o DIR, --output-dir DIR
-  -c [CONFIG ...], --config [CONFIG ...]
-                        custom config file, or configuration options in key=value format: 'modules.shodan.api_key=1234'
-  -v, --verbose         Be more verbose
-  -d, --debug           Enable debugging
-  -s, --silent          Be quiet
-  --force               Run scan even if module setups fail
-  -y, --yes             Skip scan confirmation prompt
-  --dry-run             Abort before executing scan
-  --current-config      Show current config in YAML format
-
-Module dependencies:
-  Control how modules install their dependencies
-
-  --no-deps             Don't install module dependencies
-  --force-deps          Force install all module dependencies
-  --retry-deps          Try again to install failed module dependencies
-  --ignore-failed-deps  Run modules even if they have failed dependencies
-  --install-all-deps    Install dependencies for all modules
-
-Agent:
-  Report back to a central server
-
-  -a, --agent-mode      Start in agent mode
-
-Misc:
-  --version             show BBOT version and exit
-
-EXAMPLES
-
-    Subdomains:
-        bbot -t evilcorp.com -f subdomain-enum
-
-    Subdomains (passive only):
-        bbot -t evilcorp.com -f subdomain-enum -rf passive
-
-    Subdomains + port scan + web screenshots:
-        bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .
-
-    Subdomains + basic web scan:
-        bbot -t evilcorp.com -f subdomain-enum web-basic
-
-    Web spider:
-        bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
-
-    Everything everywhere all at once:
-        bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
-
-    List modules:
-        bbot -l
-
-    List flags:
-        bbot -lf
-
-```
-<!-- END BBOT HELP OUTPUT -->
diff --git a/mkdocs.yml b/mkdocs.yml
index 2376ac00ce..ac5793575f 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -24,9 +24,7 @@ nav:
       - Global Options: scanning/configuration/global_options.md
       - Module Options: scanning/configuration/module_options.md
     - Modules Table: scanning/modules_table.md
-  - Contribution:
-    - contribution/index.md
-    - Creating a Module: contribution/module_creation.md
+  - Contribution: contribution.md
 
 theme:
   name: material

From 5ba8ddf2d03370df5097b439b72da99adc3a3787 Mon Sep 17 00:00:00 2001
From: github-actions <41898282+github-actions[bot]@users.noreply.github.com>
Date: Mon, 3 Jul 2023 22:06:10 +0000
Subject: [PATCH 154/387] Refresh module docs

---
 docs/index.md             | 4 ++--
 docs/scanning/advanced.md | 2 +-
 docs/scanning/index.md    | 2 +-
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/docs/index.md b/docs/index.md
index ee4eae7cae..a250a38510 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -62,8 +62,8 @@ bbot -t evilcorp.com -f subdomain-enum web-basic
 
 **Web spider:**
 ```bash
-# Use the web spider to crawl for emails, secrets, etc.
-bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
+# Crawl www.evilcorp.com up to a max depth of 2, automatically extracting emails, secrets, etc.
+bbot -t www.evilcorp.com -m httpx robots badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
 ```
 
 **Everything everywhere all at once:**
diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 9f3c754b2a..30dae26932 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -119,7 +119,7 @@ EXAMPLES
         bbot -t evilcorp.com -f subdomain-enum web-basic
 
     Web spider:
-        bbot -t www.evilcorp.com -m httpx badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
+        bbot -t www.evilcorp.com -m httpx robots badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
 
     Everything everywhere all at once:
         bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index d357b63e61..11c4487140 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -144,9 +144,9 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |

From 79ad9fb62b5f49d49b21eae44fda8f1379b64281 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 3 Jul 2023 18:22:20 -0400
Subject: [PATCH 155/387] steady work on docs

---
 docs/contribution.md    | 166 ++++++++++++++++++++++++++++++++++++++++
 docs/index.md           |   2 +-
 docs/scanning/events.md |   4 +-
 docs/scanning/index.md  |  89 +++++++++++----------
 4 files changed, 219 insertions(+), 42 deletions(-)
 create mode 100644 docs/contribution.md

diff --git a/docs/contribution.md b/docs/contribution.md
new file mode 100644
index 0000000000..c258a2a173
--- /dev/null
+++ b/docs/contribution.md
@@ -0,0 +1,166 @@
+# Contribution
+
+## Setting Up a Dev Environment
+
+We welcome community contributions! 
+
+### Installation (Poetry)
+
+[Poetry](https://python-poetry.org/) is the recommended method of installation if you want to dev on BBOT. To set up a dev environment with Poetry, you can follow these steps:
+
+- Fork [BBOT](https://github.com/blacklanternsecurity/bbot) on GitHub
+- Clone your fork and set up a development environment with Poetry:
+~~~bash
+# clone your forked repo and cd into it
+git clone git@github.com/<username>/bbot.git && cd bbot
+
+# install poetry
+curl -sSL https://install.python-poetry.org | python3 -
+
+# install pip dependencies
+poetry install
+
+# enter virtual environment
+poetry shell
+
+bbot --help
+~~~
+- Now, any changes you make in the code will be reflected in the `bbot` command.
+- Run the tests locally to ensure they pass:
+```bash
+# auto-format code indentation, etc.
+black .
+
+# run tests
+./bbot/test/run_tests.sh
+```
+- Finally, commit and push your changes, and create a pull request to the `dev` branch of the main BBOT repo.
+
+
+## Creating a Module
+
+Here is a simple example of a working module (`bbot/modules/mymodule.py`):
+~~~python
+from bbot.modules.base import BaseModule
+
+class MyModule(BaseModule):
+    """
+    Resolve DNS_NAMEs to IPs
+    """
+    watched_events = ["DNS_NAME"]
+    produced_events = ["IP_ADDRESS"]
+    flags = ["passive"]
+
+    async def handle_event(self, event):
+        self.hugeinfo(f"GOT EVENT: {event}")
+        for ip in await self.helpers.resolve(event.data):
+            self.hugesuccess(f"EMITTING IP_ADDRESS: {ip}")
+            self.emit_event(ip, "IP_ADDRESS", source=event)
+~~~
+
+Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
+
+1. Create a new `.py` file in `bbot/modules`
+1. At the top of the file, import `BaseModule`
+1. Declare a class that inherits from `BaseModule`
+    - the class must have the same name as your file (case-insensitive)
+1. Define in `watched_events` what type of data your module will consume
+1. Define in `produced_events` what type of data your module will produce
+1. Define (via `flags`) whether your module is `active` or `passive`, and whether it's `safe` or `aggressive`
+1. **Override `.handle_event()`**
+    - this is where you put your custom code
+
+After saving the module, you can run it simply by specifying it with `-m`:
+
+```bash
+# run a scan enabling the module in bbot/modules/mymodule.py
+bbot -t evilcorp.com -m mymodule
+```
+
+This will produce the output:
+```text
+[SUCC] Starting scan satanic_linda
+[SCAN]                  satanic_linda (SCAN:2e9ec8b6f06875bcf7980eea4c150754b53a6049)  TARGET  (distance-0)
+[INFO] mymodule: GOT EVENT: DNS_NAME("dns.google", module=TARGET, tags={'aaaa-record', 'ns-record', 'target', 'domain', 'a-record', 'resolved', 'txt-record', 'soa-record', 'distance-0', 'in-scope'})
+[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.8.8
+[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8844
+[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8888
+[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.4.4
+[DNS_NAME]              dns.google  TARGET  (a-record, aaaa-record, distance-0, domain, in-scope, ns-record, resolved, soa-record, target, txt-record)
+[INFO] Finishing scan
+```
+
+But something's wrong! We're emitting `IP_ADDRESS` [events](./scanning/events), but we're not seeing them on the console. This is because by default, BBOT only shows in-scope [events](./scanning/events). To see them, we need to increase the report distance:
+
+```bash
+# run the module again but with a higher report distance
+# this lets us see out-of-scope events (up to distance 1)
+bbot -t evilcorp.com -m mymodule -c scope_report_distance=1
+```
+
+Much better:
+
+```text
+[SUCC] Starting scan utmost_alexander
+[SCAN]                  utmost_alexander (SCAN:e9d28f64527da53eaffc16f46f5deb20103bc78b)    TARGET  (distance-0)
+[INFO] mymodule: GOT EVENT: DNS_NAME("dns.google", module=TARGET, tags={'soa-record', 'aaaa-record', 'ns-record', 'txt-record', 'distance-0', 'in-scope', 'resolved', 'domain', 'a-record', 'target'})
+[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8888
+[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.4.4
+[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.8.8
+[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8844
+[DNS_NAME]              dns.google  TARGET  (a-record, aaaa-record, distance-0, domain, in-scope, ns-record, resolved, soa-record, target, txt-record)
+[IP_ADDRESS]            8.8.4.4 A   (distance-1, ipv4, ptr-record, resolved)
+[IP_ADDRESS]            2001:4860:4860::8888    mymodule    (distance-1, ipv6, ptr-record, resolved)
+[IP_ADDRESS]            8.8.8.8 A   (distance-1, ipv4, ptr-record, resolved)
+[IP_ADDRESS]            2001:4860:4860::8844    mymodule    (distance-1, ipv6, ptr-record, resolved)
+[DNS_NAME]              ns3.zdns.google NS  (a-record, aaaa-record, distance-1, resolved, subdomain)
+[DNS_NAME]              ns1.zdns.google NS  (a-record, aaaa-record, distance-1, resolved, subdomain)
+[DNS_NAME]              ns4.zdns.google NS  (a-record, aaaa-record, distance-1, resolved, subdomain)
+[DNS_NAME]              ns2.zdns.google NS  (a-record, aaaa-record, distance-1, resolved, subdomain)
+[DNS_NAME]              xkcd.com    TXT (a-record, aaaa-record, distance-1, domain, mx-record, ns-record, resolved, soa-record, txt-record)
+[INFO] Finishing scan
+```
+
+### `handle_event()`:
+
+The `handle_event()` method is the most important part of the module. By overriding this method, you control what happens when the module runs. During a scan, when an [event](./scanning/events) from your `watched_events` is encountered (a `DNS_NAME` in this example), `handle_event()` is automatically called with that [event](./scanning/events).
+
+### `emit_event()`:
+
+The `emit_event()` method is the way modules return data. When you call `emit_event()`, it creates an [event](./scanning/events) and prints it to the console. It also distributes it any modules that are interested in that data type.
+
+### Module Dependencies
+
+BBOT automates module dependencies with **Ansible**. If your module relies on a third-party binary, OS package, or python library, you can specify them in the `deps_*` attributes of your module.
+
+~~~python
+class MyModule(BaseModule):
+    ...
+    deps_pip = ["beautifulsoup4"]
+    deps_apt = ["chromium-browser"]
+    deps_ansible = [
+        {
+            "name": "install dev tools",
+            "package": {"name": ["gcc", "git", "make"], "state": "present"},
+            "become": True,
+            "ignore_errors": True,
+        },
+        {
+            "name": "Download massdns source code",
+            "git": {
+                "repo": "https://github.com/blechschmidt/massdns.git",
+                "dest": "#{BBOT_TEMP}/massdns",
+                "single_branch": True,
+                "version": "master",
+            },
+        },
+        {
+            "name": "Build massdns",
+            "command": {"chdir": "#{BBOT_TEMP}/massdns", "cmd": "make", "creates": "#{BBOT_TEMP}/massdns/bin/massdns"},
+        },
+        {
+            "name": "Install massdns",
+            "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
+        },
+    ]
+~~~
diff --git a/docs/index.md b/docs/index.md
index a250a38510..6512f09389 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -73,4 +73,4 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap g
 ```
 <!-- END BBOT EXAMPLE COMMANDS -->
 
-For more information, see [Scanning](./scanning)
+## Next: [Scanning](./scanning)
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index 396cf282c2..16abea9103 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -10,13 +10,13 @@ event type      event data          source module    tags
 
 In addition to the obvious data (e.g. `www.evilcorp.com`), an event also contains other useful information such as:
 
-- a `.timestamp` of when the event was discovered
+- a `.timestamp` of when the data was discovered
 - the `.module` that discovered it
 - the `.source` event that led to its discovery
 - its `.scope_distance` (how many hops it is from the main scope, 0 == in-scope)
 - a list of `.tags` that describe the data (`mx-record`, `http-title`, etc.)
 
-These attributes allow us to construct a visual graph of events (e.g. in Neo4j) and let us query/filter/grep them more easily.
+These attributes allow us to construct a visual graph of events (e.g. in Neo4j) and query/filter/grep them more easily.
 
 See below for a full list of event types and which modules produce/consume them.
 
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 11c4487140..c8b94e6b5f 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -2,7 +2,7 @@
 
 <video controls="" autoplay="" name="media"><source src="https://github-production-user-asset-6210df.s3.amazonaws.com/20261699/245941416-ebf2a81e-7530-4a9e-922d-4e62eb949f35.mp4" type="video/mp4"></video>
 
-*A BBOT scan in real-time - visualization courtesy of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)*
+*A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)*
 
 
 ## Targets (`-t`)
@@ -30,44 +30,6 @@ $ bbot -t targets.txt fsociety.com 5.6.7.0/24 -m nmap
 
 On start, BBOT automatically converts Targets into [Events](./events).
 
-## Scope
-
-For pentesters and bug bounty hunters, staying in scope is extremely important. BBOT takes this seriously, meaning that active modules (e.g. `nuclei`) will only touch in-scope resources.
-
-By default, whatever you specify with `-t` becomes in-scope. This includes child subdomains. For example, if you specify `-t evilcorp.com`, any subdomains (`www.evilcorp.com`, `mail.evilcorp.com`, etc.) become in-scope.
-
-### Scope Distance
-
-Since BBOT is recursive, it would quickly resort to scannning the entire internet if left unscoped. To solve this problem, every [event](./events) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
-
-For example, if your target is `evilcorp.com` and `evilcorp.com` resolves to `1.2.3.4`, `evilcorp.com` itself would have a scope distance of `0` (i.e. in-scope) and `1.2.3.4` would have a scope distance of `1`. 
-
-Scope distance continues to increase the further out you get. Most modules (e.g. `nuclei` and `nmap`) only consume in-scope events. Certain other passive modules such as `asn` accept out to distance `1`. By default, DNS resolution happens out to a distance of `2`. Any [event](./events) that's determined to be in-scope (i.e. `www.evilcorp.com`) immediately becomes distance `0`, and the cycle of discovery starts again.
-
-### Strict Scope
-
-If you want to scan ***only*** that specific target hostname and none of its children, you can specify `--strict-scope`.
-
-Note that `--strict-scope` only applies to targets and whitelists, but not blacklists. This means that if you put `internal.evilcorp.com` in your blacklist, you can be sure none of its subdomains will be scanned, even when using `--strict-scope`.
-
-### Whitelists and Blacklists
-
-BBOT allows precise control over scope with whitelists and blacklists. These both use the same syntax as `--target`, meaning they accept the same event types, and you can specify an unlimited number of them, via a file, the CLI, or both.
-
-`--whitelist` enables you to override what's in scope. For example, if you want to run nuclei against `evilcorp.com`, but stay only inside their corporate IP range of `1.2.3.0/24`, you can accomplish this like so:
-
-```bash
-# Seed scan with evilcorp.com, but restrict scope to 1.2.3.0/24
-bbot -t evilcorp.com --whitelist 1.2.3.0/24 -f subdomain-enum -m nmap nuclei --allow-deadly
-```
-
-`--blacklist` takes ultimate precedence. Anything in the blacklist is completely excluded from the scan, even if it's in the whitelist.
-
-```bash
-# Scan evilcorp.com, but exclude internal.evilcorp.com and its children
-bbot -t evilcorp.com --blacklist internal.evilcorp.com -f subdomain-enum -m nmap nuclei --allow-deadly
-```
-
 ## Modules (`-m`)
 
 To see a full list of modules and their descriptions, use `bbot -l` or see [Modules Table](./modules_table).
@@ -151,3 +113,52 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 <!-- END BBOT MODULE FLAGS -->
+
+
+
+## Scope
+
+For pentesters and bug bounty hunters, staying in scope is extremely important. BBOT takes this seriously, meaning that active modules (e.g. `nuclei`) will only touch in-scope resources.
+
+By default, scope is whatever you specify with `-t`. This includes child subdomains. For example, if you specify `-t evilcorp.com`, all its subdomains (`www.evilcorp.com`, `mail.evilcorp.com`, etc.) also become in-scope.
+
+### Scope Distance
+
+Since BBOT is recursive, it would quickly resort to scannning the entire internet if not properly restrained. To solve this problem, every [event](./events) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
+
+For example, if your target is `evilcorp.com`, `www.evilcorp.com` itself would have a scope distance of `0` (i.e. in-scope). If BBOT discovers that `www.evilcorp.com` resolves to `1.2.3.4`, `1.2.3.4` is one hop away, which means it would have a scope distance of `1`. If `1.2.3.4` has a PTR record that points to `ecorp.blob.core.windows.net`, `ecorp.blob.core.windows.net` is two hops away, so its scope distance is `2`.
+
+Scope distance continues to increase the further out you get. Most modules (e.g. `nuclei` and `nmap`) only consume in-scope events. Certain other passive modules such as `asn` accept out to distance `1`. By default, DNS resolution happens out to a distance of `2`. Upon its discovery, any [event](./events) that's determined to be in-scope (e.g. `www.evilcorp.com`) immediately becomes distance `0`, and the cycle starts over.
+
+#### Displaying Out-of-scope Events
+
+By default, BBOT only displayed in-scope events (with a few exceptions such as `STORAGE_BUCKET`s). If you want to see more, you must increase the [config](./configuration) value of `scope_report_distance`:
+
+```bash
+# display out-of-scope events up to one hop away from the main scope
+bbot -t evilcorp.com -f subdomain-enum -c scope_report_distance=1
+```
+
+### Strict Scope
+
+If you want to scan ***only*** that specific target hostname and none of its children, you can specify `--strict-scope`.
+
+Note that `--strict-scope` only applies to targets and whitelists, but not blacklists. This means that if you put `internal.evilcorp.com` in your blacklist, you can be sure none of its subdomains will be scanned, even when using `--strict-scope`.
+
+### Whitelists and Blacklists
+
+BBOT allows precise control over scope with whitelists and blacklists. These both use the same syntax as `--target`, meaning they accept the same event types, and you can specify an unlimited number of them, via a file, the CLI, or both.
+
+`--whitelist` enables you to override what's in scope. For example, if you want to run nuclei against `evilcorp.com`, but stay only inside their corporate IP range of `1.2.3.0/24`, you can accomplish this like so:
+
+```bash
+# Seed scan with evilcorp.com, but restrict scope to 1.2.3.0/24
+bbot -t evilcorp.com --whitelist 1.2.3.0/24 -f subdomain-enum -m nmap nuclei --allow-deadly
+```
+
+`--blacklist` takes ultimate precedence. Anything in the blacklist is completely excluded from the scan, even if it's in the whitelist.
+
+```bash
+# Scan evilcorp.com, but exclude internal.evilcorp.com and its children
+bbot -t evilcorp.com --blacklist internal.evilcorp.com -f subdomain-enum -m nmap nuclei --allow-deadly
+```
\ No newline at end of file

From 5b466192bd94de2c5fde501fd84aa7d564cce6a8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 4 Jul 2023 16:55:20 -0400
Subject: [PATCH 156/387] fix tests, steady work on docs

---
 bbot/test/test_step_1/test_manager.py         |   4 +-
 docs/contribution.md                          |  55 ++---
 docs/index.md                                 |  26 ++-
 docs/scanning/advanced.md                     |  22 +-
 .../module_options.md => configuration.md}    | 195 +++++++++++++++---
 docs/scanning/configuration/global_options.md | 156 --------------
 docs/scanning/configuration/index.md          |  39 ----
 docs/scanning/events.md                       |  52 ++---
 docs/scanning/index.md                        |  17 +-
 .../{modules_table.md => list_of_modules.md}  |   1 +
 docs/scanning/output.md                       |   4 +-
 extra_sass/style.css.scss                     |   4 +
 mkdocs.yml                                    |  10 +-
 13 files changed, 275 insertions(+), 310 deletions(-)
 rename docs/scanning/{configuration/module_options.md => configuration.md} (92%)
 delete mode 100644 docs/scanning/configuration/global_options.md
 delete mode 100644 docs/scanning/configuration/index.md
 rename docs/scanning/{modules_table.md => list_of_modules.md} (98%)

diff --git a/bbot/test/test_step_1/test_manager.py b/bbot/test/test_step_1/test_manager.py
index d3e4b4f7c0..7804836f50 100644
--- a/bbot/test/test_step_1/test_manager.py
+++ b/bbot/test/test_step_1/test_manager.py
@@ -22,12 +22,12 @@ def event_children_append(e):
         event_children.append(e)
 
     success_callback = lambda e: results.append("success")
-    scan1 = bbot_scanner("127.0.0.1", modules=["ipneighbor"], output_modules=["human"], config=dns_config)
+    scan1 = bbot_scanner("127.0.0.1", modules=["ipneighbor"], output_modules=["json"], config=dns_config)
     await scan1.load_modules()
     module = scan1.modules["ipneighbor"]
     module.scope_distance_modifier = 0
     module.queue_event = results_append
-    output_module = scan1.modules["human"]
+    output_module = scan1.modules["json"]
     output_module.queue_event = output_append
     scan1.status = "RUNNING"
     manager = scan1.manager
diff --git a/docs/contribution.md b/docs/contribution.md
index c258a2a173..74752e63dd 100644
--- a/docs/contribution.md
+++ b/docs/contribution.md
@@ -2,7 +2,7 @@
 
 ## Setting Up a Dev Environment
 
-We welcome community contributions! 
+We welcome contributions! If you want a 
 
 ### Installation (Poetry)
 
@@ -39,6 +39,17 @@ black .
 
 ## Creating a Module
 
+Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
+
+1. Create a new `.py` file in `bbot/modules`
+1. At the top of the file, import `BaseModule`
+1. Declare a class that inherits from `BaseModule`
+    - the class must have the same name as your file (case-insensitive)
+1. Define in `watched_events` what type of data your module will consume
+1. Define in `produced_events` what type of data your module will produce
+1. Define (via `flags`) whether your module is `active` or `passive`, and whether it's `safe` or `aggressive`
+1. **Override `.handle_event()`** (see [`handle_event()` and `emit_event()`](#handle_event-and-emit_event))
+
 Here is a simple example of a working module (`bbot/modules/mymodule.py`):
 ~~~python
 from bbot.modules.base import BaseModule
@@ -49,7 +60,7 @@ class MyModule(BaseModule):
     """
     watched_events = ["DNS_NAME"]
     produced_events = ["IP_ADDRESS"]
-    flags = ["passive"]
+    flags = ["passive", "safe"]
 
     async def handle_event(self, event):
         self.hugeinfo(f"GOT EVENT: {event}")
@@ -58,18 +69,6 @@ class MyModule(BaseModule):
             self.emit_event(ip, "IP_ADDRESS", source=event)
 ~~~
 
-Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
-
-1. Create a new `.py` file in `bbot/modules`
-1. At the top of the file, import `BaseModule`
-1. Declare a class that inherits from `BaseModule`
-    - the class must have the same name as your file (case-insensitive)
-1. Define in `watched_events` what type of data your module will consume
-1. Define in `produced_events` what type of data your module will produce
-1. Define (via `flags`) whether your module is `active` or `passive`, and whether it's `safe` or `aggressive`
-1. **Override `.handle_event()`**
-    - this is where you put your custom code
-
 After saving the module, you can run it simply by specifying it with `-m`:
 
 ```bash
@@ -82,15 +81,11 @@ This will produce the output:
 [SUCC] Starting scan satanic_linda
 [SCAN]                  satanic_linda (SCAN:2e9ec8b6f06875bcf7980eea4c150754b53a6049)  TARGET  (distance-0)
 [INFO] mymodule: GOT EVENT: DNS_NAME("dns.google", module=TARGET, tags={'aaaa-record', 'ns-record', 'target', 'domain', 'a-record', 'resolved', 'txt-record', 'soa-record', 'distance-0', 'in-scope'})
-[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.8.8
-[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8844
-[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8888
-[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.4.4
 [DNS_NAME]              dns.google  TARGET  (a-record, aaaa-record, distance-0, domain, in-scope, ns-record, resolved, soa-record, target, txt-record)
 [INFO] Finishing scan
 ```
 
-But something's wrong! We're emitting `IP_ADDRESS` [events](./scanning/events), but we're not seeing them on the console. This is because by default, BBOT only shows in-scope [events](./scanning/events). To see them, we need to increase the report distance:
+But something's wrong! We're emitting `IP_ADDRESS` [events](./scanning/events), but they're not showing up in the output. This is because by default, BBOT only shows in-scope [events](./scanning/events). To see them, we need to increase the report distance:
 
 ```bash
 # run the module again but with a higher report distance
@@ -98,20 +93,16 @@ But something's wrong! We're emitting `IP_ADDRESS` [events](./scanning/events),
 bbot -t evilcorp.com -m mymodule -c scope_report_distance=1
 ```
 
-Much better:
+Now, with the `report_distance=1`:
 
 ```text
-[SUCC] Starting scan utmost_alexander
-[SCAN]                  utmost_alexander (SCAN:e9d28f64527da53eaffc16f46f5deb20103bc78b)    TARGET  (distance-0)
+[SUCC] Starting scan suspicious_dobby
+[SCAN]                  suspicious_dobby (SCAN:e9d28f64527da53eaffc16f46f5deb20103bc78b)    TARGET  (distance-0)
 [INFO] mymodule: GOT EVENT: DNS_NAME("dns.google", module=TARGET, tags={'soa-record', 'aaaa-record', 'ns-record', 'txt-record', 'distance-0', 'in-scope', 'resolved', 'domain', 'a-record', 'target'})
-[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8888
-[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.4.4
-[SUCC] mymodule: EMITTING IP_ADDRESS: 8.8.8.8
-[SUCC] mymodule: EMITTING IP_ADDRESS: 2001:4860:4860::8844
 [DNS_NAME]              dns.google  TARGET  (a-record, aaaa-record, distance-0, domain, in-scope, ns-record, resolved, soa-record, target, txt-record)
-[IP_ADDRESS]            8.8.4.4 A   (distance-1, ipv4, ptr-record, resolved)
+[IP_ADDRESS]            8.8.4.4 mymodule   (distance-1, ipv4, ptr-record, resolved)
 [IP_ADDRESS]            2001:4860:4860::8888    mymodule    (distance-1, ipv6, ptr-record, resolved)
-[IP_ADDRESS]            8.8.8.8 A   (distance-1, ipv4, ptr-record, resolved)
+[IP_ADDRESS]            8.8.8.8 mymodule   (distance-1, ipv4, ptr-record, resolved)
 [IP_ADDRESS]            2001:4860:4860::8844    mymodule    (distance-1, ipv6, ptr-record, resolved)
 [DNS_NAME]              ns3.zdns.google NS  (a-record, aaaa-record, distance-1, resolved, subdomain)
 [DNS_NAME]              ns1.zdns.google NS  (a-record, aaaa-record, distance-1, resolved, subdomain)
@@ -121,13 +112,11 @@ Much better:
 [INFO] Finishing scan
 ```
 
-### `handle_event()`:
-
-The `handle_event()` method is the most important part of the module. By overriding this method, you control what happens when the module runs. During a scan, when an [event](./scanning/events) from your `watched_events` is encountered (a `DNS_NAME` in this example), `handle_event()` is automatically called with that [event](./scanning/events).
+### `handle_event()` and `emit_event()`
 
-### `emit_event()`:
+The `handle_event()` method is the most important part of the module. By overriding this method, you control what the module does. During a scan, when an [event](./scanning/events) from your `watched_events` is encountered (a `DNS_NAME` in this example), `handle_event()` is automatically called with that [event](./scanning/events).
 
-The `emit_event()` method is the way modules return data. When you call `emit_event()`, it creates an [event](./scanning/events) and prints it to the console. It also distributes it any modules that are interested in that data type.
+The `emit_event()` method is how modules return data. When you call `emit_event()`, it creates an [event](./scanning/events) and prints it to the console. It also distributes it any modules that are interested in that data type.
 
 ### Module Dependencies
 
diff --git a/docs/index.md b/docs/index.md
index 6512f09389..2d69962dfa 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -1,5 +1,9 @@
 # Getting Started
 
+<video controls="" autoplay="" name="media"><source src="https://github-production-user-asset-6210df.s3.amazonaws.com/20261699/245941416-ebf2a81e-7530-4a9e-922d-4e62eb949f35.mp4" type="video/mp4"></video>
+
+*A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)*
+
 ## Installation
 
 BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution#installation-poetry).
@@ -73,4 +77,24 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap g
 ```
 <!-- END BBOT EXAMPLE COMMANDS -->
 
-## Next: [Scanning](./scanning)
+## API Keys
+
+No API keys are required to run BBOT. However, some modules need them to function. If you have API keys and want to make use of these modules, you can place them either in BBOT's YAML config (`~/.config/bbot/secrets.yml`):
+```yaml
+modules:
+  shodan_dns:
+    api_key: deadbeef
+  virustotal:
+    api_key: cafebabe
+```
+
+Or on the command-line:
+
+```bash
+# specify API key with -c
+bbot -t evilcorp.com -f subdomain-enum -c modules.shodan_dns.api_key=deadbeef modules.virustotal.api_key=cafebabe
+```
+
+For more information, see [Configuration](./configuration). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
+
+## Next Up: [Scanning](./scanning)
diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 30dae26932..20854a463a 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -30,16 +30,16 @@ asyncio.run(main())
 
 <!-- BBOT HELP OUTPUT -->
 ```text
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]]
-               [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]]
-               [--strict-scope] [-m MODULE [MODULE ...]] [-l]
-               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf]
-               [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
-               [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME]
-               [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y]
-               [--dry-run] [--current-config]
-               [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps]
-               [-a] [--version]
+usage: pytest [-h] [--help-all] [-t TARGET [TARGET ...]]
+              [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]]
+              [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+              [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf]
+              [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
+              [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME]
+              [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y]
+              [--dry-run] [--current-config]
+              [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps]
+              [-a] [--version]
 
 Bighuge BLS OSINT Tool
 
@@ -58,7 +58,7 @@ Target:
 
 Modules:
   -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,mymodule,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
   -l, --list-modules    List available modules.
   -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
                         Exclude these modules.
diff --git a/docs/scanning/configuration/module_options.md b/docs/scanning/configuration.md
similarity index 92%
rename from docs/scanning/configuration/module_options.md
rename to docs/scanning/configuration.md
index f5d12fdb5b..d3a4c8dd1f 100644
--- a/docs/scanning/configuration/module_options.md
+++ b/docs/scanning/configuration.md
@@ -1,51 +1,198 @@
-# Module Options
+# Configuration Overview
 
-## Overview
+BBOT has a YAML config at `~/.config/bbot`. This config is different from the command-line arguments. This is where you change settings such as BBOT's **HTTP proxy**, **rate limits**, or global **User-Agent**. It's also where you put modules' **API keys**.
 
-Many modules accept their own configuration options. These are detailed in the table below. 
+For a list of all possible config options, see:
 
-Module's options have the ability to change their behavior. For example, the `nmap` module accepts options for `ports`, `timing`, etc.
+- [Global Options](./global_options/)
+- [Module Options](./module_options/)
 
-## Command-line vs Config File
+## Configuration Files
+
+BBOT loads its config from the following files, in this order:
+
+- `~/.config/bbot/bbot.yml`     <-- Use this one as your main config
+- `~/.config/bbot/secrets.yml`  <-- Use this one for sensitive stuff like API keys
+- command line (`--config`)     <-- Use this to specify a custom config file or override individual config options
+
+These config files will be automatically created for you when you first run BBOT.
+
+## YAML Config vs Command Line
+
+You can specify config options either via the command line or the config. For example, if you want to proxy your BBOT scan through a local proxy like [Burp Suite](https://portswigger.net/burp), you could either do:
 
-If you wanted to pass these options to `nmap`, you could do it from the command line:
 ```bash
-bbot --config modules.nmap.ports=80,443 modules.nmap.timing=T5
+bbot -t evilcorp.com --config http_proxy=http://127.0.0.1:8080
 ```
 
-or via the config (`~/.config/bbot/bbot.yml`):
+Or, in `~/.config/bbot/config.yml`:
 
 ```yaml
-modules:
-  nmap:
-    ports: 80,443
-    timing: T5
+http_proxy: http://127.0.0.1:8080
 ```
 
-If you wanted to add an API keys for `shodan` and `virustotal`, you could either specify them like this on the command line:
+These two are equivalent.
 
+Config options specified via the command-line take precedence over all others. You can give BBOT a custom config file with `--config myconf.yml`, or individual arguments like this: `--config modules.shodan_dns.api_key=deadbeef`. To display the full and current BBOT config, including any command-line arguments, use `bbot --current-config`.
+
+Note that placing the following in `bbot.yml`:
+```yaml
+modules:
+  shodan_dns:
+    api_key: deadbeef
+```
+Is the same as:
 ```bash
-bbot --config modules.shodan.api_key=deadbeef modules.virustotal.api_key=deadbeef
+bbot --config modules.shodan_dns.api_key=deadbeef
 ```
 
-Or in the config:
+Here is an example of what a standard BBOT config might look like:
 ```yaml
 modules:
-  shodan:
-    api_key: deadbeef
-  virustotal:
-    api_key: deadbeef
 ```
 
-For a list of global BBOT config options such as HTTP Proxy, User-Agent, etc, see [Defaults](../defaults/)
+## Global Config Options
+
+Below is a full list of the config options supported, along with their defaults.
+
+<!-- BBOT DEFAULT CONFIG -->
+```yaml
+### BASIC OPTIONS ###
+
+# BBOT working directory
+home: ~/.bbot
+# Don't output events that are further than this from the main scope
+# 1 == 1 hope away from main scope
+# 0 == in scope only
+scope_report_distance: 0
+# Generate new DNS_NAME and IP_ADDRESS events through DNS resolution
+dns_resolution: true
+# Limit the number of BBOT threads
+max_threads: 25
+# Rate-limit DNS
+dns_queries_per_second: 1000
+# Rate-limit HTTP
+web_requests_per_second: 100
+# Interval for displaying status messages
+status_frequency: 15
+# HTTP proxy
+http_proxy: 
+# Web user-agent
+user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36
+
 
+### ADVANCED OPTIONS ###
+
+# How far out from the main scope to search
+scope_search_distance: 0
+# How far out from the main scope to resolve DNS names / IPs
+scope_dns_search_distance: 2
+# Limit how many DNS records can be followed in a row (stop malicious/runaway DNS records)
+dns_resolve_distance: 5
+
+# Infer certain events from others, e.g. IPs from IP ranges, DNS_NAMEs from URLs, etc.
+speculate: True
+# Passively search event data for URLs, hostnames, emails, etc.
+excavate: True
+# Summarize activity at the end of a scan
+aggregate: True
+
+# HTTP timeout (for Python requests; API calls, etc.)
+http_timeout: 10
+# HTTP timeout (for httpx)
+httpx_timeout: 5
+# Custom HTTP headers (e.g. cookies, etc.)
+# in the format { "Header-Key": "header_value" }
+# These are attached to all in-scope HTTP requests
+# Note that some modules (e.g. github) may end up sending these to out-of-scope resources
+http_headers: {}
+# HTTP retries (for Python requests; API calls, etc.)
+http_retries: 1
+# HTTP retries (for httpx)
+httpx_retries: 1
+# Enable/disable debug messages for web requests/responses
+http_debug: false
+# Maximum number of HTTP redirects to follow
+http_max_redirects: 5
+# Set the maximum number of HTTP links that can be followed in a row (0 == no spidering allowed)
+web_spider_distance: 0
+# Set the maximum directory depth for the web spider
+web_spider_depth: 1
+# Set the maximum number of links that can be followed per page
+web_spider_links_per_page: 25
+# DNS query timeout
+dns_timeout: 5
+# How many times to retry DNS queries
+dns_retries: 1
+# Disable BBOT's smart DNS wildcard handling for select domains
+dns_wildcard_ignore: []
+# How many sanity checks to make when verifying wildcard DNS
+# Increase this value if BBOT's wildcard detection isn't working
+dns_wildcard_tests: 10
+# Skip DNS requests for a certain domain and rdtype after encountering this many timeouts or SERVFAILs
+# This helps prevent faulty DNS servers from hanging up the scan
+dns_abort_threshold: 10
+# Don't show PTR records containing IP addresses
+dns_filter_ptrs: true
+# Enable/disable debug messages for dns queries
+dns_debug: false
+# Whether to verify SSL certificates
+ssl_verify: false
+# How many scan results to keep before cleaning up the older ones
+keep_scans: 20
+# Completely ignore URLs with these extensions
+url_extension_blacklist:
+    # images
+    - png
+    - jpg
+    - bmp
+    - ico
+    - jpeg
+    - gif
+    - svg
+    # web/fonts
+    - css
+    - woff
+    - woff2
+    - ttf
+    # audio
+    - mp3
+    - m4a
+    - wav
+    - flac
+    # video
+    - mp4
+    - mkv
+    - avi
+    - wmv
+    - mov
+    - flv
+    - webm
+# Distribute URLs with these extensions only to httpx (these are omitted from output)
+url_extension_httpx_only:
+    - js
+# Don't output these types of events (they are still distributed to modules)
+omit_event_types:
+    - HTTP_RESPONSE
+    - URL_UNVERIFIED
+    # - DNS_NAME_UNRESOLVED
+    # - IP_ADDRESS
+# URL of BBOT server
+agent_url: ''
+# Agent Bearer authentication token
+agent_token: ''
+
+# Custom interactsh server settings
+interactsh_server: null
+interactsh_token: null
+interactsh_disable: false
+
+```
+<!-- END BBOT DEFAULT CONFIG -->
 
 ## Module Config Options
 
-- **Config Option**: Name of the config option (`--config` syntax, see above for `yaml` equivalent)
-- **Type**: Data type of the option, e.g. `bool`, `str`, etc.
-- **Description**: Description of what the option does
-- **Default**: The option's default value
+Many modules accept their own configuration options. These options have the ability to change their behavior. For example, the `nmap` module accepts options for `ports`, `timing`, etc. Below is a list of all possible module config options.
 
 <!-- BBOT MODULE OPTIONS -->
 | Config Option                                  | Type   | Description                                                                                                                                                                                                                                                                                                     | Default                                                                                                                                                             |
diff --git a/docs/scanning/configuration/global_options.md b/docs/scanning/configuration/global_options.md
deleted file mode 100644
index 585fbdab09..0000000000
--- a/docs/scanning/configuration/global_options.md
+++ /dev/null
@@ -1,156 +0,0 @@
-# Global Options
-
-## Overview
-
-BBOT is highly configurable, and allows tweaking of many internal values such as **user-agent** and **thread count**. Below is a full list of the config options supported, along with their defaults.
-
-You can specify these either via the command line or the config. For example, if you want to proxy your BBOT scan through a local proxy like [Burp Suite](https://portswigger.net/burp), you could either do:
-
-```bash
-bbot -t evilcorp.com --config http_proxy=http://127.0.0.1:8080
-```
-
-Or, in `~/.config/bbot/config.yml`:
-
-```yaml
-http_proxy: http://127.0.0.1:8080
-```
-
-## Defaults.yml
-
-<!-- BBOT DEFAULT CONFIG -->
-```yaml
-### BASIC OPTIONS ###
-
-# BBOT working directory
-home: ~/.bbot
-# Don't output events that are further than this from the main scope
-# 1 == 1 hope away from main scope
-# 0 == in scope only
-scope_report_distance: 0
-# Generate new DNS_NAME and IP_ADDRESS events through DNS resolution
-dns_resolution: true
-# Limit the number of BBOT threads
-max_threads: 25
-# Rate-limit DNS
-dns_queries_per_second: 1000
-# Rate-limit HTTP
-web_requests_per_second: 100
-# Interval for displaying status messages
-status_frequency: 15
-# HTTP proxy
-http_proxy: 
-# Web user-agent
-user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36
-
-
-### ADVANCED OPTIONS ###
-
-# How far out from the main scope to search
-scope_search_distance: 0
-# How far out from the main scope to resolve DNS names / IPs
-scope_dns_search_distance: 2
-# Limit how many DNS records can be followed in a row (stop malicious/runaway DNS records)
-dns_resolve_distance: 5
-
-# Infer certain events from others, e.g. IPs from IP ranges, DNS_NAMEs from URLs, etc.
-speculate: True
-# Passively search event data for URLs, hostnames, emails, etc.
-excavate: True
-# Summarize activity at the end of a scan
-aggregate: True
-
-# HTTP timeout (for Python requests; API calls, etc.)
-http_timeout: 10
-# HTTP timeout (for httpx)
-httpx_timeout: 5
-# Custom HTTP headers (e.g. cookies, etc.)
-# in the format { "Header-Key": "header_value" }
-# These are attached to all in-scope HTTP requests
-# Note that some modules (e.g. github) may end up sending these to out-of-scope resources
-http_headers: {}
-# HTTP retries (for Python requests; API calls, etc.)
-http_retries: 1
-# HTTP retries (for httpx)
-httpx_retries: 1
-# Enable/disable debug messages for web requests/responses
-http_debug: false
-# Maximum number of HTTP redirects to follow
-http_max_redirects: 5
-# Set the maximum number of HTTP links that can be followed in a row (0 == no spidering allowed)
-web_spider_distance: 0
-# Set the maximum directory depth for the web spider
-web_spider_depth: 1
-# Set the maximum number of links that can be followed per page
-web_spider_links_per_page: 25
-# DNS query timeout
-dns_timeout: 5
-# How many times to retry DNS queries
-dns_retries: 1
-# Disable BBOT's smart DNS wildcard handling for select domains
-dns_wildcard_ignore: []
-# How many sanity checks to make when verifying wildcard DNS
-# Increase this value if BBOT's wildcard detection isn't working
-dns_wildcard_tests: 10
-# Skip DNS requests for a certain domain and rdtype after encountering this many timeouts or SERVFAILs
-# This helps prevent faulty DNS servers from hanging up the scan
-dns_abort_threshold: 10
-# Don't show PTR records containing IP addresses
-dns_filter_ptrs: true
-# Enable/disable debug messages for dns queries
-dns_debug: false
-# Whether to verify SSL certificates
-ssl_verify: false
-# How many scan results to keep before cleaning up the older ones
-keep_scans: 20
-# Completely ignore URLs with these extensions
-url_extension_blacklist:
-    # images
-    - png
-    - jpg
-    - bmp
-    - ico
-    - jpeg
-    - gif
-    - svg
-    # web/fonts
-    - css
-    - woff
-    - woff2
-    - ttf
-    # audio
-    - mp3
-    - m4a
-    - wav
-    - flac
-    # video
-    - mp4
-    - mkv
-    - avi
-    - wmv
-    - mov
-    - flv
-    - webm
-# Distribute URLs with these extensions only to httpx (these are omitted from output)
-url_extension_httpx_only:
-    - js
-# Don't output these types of events (they are still distributed to modules)
-omit_event_types:
-    - HTTP_RESPONSE
-    - URL_UNVERIFIED
-    # - DNS_NAME_UNRESOLVED
-    # - IP_ADDRESS
-# URL of BBOT server
-agent_url: ''
-# Agent Bearer authentication token
-agent_token: ''
-
-# Custom interactsh server settings
-interactsh_server: null
-interactsh_token: null
-interactsh_disable: false
-
-```
-<!-- END BBOT DEFAULT CONFIG -->
-
-Note that these are BBOT's global config options. If you're looking for module-specific config options, see [Module Options](../module_options/).
\ No newline at end of file
diff --git a/docs/scanning/configuration/index.md b/docs/scanning/configuration/index.md
deleted file mode 100644
index 68f0c862e9..0000000000
--- a/docs/scanning/configuration/index.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# Configuration Overview
-
-BBOT and its modules are built to be configurable for a wide range of use cases. Config options are different from standard command-line arguments. They're designed to perform more granular changes such as setting the HTTP proxy, the global user-agent, or a module's API key.
-
-For a list of all possible config options, see:
-
-- [Global Options](./global_options/)
-- [Module Options](./module_options/)
-
-## Configuration Files
-
-BBOT loads its config from the following files, in this order:
-
-- `~/.config/bbot/bbot.yml`     <-- Use this one as your main config
-- `~/.config/bbot/secrets.yml`  <-- Use this one for sensitive stuff like API keys
-- command line (`--config`)     <-- Use this to specify a custom config file or override individual config options
-
-These config files will be automatically created for you when you first run BBOT.
-
-## Command Line
-
-Config options specified via the command-line take precedence over all others. You can give BBOT a custom config file with `--config myconf.yml`, or individual arguments like this: `--config http_proxy=http://127.0.0.1:8080 modules.shodan_dns.api_key=1234`. To display the full and current BBOT config, including any command-line arguments, use `bbot --current-config`.
-
-Note that placing the following in `bbot.yml`:
-```yaml
-modules:
-  shodan:
-    api_key: deadbeef
-```
-Is the same as:
-```bash
-bbot --config modules.shodan.api_key=deadbeef
-```
-
-Here is an example of what a standard BBOT config might look like:
-```yaml
-modules:
-  
-```
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index 16abea9103..75f332cf09 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -23,30 +23,30 @@ See below for a full list of event types and which modules produce/consume them.
 ## Event Types
 
 <!-- BBOT EVENTS -->
-| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | Producing Modules                                                                                                                                                                                                                                                                                                                                                                 |
-|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                              |                                                                                                                                                                                                                                                                                                                                                                                   |
-| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | asn                                                                                                                                                                                                                                                                                                                                                                               |
-| DNS_NAME            | 46                    | 36                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, naabu, nmap, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
-| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |                                                                                                                                                                                                                                                                                                                                                                                   |
-| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                               |
-| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                |
-| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | ipstack                                                                                                                                                                                                                                                                                                                                                                           |
-| HTTP_RESPONSE       | 8                     | 1                     | badsecrets, excavate, host_header, hunt, ntlm, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                           | httpx                                                                                                                                                                                                                                                                                                                                                                             |
-| IP_ADDRESS          | 7                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                         | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                    |
-| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                                                                                                                                                                                                                                   |
-| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys                                                                                                                                                                                                                                                                                                                                                                            |
-| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                  |
-| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                              |
-| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                                                                                                                                                                                                                                   |
-| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | social                                                                                                                                                                                                                                                                                                                                                                            |
-| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                        |
-| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                             |
-| URL                 | 21                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                     | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                  |
-| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                    |
-| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                   |
-| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                | vhost                                                                                                                                                                                                                                                                                                                                                                             |
-| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                         |
-| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | wafw00f                                                                                                                                                                                                                                                                                                                                                                           |
-| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | gowitness                                                                                                                                                                                                                                                                                                                                                                         |
+| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   | Producing Modules                                                                                                                                                                                                                                                                                                                                                                 |
+|---------------------|-----------------------|-----------------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |                                                                                                                                                                                                                                                                                                                                                                                   |
+| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | asn                                                                                                                                                                                                                                                                                                                                                                               |
+| DNS_NAME            | 47                    | 36                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, mymodule, naabu, nmap, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
+| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                                                                                                                                                                                                                                   |
+| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                               |
+| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                |
+| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | ipstack                                                                                                                                                                                                                                                                                                                                                                           |
+| HTTP_RESPONSE       | 8                     | 1                     | badsecrets, excavate, host_header, hunt, ntlm, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                     | httpx                                                                                                                                                                                                                                                                                                                                                                             |
+| IP_ADDRESS          | 7                     | 5                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                   | asset_inventory, censys, ipneighbor, mymodule, speculate                                                                                                                                                                                                                                                                                                                          |
+| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |                                                                                                                                                                                                                                                                                                                                                                                   |
+| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | censys                                                                                                                                                                                                                                                                                                                                                                            |
+| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                  |
+| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                              |
+| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |                                                                                                                                                                                                                                                                                                                                                                                   |
+| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | social                                                                                                                                                                                                                                                                                                                                                                            |
+| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                        |
+| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                             |
+| URL                 | 21                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                               | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                  |
+| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                    |
+| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                   |
+| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | vhost                                                                                                                                                                                                                                                                                                                                                                             |
+| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                         |
+| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | wafw00f                                                                                                                                                                                                                                                                                                                                                                           |
+| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | gowitness                                                                                                                                                                                                                                                                                                                                                                         |
 <!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index c8b94e6b5f..9707f470b2 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -1,9 +1,6 @@
 # Scanning Overview
 
-<video controls="" autoplay="" name="media"><source src="https://github-production-user-asset-6210df.s3.amazonaws.com/20261699/245941416-ebf2a81e-7530-4a9e-922d-4e62eb949f35.mp4" type="video/mp4"></video>
-
-*A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)*
-
+press enter to execute <span class="demonic-jimmy">demonic_jimmy</span>
 
 ## Targets (`-t`)
 
@@ -32,7 +29,7 @@ On start, BBOT automatically converts Targets into [Events](./events).
 
 ## Modules (`-m`)
 
-To see a full list of modules and their descriptions, use `bbot -l` or see [Modules Table](./modules_table).
+To see a full list of modules and their descriptions, use `bbot -l` or see [List of Modules](./list_of_modules).
 
 Modules are the part of BBOT that does the work -- port scanning, subdomain brute-forcing, API querying, etc. Modules consume [Events](../events/) (`IP_ADDRESS`, `DNS_NAME`, etc.) from each other, process the data in a useful way, then emit the results as new events. You can enable individual modules with `-m`.
 
@@ -93,7 +90,7 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
 |------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
 | safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 42          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
+| passive          | 43          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, mymodule, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                         |
 | active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
 | subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
 | web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
@@ -101,17 +98,17 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS -->
 
 
diff --git a/docs/scanning/modules_table.md b/docs/scanning/list_of_modules.md
similarity index 98%
rename from docs/scanning/modules_table.md
rename to docs/scanning/list_of_modules.md
index bf899080e0..3e60cb4882 100644
--- a/docs/scanning/modules_table.md
+++ b/docs/scanning/list_of_modules.md
@@ -64,6 +64,7 @@
 | ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
 | leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
 | massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
+| mymodule             | scan     | No              |                                                                        | passive                                                                       | IP_ADDRESS                                           |
 | otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
 | passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
 | pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
diff --git a/docs/scanning/output.md b/docs/scanning/output.md
index 8b770a4306..8ee4bf9dfa 100644
--- a/docs/scanning/output.md
+++ b/docs/scanning/output.md
@@ -27,8 +27,8 @@ Neo4j is the funnest (and prettiest) way to view and interact with BBOT data.
 ~~~bash
 docker run -p 7687:7687 -p 7474:7474 -v "$(pwd)/data/:/data/" -e NEO4J_AUTH=neo4j/bbotislife neo4j
 ~~~
-- After that, run bbot with `--output-modules neo4j`
+- After that, run bbot with `-om neo4j`
 ~~~bash
-bbot -f subdomain-enum -t evilcorp.com --output-modules neo4j
+bbot -f subdomain-enum -t evilcorp.com -om neo4j
 ~~~
 - Browse data at [http://localhost:7474](http://localhost:7474)
diff --git a/extra_sass/style.css.scss b/extra_sass/style.css.scss
index 72d631cb8d..9864be9143 100644
--- a/extra_sass/style.css.scss
+++ b/extra_sass/style.css.scss
@@ -10,6 +10,10 @@
 //   max-width: unset;
 // }
 
+span.demonic-jimmy {
+  color: var(--bbot-orange);
+}
+
 .md-nav__link--active {
   font-weight: bold
 }
diff --git a/mkdocs.yml b/mkdocs.yml
index ac5793575f..2dd73261ff 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -19,12 +19,10 @@ nav:
     - Events: scanning/events.md
     - Output: scanning/output.md
     - Advanced Usage: scanning/advanced.md
-    - Configuration:
-      - scanning/configuration/index.md
-      - Global Options: scanning/configuration/global_options.md
-      - Module Options: scanning/configuration/module_options.md
-    - Modules Table: scanning/modules_table.md
-  - Contribution: contribution.md
+    - Configuration: scanning/configuration.md
+    - Modules Table: scanning/list_of_modules.md
+  - Contribution:
+    - How to Write a Module: contribution.md
 
 theme:
   name: material

From 80f3d6c4035ec5f05cdc40bfc3908a9d33df6971 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 5 Jul 2023 21:54:04 -0400
Subject: [PATCH 157/387] table javascript

---
 docs/javascripts/tablesort.js | 6 ++++++
 1 file changed, 6 insertions(+)
 create mode 100644 docs/javascripts/tablesort.js

diff --git a/docs/javascripts/tablesort.js b/docs/javascripts/tablesort.js
new file mode 100644
index 0000000000..4014300f8e
--- /dev/null
+++ b/docs/javascripts/tablesort.js
@@ -0,0 +1,6 @@
+document$.subscribe(function () {
+  var tables = document.querySelectorAll("article table:not([class])");
+  tables.forEach(function (table) {
+    new Tablesort(table);
+  });
+});

From ec7e729e7747a47dbd3f99397f95dcc693231737 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 5 Jul 2023 21:57:53 -0400
Subject: [PATCH 158/387] update readme

---
 README.md | 102 +++++++++++++++++++++++++++++-------------------------
 1 file changed, 54 insertions(+), 48 deletions(-)

diff --git a/README.md b/README.md
index e7594fb614..5001d95ea5 100644
--- a/README.md
+++ b/README.md
@@ -1,95 +1,101 @@
 # BEE·bot
+
 ### OSINT automation for hackers.
 
 [![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot) [![Discord](https://img.shields.io/discord/859164869970362439)](https://discord.com/invite/PZqkgxu5SA)
 
-BBOT is a powerful and modular OSINT (Open Source Intelligence) framework designed to map the attack surface of an organization. With BBOT, you can execute the entire OSINT workflow with just a single command.
+BBOT is a modular OSINT (Open Source Intelligence) framework that can execute the entire OSINT workflow in a single command.
 
-![bbot_banner](https://user-images.githubusercontent.com/20261699/158000235-6c1ace81-a267-4f8e-90a1-f4c16884ebac.png)
+![bbot_banner](https://github.com/blacklanternsecurity/bbot/assets/20261699/af2e822c-d7d6-40e7-bcba-2ce52faa6c4c)
 
-BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. BBOT has over 80 modules and counting.
+BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but rises to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. BBOT has over 80 modules and counting.
 
-Whether you're a pentester, security researcher, or bug bounty hunter, BBOT simplifies and automates the OSINT process so you can focus on the fun part: hacking!
+Whether you're a pentester, security researcher, or bug bounty hunter, BBOT automates the OSINT process so you can focus on the fun part: hacking!
 
 https://github.com/blacklanternsecurity/bbot/assets/20261699/ebf2a81e-7530-4a9e-922d-4e62eb949f35
 
-Visualization courtesy of [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)
+_A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)_
 
 # Getting Started
 
+Consider reading our [Documentation](https://www.blacklanternsecurity.com/bbot).
+
 ## Installation ([pip](https://pypi.org/project/bbot/))
-Note: installing in a virtualenv (e.g. via `pipx`) is recommended. If you need help with installation, please refer to the [wiki](https://github.com/blacklanternsecurity/bbot/wiki#installation).
-~~~bash
+
+For more installation methods including [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot), see [Installation](https://www.blacklanternsecurity.com/bbot/#installation).
+
+```bash
 # Prerequisites:
 # - Linux (Windows and macOS are *not* supported)
 # - Python 3.9 or newer
 
 # stable version
-pip install bbot
+pipx install bbot
 
 # bleeding edge (dev branch)
-pip install --pre bbot
+pipx install --pip-args pre bbot
 
 bbot --help
-~~~
+```
 
 ## Example Commands
-Note: Scan output, logs, etc. are saved to `~/.bbot`.
-~~~bash
-# subdomains
+
+Scan output, logs, etc. are saved to `~/.bbot`. For more detailed examples and explanations, see [Scanning](https://www.blacklanternsecurity.com/scanning).
+
+<!-- BBOT EXAMPLE COMMANDS -->
+**Subdomains:**
+
+```bash
+# Perform a full subdomain enumeration on evilcorp.com
 bbot -t evilcorp.com -f subdomain-enum
+```
+
+**Subdomains (passive only):**
 
-# subdomains (passive only)
+```bash
+# Perform a passive-only subdomain enumeration on evilcorp.com
 bbot -t evilcorp.com -f subdomain-enum -rf passive
+```
 
-# subdomains + port scan + web screenshots
-bbot -t evilcorp.com -f subdomain-enum -m naabu gowitness -n my_scan -o .
+**Subdomains + port scan + web screenshots:**
 
-# subdomains + basic web scan (wappalyzer, robots.txt, iis shortnames, etc.)
+```bash
+# Port-scan every subdomain, screenshot every webpage, output to current directory
+bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .
+```
+
+**Subdomains + basic web scan:**
+
+```bash
+# A basic web scan includes wappalyzer, robots.txt, and other non-intrusive web modules
 bbot -t evilcorp.com -f subdomain-enum web-basic
+```
 
-# subdomains + web spider (search for emails, etc.)
-bbot -t evilcorp.com -f subdomain-enum -c web_spider_distance=2 web_spider_depth=2
+**Web spider:**
 
-# everything at once because yes
-# subdomains + emails + cloud + port scan + non-intrusive web + web screenshots + nuclei
-bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m naabu gowitness nuclei --allow-deadly
+```bash
+# Crawl www.evilcorp.com up to a max depth of 2, automatically extracting emails, secrets, etc.
+bbot -t www.evilcorp.com -m httpx robots badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
+```
 
-# list modules
-bbot -l
-~~~
+**Everything everywhere all at once:**
+
+```bash
+# Subdomains, emails, cloud buckets, port scan, basic web, web screenshots, nuclei
+bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
+```
+<!-- END BBOT EXAMPLE COMMANDS -->
 
 ## Targets
 
-Targets seed a scan with initial data. You can specify an unlimited number of targets, either directly on the command line or in files (or both!). Targets can be any of the following:
+BBOT accepts an unlimited number of targets which you can specify either directly on the command line or in files (or both!). Targets can be any of the following:
 
 - DNS_NAME (`evilcorp.com`)
 - IP_ADDRESS (`1.2.3.4`)
 - IP_RANGE (`1.2.3.0/24`)
 - URL (`https://www.evilcorp.com`)
-- EMAIL_ADDRESS (`bob@evilcorp.com`)
-
-For example, the following scan is totally valid:
-
-~~~bash
-# multiple targets
-bbot -t evilcorp.com evilcorp.co.uk http://www.evilcorp.cn 1.2.3.0/24 other_targets.txt
-~~~
-
-Visit the wiki for more [tips and tricks](https://github.com/blacklanternsecurity/bbot/wiki#tips-and-tricks).
-
-## [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot)
-BBOT provides docker images, along with helper script `bbot-docker.sh` to persist your BBOT scan data.
-~~~bash
-# helper script
-./bbot-docker.sh --help
-
-# bleeding edge (dev)
-docker run -it blacklanternsecurity/bbot --help
 
-# stable
-docker run -it blacklanternsecurity/bbot:stable --help
-~~~
+For more information, see [Targets](https://www.blacklanternsecurity.com/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/scanning/#scope).
 
 # Acknowledgements
 

From 2b785ed57f15fe931bff33be1741baaf96c5f38c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 5 Jul 2023 22:03:57 -0400
Subject: [PATCH 159/387] update readme

---
 README.md            | 4 ++--
 bbot/scripts/docs.py | 5 +++--
 2 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/README.md b/README.md
index 5001d95ea5..608104aec5 100644
--- a/README.md
+++ b/README.md
@@ -4,7 +4,7 @@
 
 [![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot) [![Discord](https://img.shields.io/discord/859164869970362439)](https://discord.com/invite/PZqkgxu5SA)
 
-BBOT is a modular OSINT (Open Source Intelligence) framework that can execute the entire OSINT workflow in a single command.
+BBOT is a modular OSINT framework that can execute the entire OSINT workflow in a single command.
 
 ![bbot_banner](https://github.com/blacklanternsecurity/bbot/assets/20261699/af2e822c-d7d6-40e7-bcba-2ce52faa6c4c)
 
@@ -18,7 +18,7 @@ _A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/
 
 # Getting Started
 
-Consider reading our [Documentation](https://www.blacklanternsecurity.com/bbot).
+Consider checkout out our [Documentation](https://www.blacklanternsecurity.com/bbot).
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index b28b482978..4e51937341 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -41,8 +41,9 @@ def find_replace_file(file, keyword, replace):
         content = f.read()
         new_content = find_replace_markdown(content, keyword, replace)
     if new_content != content:
-        with open(file, "w") as f:
-            f.write(new_content)
+        if not "BBOT_TESTING" in os.environ:
+            with open(file, "w") as f:
+                f.write(new_content)
 
 
 def update_docs():

From ab2b0e9ef801e21dee4d5a47889d36cc290555ef Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 5 Jul 2023 23:41:42 -0400
Subject: [PATCH 160/387] steady work on docs

---
 .github/ISSUE_TEMPLATE/bug_report.md      |   4 +-
 .github/ISSUE_TEMPLATE/feature_request.md |   4 +-
 .github/workflows/docs.yml                |   4 +-
 README.md                                 |   4 +-
 bbot/scripts/docs.py                      |   2 +-
 bbot/test/test_output.json                |   2 +-
 docs/comparison.md                        |  10 +-
 docs/contribution.md                      |  25 +++--
 docs/how_it_works.md                      |  32 +++++-
 docs/index.md                             |  25 ++++-
 docs/scanning/advanced.md                 |  25 ++---
 docs/scanning/events.md                   |  32 +++++-
 docs/scanning/index.md                    |  83 +++++++++++---
 docs/scanning/output.md                   | 127 +++++++++++++++++++---
 docs/scanning/tips_and_tricks.md          |  57 ++++++++++
 extra_sass/style.css.scss                 |  29 +++--
 mkdocs.yml                                |  33 +++---
 17 files changed, 394 insertions(+), 104 deletions(-)
 create mode 100644 docs/scanning/tips_and_tricks.md

diff --git a/.github/ISSUE_TEMPLATE/bug_report.md b/.github/ISSUE_TEMPLATE/bug_report.md
index 4636d86a81..780ad1b26e 100644
--- a/.github/ISSUE_TEMPLATE/bug_report.md
+++ b/.github/ISSUE_TEMPLATE/bug_report.md
@@ -1,9 +1,9 @@
 ---
 name: Bug Report
 about: Create a report to help us improve
-title: ''
+title: ""
 labels: bug
-assignees: ''
+assignees: ""
 ---
 
 **Describe the bug**
diff --git a/.github/ISSUE_TEMPLATE/feature_request.md b/.github/ISSUE_TEMPLATE/feature_request.md
index 1a2eae951b..101c5fe600 100644
--- a/.github/ISSUE_TEMPLATE/feature_request.md
+++ b/.github/ISSUE_TEMPLATE/feature_request.md
@@ -1,9 +1,9 @@
 ---
 name: Feature Request
 about: Request a new feature
-title: ''
+title: ""
 labels: enhancement
-assignees: ''
+assignees: ""
 ---
 
 **Description**
diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
index e98250ea15..6dce2ba5c4 100644
--- a/.github/workflows/docs.yml
+++ b/.github/workflows/docs.yml
@@ -24,7 +24,7 @@ jobs:
       - name: Commit docs
         uses: EndBug/add-and-commit@v9
         with:
-          add: '*.md'
+          add: "*.md"
           default_author: github_actions
           message: "Refresh module docs"
   deploy:
@@ -35,7 +35,7 @@ jobs:
       - uses: actions/setup-python@v4
         with:
           python-version: 3.x
-      - run: echo "cache_id=$(date --utc '+%V')" >> $GITHUB_ENV 
+      - run: echo "cache_id=$(date --utc '+%V')" >> $GITHUB_ENV
       - uses: actions/cache@v3
         with:
           key: mkdocs-material-${{ env.cache_id }}
diff --git a/README.md b/README.md
index 608104aec5..f18cee0b78 100644
--- a/README.md
+++ b/README.md
@@ -99,9 +99,9 @@ For more information, see [Targets](https://www.blacklanternsecurity.com/scannin
 
 # Acknowledgements
 
-Thanks to all these amazing people for contributing to BBOT! :heart:
+Thanks to these amazing people for contributing to BBOT! :heart:
 
-If you have an idea for a feature or run into bugs of any kind, please submit an issue or a PR. We welcome contributions!
+If you're interested in contributing to BBOT, or just curious how it works under the hood, see [Contribution](https://www.blacklanternsecurity.com/bbot/contribution/).
 
 <p align="center">
 <a href="https://github.com/blacklanternsecurity/bbot/graphs/contributors">
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 4e51937341..f5367a36fe 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -58,7 +58,7 @@ def update_md_files(keyword, s):
     bbot_example_commands = []
     for title, description, command in scan_examples:
         example = ""
-        example += f"**{title}:**\n"
+        example += f"**{title}:**\n\n"
         # example += f"{description}\n"
         example += f"```bash\n# {description}\n{command}\n```"
         bbot_example_commands.append(example)
diff --git a/bbot/test/test_output.json b/bbot/test/test_output.json
index 94312708ce..1048b2d1e6 100644
--- a/bbot/test/test_output.json
+++ b/bbot/test/test_output.json
@@ -13,4 +13,4 @@
     "checked_at": "2022-04-17T08:03:50.419919Z",
     "created_at": "2020-07-16T14:19:04.514857Z"
   }
-]
\ No newline at end of file
+]
diff --git a/docs/comparison.md b/docs/comparison.md
index 5cfcf16199..cd3d7234bf 100644
--- a/docs/comparison.md
+++ b/docs/comparison.md
@@ -1 +1,9 @@
-# Comparison to Other Tools
\ No newline at end of file
+# Comparison to Other Tools
+
+BBOT isn't exclusively a subdomain enumeration tool. However since there's so many of them, subdomain enumeration tools are the easiest class of tool to compare it to.
+
+Thanks to BBOT's recursive nature (and `massdns`' fancy subdomain mutations), it typically finds about 20-25% more than other tools such as `Amass` or `theHarvester`.
+
+This holds true even for larger targets like `boeing.com` (1000+ subdomains):
+
+![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/1c262bbe-2e8c-4c69-bdd2-1e2553d47746)
diff --git a/docs/contribution.md b/docs/contribution.md
index 74752e63dd..6391fc4fd3 100644
--- a/docs/contribution.md
+++ b/docs/contribution.md
@@ -1,8 +1,8 @@
 # Contribution
 
-## Setting Up a Dev Environment
+We welcome contributions! If you have an idea for a new module, or are a Python developer who wants to get involved, please fork us or come talk to us on [Discord](https://discord.com/invite/PZqkgxu5SA).
 
-We welcome contributions! If you want a 
+## Setting Up a Dev Environment
 
 ### Installation (Poetry)
 
@@ -10,7 +10,8 @@ We welcome contributions! If you want a
 
 - Fork [BBOT](https://github.com/blacklanternsecurity/bbot) on GitHub
 - Clone your fork and set up a development environment with Poetry:
-~~~bash
+
+```bash
 # clone your forked repo and cd into it
 git clone git@github.com/<username>/bbot.git && cd bbot
 
@@ -24,9 +25,11 @@ poetry install
 poetry shell
 
 bbot --help
-~~~
+```
+
 - Now, any changes you make in the code will be reflected in the `bbot` command.
 - Run the tests locally to ensure they pass:
+
 ```bash
 # auto-format code indentation, etc.
 black .
@@ -34,8 +37,8 @@ black .
 # run tests
 ./bbot/test/run_tests.sh
 ```
-- Finally, commit and push your changes, and create a pull request to the `dev` branch of the main BBOT repo.
 
+- Finally, commit and push your changes, and create a pull request to the `dev` branch of the main BBOT repo.
 
 ## Creating a Module
 
@@ -44,14 +47,15 @@ Writing a module is easy and requires only a basic understanding of Python. It c
 1. Create a new `.py` file in `bbot/modules`
 1. At the top of the file, import `BaseModule`
 1. Declare a class that inherits from `BaseModule`
-    - the class must have the same name as your file (case-insensitive)
+   - the class must have the same name as your file (case-insensitive)
 1. Define in `watched_events` what type of data your module will consume
 1. Define in `produced_events` what type of data your module will produce
 1. Define (via `flags`) whether your module is `active` or `passive`, and whether it's `safe` or `aggressive`
 1. **Override `.handle_event()`** (see [`handle_event()` and `emit_event()`](#handle_event-and-emit_event))
 
 Here is a simple example of a working module (`bbot/modules/mymodule.py`):
-~~~python
+
+```python
 from bbot.modules.base import BaseModule
 
 class MyModule(BaseModule):
@@ -67,7 +71,7 @@ class MyModule(BaseModule):
         for ip in await self.helpers.resolve(event.data):
             self.hugesuccess(f"EMITTING IP_ADDRESS: {ip}")
             self.emit_event(ip, "IP_ADDRESS", source=event)
-~~~
+```
 
 After saving the module, you can run it simply by specifying it with `-m`:
 
@@ -77,6 +81,7 @@ bbot -t evilcorp.com -m mymodule
 ```
 
 This will produce the output:
+
 ```text
 [SUCC] Starting scan satanic_linda
 [SCAN]                  satanic_linda (SCAN:2e9ec8b6f06875bcf7980eea4c150754b53a6049)  TARGET  (distance-0)
@@ -122,7 +127,7 @@ The `emit_event()` method is how modules return data. When you call `emit_event(
 
 BBOT automates module dependencies with **Ansible**. If your module relies on a third-party binary, OS package, or python library, you can specify them in the `deps_*` attributes of your module.
 
-~~~python
+```python
 class MyModule(BaseModule):
     ...
     deps_pip = ["beautifulsoup4"]
@@ -152,4 +157,4 @@ class MyModule(BaseModule):
             "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
         },
     ]
-~~~
+```
diff --git a/docs/how_it_works.md b/docs/how_it_works.md
index 5f43e2386f..513a8e71b3 100644
--- a/docs/how_it_works.md
+++ b/docs/how_it_works.md
@@ -1 +1,31 @@
-# How It Works
\ No newline at end of file
+# What is it?
+
+BBOT is a system of modules that interchange data **recursively**. Okay, but like, **_what is it?_**
+
+## What It **_Isn't_**
+
+BBOT's discovery process does not have "phases", or "stages". I.e. it does not work like this:
+
+![how_it_doesnt_work](https://github.com/blacklanternsecurity/bbot/assets/20261699/67c4e332-f181-47e7-b884-2112bda347a4)
+
+This is a traditional OSINT process, where you start with a target and you work in stages. Each stage gets you a little more data and requires more cleaning/deduplication, until finally you reach the end. The problem with this approach is that it **misses things**. 
+
+Imagine if on the last step of this process, you discovered a new subdomain. Awesome! But wait, shouldn't you go back and check that one the same way you did the others? Shouldn't you port-scan it and SSL-mine it and so on? Maybe you're a thorough, hard-working human, and you do all that. Maybe by doing that, you find another subdomain! _Sigh._ What about this time? Should you start over again for that one? You see the dilemma.
+
+![traditional-workflow](https://github.com/blacklanternsecurity/bbot/assets/20261699/aa7cb6ac-6f88-464a-8069-0d534cecfd2b)
+
+## What It **_Is_**
+
+Instead, BBOT works recursively, treating each new individual piece of data as an opportunity to find even more. When it finds something, it feeds it back into the machine and uses it to fuel the discovery process. It continues to churn like this until there is no new data to discover.
+
+![bbot-workflow](https://github.com/blacklanternsecurity/bbot/assets/20261699/1b56c472-c2c4-41b5-b711-4b7296ec7b20)
+
+## Module Example
+
+As a simple example, let's run a BBOT scan with **three modules**: `nmap`, `sslcert`, and `httpx`. Each of these modules "consume" a certain type of data:
+
+- **`nmap`** consumes `DNS_NAME`s, port-scans them, and outputs `OPEN_TCP_PORT`s
+- **`sslcert`** consumes `OPEN_TCP_PORT`s, grabs certs, and extracts `DNS_NAME`s
+- **`httpx`** consumes `OPEN_TCP_PORT`s and visits any web services, extracting new `URL`s and `HTTP_RESPONSE`s.
+
+
diff --git a/docs/index.md b/docs/index.md
index 2d69962dfa..b013c518ff 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -2,28 +2,34 @@
 
 <video controls="" autoplay="" name="media"><source src="https://github-production-user-asset-6210df.s3.amazonaws.com/20261699/245941416-ebf2a81e-7530-4a9e-922d-4e62eb949f35.mp4" type="video/mp4"></video>
 
-*A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)*
+_A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)_
 
 ## Installation
 
 BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution#installation-poetry).
 
 ### [Python (pip / pipx)](https://pypi.org/project/bbot/)
+
 Note: `pipx` installs BBOT inside its own virtual environment.
-~~~bash
+
+Note: We only support Linux at this time. Windows and macOS are NOT supported!
+
+```bash
 # stable version
 pipx install bbot
 
 # bleeding edge (dev branch)
-pipx install --pre bbot
+pipx install --pip-args pre bbot
 
 # execute bbot command
 bbot --help
-~~~
+```
 
 ### [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot)
+
 Docker images are provided, along with helper script `bbot-docker.sh` to persist your scan data.
-~~~bash
+
+```bash
 # bleeding edge (dev)
 docker run -it blacklanternsecurity/bbot --help
 
@@ -33,7 +39,7 @@ docker run -it blacklanternsecurity/bbot:stable --help
 # helper script
 git clone https://github.com/blacklanternsecurity/bbot && cd bbot
 ./bbot-docker.sh --help
-~~~
+```
 
 ## Examples
 
@@ -41,36 +47,42 @@ Below are some common scan examples.
 
 <!-- BBOT EXAMPLE COMMANDS -->
 **Subdomains:**
+
 ```bash
 # Perform a full subdomain enumeration on evilcorp.com
 bbot -t evilcorp.com -f subdomain-enum
 ```
 
 **Subdomains (passive only):**
+
 ```bash
 # Perform a passive-only subdomain enumeration on evilcorp.com
 bbot -t evilcorp.com -f subdomain-enum -rf passive
 ```
 
 **Subdomains + port scan + web screenshots:**
+
 ```bash
 # Port-scan every subdomain, screenshot every webpage, output to current directory
 bbot -t evilcorp.com -f subdomain-enum -m nmap gowitness -n my_scan -o .
 ```
 
 **Subdomains + basic web scan:**
+
 ```bash
 # A basic web scan includes wappalyzer, robots.txt, and other non-intrusive web modules
 bbot -t evilcorp.com -f subdomain-enum web-basic
 ```
 
 **Web spider:**
+
 ```bash
 # Crawl www.evilcorp.com up to a max depth of 2, automatically extracting emails, secrets, etc.
 bbot -t www.evilcorp.com -m httpx robots badsecrets secretsdb -c web_spider_distance=2 web_spider_depth=2
 ```
 
 **Everything everywhere all at once:**
+
 ```bash
 # Subdomains, emails, cloud buckets, port scan, basic web, web screenshots, nuclei
 bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap gowitness nuclei --allow-deadly
@@ -80,6 +92,7 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap g
 ## API Keys
 
 No API keys are required to run BBOT. However, some modules need them to function. If you have API keys and want to make use of these modules, you can place them either in BBOT's YAML config (`~/.config/bbot/secrets.yml`):
+
 ```yaml
 modules:
   shodan_dns:
diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 20854a463a..a652ee15b7 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -3,18 +3,21 @@
 Below you can find some advanced uses of BBOT.
 
 ## BBOT as a Python library
+
 **Synchronous**
-~~~python
+
+```python
 from bbot.scanner import Scanner
 
 # any number of targets can be specified
 scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
 for event in scan.start():
     print(event.json())
-~~~
+```
 
 **Asynchronous**
-~~~python
+
+```python
 from bbot.scanner import Scanner
 
 async def main():
@@ -24,22 +27,16 @@ async def main():
 
 import asyncio
 asyncio.run(main())
-~~~
+```
 
 ## Command-Line Help
 
 <!-- BBOT HELP OUTPUT -->
 ```text
-usage: pytest [-h] [--help-all] [-t TARGET [TARGET ...]]
-              [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]]
-              [--strict-scope] [-m MODULE [MODULE ...]] [-l]
-              [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf]
-              [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
-              [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME]
-              [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y]
-              [--dry-run] [--current-config]
-              [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps]
-              [-a] [--version]
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR]
+               [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a]
+               [--version]
 
 Bighuge BLS OSINT Tool
 
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index 75f332cf09..c2744b84ef 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -1,6 +1,6 @@
 # Events
 
-Events are how data is represented inside BBOT. Examples of an event include `IP_ADDRESS`, `DNS_NAME`, `EMAIL_ADDRESS`, `URL`, etc. When you run a BBOT scan, events are constantly being exchanged between modules. They are also output to the console:
+An Event is a piece of data discovered by BBOT. Examples of an event include `IP_ADDRESS`, `DNS_NAME`, `EMAIL_ADDRESS`, `URL`, etc. When you run a BBOT scan, events are constantly being exchanged between modules. They are also output to the console:
 
 ```text
 [DNS_NAME]      www.evilcorp.com    sslcert         (distance-0, in-scope, resolved, subdomain, a-record)
@@ -16,11 +16,35 @@ In addition to the obvious data (e.g. `www.evilcorp.com`), an event also contain
 - its `.scope_distance` (how many hops it is from the main scope, 0 == in-scope)
 - a list of `.tags` that describe the data (`mx-record`, `http-title`, etc.)
 
-These attributes allow us to construct a visual graph of events (e.g. in Neo4j) and query/filter/grep them more easily.
+These attributes allow us to construct a visual graph of events (e.g. in [Neo4j](../output#neo4j)) and query/filter/grep them more easily. Here is what a typical event looks like in JSON format:
 
-See below for a full list of event types and which modules produce/consume them.
+```json
+{
+  "type": "URL",
+  "id": "URL:017ec8e5dc158c0fd46f07169f8577fb4b45e89a",
+  "data": "http://www.blacklanternsecurity.com/",
+  "web_spider_distance": 0,
+  "scope_distance": 0,
+  "scan": "SCAN:4d786912dbc97be199da13074699c318e2067a7f",
+  "timestamp": 1688526222.723366,
+  "resolved_hosts": ["185.199.108.153"],
+  "source": "OPEN_TCP_PORT:cf7e6a937b161217eaed99f0c566eae045d094c7",
+  "tags": [
+    "in-scope",
+    "distance-0",
+    "dir",
+    "ip-185-199-108-153",
+    "status-301",
+    "http-title-301-moved-permanently"
+  ],
+  "module": "httpx",
+  "module_sequence": "httpx"
+}
+```
+
+Below is a full list of event types along with which modules produce/consume them.
 
-## Event Types
+## List of Event Types
 
 <!-- BBOT EVENTS -->
 | Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   | Producing Modules                                                                                                                                                                                                                                                                                                                                                                 |
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 9707f470b2..c5bb243afc 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -1,6 +1,17 @@
 # Scanning Overview
 
-press enter to execute <span class="demonic-jimmy">demonic_jimmy</span>
+## Scan Names
+
+Every BBOT scan gets a random and mildly-entertaining name like **`demonic_jimmy`**. Output for that scan, including scan stats and any web screenshots, are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed.
+
+If you don't want a random name, you can change it with `-n`. You can also change the location of BBOT's output with `-o`:
+
+```bash
+# save everything to the folder "my_scan" in the current directory
+bbot -t evilcorp.com -f subdomain-enum -m gowitness -n my_scan -o .
+```
+
+If you reuse a scan name, BBOT will automatically append to your previous output files.
 
 ## Targets (`-t`)
 
@@ -13,7 +24,7 @@ Targets declare what's in-scope, and seed a scan with initial data. BBOT accepts
 
 You can specify targets directly on the command line, load them from files, or both! For example:
 
-~~~bash
+```bash
 $ cat targets.txt
 4.3.2.1
 1.2.3.0/24
@@ -23,7 +34,7 @@ https://www.evilcorp.co.uk
 
 # load targets from a file and from the command-line
 $ bbot -t targets.txt fsociety.com 5.6.7.0/24 -m nmap
-~~~
+```
 
 On start, BBOT automatically converts Targets into [Events](./events).
 
@@ -43,20 +54,25 @@ bbot -t www.evilcorp.com -m nmap sslcert httpx
 Modules fall into three categories:
 
 - **Scan Modules**:
-    - These make up the majority of modules. Examples are `nmap`, `sslcert`, `httpx`, etc. Enable with `-m`.
+  - These make up the majority of modules. Examples are `nmap`, `sslcert`, `httpx`, etc. Enable with `-m`.
 - **Output Modules**:
-    - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output))
+  - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output))
 - **Internal Modules**:
-    - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disabled via the config (e.g. `-c speculate=false`).
-        - `aggregate`: Summarizes results at the end of a scan
-        - `excavate`: Extracts useful data such as subdomains from webpages, etc.
-        - `speculate`: Intelligently infers new events, e.g. `OPEN_TCP_PORT` from `URL` or `IP_ADDRESS` from `IP_NETWORK`.
+  - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disabled via the config (e.g. `-c speculate=false`).
+    - `aggregate`: Summarizes results at the end of a scan
+    - `excavate`: Extracts useful data such as subdomains from webpages, etc.
+    - `speculate`: Intelligently infers new events, e.g. `OPEN_TCP_PORT` from `URL` or `IP_ADDRESS` from `IP_NETWORK`.
 
 For details in the inner workings of modules, see [Creating a Module](../contribution/module_creation/).
 
 ## Flags (`-f`)
 
-Flags are how BBOT categorizes its modules. In a way, you can think of them as groups. Flags let you enable a bunch of similar modules at the same time without having to specify them each individually. For example, `-f subdomain-enum` would enable all the modules having the `subdomain-enum` flag.
+Flags are how BBOT categorizes its modules. In a way, you can think of them as groups. Flags let you enable a bunch of similar modules at the same time without having to specify them each individually. For example, `-f subdomain-enum` would enable every module with the `subdomain-enum` flag.
+
+```bash
+# list all subdomain-enum modules
+bbot -f subdomain-enum -l
+```
 
 ### Filtering by Flag
 
@@ -100,9 +116,9 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
@@ -111,8 +127,6 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS -->
 
-
-
 ## Scope
 
 For pentesters and bug bounty hunters, staying in scope is extremely important. BBOT takes this seriously, meaning that active modules (e.g. `nuclei`) will only touch in-scope resources.
@@ -121,9 +135,9 @@ By default, scope is whatever you specify with `-t`. This includes child subdoma
 
 ### Scope Distance
 
-Since BBOT is recursive, it would quickly resort to scannning the entire internet if not properly restrained. To solve this problem, every [event](./events) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
+Since BBOT is recursive, it would quickly resort to scannning the entire internet without some kind of restraining mechanism. To solve this problem, every [event](./events) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
 
-For example, if your target is `evilcorp.com`, `www.evilcorp.com` itself would have a scope distance of `0` (i.e. in-scope). If BBOT discovers that `www.evilcorp.com` resolves to `1.2.3.4`, `1.2.3.4` is one hop away, which means it would have a scope distance of `1`. If `1.2.3.4` has a PTR record that points to `ecorp.blob.core.windows.net`, `ecorp.blob.core.windows.net` is two hops away, so its scope distance is `2`.
+For example, if your target is `evilcorp.com`, `www.evilcorp.com` would have a scope distance of `0` (i.e. in-scope). If BBOT discovers that `www.evilcorp.com` resolves to `1.2.3.4`, `1.2.3.4` is one hop away, which means it would have a scope distance of `1`. If `1.2.3.4` has a PTR record that points to `ecorp.blob.core.windows.net`, `ecorp.blob.core.windows.net` is two hops away, so its scope distance is `2`.
 
 Scope distance continues to increase the further out you get. Most modules (e.g. `nuclei` and `nmap`) only consume in-scope events. Certain other passive modules such as `asn` accept out to distance `1`. By default, DNS resolution happens out to a distance of `2`. Upon its discovery, any [event](./events) that's determined to be in-scope (e.g. `www.evilcorp.com`) immediately becomes distance `0`, and the cycle starts over.
 
@@ -138,7 +152,7 @@ bbot -t evilcorp.com -f subdomain-enum -c scope_report_distance=1
 
 ### Strict Scope
 
-If you want to scan ***only*** that specific target hostname and none of its children, you can specify `--strict-scope`.
+If you want to scan **_only_** that specific target hostname and none of its children, you can specify `--strict-scope`.
 
 Note that `--strict-scope` only applies to targets and whitelists, but not blacklists. This means that if you put `internal.evilcorp.com` in your blacklist, you can be sure none of its subdomains will be scanned, even when using `--strict-scope`.
 
@@ -158,4 +172,39 @@ bbot -t evilcorp.com --whitelist 1.2.3.0/24 -f subdomain-enum -m nmap nuclei --a
 ```bash
 # Scan evilcorp.com, but exclude internal.evilcorp.com and its children
 bbot -t evilcorp.com --blacklist internal.evilcorp.com -f subdomain-enum -m nmap nuclei --allow-deadly
-```
\ No newline at end of file
+```
+
+## DNS Wildcards
+
+BBOT has robust wildcard detection built-in. It can reliably detect wildcard domains, and will tag them accordingly:
+
+```text
+[DNS_NAME]      github.io   TARGET  (a-record, a-wildcard-domain, aaaa-wildcard-domain, wildcard-domain)
+                                               ^^^^^^^^^^^^^^^^^  ^^^^^^^^^^^^^^^^^^^^  ^^^^^^^^^^^^^^^
+```
+
+Wildcard hosts are collapsed into a single host beginning with `_wildcard`:
+
+```text
+[DNS_NAME]      _wildcard.github.io     TARGET  (a-record, a-wildcard, a-wildcard-domain, aaaa-record, aaaa-wildcard, aaaa-wildcard-domain, wildcard, wildcard-domain)
+                ^^^^^^^^^
+```
+
+If you don't want this, you can disable wildcard detection on a domain-to-domain basis in the [config](./configuration):
+
+**`~/.bbot/config/bbot.yml`**:
+
+```yaml
+dns_wildcard_ignore:
+  - evilcorp.com
+  - evilcorp.co.uk
+```
+
+There are certain edge cases (such as with dynamic DNS rules) where BBOT's wildcard detection fails. In these cases, you can try increasing the number of wildcard checks in the config:
+
+```yaml
+# default == 10
+dns_wildcard_tests: 20
+```
+
+If that doesn't work you can consider [blacklisting](#whitelists-and-blacklists) the offending domain.
diff --git a/docs/scanning/output.md b/docs/scanning/output.md
index 8ee4bf9dfa..fb83ef3caa 100644
--- a/docs/scanning/output.md
+++ b/docs/scanning/output.md
@@ -3,32 +3,125 @@
 By default, BBOT saves its output in TXT, JSON, and CSV formats:
 ![image](https://github.com/blacklanternsecurity/bbot/assets/20261699/779207f4-1c2f-4f65-a132-794ca8bd2f8a)
 
-You can enable other output modules with `-om`.
-~~~bash
-# tee to a file
-bbot -t evilcorp.com -f subdomain-enum | tee evilcorp.txt
+Every BBOT scan gets a unique and mildly-entertaining name like **`demonic_jimmy`**. Output for that scan, including scan stats and any web screenshots, etc., are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed. You can change the location of BBOT's output with `--output`, and you can also pick a custom scan name with `--name`.
 
-# output JSON to stdout
-bbot -t evilcorp.com -f subdomain-enum -om json | jq
+If you reuse a scan name, it will append to its original output files and leverage the previous.
 
-# output asset inventory in current directory
-bbot -t evilcorp.com -f subdomain-enum -om asset_inventory -o .
-~~~
-For every scan, BBOT generates a unique and mildly-entertaining name like `demonic_jimmy`. Output for that scan, including scan stats and any gowitness screenshots, etc., are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed. You can change the location of BBOT's output with `--output`, and you can also pick a custom scan name with `--name`.
+## Output Modules
 
-If you reuse a scan name, it will append to its original output files and leverage the previous.
+Multiple simultaneous output formats are possible because of **output modules**. Output modules are similar to normal modules except they are enabled with `-om`.
+
+### Human
+
+`human` output is tab-delimited, so it's easy to grep:
+
+```bash
+# grep out only the DNS_NAMEs
+cat ~/.bbot/scans/extreme_johnny/output.txt | grep '[DNS_NAME]' | cut -f2
+evilcorp.com
+www.evilcorp.com
+mail.evilcorp.com
+```
+
+### CSV
+
+The `csv` output module produces a CSV like this:
+
+| Event type | Event data              | IP Address | Source Module | Scope Distance | Event Tags                                                                                               |
+| ---------- | ----------------------- | ---------- | ------------- | -------------- | -------------------------------------------------------------------------------------------------------- |
+| DNS_NAME   | evilcorp.com            | 1.2.3.4    | TARGET        | 0              | a-record,cdn-github,distance-0,domain,in-scope,mx-record,ns-record,resolved,soa-record,target,txt-record |
+| DNS_NAME   | www.evilcorp.com        | 2.3.4.5    | certspotter   | 0              | a-record,aaaa-record,cdn-github,cname-record,distance-0,in-scope,resolved,subdomain                      |
+| URL        | http://www.evilcorp.com | 2.3.4.5    | httpx         | 0              | a-record,aaaa-record,cdn-github,cname-record,distance-0,in-scope,resolved,subdomain                      |
+| DNS_NAME   | admin.evilcorp.com      | 5.6.7.8    | otx           | 0              | a-record,aaaa-record,cloud-azure,cname-record,distance-0,in-scope,resolved,subdomain                     |
+
+### JSON
+
+If you manually enable the `json` output module, it will go to stdout:
+
+```bash
+bbot -t evilcorp.com -om json | jq
+```
+
+You will then see [events](./events) like this:
+
+```json
+{
+  "type": "IP_ADDRESS",
+  "id": "IP_ADDRESS:13cd09c2adf0860a582240229cd7ad1dccdb5eb1",
+  "data": "1.2.3.4",
+  "scope_distance": 1,
+  "scan": "SCAN:64c0e076516ae7aa6502fd99489693d0d5ec26cc",
+  "timestamp": 1688518967.740472,
+  "resolved_hosts": ["1.2.3.4"],
+  "source": "DNS_NAME:2da045542abbf86723f22383d04eb453e573723c",
+  "tags": ["distance-1", "ipv4", "internal"],
+  "module": "A",
+  "module_sequence": "A"
+}
+```
+
+You can filter on the JSON output with `jq`:
+
+```bash
+# pull out only the .data attribute of every DNS_NAME
+$ jq -r 'select(.type=="DNS_NAME") | .data' ~/.bbot/scans/extreme_johnny/output.json
+evilcorp.com
+www.evilcorp.com
+mail.evilcorp.com
+```
+
+### HTTP
+
+The `http` output module sends [events](./events) in JSON format to a desired HTTP endpoint.
+
+```bash
+# POST scan results to localhost
+bbot -t evilcorp.com -om http -c output_modules.http.url=http://localhost:8000
+```
+
+You can customize the HTTP method if needed. Authentication is also supported:
+
+**`~/.config/bbot.yml`:**
+
+```yaml
+output_modules:
+  http:
+    url: https://localhost:8000
+    method: PUT
+    # Authorization: Bearer
+    bearer: <bearer_token>
+    # OR
+    username: bob
+    password: P@ssw0rd
+```
+
+### Asset Inventory
+
+The `asset_inventory` module produces a CSV like this:
+
+| Host               | Provider    | IP(s)   | Status | Open Ports |
+| ------------------ | ----------- | ------- | ------ | ---------- |
+| evilcorp.com       | cdn-github  | 1.2.3.4 | Active | 80,443     |
+| www.evilcorp.com   | cdn-github  | 2.3.4.5 | Active | 22,80,443  |
+| admin.evilcorp.com | cloud-azure | 5.6.7.8 | N/A    |            |
 
 ## Neo4j
+
 Neo4j is the funnest (and prettiest) way to view and interact with BBOT data.
 
-![neo4j](https://user-images.githubusercontent.com/20261699/182398274-729f3c48-c23c-4db0-8c2e-8b403c1bf790.png)
+![neo4j](https://github.com/blacklanternsecurity/bbot/assets/20261699/0192d548-5c60-42b6-9a1e-32ba7b921cdf)
 
 - You can get Neo4j up and running with a single docker command:
-~~~bash
-docker run -p 7687:7687 -p 7474:7474 -v "$(pwd)/data/:/data/" -e NEO4J_AUTH=neo4j/bbotislife neo4j
-~~~
+
+```bash
+# start Neo4j in the background with docker
+docker run -d -p 7687:7687 -p 7474:7474 -v "$(pwd)/neo4j/:/data/" -e NEO4J_AUTH=neo4j/bbotislife neo4j
+```
+
 - After that, run bbot with `-om neo4j`
-~~~bash
+
+```bash
 bbot -f subdomain-enum -t evilcorp.com -om neo4j
-~~~
+```
+
 - Browse data at [http://localhost:7474](http://localhost:7474)
diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
new file mode 100644
index 0000000000..81bce45c2b
--- /dev/null
+++ b/docs/scanning/tips_and_tricks.md
@@ -0,0 +1,57 @@
+# Tips and Tricks
+
+Below are some helpful tricks to help you in your adventures.
+
+## Change Verbosity During Scan
+Press enter during a BBOT scan to change the log level. This will allow you to see debugging messages, etc.
+
+<img src="https://user-images.githubusercontent.com/20261699/224358855-9411cdc6-68a9-4cc4-828f-e30e4766101a.gif" style="max-width: 45em !important"/>
+
+## Common Config Changes
+
+### Custom HTTP Proxy
+
+Web pentesters may appreciate the ability to proxy a BBOT scan through Burp Suite. When executed with gowitness, this can even capture auxiliary web resources, API calls, etc. To accomplish this, set the `http_proxy` config option like so:
+
+```bash
+# enumerate subdomains, take web screenshots
+bbot -t evilcorp.com -f subdomain-enum -m gowitness -c http_proxy=http://127.0.0.1:8080
+```
+
+### Display `HTTP_RESPONSE` Events
+
+BBOT's `httpx` module emits `HTTP_RESPONSE` events, but by default they're hidden from output. These events contain the full raw HTTP body along with headers, etc. If you want to see them, you can modify `omit_event_types` in the config:
+
+**`~/.config/bbot/bbot.yml`:**
+```yaml
+omit_event_types:
+  - URL_UNVERIFIED
+  # - HTTP_RESPONSE
+```
+
+### Display Out-of-scope Events
+By default, BBOT only shows in-scope events (with a few exceptions for things like storage buckets). If you want to see events that BBOT is emitting internally (such as for DNS resolution, etc.), you can increase `scope_report_distance` in the config or on the command line like so:
+~~~bash
+bbot -f subdomain-enum -t evilcorp.com -c scope_report_distance=2
+~~~
+
+### Speed Up Scans By Disabling DNS Resolution
+If you already have a list of discovered targets (e.g. URLs), you can speed up the scan by skipping BBOT's DNS resolution. You can do this by setting `dns_resolution` to `false`.
+~~~bash
+bbot -m httpx gowitness wappalyzer -t urls.txt -c dns_resolution=false
+~~~
+
+## FAQ
+
+### What is `URL_UNVERIFIED`?
+
+`URL_UNVERIFIED` events are URLs that haven't yet been visited by `httpx`. Once `httpx` visits them, it reraises them as `URL`s, tagged with their resulting status code.
+
+For example, when [`excavate`](../#types-of-modules) gets an `HTTP_RESPONSE` event, it extracts links from the raw HTTP response as `URL_UNVERIFIED`s and then passes them back to `httpx` to be visited.
+
+By default, `URL_UNVERIFIED`s are hidden from output. If you want to see all of them including the out-of-scope ones, you can do it by changing `omit_event_types` and `scope_report_distance` in the config like so:
+
+```bash
+# visit www.evilcorp.com and extract all the links
+bbot -t www.evilcorp.com -m httpx -c omit_event_types=[] scope_report_distance=2
+```
diff --git a/extra_sass/style.css.scss b/extra_sass/style.css.scss
index 9864be9143..98f7a23fa2 100644
--- a/extra_sass/style.css.scss
+++ b/extra_sass/style.css.scss
@@ -1,7 +1,7 @@
 /* GLOBAL STYLES */
 
 :root {
-  --bbot-orange: #FF8400;
+  --bbot-orange: #ff8400;
 }
 
 // .md-grid {
@@ -10,19 +10,25 @@
 //   max-width: unset;
 // }
 
-span.demonic-jimmy {
+p img {
+  max-width: 60em !important;
+}
+
+.demonic-jimmy {
   color: var(--bbot-orange);
 }
 
 .md-nav__link--active {
-  font-weight: bold
+  font-weight: bold;
 }
 
 .md-typeset__table td:first-child {
   font-weight: bold;
 }
 
-a.md-source, .md-header__topic, a:hover {
+a.md-source,
+.md-header__topic,
+a:hover {
   color: var(--bbot-orange);
 }
 
@@ -31,10 +37,14 @@ article.md-content__inner {
     font-weight: 500;
     color: var(--bbot-orange);
   }
-  h1, h2 {
+  h1,
+  h2 {
     color: var(--bbot-orange);
   }
-  h2, h3, h4, h5, {
+  h2,
+  h3,
+  h4,
+  h5 {
     font-weight: 300;
   }
 }
@@ -49,8 +59,7 @@ table {
 
 /* DARK MODE SPECIFIC */
 
-[data-md-color-scheme=slate] {
-
+[data-md-color-scheme="slate"] {
   div.md-source__repository ul {
     color: white;
   }
@@ -60,7 +69,7 @@ table {
   }
 
   .md-nav__link--active {
-    font-weight: bold
+    font-weight: bold;
   }
 
   .md-typeset__table tr {
@@ -75,4 +84,4 @@ table {
     color: var(--bbot-orange);
     background-color: var(--md-primary-fg-color--dark);
   }
-}
\ No newline at end of file
+}
diff --git a/mkdocs.yml b/mkdocs.yml
index 2dd73261ff..e597d30c91 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -11,18 +11,19 @@ repo_url: https://github.com/blacklanternsecurity/bbot
 # Page tree
 nav:
   - Basics:
-    - Getting Started: index.md
-    - How it Works: how_it_works.md
-    - Comparison to Other Tools: comparison.md
+      - Getting Started: index.md
+      - How it Works: how_it_works.md
+      - Comparison to Other Tools: comparison.md
   - Scanning:
-    - scanning/index.md
-    - Events: scanning/events.md
-    - Output: scanning/output.md
-    - Advanced Usage: scanning/advanced.md
-    - Configuration: scanning/configuration.md
-    - Modules Table: scanning/list_of_modules.md
+      - scanning/index.md
+      - Events: scanning/events.md
+      - Output: scanning/output.md
+      - Tips and Tricks: scanning/tips_and_tricks.md
+      - Advanced Usage: scanning/advanced.md
+      - Configuration: scanning/configuration.md
+      - List of Modules: scanning/list_of_modules.md
   - Contribution:
-    - How to Write a Module: contribution.md
+      - How to Write a Module: contribution.md
 
 theme:
   name: material
@@ -32,10 +33,10 @@ theme:
     - navigation.sections
     - navigation.expand
     - toc.integrate
-  palette: 
-  - scheme: slate
-    primary: black
-    accent: deep orange
+  palette:
+    - scheme: slate
+      primary: black
+      accent: deep orange
 
 plugins:
   - search
@@ -46,3 +47,7 @@ markdown_extensions:
       use_pygments: True
       noclasses: True
       pygments_style: github-dark
+
+extra_javascript:
+  - https://unpkg.com/tablesort@5.3.0/dist/tablesort.min.js
+  - javascripts/tablesort.js

From 8f58359539613cb1764833974c6671b6a3fe5611 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 5 Jul 2023 23:53:30 -0400
Subject: [PATCH 161/387] updated readme

---
 README.md | 6 +++++-
 1 file changed, 5 insertions(+), 1 deletion(-)

diff --git a/README.md b/README.md
index f18cee0b78..299a1c878d 100644
--- a/README.md
+++ b/README.md
@@ -97,7 +97,11 @@ BBOT accepts an unlimited number of targets which you can specify either directl
 
 For more information, see [Targets](https://www.blacklanternsecurity.com/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/scanning/#scope).
 
-# Acknowledgements
+## Comparison to Other Tools
+
+![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/1c262bbe-2e8c-4c69-bdd2-1e2553d47746)
+
+## Acknowledgements
 
 Thanks to these amazing people for contributing to BBOT! :heart:
 

From 042be70e099515a39119a09cec5defbde44abe9e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 00:17:41 -0400
Subject: [PATCH 162/387] more work on docs

---
 docs/how_it_works.md | 12 +++++++++++-
 mkdocs.yml           |  5 +++++
 2 files changed, 16 insertions(+), 1 deletion(-)

diff --git a/docs/how_it_works.md b/docs/how_it_works.md
index 513a8e71b3..ff624522e0 100644
--- a/docs/how_it_works.md
+++ b/docs/how_it_works.md
@@ -22,10 +22,20 @@ Instead, BBOT works recursively, treating each new individual piece of data as a
 
 ## Module Example
 
-As a simple example, let's run a BBOT scan with **three modules**: `nmap`, `sslcert`, and `httpx`. Each of these modules "consume" a certain type of data:
+In a simple example, we run a BBOT scan with **three modules**: `nmap`, `sslcert`, and `httpx`. Each of these modules "consume" a certain type of data:
 
 - **`nmap`** consumes `DNS_NAME`s, port-scans them, and outputs `OPEN_TCP_PORT`s
 - **`sslcert`** consumes `OPEN_TCP_PORT`s, grabs certs, and extracts `DNS_NAME`s
 - **`httpx`** consumes `OPEN_TCP_PORT`s and visits any web services, extracting new `URL`s and `HTTP_RESPONSE`s.
 
+```mermaid
+graph TD
+  nmap -->|OPEN_TCP_PORT| sslcert;
+  nmap -->|OPEN_TCP_PORT| httpx;
+  sslcert --> |DNS_NAME| nmap;
+  httpx --> |DNS_NAME| nmap;
+```
 
+This allows for some interesting chains of events. Given a single target such as `evilcorp.com`, `nmap` may start by discovering an `OPEN_TCP_PORT`. `sslcert` and `httpx` will then visit that port and extract more hostnames, which are in turn scanned by `nmap` and visited by `sslcert` and `httpx` to discover more hostnames which are again passed to `nmap`, and so on...
+
+For a full list of event types and which modules consume/produce them, see [List of Event Types](../scanning/events/#list-of-event-types).
diff --git a/mkdocs.yml b/mkdocs.yml
index e597d30c91..9c58c37ef5 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -47,6 +47,11 @@ markdown_extensions:
       use_pygments: True
       noclasses: True
       pygments_style: github-dark
+  - pymdownx.superfences:
+      custom_fences:
+        - name: mermaid
+          class: mermaid
+          format: !!python/name:pymdownx.superfences.fence_code_format
 
 extra_javascript:
   - https://unpkg.com/tablesort@5.3.0/dist/tablesort.min.js

From b5015891356ab46ce84fd88efa2b6b47f4dc52ee Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 00:21:55 -0400
Subject: [PATCH 163/387] updated readme

---
 README.md | 12 ++++--------
 1 file changed, 4 insertions(+), 8 deletions(-)

diff --git a/README.md b/README.md
index 299a1c878d..0fc9857325 100644
--- a/README.md
+++ b/README.md
@@ -8,13 +8,13 @@ BBOT is a modular OSINT framework that can execute the entire OSINT workflow in
 
 ![bbot_banner](https://github.com/blacklanternsecurity/bbot/assets/20261699/af2e822c-d7d6-40e7-bcba-2ce52faa6c4c)
 
-BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but rises to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. BBOT has over 80 modules and counting.
+BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. 
 
-Whether you're a pentester, security researcher, or bug bounty hunter, BBOT automates the OSINT process so you can focus on the fun part: hacking!
+BBOT typically outperforms other subdomain enumeration tools by 20-25%:
 
-https://github.com/blacklanternsecurity/bbot/assets/20261699/ebf2a81e-7530-4a9e-922d-4e62eb949f35
+![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/1c262bbe-2e8c-4c69-bdd2-1e2553d47746)
 
-_A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/blacklanternsecurity/bbot-vivagraphjs)_
+To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
 
 # Getting Started
 
@@ -97,10 +97,6 @@ BBOT accepts an unlimited number of targets which you can specify either directl
 
 For more information, see [Targets](https://www.blacklanternsecurity.com/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/scanning/#scope).
 
-## Comparison to Other Tools
-
-![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/1c262bbe-2e8c-4c69-bdd2-1e2553d47746)
-
 ## Acknowledgements
 
 Thanks to these amazing people for contributing to BBOT! :heart:

From 8d8d18de105b9aab05b054eb56eadf247ace9650 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 00:26:43 -0400
Subject: [PATCH 164/387] updated readme

---
 README.md            | 4 +---
 docs/how_it_works.md | 4 +++-
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/README.md b/README.md
index 0fc9857325..1d0a4dfbbd 100644
--- a/README.md
+++ b/README.md
@@ -10,11 +10,9 @@ BBOT is a modular OSINT framework that can execute the entire OSINT workflow in
 
 BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. 
 
-BBOT typically outperforms other subdomain enumeration tools by 20-25%:
-
 ![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/1c262bbe-2e8c-4c69-bdd2-1e2553d47746)
 
-To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
+BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
 
 # Getting Started
 
diff --git a/docs/how_it_works.md b/docs/how_it_works.md
index ff624522e0..5e48677fe7 100644
--- a/docs/how_it_works.md
+++ b/docs/how_it_works.md
@@ -36,6 +36,8 @@ graph TD
   httpx --> |DNS_NAME| nmap;
 ```
 
-This allows for some interesting chains of events. Given a single target such as `evilcorp.com`, `nmap` may start by discovering an `OPEN_TCP_PORT`. `sslcert` and `httpx` will then visit that port and extract more hostnames, which are in turn scanned by `nmap` and visited by `sslcert` and `httpx` to discover more hostnames which are again passed to `nmap`, and so on...
+This allows for some interesting chains of events. Given a single target such as `evilcorp.com`, `nmap` may start by discovering an `OPEN_TCP_PORT` `evilcorp.com:443`. `sslcert` and `httpx` will then visit that port and extract more hostnames, which are in turn scanned by `nmap` to produce more open ports which are visited by `sslcert` and `httpx`, which discover more hostnames, which are again passed to `nmap`, and so on...
+
+This is a simple example with only a few modules, but you can being to see how if 30 or 40 modules were enabled, they could feed each other exponentially to produce an immense amount of data. This recursion is exactly how BBOT is able to outperform other tools.
 
 For a full list of event types and which modules consume/produce them, see [List of Event Types](../scanning/events/#list-of-event-types).

From b55a90121d7ef302344ef96efb70091e196ddc47 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 00:41:25 -0400
Subject: [PATCH 165/387] more work on docs

---
 README.md               | 27 ++++++++++++++
 docs/contribution.md    |  9 +++--
 docs/index.md           |  2 +-
 docs/release_history.md | 80 +++++++++++++++++++++++++++++++++++++++++
 docs/troubleshooting.md | 35 ++++++++++++++++++
 mkdocs.yml              | 23 ++++++------
 6 files changed, 162 insertions(+), 14 deletions(-)
 create mode 100644 docs/release_history.md
 create mode 100644 docs/troubleshooting.md

diff --git a/README.md b/README.md
index 1d0a4dfbbd..4164987783 100644
--- a/README.md
+++ b/README.md
@@ -95,6 +95,33 @@ BBOT accepts an unlimited number of targets which you can specify either directl
 
 For more information, see [Targets](https://www.blacklanternsecurity.com/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/scanning/#scope).
 
+## BBOT as a Python library
+
+**Synchronous**
+
+```python
+from bbot.scanner import Scanner
+
+# any number of targets can be specified
+scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
+for event in scan.start():
+    print(event.json())
+```
+
+**Asynchronous**
+
+```python
+from bbot.scanner import Scanner
+
+async def main():
+    scan = Scanner("example.com", "scanme.nmap.org", modules=["nmap", "sslcert"])
+    async for event in scan.async_start():
+        print(event.json())
+
+import asyncio
+asyncio.run(main())
+```
+
 ## Acknowledgements
 
 Thanks to these amazing people for contributing to BBOT! :heart:
diff --git a/docs/contribution.md b/docs/contribution.md
index 6391fc4fd3..c90a4eb9ef 100644
--- a/docs/contribution.md
+++ b/docs/contribution.md
@@ -28,7 +28,12 @@ bbot --help
 ```
 
 - Now, any changes you make in the code will be reflected in the `bbot` command.
-- Run the tests locally to ensure they pass:
+- Run the tests locally to ensure they pass.
+- Finally, commit and push your changes, and create a pull request to the `dev` branch of the main BBOT repo.
+
+## Running Tests
+
+BBOT makes use of pytest for its unit testing. You can run the tests simply by executing the bash script at `bbot/test/run_tests.sh`:
 
 ```bash
 # auto-format code indentation, etc.
@@ -38,8 +43,6 @@ black .
 ./bbot/test/run_tests.sh
 ```
 
-- Finally, commit and push your changes, and create a pull request to the `dev` branch of the main BBOT repo.
-
 ## Creating a Module
 
 Writing a module is easy and requires only a basic understanding of Python. It consists of a few steps:
diff --git a/docs/index.md b/docs/index.md
index b013c518ff..1ede24b934 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -110,4 +110,4 @@ bbot -t evilcorp.com -f subdomain-enum -c modules.shodan_dns.api_key=deadbeef mo
 
 For more information, see [Configuration](./configuration). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
 
-## Next Up: [Scanning](./scanning)
+## See: [Scanning](./scanning)
diff --git a/docs/release_history.md b/docs/release_history.md
new file mode 100644
index 0000000000..1396ca7616
--- /dev/null
+++ b/docs/release_history.md
@@ -0,0 +1,80 @@
+## v1.0.5
+March 10, 2023
+
+**New Modules**:
+
+- [Badsecrets](https://github.com/blacklanternsecurity/badsecrets) ([blacklist3r](https://github.com/NotSoSecure/Blacklist3r) but better!)
+- Subdomain Hijacking (uses [can-i-take-over-xyz](https://github.com/EdOverflow/can-i-take-over-xyz))
+- [WafW00f](https://github.com/EnableSecurity/wafw00f)
+- [Fingerprintx](https://github.com/praetorian-inc/fingerprintx)
+- [Masscan](https://github.com/robertdavidgraham/masscan)
+- Robots.txt
+- Web Report
+- IIS shortnames (Pure Python rewrite)
+
+**New Features**:
+
+- Automatic tagging of cloud resources (with [cloudcheck](https://github.com/blacklanternsecurity/cloudcheck))
+- Significant performance increases
+- Bug fixes
+- Better tests + code coverage
+- Support for punycode (non-ascii) domains
+- Better support for non-64-bit systems
+- Enter key now toggles verbosity during scan
+
+
+## v1.0.4
+December 15, 2022
+
+**New Modules**:
+
+- Storage buckets:
+    - Azure
+    - GCP
+    - AWS
+    - DigitalOcean
+- ipstack (geolocation)
+- BeVigil
+- ASN (rewrite)
+
+**New Features**:
+
+- Colored vulnerabilities on CLI
+- Log full nuclei output
+- Various bugfixes
+- Better handling of:
+    - DNS wildcards
+    - Infinite DNS-record chains
+    - Infinite HTTP redirects
+- Improved module tests
+
+## v1.0.3
+October 12, 2022
+
+**Changes**:
+
+- Tag URL events with their corresponding IP address
+- Automatic docker hub publishing
+- Added `retries` option for httpx module
+- Added `asset_inventory` output module
+- Improvements to nuclei module
+- Avoid unnecessary failed sudo attempts during dependency install
+- Improved Python API
+- Added AnubisDB module
+- Various bugfixes
+- Add examples to `--help` output
+- Reduce annoying warnings on free API modules
+- Update iis_shortnames .jar dependency
+- Updated documentation to explain targets, whitelists, blacklists
+- Added help for module-specific options
+- Added warning if unable to validate public DNS servers (for massdns)
+- Various performance optimizations
+- Various bugfixes
+- Fix Pypi auto-publishing
+- Added bug report template
+- Added examples in README
+- Improved wildcard detection
+- Added DNS retry functionality
+- Improved excavate hostname extraction
+- Added command-line option for installing all dependencies
+- Improved gowitness dependency install, improved tests
diff --git a/docs/troubleshooting.md b/docs/troubleshooting.md
new file mode 100644
index 0000000000..63a77f2df5
--- /dev/null
+++ b/docs/troubleshooting.md
@@ -0,0 +1,35 @@
+# Troubleshooting
+
+## Installation troubleshooting
+- `Fatal error from pip prevented installation.`
+- `ERROR: No matching distribution found for bbot`
+- `bash: /home/user/.local/bin/bbot: /home/user/.local/pipx/venvs/bbot/bin/python: bad interpreter`
+
+If you get errors resembling any of the above, you need to do something like this:
+```bash
+# install a newer version of python
+sudo apt install python3.9 python3.9-venv
+# install pipx
+python3.9 -m pip install --user pipx
+# add pipx to your path
+python3.9 -m pipx ensurepath
+# reboot
+reboot
+# install bbot
+python3.9 -m pipx install bbot
+# run bbot
+bbot --help
+```
+
+## `ModuleNotFoundError`
+If you run into a `ModuleNotFoundError`, try running your `bbot` command again with `--force-deps`. This will repair your modules' Python dependencies.
+
+## Regenerate Config
+As a troubleshooting step it is sometimes useful to clear out your older configs and let BBOT generate new ones. This will ensure that new defaults are property restored, etc.
+```bash
+# make a backup of the old configs
+mv ~/.config/bbot ~/.config/bbot.bak
+
+# generate new configs
+bbot
+```
diff --git a/mkdocs.yml b/mkdocs.yml
index 9c58c37ef5..398541d6fe 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -11,19 +11,22 @@ repo_url: https://github.com/blacklanternsecurity/bbot
 # Page tree
 nav:
   - Basics:
-      - Getting Started: index.md
-      - How it Works: how_it_works.md
-      - Comparison to Other Tools: comparison.md
+    - Getting Started: index.md
+    - How it Works: how_it_works.md
+    - Comparison to Other Tools: comparison.md
   - Scanning:
-      - scanning/index.md
-      - Events: scanning/events.md
-      - Output: scanning/output.md
-      - Tips and Tricks: scanning/tips_and_tricks.md
-      - Advanced Usage: scanning/advanced.md
-      - Configuration: scanning/configuration.md
-      - List of Modules: scanning/list_of_modules.md
+    - scanning/index.md
+    - Events: scanning/events.md
+    - Output: scanning/output.md
+    - Tips and Tricks: scanning/tips_and_tricks.md
+    - Advanced Usage: scanning/advanced.md
+    - Configuration: scanning/configuration.md
+    - List of Modules: scanning/list_of_modules.md
   - Contribution:
       - How to Write a Module: contribution.md
+  - Misc:
+    - Release History: release_history.md
+    - Troubleshooting: troubleshooting.md
 
 theme:
   name: material

From 8be80e68ef12473007cf2cf3ebf7296af8bde5c5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 00:43:16 -0400
Subject: [PATCH 166/387] updated readme

---
 README.md | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/README.md b/README.md
index 4164987783..47225a38af 100644
--- a/README.md
+++ b/README.md
@@ -14,9 +14,7 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
 
-# Getting Started
-
-Consider checkout out our [Documentation](https://www.blacklanternsecurity.com/bbot).
+## Consider checkout out our [Documentation](https://www.blacklanternsecurity.com/bbot).
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 

From 1a17643259c781810abf141cb1679f5c4a6ac73e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 01:07:58 -0400
Subject: [PATCH 167/387] dependencies

---
 docs/scanning/index.md | 14 +++++++++++++-
 1 file changed, 13 insertions(+), 1 deletion(-)

diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index c5bb243afc..dccabc022d 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -125,7 +125,19 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-<!-- END BBOT MODULE FLAGS -->
+<!-- END BBOT MODULE FLAGS --> 
+
+## Dependencies
+
+BBOT modules have external dependencies ranging from OS packages (`openssl`) to binaries (`nmap`) to Python libraries (`wappalyzer`). When a module is enabled, installation of its dependencies happens at runtime with [Ansible](https://github.com/ansible/ansible). BBOT provides several command-line flags to control how dependencies are installed.
+
+- `--no-deps` - Don't install module dependencies
+- `--force-deps` - Force install all module dependencies
+- `--retry-deps` - Try again to install failed module dependencies
+- `--ignore-failed-deps` - Run modules even if they have failed dependencies
+- `--install-all-deps` - Install dependencies for all modules (useful if you are provisioning a pentest system and want to install everything ahead of time)
+
+For details on how Ansible playbooks are attached to BBOT modules, see [How to Write a Module](../contribution/#module-dependencies).
 
 ## Scope
 

From 7a20264f825090e808a44f5331f1ec34d19d0ccc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 01:12:21 -0400
Subject: [PATCH 168/387] more work on docs

---
 docs/scanning/configuration.md   | 3 +++
 docs/scanning/tips_and_tricks.md | 2 ++
 2 files changed, 5 insertions(+)

diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index d3a4c8dd1f..3b3eb16726 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -7,6 +7,8 @@ For a list of all possible config options, see:
 - [Global Options](./global_options/)
 - [Module Options](./module_options/)
 
+For a summary of commonly-used config options, see [Common Config Options]
+
 ## Configuration Files
 
 BBOT loads its config from the following files, in this order:
@@ -22,6 +24,7 @@ These config files will be automatically created for you when you first run BBOT
 You can specify config options either via the command line or the config. For example, if you want to proxy your BBOT scan through a local proxy like [Burp Suite](https://portswigger.net/burp), you could either do:
 
 ```bash
+# send BBOT traffic through an HTTP proxy
 bbot -t evilcorp.com --config http_proxy=http://127.0.0.1:8080
 ```
 
diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
index 81bce45c2b..4a4236fd33 100644
--- a/docs/scanning/tips_and_tricks.md
+++ b/docs/scanning/tips_and_tricks.md
@@ -32,12 +32,14 @@ omit_event_types:
 ### Display Out-of-scope Events
 By default, BBOT only shows in-scope events (with a few exceptions for things like storage buckets). If you want to see events that BBOT is emitting internally (such as for DNS resolution, etc.), you can increase `scope_report_distance` in the config or on the command line like so:
 ~~~bash
+# display events up to scope distance 2 (default == 0)
 bbot -f subdomain-enum -t evilcorp.com -c scope_report_distance=2
 ~~~
 
 ### Speed Up Scans By Disabling DNS Resolution
 If you already have a list of discovered targets (e.g. URLs), you can speed up the scan by skipping BBOT's DNS resolution. You can do this by setting `dns_resolution` to `false`.
 ~~~bash
+# disable the creation of new events from DNS resoluion
 bbot -m httpx gowitness wappalyzer -t urls.txt -c dns_resolution=false
 ~~~
 

From 64997f51f306513f26b194e8121075990eab1070 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 01:14:46 -0400
Subject: [PATCH 169/387] steady work on docs

---
 docs/scanning/tips_and_tricks.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
index 4a4236fd33..a292f50981 100644
--- a/docs/scanning/tips_and_tricks.md
+++ b/docs/scanning/tips_and_tricks.md
@@ -11,10 +11,10 @@ Press enter during a BBOT scan to change the log level. This will allow you to s
 
 ### Custom HTTP Proxy
 
-Web pentesters may appreciate the ability to proxy a BBOT scan through Burp Suite. When executed with gowitness, this can even capture auxiliary web resources, API calls, etc. To accomplish this, set the `http_proxy` config option like so:
+Web pentesters may appreciate the ability to proxy a scan through Burp Suite. When executed with gowitness, this will capture the traffic as if you manually visited each website in your browser -- including auxiliary web resources and javascript API calls. To accomplish this, set the `http_proxy` config option like so:
 
 ```bash
-# enumerate subdomains, take web screenshots
+# enumerate subdomains, take web screenshots, proxy through Burp
 bbot -t evilcorp.com -f subdomain-enum -m gowitness -c http_proxy=http://127.0.0.1:8080
 ```
 

From 0d5fb284fb761766655fcebb2373188a26c1729b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 01:18:14 -0400
Subject: [PATCH 170/387] smaller comparison graph

---
 README.md          | 4 ++--
 docs/comparison.md | 2 +-
 2 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index 47225a38af..4e3aa28653 100644
--- a/README.md
+++ b/README.md
@@ -4,13 +4,13 @@
 
 [![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot) [![Discord](https://img.shields.io/discord/859164869970362439)](https://discord.com/invite/PZqkgxu5SA)
 
-BBOT is a modular OSINT framework that can execute the entire OSINT workflow in a single command.
+BBOT is a modular, recursive OSINT framework that can execute the entire OSINT workflow in a single command.
 
 ![bbot_banner](https://github.com/blacklanternsecurity/bbot/assets/20261699/af2e822c-d7d6-40e7-bcba-2ce52faa6c4c)
 
 BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. 
 
-![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/1c262bbe-2e8c-4c69-bdd2-1e2553d47746)
+![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/de0154c1-476e-4337-9599-45a1c5e0e78b)
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
 
diff --git a/docs/comparison.md b/docs/comparison.md
index cd3d7234bf..9d17b9ff4d 100644
--- a/docs/comparison.md
+++ b/docs/comparison.md
@@ -6,4 +6,4 @@ Thanks to BBOT's recursive nature (and `massdns`' fancy subdomain mutations), it
 
 This holds true even for larger targets like `boeing.com` (1000+ subdomains):
 
-![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/1c262bbe-2e8c-4c69-bdd2-1e2553d47746)
+![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/de0154c1-476e-4337-9599-45a1c5e0e78b)

From 7a110162b99709c588eca08ea70714c74ac43f81 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 01:20:48 -0400
Subject: [PATCH 171/387] typo

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 4e3aa28653..e7440a858e 100644
--- a/README.md
+++ b/README.md
@@ -14,7 +14,7 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
 
-## Consider checkout out our [Documentation](https://www.blacklanternsecurity.com/bbot).
+## Consider checking out our [Documentation](https://www.blacklanternsecurity.com/bbot).
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 

From 3b6e500b5d8c91a789d3ea8c2d95134dab9e39ac Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 01:31:20 -0400
Subject: [PATCH 172/387] bump version

---
 pyproject.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index 502e7a032c..920fc8365c 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -61,7 +61,7 @@ line-length = 119
 [tool.poetry-dynamic-versioning]
 enable = true
 metadata = false
-format-jinja = 'v1.0.5.{{ distance }}{% if branch == "dev" %}rc{% endif %}'
+format-jinja = 'v1.1.0.{{ distance }}{% if branch == "dev" %}rc{% endif %}'
 
 [tool.poetry-dynamic-versioning.substitution]
 files = ["*/__init__.py"]

From 381e3f2a8d7f409b752a9830396915ded81f8044 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 09:56:20 -0400
Subject: [PATCH 173/387] updating docs

---
 docs/how_it_works.md    | 2 +-
 docs/index.md           | 2 +-
 docs/troubleshooting.md | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/docs/how_it_works.md b/docs/how_it_works.md
index 5e48677fe7..1d2277b997 100644
--- a/docs/how_it_works.md
+++ b/docs/how_it_works.md
@@ -26,7 +26,7 @@ In a simple example, we run a BBOT scan with **three modules**: `nmap`, `sslcert
 
 - **`nmap`** consumes `DNS_NAME`s, port-scans them, and outputs `OPEN_TCP_PORT`s
 - **`sslcert`** consumes `OPEN_TCP_PORT`s, grabs certs, and extracts `DNS_NAME`s
-- **`httpx`** consumes `OPEN_TCP_PORT`s and visits any web services, extracting new `URL`s and `HTTP_RESPONSE`s.
+- **`httpx`** consumes `OPEN_TCP_PORT`s and visits any web services, ultimately producing new `DNS_NAME`s
 
 ```mermaid
 graph TD
diff --git a/docs/index.md b/docs/index.md
index 1ede24b934..b013c518ff 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -110,4 +110,4 @@ bbot -t evilcorp.com -f subdomain-enum -c modules.shodan_dns.api_key=deadbeef mo
 
 For more information, see [Configuration](./configuration). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
 
-## See: [Scanning](./scanning)
+## Next Up: [Scanning](./scanning)
diff --git a/docs/troubleshooting.md b/docs/troubleshooting.md
index 63a77f2df5..0ccfa8627e 100644
--- a/docs/troubleshooting.md
+++ b/docs/troubleshooting.md
@@ -5,7 +5,7 @@
 - `ERROR: No matching distribution found for bbot`
 - `bash: /home/user/.local/bin/bbot: /home/user/.local/pipx/venvs/bbot/bin/python: bad interpreter`
 
-If you get errors resembling any of the above, you need to do something like this:
+If you get errors resembling any of the above, it's probably because your Python version is too old. To install a newer version (3.9+ is required), you will need to do something like this:
 ```bash
 # install a newer version of python
 sudo apt install python3.9 python3.9-venv

From 77bcd268bf63a8a03571f986f899ccc7d6fe6005 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 10:04:14 -0400
Subject: [PATCH 174/387] fix broken link

---
 docs/scanning/configuration.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index 3b3eb16726..7f6b354958 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -7,7 +7,7 @@ For a list of all possible config options, see:
 - [Global Options](./global_options/)
 - [Module Options](./module_options/)
 
-For a summary of commonly-used config options, see [Common Config Options]
+For examples of common config changes, see [Tips and Tricks](../tips_and_tricks/).
 
 ## Configuration Files
 

From 92331a0e36e3f0c6dc49fcb1e8e0b69345d9863d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 12:32:52 -0400
Subject: [PATCH 175/387] prettifying

---
 bbot/scripts/docs.py             |  2 +-
 docs/index.md                    | 12 ++++++++----
 docs/scanning/configuration.md   | 11 +++--------
 docs/scanning/index.md           | 10 ++++------
 docs/scanning/output.md          |  4 +---
 docs/scanning/tips_and_tricks.md |  3 +--
 extra_sass/style.css.scss        |  9 +++++++++
 mkdocs.yml                       |  5 ++++-
 8 files changed, 31 insertions(+), 25 deletions(-)

diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index f5367a36fe..154d167237 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -96,7 +96,7 @@ def update_md_files(keyword, s):
     default_config_file = bbot_code_dir / "bbot" / "defaults.yml"
     with open(default_config_file) as f:
         default_config_yml = f.read()
-    default_config_yml = f"```yaml\n{default_config_yml}\n```"
+    default_config_yml = f'```yaml title="defaults.yml"\n{default_config_yml}\n```'
     assert len(default_config_yml.splitlines()) > 20
     update_md_files("BBOT DEFAULT CONFIG", default_config_yml)
 
diff --git a/docs/index.md b/docs/index.md
index b013c518ff..dcff61683b 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -6,13 +6,17 @@ _A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/
 
 ## Installation
 
+!!! info "Supported Platforms"
+
+    Only **Linux** is supported at this time. **Windows** and **macOS** are *not* supported! If you use one of these platforms, considering using [Docker](#Docker).
+
 BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution#installation-poetry).
 
 ### [Python (pip / pipx)](https://pypi.org/project/bbot/)
 
-Note: `pipx` installs BBOT inside its own virtual environment.
+???+ note
 
-Note: We only support Linux at this time. Windows and macOS are NOT supported!
+    `pipx` installs BBOT inside its own virtual environment.
 
 ```bash
 # stable version
@@ -93,7 +97,7 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap g
 
 No API keys are required to run BBOT. However, some modules need them to function. If you have API keys and want to make use of these modules, you can place them either in BBOT's YAML config (`~/.config/bbot/secrets.yml`):
 
-```yaml
+```yaml title="~/.config/bbot/secrets.yml"
 modules:
   shodan_dns:
     api_key: deadbeef
@@ -110,4 +114,4 @@ bbot -t evilcorp.com -f subdomain-enum -c modules.shodan_dns.api_key=deadbeef mo
 
 For more information, see [Configuration](./configuration). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
 
-## Next Up: [Scanning](./scanning)
+[Next Up: Scanning](./scanning/){ .md-button .md-button--primary }
diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index 7f6b354958..7173287ad8 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -30,7 +30,7 @@ bbot -t evilcorp.com --config http_proxy=http://127.0.0.1:8080
 
 Or, in `~/.config/bbot/config.yml`:
 
-```yaml
+```yaml title="~/.bbot/config/bbot.yml"
 http_proxy: http://127.0.0.1:8080
 ```
 
@@ -39,7 +39,7 @@ These two are equivalent.
 Config options specified via the command-line take precedence over all others. You can give BBOT a custom config file with `--config myconf.yml`, or individual arguments like this: `--config modules.shodan_dns.api_key=deadbeef`. To display the full and current BBOT config, including any command-line arguments, use `bbot --current-config`.
 
 Note that placing the following in `bbot.yml`:
-```yaml
+```yaml title="~/.bbot/config/bbot.yml"
 modules:
   shodan_dns:
     api_key: deadbeef
@@ -49,17 +49,12 @@ Is the same as:
 bbot --config modules.shodan_dns.api_key=deadbeef
 ```
 
-Here is an example of what a standard BBOT config might look like:
-```yaml
-modules:
-```
-
 ## Global Config Options
 
 Below is a full list of the config options supported, along with their defaults.
 
 <!-- BBOT DEFAULT CONFIG -->
-```yaml
+```yaml title="defaults.yml"
 ### BASIC OPTIONS ###
 
 # BBOT working directory
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index dccabc022d..16ca3d40fe 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -114,14 +114,14 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
 | cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
 | iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
@@ -204,9 +204,7 @@ Wildcard hosts are collapsed into a single host beginning with `_wildcard`:
 
 If you don't want this, you can disable wildcard detection on a domain-to-domain basis in the [config](./configuration):
 
-**`~/.bbot/config/bbot.yml`**:
-
-```yaml
+```yaml title="~/.bbot/config/bbot.yml"
 dns_wildcard_ignore:
   - evilcorp.com
   - evilcorp.co.uk
@@ -214,7 +212,7 @@ dns_wildcard_ignore:
 
 There are certain edge cases (such as with dynamic DNS rules) where BBOT's wildcard detection fails. In these cases, you can try increasing the number of wildcard checks in the config:
 
-```yaml
+```yaml title="~/.bbot/config/bbot.yml"
 # default == 10
 dns_wildcard_tests: 20
 ```
diff --git a/docs/scanning/output.md b/docs/scanning/output.md
index fb83ef3caa..e5c5ece1b6 100644
--- a/docs/scanning/output.md
+++ b/docs/scanning/output.md
@@ -81,9 +81,7 @@ bbot -t evilcorp.com -om http -c output_modules.http.url=http://localhost:8000
 
 You can customize the HTTP method if needed. Authentication is also supported:
 
-**`~/.config/bbot.yml`:**
-
-```yaml
+```yaml title="~/.bbot/config/bbot.yml"
 output_modules:
   http:
     url: https://localhost:8000
diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
index a292f50981..601daf5acf 100644
--- a/docs/scanning/tips_and_tricks.md
+++ b/docs/scanning/tips_and_tricks.md
@@ -22,8 +22,7 @@ bbot -t evilcorp.com -f subdomain-enum -m gowitness -c http_proxy=http://127.0.0
 
 BBOT's `httpx` module emits `HTTP_RESPONSE` events, but by default they're hidden from output. These events contain the full raw HTTP body along with headers, etc. If you want to see them, you can modify `omit_event_types` in the config:
 
-**`~/.config/bbot/bbot.yml`:**
-```yaml
+```yaml title="~/.bbot/config/bbot.yml"
 omit_event_types:
   - URL_UNVERIFIED
   # - HTTP_RESPONSE
diff --git a/extra_sass/style.css.scss b/extra_sass/style.css.scss
index 98f7a23fa2..6d9c733a37 100644
--- a/extra_sass/style.css.scss
+++ b/extra_sass/style.css.scss
@@ -59,6 +59,15 @@ table {
 
 /* DARK MODE SPECIFIC */
 
+[data-md-color-primary=black] p a.md-button--primary {
+  background-color: black;
+  border: none;
+}
+
+[data-md-color-primary=black] p a.md-button--primary:hover {
+  background-color: var(--bbot-orange);
+}
+
 [data-md-color-scheme="slate"] {
   div.md-source__repository ul {
     color: white;
diff --git a/mkdocs.yml b/mkdocs.yml
index 398541d6fe..ae42dd2a93 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -46,7 +46,10 @@ plugins:
   - extra-sass
 
 markdown_extensions:
-  - codehilite:
+  - admonition
+  - pymdownx.details
+  - pymdownx.superfences
+  - pymdownx.highlight:
       use_pygments: True
       noclasses: True
       pygments_style: github-dark

From b1ff5c2b6cdd234252a4f94b48a8545cfcf82c32 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 15:29:45 -0400
Subject: [PATCH 176/387] pypi badge

---
 README.md     | 2 +-
 docs/index.md | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/README.md b/README.md
index e7440a858e..5b93771041 100644
--- a/README.md
+++ b/README.md
@@ -2,7 +2,7 @@
 
 ### OSINT automation for hackers.
 
-[![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot) [![Discord](https://img.shields.io/discord/859164869970362439)](https://discord.com/invite/PZqkgxu5SA)
+[![Python Version](https://img.shields.io/badge/python-3.9+-FF8400)](https://www.python.org) [![Black](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black) [![License](https://img.shields.io/badge/license-GPLv3-FF8400.svg)](https://github.com/blacklanternsecurity/bbot/blob/dev/LICENSE) [![Tests](https://github.com/blacklanternsecurity/bbot/actions/workflows/tests.yml/badge.svg?branch=stable)](https://github.com/blacklanternsecurity/bbot/actions?query=workflow%3A"tests") [![Codecov](https://codecov.io/gh/blacklanternsecurity/bbot/branch/dev/graph/badge.svg?token=IR5AZBDM5K)](https://codecov.io/gh/blacklanternsecurity/bbot) [![Pypi Downloads](https://img.shields.io/pypi/dm/bbot)](https://pypi.org/project/bbot) [![Discord](https://img.shields.io/discord/859164869970362439)](https://discord.com/invite/PZqkgxu5SA)
 
 BBOT is a modular, recursive OSINT framework that can execute the entire OSINT workflow in a single command.
 
diff --git a/docs/index.md b/docs/index.md
index dcff61683b..7692f76a6d 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -112,6 +112,6 @@ Or on the command-line:
 bbot -t evilcorp.com -f subdomain-enum -c modules.shodan_dns.api_key=deadbeef modules.virustotal.api_key=cafebabe
 ```
 
-For more information, see [Configuration](./configuration). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
+For more information, see [Configuration](./scanning/configuration/). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
 
 [Next Up: Scanning](./scanning/){ .md-button .md-button--primary }

From f8ed4ce69ecf6bafcee79cd905f42169f3e4869d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 15:50:25 -0400
Subject: [PATCH 177/387] button fix

---
 docs/index.md | 4 ++--
 mkdocs.yml    | 1 +
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/docs/index.md b/docs/index.md
index 7692f76a6d..6aee14bbd8 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -8,7 +8,7 @@ _A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/
 
 !!! info "Supported Platforms"
 
-    Only **Linux** is supported at this time. **Windows** and **macOS** are *not* supported! If you use one of these platforms, considering using [Docker](#Docker).
+    Only **Linux** is supported at this time. **Windows** and **macOS** are *not* supported. If you use one of these platforms, consider using [Docker](#Docker).
 
 BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution#installation-poetry).
 
@@ -114,4 +114,4 @@ bbot -t evilcorp.com -f subdomain-enum -c modules.shodan_dns.api_key=deadbeef mo
 
 For more information, see [Configuration](./scanning/configuration/). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
 
-[Next Up: Scanning](./scanning/){ .md-button .md-button--primary }
+[Next Up: Scanning -->](./scanning/){ .md-button .md-button--primary }
diff --git a/mkdocs.yml b/mkdocs.yml
index ae42dd2a93..4722a3276e 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -46,6 +46,7 @@ plugins:
   - extra-sass
 
 markdown_extensions:
+  - attr_list
   - admonition
   - pymdownx.details
   - pymdownx.superfences

From d44657c0a2e8a8032f9bf9f73bc788f524814d27 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 6 Jul 2023 16:49:09 -0400
Subject: [PATCH 178/387] fix filename bug in download()

---
 bbot/core/helpers/web.py          | 2 +-
 bbot/test/test_step_1/test_web.py | 7 +++++++
 2 files changed, 8 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index c1700f3fab..58e58d0e45 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -124,7 +124,7 @@ async def download(self, url, **kwargs):
         Caching supported via "cache_hrs"
         """
         success = False
-        filename = kwargs.get("filename", self.parent_helper.cache_filename(url))
+        filename = kwargs.pop("filename", self.parent_helper.cache_filename(url))
         cache_hrs = float(kwargs.pop("cache_hrs", -1))
         log.debug(f"Downloading file from {url} with cache_hrs={cache_hrs}")
         if cache_hrs > 0 and self.parent_helper.is_cached(url):
diff --git a/bbot/test/test_step_1/test_web.py b/bbot/test/test_step_1/test_web.py
index 8475cc631e..d4b7c1d7a2 100644
--- a/bbot/test/test_step_1/test_web.py
+++ b/bbot/test/test_step_1/test_web.py
@@ -37,6 +37,13 @@ async def test_web_helpers(bbot_scanner, bbot_config, bbot_httpserver):
     assert scan1.helpers.is_cached(url)
     with open(filename) as f:
         assert f.read() == download_content
+    filename = Path("/tmp/bbot_download_test_file")
+    filename.unlink(missing_ok=True)
+    filename2 = await scan1.helpers.download(url, filename=filename)
+    assert filename2 == filename
+    assert filename2.is_file()
+    with open(filename2) as f:
+        assert f.read() == download_content
     # 404
     path = "/test_http_helpers_download_404"
     url = bbot_httpserver.url_for(path)

From 163743b8c39fa60ccf27180aa4eaadc7c82168fb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 7 Jul 2023 10:44:58 -0400
Subject: [PATCH 179/387] fix broken link

---
 docs/scanning/list_of_modules.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 3e60cb4882..27dadfe6fd 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -94,4 +94,4 @@
 | speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
 <!-- END BBOT MODULES -->
 
-For a list of module config options, see [Module Options](../configuration/module_options/).
+For a list of module config options, see [Module Options](../configuration/#module-config-options).

From e9f38fa7262e702cb75f0748e55436ff1b551c9d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 7 Jul 2023 13:04:34 -0400
Subject: [PATCH 180/387] fix some broken links

---
 docs/contribution.md             |  6 +++---
 docs/index.md                    |  4 ++--
 docs/scanning/configuration.md   |  4 ++--
 docs/scanning/index.md           | 18 +++++++++---------
 docs/scanning/list_of_modules.md |  2 +-
 5 files changed, 17 insertions(+), 17 deletions(-)

diff --git a/docs/contribution.md b/docs/contribution.md
index c90a4eb9ef..6815944e2f 100644
--- a/docs/contribution.md
+++ b/docs/contribution.md
@@ -93,7 +93,7 @@ This will produce the output:
 [INFO] Finishing scan
 ```
 
-But something's wrong! We're emitting `IP_ADDRESS` [events](./scanning/events), but they're not showing up in the output. This is because by default, BBOT only shows in-scope [events](./scanning/events). To see them, we need to increase the report distance:
+But something's wrong! We're emitting `IP_ADDRESS` [events](./scanning/events/), but they're not showing up in the output. This is because by default, BBOT only shows in-scope [events](./scanning/events/). To see them, we need to increase the report distance:
 
 ```bash
 # run the module again but with a higher report distance
@@ -122,9 +122,9 @@ Now, with the `report_distance=1`:
 
 ### `handle_event()` and `emit_event()`
 
-The `handle_event()` method is the most important part of the module. By overriding this method, you control what the module does. During a scan, when an [event](./scanning/events) from your `watched_events` is encountered (a `DNS_NAME` in this example), `handle_event()` is automatically called with that [event](./scanning/events).
+The `handle_event()` method is the most important part of the module. By overriding this method, you control what the module does. During a scan, when an [event](./scanning/events/) from your `watched_events` is encountered (a `DNS_NAME` in this example), `handle_event()` is automatically called with that [event](./scanning/events/).
 
-The `emit_event()` method is how modules return data. When you call `emit_event()`, it creates an [event](./scanning/events) and prints it to the console. It also distributes it any modules that are interested in that data type.
+The `emit_event()` method is how modules return data. When you call `emit_event()`, it creates an [event](./scanning/events/) and prints it to the console. It also distributes it any modules that are interested in that data type.
 
 ### Module Dependencies
 
diff --git a/docs/index.md b/docs/index.md
index 6aee14bbd8..c2fd543510 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -10,7 +10,7 @@ _A BBOT scan in real-time - visualization with [VivaGraphJS](https://github.com/
 
     Only **Linux** is supported at this time. **Windows** and **macOS** are *not* supported. If you use one of these platforms, consider using [Docker](#Docker).
 
-BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution#installation-poetry).
+BBOT offers multiple methods of installation, including **pipx** and **Docker**. If you plan to dev on BBOT, see [Installation (Poetry)](https://www.blacklanternsecurity.com/bbot/contribution/#installation-poetry).
 
 ### [Python (pip / pipx)](https://pypi.org/project/bbot/)
 
@@ -112,6 +112,6 @@ Or on the command-line:
 bbot -t evilcorp.com -f subdomain-enum -c modules.shodan_dns.api_key=deadbeef modules.virustotal.api_key=cafebabe
 ```
 
-For more information, see [Configuration](./scanning/configuration/). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules).
+For more information, see [Configuration](./scanning/configuration/). For a full list of modules, including which ones require API keys, see [List of Modules](./scanning/list_of_modules/).
 
 [Next Up: Scanning -->](./scanning/){ .md-button .md-button--primary }
diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index 7173287ad8..38edec747a 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -4,8 +4,8 @@ BBOT has a YAML config at `~/.config/bbot`. This config is different from the co
 
 For a list of all possible config options, see:
 
-- [Global Options](./global_options/)
-- [Module Options](./module_options/)
+- [Global Options](#global-config-options)
+- [Module Options](#module-config-options)
 
 For examples of common config changes, see [Tips and Tricks](../tips_and_tricks/).
 
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 16ca3d40fe..fac60761bd 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -36,13 +36,13 @@ https://www.evilcorp.co.uk
 $ bbot -t targets.txt fsociety.com 5.6.7.0/24 -m nmap
 ```
 
-On start, BBOT automatically converts Targets into [Events](./events).
+On start, BBOT automatically converts Targets into [Events](./events/).
 
 ## Modules (`-m`)
 
-To see a full list of modules and their descriptions, use `bbot -l` or see [List of Modules](./list_of_modules).
+To see a full list of modules and their descriptions, use `bbot -l` or see [List of Modules](./list_of_modules/).
 
-Modules are the part of BBOT that does the work -- port scanning, subdomain brute-forcing, API querying, etc. Modules consume [Events](../events/) (`IP_ADDRESS`, `DNS_NAME`, etc.) from each other, process the data in a useful way, then emit the results as new events. You can enable individual modules with `-m`.
+Modules are the part of BBOT that does the work -- port scanning, subdomain brute-forcing, API querying, etc. Modules consume [Events](./events/) (`IP_ADDRESS`, `DNS_NAME`, etc.) from each other, process the data in a useful way, then emit the results as new events. You can enable individual modules with `-m`.
 
 ```bash
 # Enable modules: nmap, sslcert, and httpx
@@ -56,14 +56,14 @@ Modules fall into three categories:
 - **Scan Modules**:
   - These make up the majority of modules. Examples are `nmap`, `sslcert`, `httpx`, etc. Enable with `-m`.
 - **Output Modules**:
-  - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output))
+  - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output/))
 - **Internal Modules**:
   - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disabled via the config (e.g. `-c speculate=false`).
     - `aggregate`: Summarizes results at the end of a scan
     - `excavate`: Extracts useful data such as subdomains from webpages, etc.
     - `speculate`: Intelligently infers new events, e.g. `OPEN_TCP_PORT` from `URL` or `IP_ADDRESS` from `IP_NETWORK`.
 
-For details in the inner workings of modules, see [Creating a Module](../contribution/module_creation/).
+For details in the inner workings of modules, see [Creating a Module](../contribution/#creating-a-module).
 
 ## Flags (`-f`)
 
@@ -147,15 +147,15 @@ By default, scope is whatever you specify with `-t`. This includes child subdoma
 
 ### Scope Distance
 
-Since BBOT is recursive, it would quickly resort to scannning the entire internet without some kind of restraining mechanism. To solve this problem, every [event](./events) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
+Since BBOT is recursive, it would quickly resort to scannning the entire internet without some kind of restraining mechanism. To solve this problem, every [event](./events/) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
 
 For example, if your target is `evilcorp.com`, `www.evilcorp.com` would have a scope distance of `0` (i.e. in-scope). If BBOT discovers that `www.evilcorp.com` resolves to `1.2.3.4`, `1.2.3.4` is one hop away, which means it would have a scope distance of `1`. If `1.2.3.4` has a PTR record that points to `ecorp.blob.core.windows.net`, `ecorp.blob.core.windows.net` is two hops away, so its scope distance is `2`.
 
-Scope distance continues to increase the further out you get. Most modules (e.g. `nuclei` and `nmap`) only consume in-scope events. Certain other passive modules such as `asn` accept out to distance `1`. By default, DNS resolution happens out to a distance of `2`. Upon its discovery, any [event](./events) that's determined to be in-scope (e.g. `www.evilcorp.com`) immediately becomes distance `0`, and the cycle starts over.
+Scope distance continues to increase the further out you get. Most modules (e.g. `nuclei` and `nmap`) only consume in-scope events. Certain other passive modules such as `asn` accept out to distance `1`. By default, DNS resolution happens out to a distance of `2`. Upon its discovery, any [event](./events/) that's determined to be in-scope (e.g. `www.evilcorp.com`) immediately becomes distance `0`, and the cycle starts over.
 
 #### Displaying Out-of-scope Events
 
-By default, BBOT only displayed in-scope events (with a few exceptions such as `STORAGE_BUCKET`s). If you want to see more, you must increase the [config](./configuration) value of `scope_report_distance`:
+By default, BBOT only displayed in-scope events (with a few exceptions such as `STORAGE_BUCKET`s). If you want to see more, you must increase the [config](./configuration/) value of `scope_report_distance`:
 
 ```bash
 # display out-of-scope events up to one hop away from the main scope
@@ -202,7 +202,7 @@ Wildcard hosts are collapsed into a single host beginning with `_wildcard`:
                 ^^^^^^^^^
 ```
 
-If you don't want this, you can disable wildcard detection on a domain-to-domain basis in the [config](./configuration):
+If you don't want this, you can disable wildcard detection on a domain-to-domain basis in the [config](./configuration/):
 
 ```yaml title="~/.bbot/config/bbot.yml"
 dns_wildcard_ignore:
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 27dadfe6fd..846118271e 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -94,4 +94,4 @@
 | speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
 <!-- END BBOT MODULES -->
 
-For a list of module config options, see [Module Options](../configuration/#module-config-options).
+For a list of module config options, see [Module Options](../configurations/#module-config-options).

From c10397b9f11b14ddad4700a173489ab2c7a9dda1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 7 Jul 2023 13:51:46 -0400
Subject: [PATCH 181/387] update censys module for v2 API

---
 bbot/modules/censys.py                        | 77 +++++++++++--------
 .../module_tests/test_module_censys.py        | 73 +++++++++++++-----
 2 files changed, 99 insertions(+), 51 deletions(-)

diff --git a/bbot/modules/censys.py b/bbot/modules/censys.py
index 283b902e37..9a81ac7dd0 100644
--- a/bbot/modules/censys.py
+++ b/bbot/modules/censys.py
@@ -10,19 +10,24 @@ class censys(shodan_dns):
     produced_events = ["DNS_NAME", "EMAIL_ADDRESS", "IP_ADDRESS", "OPEN_PORT", "PROTOCOL"]
     flags = ["subdomain-enum", "email-enum", "passive", "safe"]
     meta = {"description": "Query the Censys API", "auth_required": True}
-    options = {"api_id": "", "api_secret": ""}
-    options_desc = {"api_id": "Censys.io API ID", "api_secret": "Censys.io API Secret"}
+    options = {"api_id": "", "api_secret": "", "max_pages": 5}
+    options_desc = {
+        "api_id": "Censys.io API ID",
+        "api_secret": "Censys.io API Secret",
+        "max_pages": "Maximum number of pages to fetch (100 results per page)",
+    }
 
-    base_url = "https://search.censys.io/api/v1"
+    base_url = "https://search.censys.io/api"
 
     async def setup(self):
         self.api_id = self.config.get("api_id", "")
         self.api_secret = self.config.get("api_secret", "")
         self.auth = (self.api_id, self.api_secret)
+        self.max_pages = self.config.get("max_pages", 5)
         return await super().setup()
 
     async def ping(self):
-        url = f"{self.base_url}/account"
+        url = f"{self.base_url}/v1/account"
         resp = await self.helpers.request(url, auth=self.auth)
         d = resp.json()
         assert isinstance(d, dict), f"Invalid response from {url}: {resp}"
@@ -33,46 +38,54 @@ async def ping(self):
 
     async def query(self, query):
         results = set()
-        page = 1
-        while 1:
+        cursor = ""
+        for i in range(self.max_pages):
+            url = f"{self.base_url}/v2/certificates/search"
+            json_data = {
+                "q": f"names: {query}",
+                "per_page": 100,
+            }
+            if cursor:
+                json_data.update({"cursor": cursor})
             resp = await self.helpers.request(
-                f"{self.base_url}/search/certificates",
+                url,
                 method="POST",
-                json={
-                    "query": f"parsed.names: {query}",
-                    "page": page,
-                    "fields": ["parsed.names"],
-                },
+                json=json_data,
                 auth=self.auth,
             )
-            page += 1
 
             if resp is None:
                 break
 
             d = resp.json()
-            if d is None:
-                break
-            elif not isinstance(d, dict):
-                break
-
-            error = d.get("error", "")
-            if error:
-                self.warning(error)
 
             if resp.status_code < 200 or resp.status_code >= 400:
+                if isinstance(d, dict):
+                    error = d.get("error", "")
+                    if error:
+                        self.warning(error)
+                self.verbose(f'Non-200 Status code: {resp.status_code} for query "{query}", page #{i+1}')
+                self.debug(f"Response: {resp.text}")
                 break
-
-            elif d.get("status") is None or d["status"] != "ok" or len(d.get("results", [])) == 0:
-                break
-
-            for r in d["results"]:
-                for v in r["parsed.names"]:
-                    results.add(v.strip(".*").lower())
-
-            metadata = d.get("metadata", {})
-            if metadata.get("page", 0) >= metadata.get("pages", 0):
-                break
+            else:
+                if d is None:
+                    break
+                elif not isinstance(d, dict):
+                    break
+                status = d.get("status", "").lower()
+                result = d.get("result", {})
+                hits = result.get("hits", [])
+                if status != "ok" or not hits:
+                    break
+
+                for h in hits:
+                    names = h.get("names", [])
+                    for n in names:
+                        results.add(n.strip(".*").lower())
+
+                cursor = result.get("links", {}).get("next", "")
+                if not cursor:
+                    break
 
         return results
 
diff --git a/bbot/test/test_step_2/module_tests/test_module_censys.py b/bbot/test/test_step_2/module_tests/test_module_censys.py
index 0eb2017804..51a2d054bc 100644
--- a/bbot/test/test_step_2/module_tests/test_module_censys.py
+++ b/bbot/test/test_step_2/module_tests/test_module_censys.py
@@ -16,28 +16,63 @@ async def setup_before_prep(self, module_test):
             },
         )
         module_test.httpx_mock.add_response(
-            url="https://search.censys.io/api/v1/search/certificates",
-            match_content=b'{"query": "parsed.names: blacklanternsecurity.com", "page": 1, "fields": ["parsed.names"]}',
+            url="https://search.censys.io/api/v2/certificates/search",
+            match_content=b'{"q": "names: blacklanternsecurity.com", "per_page": 100}',
             json={
-                "status": "ok",
-                "metadata": {
-                    "query": "parsed.names: blacklanternsecurity.com",
-                    "count": 1,
-                    "backend_time": 4465,
-                    "page": 1,
-                    "pages": 4,
+                "code": 200,
+                "status": "OK",
+                "result": {
+                    "query": "names: blacklanternsecurity.com",
+                    "total": 196,
+                    "duration_ms": 1046,
+                    "hits": [
+                        {
+                            "parsed": {
+                                "validity_period": {
+                                    "not_before": "2021-11-18T00:09:46Z",
+                                    "not_after": "2022-11-18T00:09:46Z",
+                                },
+                                "issuer_dn": "C=US, ST=Arizona, L=Scottsdale, O=GoDaddy.com\\, Inc., OU=http://certs.godaddy.com/repository/, CN=Go Daddy Secure Certificate Authority - G2",
+                                "subject_dn": "CN=asdf.blacklanternsecurity.com",
+                            },
+                            "fingerprint_sha256": "590ad51b8db62925f0fd3f300264c6a36692e20ceec2b5a22e7e4b41c1575cdc",
+                            "names": ["asdf.blacklanternsecurity.com", "asdf2.blacklanternsecurity.com"],
+                        },
+                    ],
+                    "links": {"next": "NextToken", "prev": ""},
+                },
+            },
+        )
+        module_test.httpx_mock.add_response(
+            url="https://search.censys.io/api/v2/certificates/search",
+            match_content=b'{"q": "names: blacklanternsecurity.com", "per_page": 100, "cursor": "NextToken"}',
+            json={
+                "code": 200,
+                "status": "OK",
+                "result": {
+                    "query": "names: blacklanternsecurity.com",
+                    "total": 196,
+                    "duration_ms": 1046,
+                    "hits": [
+                        {
+                            "parsed": {
+                                "validity_period": {
+                                    "not_before": "2021-11-18T00:09:46Z",
+                                    "not_after": "2022-11-18T00:09:46Z",
+                                },
+                                "issuer_dn": "C=US, ST=Arizona, L=Scottsdale, O=GoDaddy.com\\, Inc., OU=http://certs.godaddy.com/repository/, CN=Go Daddy Secure Certificate Authority - G2",
+                                "subject_dn": "CN=zzzz.blacklanternsecurity.com",
+                            },
+                            "fingerprint_sha256": "590ad51b8db62925f0fd3f300264c6a36692e20ceec2b5a22e7e4b41c1575cdc",
+                            "names": ["zzzz.blacklanternsecurity.com"],
+                        },
+                    ],
+                    "links": {"next": "", "prev": ""},
                 },
-                "results": [
-                    {
-                        "parsed.names": [
-                            "asdf.blacklanternsecurity.com",
-                            "zzzz.blacklanternsecurity.com",
-                        ]
-                    },
-                ],
             },
         )
 
     def check(self, module_test, events):
-        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
-        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect asdf subdomain"
+        assert any(e.data == "asdf2.blacklanternsecurity.com" for e in events), "Failed to detect asdf2 subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect zzzz subdomain"

From 97730c1cc63f336fc5e2a5946b746232f2976815 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 7 Jul 2023 16:17:31 -0400
Subject: [PATCH 182/387] flag descriptions, web spider docs

---
 .github/workflows/docs.yml                  |  1 +
 bbot/core/flags.py                          | 40 +++++++--------
 bbot/core/helpers/modules.py                |  2 +-
 bbot/defaults.yml                           | 15 +++---
 bbot/test/test_step_1/test_modules_basic.py | 11 +++++
 docs/scanning/advanced.md                   |  2 +-
 docs/scanning/configuration.md              | 15 +++---
 docs/scanning/events.md                     | 54 ++++++++++-----------
 docs/scanning/index.md                      | 46 +++++++++---------
 docs/scanning/list_of_modules.md            |  1 -
 docs/scanning/tips_and_tricks.md            | 32 +++++++++++-
 11 files changed, 133 insertions(+), 86 deletions(-)

diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
index 6dce2ba5c4..ef4a9f0af1 100644
--- a/.github/workflows/docs.yml
+++ b/.github/workflows/docs.yml
@@ -3,6 +3,7 @@ on:
   push:
     branches:
       - material-docs
+      - dev
 permissions:
   contents: write
 jobs:
diff --git a/bbot/core/flags.py b/bbot/core/flags.py
index f8bf9abcfe..63c90fa4cf 100644
--- a/bbot/core/flags.py
+++ b/bbot/core/flags.py
@@ -1,22 +1,22 @@
 flag_descriptions = {
-    "active": "",
-    "affiliates": "",
-    "aggressive": "",
-    "cloud-enum": "",
-    "deadly": "",
-    "email-enum": "",
-    "iis-shortnames": "",
-    "passive": "",
-    "portscan": "",
-    "report": "",
-    "safe": "",
-    "service-enum": "",
-    "slow": "",
-    "social-enum": "",
-    "subdomain-enum": "",
-    "subdomain-hijack": "",
-    "web-basic": "",
-    "web-paramminer": "",
-    "web-screenshots": "",
-    "web-thorough": "",
+    "active": "Makes active connections to target systems",
+    "affiliates": "Discovers affiliated hostnames/domains",
+    "aggressive": "Generates a large amount of network traffic",
+    "cloud-enum": "Enumerates cloud resources",
+    "deadly": "Highly aggressive",
+    "email-enum": "Enumerates email addresses",
+    "iis-shortnames": "Scans for IIS Shortname vulnerability",
+    "passive": "Never connects to target systems",
+    "portscan": "Discovers open ports",
+    "report": "Generates a report at the end of the scan",
+    "safe": "Non-intrusive, safe to run",
+    "service-enum": "Identifies protocols running on open ports",
+    "slow": "May take a long time to complete",
+    "social-enum": "Enumerates social media",
+    "subdomain-enum": "Enumerates subdomains",
+    "subdomain-hijack": "Detects hijackable subdomains",
+    "web-basic": "Basic, non-intrusive web scan functionality",
+    "web-paramminer": "Discovers HTTP parameters through brute-force",
+    "web-screenshots": "Takes screenshots of web pages",
+    "web-thorough": "More advanced web scanning functionality",
 }
diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index eee3d7a512..7e758c747c 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -328,7 +328,7 @@ def flags(self, flags=None):
     def flags_table(self, flags=None):
         table = []
         header = ["Flag", "# Modules", "Description", "Modules"]
-        maxcolwidths = [20, 40, 5, 80]
+        maxcolwidths = [20, 5, 40, 80]
         _flags = self.flags(flags=flags)
         for flag, modules in _flags:
             description = flag_descriptions.get(flag, "")
diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 2ed0f2e039..30772026e1 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -21,6 +21,15 @@ http_proxy:
 # Web user-agent
 user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36
 
+### WEB SPIDER ###
+
+# Set the maximum number of HTTP links that can be followed in a row (0 == no spidering allowed)
+web_spider_distance: 0
+# Set the maximum directory depth for the web spider
+web_spider_depth: 1
+# Set the maximum number of links that can be followed per page
+web_spider_links_per_page: 25
+
 
 ### ADVANCED OPTIONS ###
 
@@ -55,12 +64,6 @@ httpx_retries: 1
 http_debug: false
 # Maximum number of HTTP redirects to follow
 http_max_redirects: 5
-# Set the maximum number of HTTP links that can be followed in a row (0 == no spidering allowed)
-web_spider_distance: 0
-# Set the maximum directory depth for the web spider
-web_spider_depth: 1
-# Set the maximum number of links that can be followed per page
-web_spider_links_per_page: 25
 # DNS query timeout
 dns_timeout: 5
 # How many times to retry DNS queries
diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index 0fbcfde355..92a771e804 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -114,9 +114,13 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
     assert all_preloaded["sslcert"]["deps"]["apt"]
     assert all_preloaded["massdns"]["deps"]["ansible"]
 
+    all_flags = set()
+
     for module_name, preloaded in all_preloaded.items():
         # either active or passive and never both
         flags = preloaded.get("flags", [])
+        for flag in flags:
+            all_flags.add(flag)
         if preloaded["type"] == "scan":
             assert ("active" in flags and not "passive" in flags) or (
                 not "active" in flags and "passive" in flags
@@ -156,3 +160,10 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
         assert all(
             o for o in preloaded.get("options_desc", {}).values()
         ), f"{module_name}.options_desc descriptions must not be blank"
+
+    from bbot.core.flags import flag_descriptions
+
+    for flag in all_flags:
+        assert flag in flag_descriptions, f'Flag "{flag}" not listed in bbot/core/flags.py'
+        description = flag_descriptions.get(flag, "")
+        assert description, f'Flag "{flag}" has no description in bbot/core/flags.py'
diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index a652ee15b7..75b9013619 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -55,7 +55,7 @@ Target:
 
 Modules:
   -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,mymodule,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
   -l, --list-modules    List available modules.
   -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
                         Exclude these modules.
diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index 38edec747a..c9dd55c8ad 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -78,6 +78,15 @@ http_proxy:
 # Web user-agent
 user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36
 
+### WEB SPIDER ###
+
+# Set the maximum number of HTTP links that can be followed in a row (0 == no spidering allowed)
+web_spider_distance: 0
+# Set the maximum directory depth for the web spider
+web_spider_depth: 1
+# Set the maximum number of links that can be followed per page
+web_spider_links_per_page: 25
+
 
 ### ADVANCED OPTIONS ###
 
@@ -112,12 +121,6 @@ httpx_retries: 1
 http_debug: false
 # Maximum number of HTTP redirects to follow
 http_max_redirects: 5
-# Set the maximum number of HTTP links that can be followed in a row (0 == no spidering allowed)
-web_spider_distance: 0
-# Set the maximum directory depth for the web spider
-web_spider_depth: 1
-# Set the maximum number of links that can be followed per page
-web_spider_links_per_page: 25
 # DNS query timeout
 dns_timeout: 5
 # How many times to retry DNS queries
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index c2744b84ef..c8f77178ed 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -1,6 +1,6 @@
 # Events
 
-An Event is a piece of data discovered by BBOT. Examples of an event include `IP_ADDRESS`, `DNS_NAME`, `EMAIL_ADDRESS`, `URL`, etc. When you run a BBOT scan, events are constantly being exchanged between modules. They are also output to the console:
+An Event is a piece of data discovered by BBOT. Examples include `IP_ADDRESS`, `DNS_NAME`, `EMAIL_ADDRESS`, `URL`, etc. When you run a BBOT scan, events are constantly being exchanged between modules. They are also output to the console:
 
 ```text
 [DNS_NAME]      www.evilcorp.com    sslcert         (distance-0, in-scope, resolved, subdomain, a-record)
@@ -47,30 +47,30 @@ Below is a full list of event types along with which modules produce/consume the
 ## List of Event Types
 
 <!-- BBOT EVENTS -->
-| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   | Producing Modules                                                                                                                                                                                                                                                                                                                                                                 |
-|---------------------|-----------------------|-----------------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |                                                                                                                                                                                                                                                                                                                                                                                   |
-| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | asn                                                                                                                                                                                                                                                                                                                                                                               |
-| DNS_NAME            | 47                    | 36                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, mymodule, naabu, nmap, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
-| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                                                                                                                                                                                                                                   |
-| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                               |
-| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                |
-| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | ipstack                                                                                                                                                                                                                                                                                                                                                                           |
-| HTTP_RESPONSE       | 8                     | 1                     | badsecrets, excavate, host_header, hunt, ntlm, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                     | httpx                                                                                                                                                                                                                                                                                                                                                                             |
-| IP_ADDRESS          | 7                     | 5                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                   | asset_inventory, censys, ipneighbor, mymodule, speculate                                                                                                                                                                                                                                                                                                                          |
-| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |                                                                                                                                                                                                                                                                                                                                                                                   |
-| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | censys                                                                                                                                                                                                                                                                                                                                                                            |
-| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                  |
-| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                              |
-| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |                                                                                                                                                                                                                                                                                                                                                                                   |
-| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | social                                                                                                                                                                                                                                                                                                                                                                            |
-| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                        |
-| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                             |
-| URL                 | 21                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                               | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                  |
-| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                    |
-| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                   |
-| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | vhost                                                                                                                                                                                                                                                                                                                                                                             |
-| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                         |
-| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | wafw00f                                                                                                                                                                                                                                                                                                                                                                           |
-| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | gowitness                                                                                                                                                                                                                                                                                                                                                                         |
+| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | Producing Modules                                                                                                                                                                                                                                                                                                                                                                 |
+|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                              |                                                                                                                                                                                                                                                                                                                                                                                   |
+| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | asn                                                                                                                                                                                                                                                                                                                                                                               |
+| DNS_NAME            | 46                    | 36                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, naabu, nmap, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
+| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |                                                                                                                                                                                                                                                                                                                                                                                   |
+| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                               |
+| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                |
+| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | ipstack                                                                                                                                                                                                                                                                                                                                                                           |
+| HTTP_RESPONSE       | 8                     | 1                     | badsecrets, excavate, host_header, hunt, ntlm, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                           | httpx                                                                                                                                                                                                                                                                                                                                                                             |
+| IP_ADDRESS          | 7                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                         | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                    |
+| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                                                                                                                                                                                                                                   |
+| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys                                                                                                                                                                                                                                                                                                                                                                            |
+| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                  |
+| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                              |
+| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                                                                                                                                                                                                                                   |
+| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | social                                                                                                                                                                                                                                                                                                                                                                            |
+| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                        |
+| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                             |
+| URL                 | 21                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                     | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                  |
+| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                    |
+| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                   |
+| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                | vhost                                                                                                                                                                                                                                                                                                                                                                             |
+| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                         |
+| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | wafw00f                                                                                                                                                                                                                                                                                                                                                                           |
+| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | gowitness                                                                                                                                                                                                                                                                                                                                                                         |
 <!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index fac60761bd..6ae5cea7ec 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -103,28 +103,28 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 ### List of Flags
 
 <!-- BBOT MODULE FLAGS -->
-| Flag             | # Modules   | Description   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
-|------------------|-------------|---------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| safe             | 58          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 43          |               | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, mymodule, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                         |
-| active           | 37          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
-| subdomain-enum   | 35          |               | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
-| web-thorough     | 25          |               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
-| aggressive       | 19          |               | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
-| web-basic        | 15          |               | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| slow             | 9           |               | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| cloud-enum       | 7           |               | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           |               | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| email-enum       | 6           |               | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| deadly           | 3           |               | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| web-paramminer   | 3           |               | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| portscan         | 3           |               | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| report           | 2           |               | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| social-enum      | 2           |               | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| iis-shortnames   | 2           |               | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| web-screenshots  | 1           |               | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| service-enum     | 1           |               | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| subdomain-hijack | 1           |               | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| Flag             | # Modules   | Description                                   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
+|------------------|-------------|-----------------------------------------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 58          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 42          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
+| active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
+| subdomain-enum   | 35          | Enumerates subdomains                         | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| web-thorough     | 25          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
+| aggressive       | 19          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
+| web-basic        | 15          | Basic, non-intrusive web scan functionality   | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| slow             | 9           | May take a long time to complete              | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| cloud-enum       | 7           | Enumerates cloud resources                    | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| affiliates       | 6           | Discovers affiliated hostnames/domains        | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| email-enum       | 6           | Enumerates email addresses                    | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| portscan         | 3           | Discovers open ports                          | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
 <!-- END BBOT MODULE FLAGS --> 
 
 ## Dependencies
@@ -147,7 +147,7 @@ By default, scope is whatever you specify with `-t`. This includes child subdoma
 
 ### Scope Distance
 
-Since BBOT is recursive, it would quickly resort to scannning the entire internet without some kind of restraining mechanism. To solve this problem, every [event](./events/) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
+Since BBOT is recursive, it would quickly resort to scanning the entire internet without some kind of restraining mechanism. To solve this problem, every [event](./events/) discovered by BBOT is assigned a **Scope Distance**. Scope distance represents how far out from the main scope that data was discovered.
 
 For example, if your target is `evilcorp.com`, `www.evilcorp.com` would have a scope distance of `0` (i.e. in-scope). If BBOT discovers that `www.evilcorp.com` resolves to `1.2.3.4`, `1.2.3.4` is one hop away, which means it would have a scope distance of `1`. If `1.2.3.4` has a PTR record that points to `ecorp.blob.core.windows.net`, `ecorp.blob.core.windows.net` is two hops away, so its scope distance is `2`.
 
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 846118271e..47b8ef53f7 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -64,7 +64,6 @@
 | ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
 | leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
 | massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
-| mymodule             | scan     | No              |                                                                        | passive                                                                       | IP_ADDRESS                                           |
 | otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
 | passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
 | pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
index 601daf5acf..60bd38d1b9 100644
--- a/docs/scanning/tips_and_tricks.md
+++ b/docs/scanning/tips_and_tricks.md
@@ -9,9 +9,39 @@ Press enter during a BBOT scan to change the log level. This will allow you to s
 
 ## Common Config Changes
 
+### Web Spider
+
+The web spider is great for finding juicy data like subdomains, email addresses, and javascript secrets buried in webpages. However since it can lengthen the duration of a scan, it's disabled by default. To enable the web spider, you must increase the value of `web_spider_distance`.
+
+The web spider is controlled with three config values:
+
+- `web_spider_distance` (`0` == all spidering disabled, default: `0`): the maximum number of links that can be followed in a row. This is designed to limit the spider in cases where `web_spider_depth` fails (e.g. for an ecommerce website with thousands of base-level URLs).
+- `web_spider_depth` (default: `1`: the maximum directory depth allowed. This is to prevent the spider from delving too deep into a website.
+- `web_spider_links_per_page` (default: `25`): the maximum number of links per page that can be followed. This is designed specifically for cases where a single page has hundreds or thousands of links.
+
+Here is a typical example:
+
+```yaml title="spider.yml"
+web_spider_depth: 2
+web_spider_distance: 2
+web_spider_links_per_page: 25
+```
+
+```bash
+# run the web spider against www.evilcorp.com
+bbot -t www.evilcorp.com -m httpx -c spider.yml
+```
+
+You can also pair the web spider with subdomain enumeration:
+
+```bash
+# spider every subdomain of evilcorp.com
+bbot -t evilcorp.com -f subdomain-enum -c spider.yml
+```
+
 ### Custom HTTP Proxy
 
-Web pentesters may appreciate the ability to proxy a scan through Burp Suite. When executed with gowitness, this will capture the traffic as if you manually visited each website in your browser -- including auxiliary web resources and javascript API calls. To accomplish this, set the `http_proxy` config option like so:
+Web pentesters may appreciate BBOT's ability to quickly populate Burp Suite site maps for all subdomains owned by a target. If your scan includes gowitness, this will capture the traffic as if you manually visited each website in your browser -- including auxiliary web resources and javascript API calls. To accomplish this, set the `http_proxy` config option like so:
 
 ```bash
 # enumerate subdomains, take web screenshots, proxy through Burp

From d3f4dbb33c3d213e6187e247d95706e65eec35a9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 7 Jul 2023 17:13:43 -0400
Subject: [PATCH 183/387] include consumed event types in module table

---
 bbot/core/helpers/modules.py     |  10 +-
 docs/how_it_works.md             |   2 +-
 docs/scanning/index.md           |   6 +-
 docs/scanning/list_of_modules.md | 180 +++++++++++++++----------------
 docs/scanning/tips_and_tricks.md |   2 +-
 5 files changed, 101 insertions(+), 99 deletions(-)

diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index 7e758c747c..1d8dec6daa 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -270,10 +270,11 @@ def add_or_create(d, k, *items):
 
     def modules_table(self, modules=None, mod_type=None):
         table = []
-        header = ["Module", "Type", "Needs API Key", "Description", "Flags", "Produced Events"]
-        maxcolwidths = [20, 20, 5, 40, 40, 40]
+        header = ["Module", "Type", "Needs API Key", "Description", "Flags", "Consumed Events", "Produced Events"]
+        maxcolwidths = [20, 10, 5, 30, 30, 20, 20]
         for module_name, preloaded in self.filter_modules(modules, mod_type):
             module_type = preloaded["type"]
+            consumed_events = sorted(preloaded.get("watched_events", []))
             produced_events = sorted(preloaded.get("produced_events", []))
             flags = sorted(preloaded.get("flags", []))
             api_key_required = ""
@@ -281,7 +282,7 @@ def modules_table(self, modules=None, mod_type=None):
             api_key_required = "Yes" if meta.get("auth_required", False) else "No"
             description = meta.get("description", "")
             table.append(
-                [module_name, module_type, api_key_required, description, ",".join(flags), ",".join(produced_events)]
+                [module_name, module_type, api_key_required, description, ", ".join(flags), ", ".join(consumed_events), ", ".join(produced_events)]
             )
         return make_table(table, header, maxcolwidths=maxcolwidths)
 
@@ -322,7 +323,8 @@ def flags(self, flags=None):
                     except KeyError:
                         _flags[flag] = {module_name}
 
-        _flags = sorted(_flags.items(), key=lambda x: len(x[-1]), reverse=True)
+        _flags = sorted(_flags.items(), key=lambda x: x[0])
+        _flags = sorted(_flags, key=lambda x: len(x[-1]), reverse=True)
         return _flags
 
     def flags_table(self, flags=None):
diff --git a/docs/how_it_works.md b/docs/how_it_works.md
index 1d2277b997..b7cf44c3c9 100644
--- a/docs/how_it_works.md
+++ b/docs/how_it_works.md
@@ -4,7 +4,7 @@ BBOT is a system of modules that interchange data **recursively**. Okay, but lik
 
 ## What It **_Isn't_**
 
-BBOT's discovery process does not have "phases", or "stages". I.e. it does not work like this:
+BBOT's discovery process does not have "phases", or "stages"; i.e. it does not work like this:
 
 ![how_it_doesnt_work](https://github.com/blacklanternsecurity/bbot/assets/20261699/67c4e332-f181-47e7-b884-2112bda347a4)
 
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 6ae5cea7ec..8aebeb4c62 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -117,14 +117,14 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 | affiliates       | 6           | Discovers affiliated hostnames/domains        | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
 | email-enum       | 6           | Enumerates email addresses                    | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
 | deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | portscan         | 3           | Discovers open ports                          | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 | social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 | service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 | subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
 <!-- END BBOT MODULE FLAGS --> 
 
 ## Dependencies
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 47b8ef53f7..fb26ce3902 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -1,96 +1,96 @@
 # List of Modules
 
 <!-- BBOT MODULES -->
-| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                         | Produced Events                                      |
-|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------|------------------------------------------------------|
-| badsecrets           | scan     | No              | Library for detecting known or weak secrets across many web frameworks | active,safe,web-basic,web-thorough                                            | FINDING,VULNERABILITY                                |
-| bucket_aws           | scan     | No              | Check for S3 buckets related to target                                 | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_azure         | scan     | No              | Check for Azure storage blobs related to target                        | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_digitalocean  | scan     | No              | Check for DigitalOcean spaces related to target                        | active,cloud-enum,safe,slow,web-thorough                                      | FINDING,STORAGE_BUCKET                               |
-| bucket_firebase      | scan     | No              | Check for open Firebase databases related to target                    | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bucket_gcp           | scan     | No              | Check for Google object storage related to target                      | active,cloud-enum,safe,web-basic,web-thorough                                 | FINDING,STORAGE_BUCKET                               |
-| bypass403            | scan     | No              | Check 403 pages for common bypasses                                    | active,aggressive,web-thorough                                                | FINDING                                              |
-| dnszonetransfer      | scan     | No              | Attempt DNS zone transfers                                             | active,safe,subdomain-enum                                                    | DNS_NAME                                             |
-| ffuf                 | scan     | No              | A fast web fuzzer written in Go                                        | active,aggressive,deadly                                                      | URL_UNVERIFIED                                       |
-| ffuf_shortnames      | scan     | No              | Use ffuf in combination IIS shortnames                                 | active,aggressive,iis-shortnames,web-thorough                                 | URL_UNVERIFIED                                       |
-| fingerprintx         | scan     | No              | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active,safe,service-enum,slow                                                 | PROTOCOL                                             |
-| generic_ssrf         | scan     | No              | Check for generic SSRFs                                                | active,aggressive,web-thorough                                                | VULNERABILITY                                        |
-| git                  | scan     | No              | Check for exposed .git repositories                                    | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| gowitness            | scan     | No              | Take screenshots of webpages                                           | active,safe,web-screenshots                                                   | TECHNOLOGY,URL,URL_UNVERIFIED,WEBSCREENSHOT          |
-| host_header          | scan     | No              | Try common HTTP Host header spoofing techniques                        | active,aggressive,web-thorough                                                | FINDING                                              |
-| httpx                | scan     | No              | Visit webpages. Many other modules rely on httpx                       | active,cloud-enum,safe,social-enum,subdomain-enum,web-basic,web-thorough      | HTTP_RESPONSE,URL                                    |
-| hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active,iis-shortnames,safe,web-basic,web-thorough                             | URL_HINT                                             |
-| masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active,aggressive,portscan                                                    | OPEN_TCP_PORT                                        |
-| naabu                | scan     | No              | Execute port scans with naabu                                          | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| nmap                 | scan     | No              | Execute port scans with nmap                                           | active,aggressive,portscan,web-thorough                                       | OPEN_TCP_PORT                                        |
-| ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active,safe,web-basic,web-thorough                                            | DNS_NAME,FINDING                                     |
-| nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active,aggressive,deadly                                                      | FINDING,VULNERABILITY                                |
-| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active,aggressive,slow,web-paramminer                                         | FINDING                                              |
-| robots               | scan     | No              | Look for and parse robots.txt                                          | active,safe,web-basic,web-thorough                                            | URL_UNVERIFIED                                       |
-| secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active,safe,web-basic,web-thorough                                            | FINDING                                              |
-| smuggler             | scan     | No              | Check for HTTP smuggling                                               | active,aggressive,slow,web-thorough                                           | FINDING                                              |
-| social               | scan     | No              | Look for social media links in webpages                                | active,safe,social-enum                                                       | SOCIAL                                               |
-| sslcert              | scan     | No              | Visit open ports and retrieve SSL certificates                         | active,affiliates,email-enum,safe,subdomain-enum,web-basic,web-thorough       | DNS_NAME,EMAIL_ADDRESS                               |
-| subdomain_hijack     | scan     | No              | Detect hijackable subdomains                                           | active,cloud-enum,safe,subdomain-enum,subdomain-hijack,web-basic,web-thorough | FINDING                                              |
-| telerik              | scan     | No              | Scan for critical Telerik vulnerabilities                              | active,aggressive,slow,web-thorough                                           | FINDING,VULNERABILITY                                |
-| url_manipulation     | scan     | No              | Attempt to identify URL parsing/routing based vulnerabilities          | active,aggressive,web-thorough                                                | FINDING                                              |
-| vhost                | scan     | No              | Fuzz for virtual hosts                                                 | active,aggressive,deadly,slow                                                 | DNS_NAME,VHOST                                       |
-| wafw00f              | scan     | No              | Web Application Firewall Fingerprinting Tool                           | active,aggressive                                                             | WAF                                                  |
-| wappalyzer           | scan     | No              | Extract technologies from web responses                                | active,safe,web-basic,web-thorough                                            | TECHNOLOGY                                           |
-| affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates,passive,report,safe                                                |                                                      |
-| anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive,report,safe,subdomain-enum                                            | ASN                                                  |
-| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| c99                  | scan     | Yes             | Query the C99 API for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| censys               | scan     | Yes             | Query the Censys API                                                   | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,IP_ADDRESS,OPEN_PORT,PROTOCOL |
-| certspotter          | scan     | No              | Query Certspotter's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive,safe                                                                  | DNS_NAME                                             |
-| crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| fullhunt             | scan     | Yes             | Query the fullhunt.io API for subdomains                               | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| github               | scan     | Yes             | Query Github's API for related repositories                            | passive,safe,subdomain-enum                                                   | URL_UNVERIFIED                                       |
-| hackertarget         | scan     | No              | Query the hackertarget.com API for subdomains                          | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| hunterio             | scan     | Yes             | Query hunter.io for emails                                             | email-enum,passive,safe,subdomain-enum                                        | DNS_NAME,EMAIL_ADDRESS,URL_UNVERIFIED                |
-| ipneighbor           | scan     | No              | Look beside IPs in their surrounding subnet                            | aggressive,passive,subdomain-enum                                             | IP_ADDRESS                                           |
-| ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive,safe                                                                  | GEOLOCATION                                          |
-| leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive,passive,slow,subdomain-enum                                        | DNS_NAME                                             |
-| otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| rapiddns             | scan     | No              | Query rapiddns.io for subdomains                                       | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum,passive,safe                                                       | EMAIL_ADDRESS                                        |
-| sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive,safe                                                                  | DNS_NAME                                             |
-| threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| viewdns              | scan     | No              | Query viewdns.info's reverse whois for related domains                 | affiliates,passive,safe                                                       | DNS_NAME                                             |
-| virustotal           | scan     | Yes             | Query VirusTotal's API for subdomains                                  | passive,safe,subdomain-enum                                                   | DNS_NAME                                             |
-| wayback              | scan     | No              | Query archive.org's API for subdomains                                 | passive,safe,subdomain-enum                                                   | DNS_NAME,URL_UNVERIFIED                              |
-| zoomeye              | scan     | Yes             | Query ZoomEye's API for subdomains                                     | affiliates,passive,safe,subdomain-enum                                        | DNS_NAME                                             |
-| asset_inventory      | output   | No              | Output to an asset inventory style flattened CSV file                  |                                                                               | IP_ADDRESS,OPEN_TCP_PORT                             |
-| csv                  | output   | No              | Output to CSV                                                          |                                                                               |                                                      |
-| http                 | output   | No              | Send every event to a custom URL via a web request                     |                                                                               |                                                      |
-| human                | output   | No              | Output to text                                                         |                                                                               |                                                      |
-| json                 | output   | No              | Output to JSON                                                         |                                                                               |                                                      |
-| neo4j                | output   | No              | Output to Neo4j                                                        |                                                                               |                                                      |
-| python               | output   | No              | Output via Python API                                                  |                                                                               |                                                      |
-| web_report           | output   | No              | Create a markdown report with web assets                               |                                                                               |                                                      |
-| websocket            | output   | No              | Output to websockets                                                   |                                                                               |                                                      |
-| aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive,safe                                                                  |                                                      |
-| excavate             | internal | No              | Passively extract juicy tidbits from scan data                         | passive                                                                       | URL_UNVERIFIED                                       |
-| speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                       | DNS_NAME,FINDING,IP_ADDRESS,OPEN_TCP_PORT            |
+| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                               | Consumed Events                                                                                         | Produced Events                                          |
+|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
+| badsecrets           | scan     | No              | Library for detecting known or weak secrets across many web frameworks | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING, VULNERABILITY                                   |
+| bucket_aws           | scan     | No              | Check for S3 buckets related to target                                 | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
+| bucket_azure         | scan     | No              | Check for Azure storage blobs related to target                        | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
+| bucket_digitalocean  | scan     | No              | Check for DigitalOcean spaces related to target                        | active, cloud-enum, safe, slow, web-thorough                                        | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
+| bucket_firebase      | scan     | No              | Check for open Firebase databases related to target                    | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
+| bucket_gcp           | scan     | No              | Check for Google object storage related to target                      | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
+| bypass403            | scan     | No              | Check 403 pages for common bypasses                                    | active, aggressive, web-thorough                                                    | URL                                                                                                     | FINDING                                                  |
+| dnszonetransfer      | scan     | No              | Attempt DNS zone transfers                                             | active, safe, subdomain-enum                                                        | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| ffuf                 | scan     | No              | A fast web fuzzer written in Go                                        | active, aggressive, deadly                                                          | URL                                                                                                     | URL_UNVERIFIED                                           |
+| ffuf_shortnames      | scan     | No              | Use ffuf in combination IIS shortnames                                 | active, aggressive, iis-shortnames, web-thorough                                    | URL_HINT                                                                                                | URL_UNVERIFIED                                           |
+| fingerprintx         | scan     | No              | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active, safe, service-enum, slow                                                    | OPEN_TCP_PORT                                                                                           | PROTOCOL                                                 |
+| generic_ssrf         | scan     | No              | Check for generic SSRFs                                                | active, aggressive, web-thorough                                                    | URL                                                                                                     | VULNERABILITY                                            |
+| git                  | scan     | No              | Check for exposed .git repositories                                    | active, safe, web-basic, web-thorough                                               | URL                                                                                                     | FINDING                                                  |
+| gowitness            | scan     | No              | Take screenshots of webpages                                           | active, safe, web-screenshots                                                       | URL                                                                                                     | TECHNOLOGY, URL, URL_UNVERIFIED, WEBSCREENSHOT           |
+| host_header          | scan     | No              | Try common HTTP Host header spoofing techniques                        | active, aggressive, web-thorough                                                    | HTTP_RESPONSE                                                                                           | FINDING                                                  |
+| httpx                | scan     | No              | Visit webpages. Many other modules rely on httpx                       | active, cloud-enum, safe, social-enum, subdomain-enum, web-basic, web-thorough      | OPEN_TCP_PORT, URL, URL_UNVERIFIED                                                                      | HTTP_RESPONSE, URL                                       |
+| hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                                  |
+| iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active, iis-shortnames, safe, web-basic, web-thorough                               | URL                                                                                                     | URL_HINT                                                 |
+| masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active, aggressive, portscan                                                        | SCAN                                                                                                    | OPEN_TCP_PORT                                            |
+| naabu                | scan     | No              | Execute port scans with naabu                                          | active, aggressive, portscan, web-thorough                                          | DNS_NAME, IP_ADDRESS                                                                                    | OPEN_TCP_PORT                                            |
+| nmap                 | scan     | No              | Execute port scans with nmap                                           | active, aggressive, portscan, web-thorough                                          | DNS_NAME, IP_ADDRESS                                                                                    | OPEN_TCP_PORT                                            |
+| ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE, URL                                                                                      | DNS_NAME, FINDING                                        |
+| nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active, aggressive, deadly                                                          | URL                                                                                                     | FINDING, VULNERABILITY                                   |
+| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active, aggressive, slow, web-paramminer                                            | URL                                                                                                     | FINDING                                                  |
+| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active, aggressive, slow, web-paramminer                                            | URL                                                                                                     | FINDING                                                  |
+| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active, aggressive, slow, web-paramminer                                            | URL                                                                                                     | FINDING                                                  |
+| robots               | scan     | No              | Look for and parse robots.txt                                          | active, safe, web-basic, web-thorough                                               | URL                                                                                                     | URL_UNVERIFIED                                           |
+| secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                                  |
+| smuggler             | scan     | No              | Check for HTTP smuggling                                               | active, aggressive, slow, web-thorough                                              | URL                                                                                                     | FINDING                                                  |
+| social               | scan     | No              | Look for social media links in webpages                                | active, safe, social-enum                                                           | URL_UNVERIFIED                                                                                          | SOCIAL                                                   |
+| sslcert              | scan     | No              | Visit open ports and retrieve SSL certificates                         | active, affiliates, email-enum, safe, subdomain-enum, web-basic, web-thorough       | OPEN_TCP_PORT                                                                                           | DNS_NAME, EMAIL_ADDRESS                                  |
+| subdomain_hijack     | scan     | No              | Detect hijackable subdomains                                           | active, cloud-enum, safe, subdomain-enum, subdomain-hijack, web-basic, web-thorough | DNS_NAME, DNS_NAME_UNRESOLVED                                                                           | FINDING                                                  |
+| telerik              | scan     | No              | Scan for critical Telerik vulnerabilities                              | active, aggressive, slow, web-thorough                                              | URL                                                                                                     | FINDING, VULNERABILITY                                   |
+| url_manipulation     | scan     | No              | Attempt to identify URL parsing/routing based vulnerabilities          | active, aggressive, web-thorough                                                    | URL                                                                                                     | FINDING                                                  |
+| vhost                | scan     | No              | Fuzz for virtual hosts                                                 | active, aggressive, deadly, slow                                                    | URL                                                                                                     | DNS_NAME, VHOST                                          |
+| wafw00f              | scan     | No              | Web Application Firewall Fingerprinting Tool                           | active, aggressive                                                                  | URL                                                                                                     | WAF                                                      |
+| wappalyzer           | scan     | No              | Extract technologies from web responses                                | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | TECHNOLOGY                                               |
+| affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates, passive, report, safe                                                   | *                                                                                                       |                                                          |
+| anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive, report, safe, subdomain-enum                                               | IP_ADDRESS                                                                                              | ASN                                                      |
+| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |
+| binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| c99                  | scan     | Yes             | Query the C99 API for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| censys               | scan     | Yes             | Query the Censys API                                                   | email-enum, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME, EMAIL_ADDRESS, IP_ADDRESS, OPEN_PORT, PROTOCOL |
+| certspotter          | scan     | No              | Query Certspotter's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
+| fullhunt             | scan     | Yes             | Query the fullhunt.io API for subdomains                               | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| github               | scan     | Yes             | Query Github's API for related repositories                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | URL_UNVERIFIED                                           |
+| hackertarget         | scan     | No              | Query the hackertarget.com API for subdomains                          | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| hunterio             | scan     | Yes             | Query hunter.io for emails                                             | email-enum, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME, EMAIL_ADDRESS, URL_UNVERIFIED                  |
+| ipneighbor           | scan     | No              | Look beside IPs in their surrounding subnet                            | aggressive, passive, subdomain-enum                                                 | IP_ADDRESS                                                                                              | IP_ADDRESS                                               |
+| ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive, safe                                                                       | IP_ADDRESS                                                                                              | GEOLOCATION                                              |
+| leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive, passive, slow, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
+| rapiddns             | scan     | No              | Query rapiddns.io for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
+| sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |
+| viewdns              | scan     | No              | Query viewdns.info's reverse whois for related domains                 | affiliates, passive, safe                                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| virustotal           | scan     | Yes             | Query VirusTotal's API for subdomains                                  | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| wayback              | scan     | No              | Query archive.org's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |
+| zoomeye              | scan     | Yes             | Query ZoomEye's API for subdomains                                     | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| asset_inventory      | output   | No              | Output to an asset inventory style flattened CSV file                  |                                                                                     | DNS_NAME, FINDING, IP_ADDRESS, OPEN_TCP_PORT, TECHNOLOGY, URL, VULNERABILITY                            | IP_ADDRESS, OPEN_TCP_PORT                                |
+| csv                  | output   | No              | Output to CSV                                                          |                                                                                     | *                                                                                                       |                                                          |
+| http                 | output   | No              | Send every event to a custom URL via a web request                     |                                                                                     | *                                                                                                       |                                                          |
+| human                | output   | No              | Output to text                                                         |                                                                                     | *                                                                                                       |                                                          |
+| json                 | output   | No              | Output to JSON                                                         |                                                                                     | *                                                                                                       |                                                          |
+| neo4j                | output   | No              | Output to Neo4j                                                        |                                                                                     | *                                                                                                       |                                                          |
+| python               | output   | No              | Output via Python API                                                  |                                                                                     | *                                                                                                       |                                                          |
+| web_report           | output   | No              | Create a markdown report with web assets                               |                                                                                     | FINDING, TECHNOLOGY, URL, VHOST, VULNERABILITY                                                          |                                                          |
+| websocket            | output   | No              | Output to websockets                                                   |                                                                                     | *                                                                                                       |                                                          |
+| aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive, safe                                                                       |                                                                                                         |                                                          |
+| excavate             | internal | No              | Passively extract juicy tidbits from scan data                         | passive                                                                             | HTTP_RESPONSE                                                                                           | URL_UNVERIFIED                                           |
+| speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                             | DNS_NAME, DNS_NAME_UNRESOLVED, HTTP_RESPONSE, IP_ADDRESS, IP_RANGE, STORAGE_BUCKET, URL, URL_UNVERIFIED | DNS_NAME, FINDING, IP_ADDRESS, OPEN_TCP_PORT             |
 <!-- END BBOT MODULES -->
 
 For a list of module config options, see [Module Options](../configurations/#module-config-options).
diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
index 60bd38d1b9..c6c032da7b 100644
--- a/docs/scanning/tips_and_tricks.md
+++ b/docs/scanning/tips_and_tricks.md
@@ -41,7 +41,7 @@ bbot -t evilcorp.com -f subdomain-enum -c spider.yml
 
 ### Custom HTTP Proxy
 
-Web pentesters may appreciate BBOT's ability to quickly populate Burp Suite site maps for all subdomains owned by a target. If your scan includes gowitness, this will capture the traffic as if you manually visited each website in your browser -- including auxiliary web resources and javascript API calls. To accomplish this, set the `http_proxy` config option like so:
+Web pentesters may appreciate BBOT's ability to quickly populate Burp Suite site maps for all subdomains in a target. If your scan includes gowitness, this will capture the traffic as if you manually visited each website in your browser -- including auxiliary web resources and javascript API calls. To accomplish this, set the `http_proxy` config option like so:
 
 ```bash
 # enumerate subdomains, take web screenshots, proxy through Burp

From 0cdd6ecf3eb244620bfbb33dd8d76323ee77102a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 9 Jul 2023 00:53:00 -0400
Subject: [PATCH 184/387] blacked

---
 bbot/core/helpers/modules.py | 10 +++++++++-
 docs/how_it_works.md         |  2 +-
 2 files changed, 10 insertions(+), 2 deletions(-)

diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index 1d8dec6daa..8edd406b74 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -282,7 +282,15 @@ def modules_table(self, modules=None, mod_type=None):
             api_key_required = "Yes" if meta.get("auth_required", False) else "No"
             description = meta.get("description", "")
             table.append(
-                [module_name, module_type, api_key_required, description, ", ".join(flags), ", ".join(consumed_events), ", ".join(produced_events)]
+                [
+                    module_name,
+                    module_type,
+                    api_key_required,
+                    description,
+                    ", ".join(flags),
+                    ", ".join(consumed_events),
+                    ", ".join(produced_events),
+                ]
             )
         return make_table(table, header, maxcolwidths=maxcolwidths)
 
diff --git a/docs/how_it_works.md b/docs/how_it_works.md
index b7cf44c3c9..3423e28a81 100644
--- a/docs/how_it_works.md
+++ b/docs/how_it_works.md
@@ -10,7 +10,7 @@ BBOT's discovery process does not have "phases", or "stages"; i.e. it does not w
 
 This is a traditional OSINT process, where you start with a target and you work in stages. Each stage gets you a little more data and requires more cleaning/deduplication, until finally you reach the end. The problem with this approach is that it **misses things**. 
 
-Imagine if on the last step of this process, you discovered a new subdomain. Awesome! But wait, shouldn't you go back and check that one the same way you did the others? Shouldn't you port-scan it and SSL-mine it and so on? Maybe you're a thorough, hard-working human, and you do all that. Maybe by doing that, you find another subdomain! _Sigh._ What about this time? Should you start over again for that one? You see the dilemma.
+Imagine if on the last step of this process, you discovered a new subdomain. Awesome! But wait, shouldn't you go back and check that one the same way you did the others? Shouldn't you port-scan it and SSL-mine it and so on? Maybe you're a thorough, hard-working human, and you take the time to do that. Maybe by doing that, you find another subdomain! _Sigh._ What about this time? Should you start over again for that one? You see the dilemma.
 
 ![traditional-workflow](https://github.com/blacklanternsecurity/bbot/assets/20261699/aa7cb6ac-6f88-464a-8069-0d534cecfd2b)
 

From e518f1e3f2d2492cfb6dffb166ebf0b5d7c8cf6c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 9 Jul 2023 01:18:35 -0400
Subject: [PATCH 185/387] autogenerate docs toc

---
 README.md              | 22 +++++++++++++++++++++-
 bbot/scripts/docs.py   | 26 +++++++++++++++++++++++++-
 docs/scanning/index.md |  2 +-
 mkdocs.yml             |  4 ++--
 4 files changed, 49 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index 5b93771041..51fb575b70 100644
--- a/README.md
+++ b/README.md
@@ -14,7 +14,27 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
 
-## Consider checking out our [Documentation](https://www.blacklanternsecurity.com/bbot).
+## Consider checking out our [Documentation](https://www.blacklanternsecurity.com/bbot):
+
+<!-- BBOT DOCS TOC -->
+- **Basics**
+        - [Getting Started](https://www.blacklanternsecurity.com/bbot/index)
+        - [How it Works](https://www.blacklanternsecurity.com/bbot/how_it_works)
+        - [Comparison to Other Tools](https://www.blacklanternsecurity.com/bbot/comparison)
+- **Scanning**
+        - [Scanning Overview](https://www.blacklanternsecurity.com/bbot/scanning/index)
+        - [Events](https://www.blacklanternsecurity.com/bbot/scanning/events)
+        - [Output](https://www.blacklanternsecurity.com/bbot/scanning/output)
+        - [Tips and Tricks](https://www.blacklanternsecurity.com/bbot/scanning/tips_and_tricks)
+        - [Advanced Usage](https://www.blacklanternsecurity.com/bbot/scanning/advanced)
+        - [Configuration](https://www.blacklanternsecurity.com/bbot/scanning/configuration)
+        - [List of Modules](https://www.blacklanternsecurity.com/bbot/scanning/list_of_modules)
+- **Contribution**
+        - [How to Write a Module](https://www.blacklanternsecurity.com/bbot/contribution)
+- **Misc**
+        - [Release History](https://www.blacklanternsecurity.com/bbot/release_history)
+        - [Troubleshooting](https://www.blacklanternsecurity.com/bbot/troubleshooting)
+<!-- END BBOT DOCS TOC -->
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 154d167237..66030d86dd 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -2,6 +2,7 @@
 
 import os
 import re
+import yaml
 from pathlib import Path
 
 from bbot.modules import module_loader
@@ -14,6 +15,8 @@
 blacklist_chars = ["<", ">"]
 blacklist_re = re.compile(r"\|([^|]*[" + re.escape("".join(blacklist_chars)) + r"][^|]*)\|")
 
+bbot_code_dir = Path(__file__).parent.parent.parent
+
 
 def enclose_tags(text):
     # Use re.sub() to replace matched words with the same words enclosed in backticks
@@ -47,7 +50,6 @@ def find_replace_file(file, keyword, replace):
 
 
 def update_docs():
-    bbot_code_dir = Path(__file__).parent.parent.parent
     md_files = [p for p in bbot_code_dir.glob("**/*.md") if p.is_file()]
 
     def update_md_files(keyword, s):
@@ -100,5 +102,27 @@ def update_md_files(keyword, s):
     assert len(default_config_yml.splitlines()) > 20
     update_md_files("BBOT DEFAULT CONFIG", default_config_yml)
 
+    # Table of Contents
+    mkdocs_yml_file = bbot_code_dir / "mkdocs.yml"
+    yaml.SafeLoader.add_constructor(
+        "tag:yaml.org,2002:python/name:pymdownx.superfences.fence_code_format", lambda x, y: {}
+    )
+    bbot_docs_toc = ""
+    base_url = "https://www.blacklanternsecurity.com/bbot"
+    with open(mkdocs_yml_file, "r") as f:
+        mkdocs_yaml = yaml.safe_load(f)
+        nav = mkdocs_yaml["nav"]
+        for section in nav:
+            # print(section)
+            for section_title, subsections in section.items():
+                bbot_docs_toc += f"- **{section_title}**\n"
+                for subsection in subsections:
+                    for subsection_title, subsection_path in subsection.items():
+                        path = subsection_path.split(".md")[0]
+                        bbot_docs_toc += f"        - [{subsection_title}]({base_url}/{path})\n"
+    bbot_docs_toc = bbot_docs_toc.strip()
+    assert len(bbot_docs_toc.splitlines()) > 5
+    update_md_files("BBOT DOCS TOC", bbot_docs_toc)
+
 
 update_docs()
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 8aebeb4c62..b2f61060de 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -2,7 +2,7 @@
 
 ## Scan Names
 
-Every BBOT scan gets a random and mildly-entertaining name like **`demonic_jimmy`**. Output for that scan, including scan stats and any web screenshots, are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed.
+Every BBOT scan gets a random, mildly-entertaining name like **`demonic_jimmy`**. Output for that scan, including scan stats and any web screenshots, are saved to a folder by that name in `~/.bbot/scans`. The most recent 20 scans are kept, and older ones are removed.
 
 If you don't want a random name, you can change it with `-n`. You can also change the location of BBOT's output with `-o`:
 
diff --git a/mkdocs.yml b/mkdocs.yml
index 4722a3276e..bd3fc780db 100644
--- a/mkdocs.yml
+++ b/mkdocs.yml
@@ -15,7 +15,7 @@ nav:
     - How it Works: how_it_works.md
     - Comparison to Other Tools: comparison.md
   - Scanning:
-    - scanning/index.md
+    - Scanning Overview: scanning/index.md
     - Events: scanning/events.md
     - Output: scanning/output.md
     - Tips and Tricks: scanning/tips_and_tricks.md
@@ -23,7 +23,7 @@ nav:
     - Configuration: scanning/configuration.md
     - List of Modules: scanning/list_of_modules.md
   - Contribution:
-      - How to Write a Module: contribution.md
+    - How to Write a Module: contribution.md
   - Misc:
     - Release History: release_history.md
     - Troubleshooting: troubleshooting.md

From c0db74c60c8c7ac9002bfab11803e66379a4f1ae Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 9 Jul 2023 01:19:33 -0400
Subject: [PATCH 186/387] fixed indentation

---
 README.md            | 26 +++++++++++++-------------
 bbot/scripts/docs.py |  2 +-
 2 files changed, 14 insertions(+), 14 deletions(-)

diff --git a/README.md b/README.md
index 51fb575b70..e9c44b1162 100644
--- a/README.md
+++ b/README.md
@@ -18,22 +18,22 @@ BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn
 
 <!-- BBOT DOCS TOC -->
 - **Basics**
-        - [Getting Started](https://www.blacklanternsecurity.com/bbot/index)
-        - [How it Works](https://www.blacklanternsecurity.com/bbot/how_it_works)
-        - [Comparison to Other Tools](https://www.blacklanternsecurity.com/bbot/comparison)
+    - [Getting Started](https://www.blacklanternsecurity.com/bbot/index)
+    - [How it Works](https://www.blacklanternsecurity.com/bbot/how_it_works)
+    - [Comparison to Other Tools](https://www.blacklanternsecurity.com/bbot/comparison)
 - **Scanning**
-        - [Scanning Overview](https://www.blacklanternsecurity.com/bbot/scanning/index)
-        - [Events](https://www.blacklanternsecurity.com/bbot/scanning/events)
-        - [Output](https://www.blacklanternsecurity.com/bbot/scanning/output)
-        - [Tips and Tricks](https://www.blacklanternsecurity.com/bbot/scanning/tips_and_tricks)
-        - [Advanced Usage](https://www.blacklanternsecurity.com/bbot/scanning/advanced)
-        - [Configuration](https://www.blacklanternsecurity.com/bbot/scanning/configuration)
-        - [List of Modules](https://www.blacklanternsecurity.com/bbot/scanning/list_of_modules)
+    - [Scanning Overview](https://www.blacklanternsecurity.com/bbot/scanning/index)
+    - [Events](https://www.blacklanternsecurity.com/bbot/scanning/events)
+    - [Output](https://www.blacklanternsecurity.com/bbot/scanning/output)
+    - [Tips and Tricks](https://www.blacklanternsecurity.com/bbot/scanning/tips_and_tricks)
+    - [Advanced Usage](https://www.blacklanternsecurity.com/bbot/scanning/advanced)
+    - [Configuration](https://www.blacklanternsecurity.com/bbot/scanning/configuration)
+    - [List of Modules](https://www.blacklanternsecurity.com/bbot/scanning/list_of_modules)
 - **Contribution**
-        - [How to Write a Module](https://www.blacklanternsecurity.com/bbot/contribution)
+    - [How to Write a Module](https://www.blacklanternsecurity.com/bbot/contribution)
 - **Misc**
-        - [Release History](https://www.blacklanternsecurity.com/bbot/release_history)
-        - [Troubleshooting](https://www.blacklanternsecurity.com/bbot/troubleshooting)
+    - [Release History](https://www.blacklanternsecurity.com/bbot/release_history)
+    - [Troubleshooting](https://www.blacklanternsecurity.com/bbot/troubleshooting)
 <!-- END BBOT DOCS TOC -->
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 66030d86dd..5e4b21c24c 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -119,7 +119,7 @@ def update_md_files(keyword, s):
                 for subsection in subsections:
                     for subsection_title, subsection_path in subsection.items():
                         path = subsection_path.split(".md")[0]
-                        bbot_docs_toc += f"        - [{subsection_title}]({base_url}/{path})\n"
+                        bbot_docs_toc += f"    - [{subsection_title}]({base_url}/{path})\n"
     bbot_docs_toc = bbot_docs_toc.strip()
     assert len(bbot_docs_toc.splitlines()) > 5
     update_md_files("BBOT DOCS TOC", bbot_docs_toc)

From 8502d12f3709b6c687b60dffffd9d2aefec5c2f6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 9 Jul 2023 01:22:30 -0400
Subject: [PATCH 187/387] strip index

---
 README.md            | 4 ++--
 bbot/scripts/docs.py | 4 ++--
 2 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/README.md b/README.md
index e9c44b1162..2515ff04d9 100644
--- a/README.md
+++ b/README.md
@@ -18,11 +18,11 @@ BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn
 
 <!-- BBOT DOCS TOC -->
 - **Basics**
-    - [Getting Started](https://www.blacklanternsecurity.com/bbot/index)
+    - [Getting Started](https://www.blacklanternsecurity.com/bbot/)
     - [How it Works](https://www.blacklanternsecurity.com/bbot/how_it_works)
     - [Comparison to Other Tools](https://www.blacklanternsecurity.com/bbot/comparison)
 - **Scanning**
-    - [Scanning Overview](https://www.blacklanternsecurity.com/bbot/scanning/index)
+    - [Scanning Overview](https://www.blacklanternsecurity.com/bbot/scanning/)
     - [Events](https://www.blacklanternsecurity.com/bbot/scanning/events)
     - [Output](https://www.blacklanternsecurity.com/bbot/scanning/output)
     - [Tips and Tricks](https://www.blacklanternsecurity.com/bbot/scanning/tips_and_tricks)
diff --git a/bbot/scripts/docs.py b/bbot/scripts/docs.py
index 5e4b21c24c..9969a8989c 100755
--- a/bbot/scripts/docs.py
+++ b/bbot/scripts/docs.py
@@ -113,12 +113,12 @@ def update_md_files(keyword, s):
         mkdocs_yaml = yaml.safe_load(f)
         nav = mkdocs_yaml["nav"]
         for section in nav:
-            # print(section)
             for section_title, subsections in section.items():
                 bbot_docs_toc += f"- **{section_title}**\n"
                 for subsection in subsections:
                     for subsection_title, subsection_path in subsection.items():
-                        path = subsection_path.split(".md")[0]
+                        path = subsection_path.split("index.md")[0]
+                        path = path.split(".md")[0]
                         bbot_docs_toc += f"    - [{subsection_title}]({base_url}/{path})\n"
     bbot_docs_toc = bbot_docs_toc.strip()
     assert len(bbot_docs_toc.splitlines()) > 5

From 3f31462aaf05184ab763c48293b0715323036835 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 9 Jul 2023 01:24:08 -0400
Subject: [PATCH 188/387] fix dead link

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 2515ff04d9..e1f265a820 100644
--- a/README.md
+++ b/README.md
@@ -12,7 +12,7 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 ![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/de0154c1-476e-4337-9599-45a1c5e0e78b)
 
-BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/how_it_works/).
+BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/bbot/how_it_works/).
 
 ## Consider checking out our [Documentation](https://www.blacklanternsecurity.com/bbot):
 

From 8d23ad83715ece030d789b94b8edf3e931ff73b2 Mon Sep 17 00:00:00 2001
From: Ikko Eltociear Ashimine <eltociear@gmail.com>
Date: Tue, 27 Jun 2023 14:40:05 +0900
Subject: [PATCH 189/387] Fix typo in nuclei.py

intialize -> initialize
---
 bbot/modules/deadly/nuclei.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/deadly/nuclei.py b/bbot/modules/deadly/nuclei.py
index 0b0f6bc6ee..649f2b4df0 100644
--- a/bbot/modules/deadly/nuclei.py
+++ b/bbot/modules/deadly/nuclei.py
@@ -87,7 +87,7 @@ async def setup(self):
         self.itoken = self.scan.config.get("interactsh_token", None)
 
         if self.mode not in ("technology", "severe", "manual", "budget"):
-            self.warning(f"Unable to intialize nuclei: invalid mode selected: [{self.mode}]")
+            self.warning(f"Unable to initialize nuclei: invalid mode selected: [{self.mode}]")
             return False
 
         if self.mode == "technology":

From e772525e6e95d622f48420061f903ec67782072f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 9 Jul 2023 01:51:08 -0400
Subject: [PATCH 190/387] fix list indentation

---
 docs/scanning/index.md | 12 ++++++------
 1 file changed, 6 insertions(+), 6 deletions(-)

diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index b2f61060de..3798bebba8 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -54,14 +54,14 @@ bbot -t www.evilcorp.com -m nmap sslcert httpx
 Modules fall into three categories:
 
 - **Scan Modules**:
-  - These make up the majority of modules. Examples are `nmap`, `sslcert`, `httpx`, etc. Enable with `-m`.
+    - These make up the majority of modules. Examples are `nmap`, `sslcert`, `httpx`, etc. Enable with `-m`.
 - **Output Modules**:
-  - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output/))
+    - These output scan data to different formats/destinations. `human`, `json`, and `csv` are enabled by default. Enable others with `-om`. (See: [Output](./output/))
 - **Internal Modules**:
-  - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disabled via the config (e.g. `-c speculate=false`).
-    - `aggregate`: Summarizes results at the end of a scan
-    - `excavate`: Extracts useful data such as subdomains from webpages, etc.
-    - `speculate`: Intelligently infers new events, e.g. `OPEN_TCP_PORT` from `URL` or `IP_ADDRESS` from `IP_NETWORK`.
+    - These modules perform essential, common-sense tasks. They are always enabled, unless explicitly disabled via the config (e.g. `-c speculate=false`).
+        - `aggregate`: Summarizes results at the end of a scan
+        - `excavate`: Extracts useful data such as subdomains from webpages, etc.
+        - `speculate`: Intelligently infers new events, e.g. `OPEN_TCP_PORT` from `URL` or `IP_ADDRESS` from `IP_NETWORK`.
 
 For details in the inner workings of modules, see [Creating a Module](../contribution/#creating-a-module).
 

From 744f3b18f82d36224cae254506c22f8a033f61d5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 9 Jul 2023 19:04:18 -0400
Subject: [PATCH 191/387] update readme, pipx command

---
 README.md              | 4 +---
 docs/index.md          | 2 +-
 docs/scanning/index.md | 2 +-
 3 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/README.md b/README.md
index e1f265a820..2745104568 100644
--- a/README.md
+++ b/README.md
@@ -49,7 +49,7 @@ For more installation methods including [Docker](https://hub.docker.com/r/blackl
 pipx install bbot
 
 # bleeding edge (dev branch)
-pipx install --pip-args pre bbot
+pipx install --pip-args '\--pre' bbot
 
 bbot --help
 ```
@@ -159,5 +159,3 @@ Special thanks to the following people who made BBOT possible:
 - Steve Micallef (@smicallef) for creating Spiderfoot
 - @kerrymilan for his Neo4j and Ansible expertise
 - Aleksei Kornev (@alekseiko) for allowing us ownership of the bbot Pypi repository <3
-
-See also: [Release History](https://github.com/blacklanternsecurity/bbot/wiki/Release-History)
diff --git a/docs/index.md b/docs/index.md
index c2fd543510..7592d4451c 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -23,7 +23,7 @@ BBOT offers multiple methods of installation, including **pipx** and **Docker**.
 pipx install bbot
 
 # bleeding edge (dev branch)
-pipx install --pip-args pre bbot
+pipx install --pip-args '\--pre' bbot
 
 # execute bbot command
 bbot --help
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 3798bebba8..ca14397151 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -155,7 +155,7 @@ Scope distance continues to increase the further out you get. Most modules (e.g.
 
 #### Displaying Out-of-scope Events
 
-By default, BBOT only displayed in-scope events (with a few exceptions such as `STORAGE_BUCKET`s). If you want to see more, you must increase the [config](./configuration/) value of `scope_report_distance`:
+By default, BBOT only displays in-scope events (with a few exceptions such as `STORAGE_BUCKET`s). If you want to see more, you must increase the [config](./configuration/) value of `scope_report_distance`:
 
 ```bash
 # display out-of-scope events up to one hop away from the main scope

From 77ce7c68416f79fc945217d5849592799f9ae866 Mon Sep 17 00:00:00 2001
From: github-actions <41898282+github-actions[bot]@users.noreply.github.com>
Date: Sun, 9 Jul 2023 23:05:14 +0000
Subject: [PATCH 192/387] Refresh module docs

---
 docs/scanning/advanced.md | 14 ++++++++++----
 1 file changed, 10 insertions(+), 4 deletions(-)

diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 75b9013619..42163e0c4f 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -33,10 +33,16 @@ asyncio.run(main())
 
 <!-- BBOT HELP OUTPUT -->
 ```text
-usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]] [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]] [--strict-scope] [-m MODULE [MODULE ...]] [-l]
-               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf] [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]] [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME] [-o DIR]
-               [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y] [--dry-run] [--current-config] [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps] [-a]
-               [--version]
+usage: bbot [-h] [--help-all] [-t TARGET [TARGET ...]]
+               [-w WHITELIST [WHITELIST ...]] [-b BLACKLIST [BLACKLIST ...]]
+               [--strict-scope] [-m MODULE [MODULE ...]] [-l]
+               [-em MODULE [MODULE ...]] [-f FLAG [FLAG ...]] [-lf]
+               [-rf FLAG [FLAG ...]] [-ef FLAG [FLAG ...]]
+               [-om MODULE [MODULE ...]] [--allow-deadly] [-n SCAN_NAME]
+               [-o DIR] [-c [CONFIG ...]] [-v] [-d] [-s] [--force] [-y]
+               [--dry-run] [--current-config]
+               [--no-deps | --force-deps | --retry-deps | --ignore-failed-deps | --install-all-deps]
+               [-a] [--version]
 
 Bighuge BLS OSINT Tool
 

From 766ad2f6b1d70f9d3d2a7425878e6ce8bb16278f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 10:10:26 -0400
Subject: [PATCH 193/387] builtwith TLC

---
 bbot/modules/builtwith.py | 9 +++++----
 bbot/modules/crobat.py    | 6 ++++--
 2 files changed, 9 insertions(+), 6 deletions(-)

diff --git a/bbot/modules/builtwith.py b/bbot/modules/builtwith.py
index 6c5a305c1a..4adcd2cb03 100644
--- a/bbot/modules/builtwith.py
+++ b/bbot/modules/builtwith.py
@@ -62,7 +62,7 @@ def parse_domains(self, r, query):
         """
         results_set = set()
         json = r.json()
-        if json:
+        if json and isinstance(json, dict):
             results = json.get("Results", [])
             if results:
                 for result in results:
@@ -74,8 +74,9 @@ def parse_domains(self, r, query):
                                 domain = f"{subdomain}.{domain}"
                             results_set.add(domain)
             else:
-                error = json.get("Errors", [{}])[0].get("Message", "Unknown Error")
-                if error:
+                errors = json.get("Errors", [{}])
+                if errors:
+                    error = errors[0].get("Message", "Unknown Error")
                     self.verbose(f"No results for {query}: {error}")
         return results_set
 
@@ -95,7 +96,7 @@ def parse_redirects(self, r, query):
         """
         results = set()
         json = r.json()
-        if json:
+        if json and isinstance(json, dict):
             inbound = json.get("Inbound", [])
             outbound = json.get("Outbound", [])
             if inbound:
diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index 09c29d9a2c..349256f690 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -128,8 +128,10 @@ async def query(self, query, parse_fn=None, request_fn=None):
                 results = list(parse_fn(response, query))
             except Exception as e:
                 if response:
-                    self.info(f'Status code {response.status_code} for query "{query}"')
-                    self.debug(response.text)
+                    self.info(
+                        f'Error parsing results for query "{query}" (status code {response.status_code})', trace=True
+                    )
+                    self.log.trace(response.text)
                 else:
                     self.info(f'Error parsing results for "{query}": {e}', trace=True)
                 return

From 9e9e59637a3d546ac3fd2bce4e696dfec11680e8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 10:12:53 -0400
Subject: [PATCH 194/387] don't emit DNS_NAME_UNRESOLVED

---
 bbot/defaults.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 715ae5547d..1ee19b199f 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -116,7 +116,7 @@ url_extension_httpx_only:
 omit_event_types:
     - HTTP_RESPONSE
     - URL_UNVERIFIED
-    # - DNS_NAME_UNRESOLVED
+    - DNS_NAME_UNRESOLVED
     # - IP_ADDRESS
 # URL of BBOT server
 agent_url: ''

From fb45287a32760da8a41698fda0218957a3b9e46e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 10:48:47 -0400
Subject: [PATCH 195/387] fix http_proxy, ssl_verify

---
 bbot/core/helpers/web.py | 20 +++++++++++++++-----
 bbot/modules/crobat.py   |  3 +++
 2 files changed, 18 insertions(+), 5 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 58e58d0e45..1e86d3543a 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -25,10 +25,18 @@ def __init__(self, *args, **kwargs):
         headers = kwargs.get("headers", None)
         if headers is None:
             headers = {}
+        # user agent
         user_agent = self._bbot_scan.config.get("user_agent", "BBOT")
         if "User-Agent" not in headers:
             headers["User-Agent"] = user_agent
         kwargs["headers"] = headers
+        # proxy
+        proxies = self._bbot_scan.config.get("http_proxy", None)
+        kwargs["proxies"] = proxies
+
+        http_debug = self._bbot_scan.config.get("http_debug", None)
+        if http_debug:
+            log.debug(f"Creating AsyncClient: {args}, {kwargs}")
 
         super().__init__(*args, **kwargs)
 
@@ -62,6 +70,7 @@ class WebHelper:
 
     def __init__(self, parent_helper):
         self.parent_helper = parent_helper
+        self.http_debug = self.parent_helper.config.get("http_debug", False)
         self.ssl_verify = self.parent_helper.config.get("ssl_verify", False)
         self.web_requests_per_second = self.parent_helper.config.get("web_requests_per_second", 50)
         self.web_rate_limiter = RateLimiter(self.web_requests_per_second, "Web")
@@ -69,7 +78,8 @@ def __init__(self, parent_helper):
     def AsyncClient(self, *args, **kwargs):
         kwargs["_bbot_scan"] = self.parent_helper.scan
         retries = kwargs.pop("retries", self.parent_helper.config.get("http_retries", 1))
-        kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries, verify=self.ssl_verify)
+        kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries)
+        kwargs["verify"] = self.ssl_verify
         return BBOTAsyncClient(*args, **kwargs)
 
     async def request(self, *args, **kwargs):
@@ -90,8 +100,6 @@ async def request(self, *args, **kwargs):
         if not args and "method" not in kwargs:
             kwargs["method"] = "GET"
 
-        http_debug = self.parent_helper.config.get("http_debug", False)
-
         client_kwargs = {}
         for k in list(kwargs):
             if k in self.client_options:
@@ -99,22 +107,24 @@ async def request(self, *args, **kwargs):
                 client_kwargs[k] = v
         async with self.AsyncClient(**client_kwargs) as client:
             try:
-                if http_debug:
+                if self.http_debug:
                     logstr = f"Web request: {str(args)}, {str(kwargs)}"
                     log.debug(logstr)
                 async with self.web_rate_limiter:
                     response = await client.request(*args, **kwargs)
-                if http_debug:
+                if self.http_debug:
                     log.debug(
                         f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
                     )
                 return response
             except httpx.RequestError as e:
                 log.debug(f"Error with request: {e}")
+                log.trace(traceback.format_exc())
                 if raise_error:
                     raise
             except ssl.SSLError as e:
                 log.debug(f"SSL error with request: {e}")
+                log.trace(traceback.format_exc())
 
     async def download(self, url, **kwargs):
         """
diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index 349256f690..d21447e8b6 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -124,6 +124,9 @@ async def query(self, query, parse_fn=None, request_fn=None):
             request_fn = self.request_url
         try:
             response = await request_fn(query)
+            if response is None:
+                self.info(f'Query "{query}" failed')
+                return []
             try:
                 results = list(parse_fn(response, query))
             except Exception as e:

From 8a8953dfce13065d5de4443ba874d2f33ed6fe4a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 12:11:00 -0400
Subject: [PATCH 196/387] tests for http proxy and ssl verification

---
 bbot/core/helpers/web.py          |  2 +-
 bbot/test/conftest.py             | 50 +++++++++++++++++++++++++++++++
 bbot/test/test_step_1/test_web.py | 46 ++++++++++++++++++++++++++++
 3 files changed, 97 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 1e86d3543a..9372fbab96 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -78,7 +78,7 @@ def __init__(self, parent_helper):
     def AsyncClient(self, *args, **kwargs):
         kwargs["_bbot_scan"] = self.parent_helper.scan
         retries = kwargs.pop("retries", self.parent_helper.config.get("http_retries", 1))
-        kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries)
+        kwargs["transport"] = httpx.AsyncHTTPTransport(retries=retries, verify=self.ssl_verify)
         kwargs["verify"] = self.ssl_verify
         return BBOTAsyncClient(*args, **kwargs)
 
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 6c7b125352..52d0d232a8 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -99,3 +99,53 @@ async def poll(self):
         for subdomain_tag in self.interactions:
             poll_results.append({"full-id": f"{subdomain_tag}.fakedomain.fakeinteractsh.com", "protocol": "HTTP"})
         return poll_results
+
+
+import threading
+import http.server
+import socketserver
+import urllib.request
+
+
+class Proxy(http.server.SimpleHTTPRequestHandler):
+    protocol_version = "HTTP/1.0"
+    server_version = "Proxy"
+    urls = []
+
+    def do_GET(self):
+        self.urls.append(self.path)
+
+        # Extract host and port from path
+        netloc = urllib.parse.urlparse(self.path).netloc
+        host, _, port = netloc.partition(":")
+
+        # Fetch the content
+        conn = http.client.HTTPConnection(host, port if port else 80)
+        conn.request("GET", self.path, headers=self.headers)
+        response = conn.getresponse()
+
+        # Send the response back to the client
+        self.send_response(response.status)
+        for header, value in response.getheaders():
+            self.send_header(header, value)
+        self.end_headers()
+        self.copyfile(response, self.wfile)
+
+        response.close()
+        conn.close()
+
+
+@pytest.fixture
+def proxy_server():
+    # Set up an HTTP server that acts as a simple proxy.
+    server = socketserver.ThreadingTCPServer(("localhost", 0), Proxy)
+
+    # Start the server in a new thread.
+    server_thread = threading.Thread(target=server.serve_forever)
+    server_thread.start()
+
+    yield server
+
+    # Stop the server.
+    server.shutdown()
+    server_thread.join()
diff --git a/bbot/test/test_step_1/test_web.py b/bbot/test/test_step_1/test_web.py
index d4b7c1d7a2..4635e80956 100644
--- a/bbot/test/test_step_1/test_web.py
+++ b/bbot/test/test_step_1/test_web.py
@@ -1,4 +1,5 @@
 import re
+from omegaconf import OmegaConf
 
 from ..bbot_fixtures import *
 
@@ -165,3 +166,48 @@ async def test_web_http_compare(httpx_mock, helpers):
     compare_helper.compare_body({"asdf": "fdsa"}, {"fdsa": "asdf"})
     for mode in ("getparam", "header", "cookie"):
         assert await compare_helper.canary_check("http://www.example.com", mode=mode) == True
+
+
+@pytest.mark.asyncio
+async def test_http_proxy(bbot_scanner, bbot_config, bbot_httpserver, proxy_server):
+    endpoint = "/test_http_proxy"
+    url = bbot_httpserver.url_for(endpoint)
+    # test user agent + custom headers
+    bbot_httpserver.expect_request(uri=endpoint).respond_with_data("test_http_proxy_yep")
+
+    proxy_address = f"http://127.0.0.1:{proxy_server.server_address[1]}"
+
+    test_config = OmegaConf.merge(bbot_config, OmegaConf.create({"http_proxy": proxy_address}))
+
+    scan = bbot_scanner("127.0.0.1", config=test_config)
+
+    assert len(proxy_server.RequestHandlerClass.urls) == 0
+
+    r = await scan.helpers.request(url)
+
+    assert (
+        len(proxy_server.RequestHandlerClass.urls) == 1
+    ), f"Request to {url} did not go through proxy {proxy_address}"
+    visited_url = proxy_server.RequestHandlerClass.urls[0]
+    assert visited_url.endswith(endpoint), f"There was a problem with request to {url}: {visited_url}"
+    assert r.status_code == 200 and r.text == "test_http_proxy_yep"
+
+
+@pytest.mark.asyncio
+async def test_http_ssl(bbot_scanner, bbot_config, bbot_httpserver_ssl):
+    endpoint = "/test_http_ssl"
+    url = bbot_httpserver_ssl.url_for(endpoint)
+    # test user agent + custom headers
+    bbot_httpserver_ssl.expect_request(uri=endpoint).respond_with_data("test_http_ssl_yep")
+
+    verify_config = OmegaConf.merge(bbot_config, OmegaConf.create({"ssl_verify": True, "http_debug": True}))
+    scan1 = bbot_scanner("127.0.0.1", config=verify_config)
+
+    not_verify_config = OmegaConf.merge(bbot_config, OmegaConf.create({"ssl_verify": False, "http_debug": True}))
+    scan2 = bbot_scanner("127.0.0.1", config=not_verify_config)
+
+    r1 = await scan1.helpers.request(url)
+    assert r1 is None, "Request to self-signed SSL server went through even with ssl_verify=True"
+    r2 = await scan2.helpers.request(url)
+    assert r2 is not None, "Request to self-signed SSL server failed even with ssl_verify=False"
+    assert r2.status_code == 200 and r2.text == "test_http_ssl_yep"

From a405f81ff6588df287f36792f91fc0bbdba82395 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 13:09:40 -0400
Subject: [PATCH 197/387] removed debug statements

---
 bbot/test/test_step_2/module_tests/test_module_git.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_git.py b/bbot/test/test_step_2/module_tests/test_module_git.py
index 57fcfa9183..6c986da55c 100644
--- a/bbot/test/test_step_2/module_tests/test_module_git.py
+++ b/bbot/test/test_step_2/module_tests/test_module_git.py
@@ -29,8 +29,6 @@ async def setup_after_prep(self, module_test):
         module_test.set_expect_requests(expect_args={"uri": "/test2/.git/config"}, respond_args={"response_data": ""})
 
     def check(self, module_test, events):
-        for e in events:
-            module_test.log.critical(e.data)
         assert any(
             e.type == "FINDING" and "http://127.0.0.1:8888/.git/config" in e.data["description"] for e in events
         )

From 55fb562390005d5dc871e7d88ed66c0dac7067be Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 13:34:51 -0400
Subject: [PATCH 198/387] remove http proxy from os.environ

---
 bbot/core/configurator/environ.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/bbot/core/configurator/environ.py b/bbot/core/configurator/environ.py
index 6651bad012..f6cb870468 100644
--- a/bbot/core/configurator/environ.py
+++ b/bbot/core/configurator/environ.py
@@ -130,6 +130,9 @@ def prepare_environment(bbot_config):
     if http_proxy:
         os.environ["HTTP_PROXY"] = http_proxy
         os.environ["HTTPS_PROXY"] = http_proxy
+    else:
+        del os.environ["HTTP_PROXY"]
+        del os.environ["HTTPS_PROXY"]
 
     # replace environment variables in preloaded modules
     module_loader.find_and_replace(**os.environ)

From 41dd5aeefa94b7eb322a356a708318e096bcb210 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 13:42:45 -0400
Subject: [PATCH 199/387] fix keyerror

---
 bbot/core/configurator/environ.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/core/configurator/environ.py b/bbot/core/configurator/environ.py
index f6cb870468..ac43bfdde3 100644
--- a/bbot/core/configurator/environ.py
+++ b/bbot/core/configurator/environ.py
@@ -131,8 +131,8 @@ def prepare_environment(bbot_config):
         os.environ["HTTP_PROXY"] = http_proxy
         os.environ["HTTPS_PROXY"] = http_proxy
     else:
-        del os.environ["HTTP_PROXY"]
-        del os.environ["HTTPS_PROXY"]
+        os.environ.pop("HTTP_PROXY", None)
+        os.environ.pop("HTTPS_PROXY", None)
 
     # replace environment variables in preloaded modules
     module_loader.find_and_replace(**os.environ)

From 5fb65165dc461905a8413ced1fb2470f93cd9335 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 14:10:59 -0400
Subject: [PATCH 200/387] don't tag URLs with unknown IP

---
 bbot/modules/httpx.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index 12577e9dc5..9e95cf2bb6 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -132,8 +132,10 @@ async def handle_batch(self, *events):
                 continue
 
             # main URL
-            httpx_ip = j.get("host", "unknown")
-            tags = [f"status-{status_code}", f"ip-{httpx_ip}"]
+            tags = [f"status-{status_code}"]
+            httpx_ip = j.get("host", "")
+            if httpx_ip:
+                tags.append(f"ip-{httpx_ip}")
             # detect login pages
             if is_login_page(j.get("body", "")):
                 tags.append("login-page")

From b070bf170472edf018178a50ea5c611eae850bd0 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 14:14:24 -0400
Subject: [PATCH 201/387] paramminer extraction feature

---
 bbot/core/helpers/misc.py                     |  87 ++++++++
 bbot/core/helpers/regexes.py                  |   6 +
 bbot/modules/hunt.py                          |  52 +----
 bbot/modules/paramminer_cookies.py            |   5 +-
 bbot/modules/paramminer_getparams.py          |   6 +-
 bbot/modules/paramminer_headers.py            |  54 ++++-
 .../test_module_paramminer_getparams.py       | 192 +++++++++++++++++-
 .../test_module_paramminer_headers.py         |   5 +-
 8 files changed, 341 insertions(+), 66 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index b86129338f..600e83f4f5 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -26,6 +26,7 @@
 from contextlib import suppress
 import cloudcheck as _cloudcheck
 import tldextract as _tldextract
+import xml.etree.ElementTree as ET
 from collections.abc import Mapping
 from hashlib import sha1 as hashlib_sha1
 from urllib.parse import urlparse, quote, unquote, urlunparse  # noqa F401
@@ -375,6 +376,92 @@ def rand_string(length=10, digits=True):
     return "".join([random.choice(pool) for _ in range(int(length))])
 
 
+def extract_params_json(json_data):
+    try:
+        data = json.loads(json_data)
+    except json.JSONDecodeError:
+        log.debug(f"Invalid JSON supplied. Returning empty list.")
+        return []
+
+    keys = []
+
+    def extract_keys(data):
+        if isinstance(data, dict):
+            for key, value in data.items():
+                keys.append(key)
+                extract_keys(value)
+        elif isinstance(data, list):
+            for item in data:
+                extract_keys(item)
+
+    extract_keys(data)
+    return keys
+
+
+def extract_params_xml(xml_data):
+    try:
+        root = ET.fromstring(xml_data)
+    except ET.ParseError:
+        log.debug("Invalid XML supplied. Returning empty list.")
+        return []
+
+    tags = []
+
+    def extract_tags(element):
+        tags.append(element.tag)
+        for child in element:
+            extract_tags(child)
+
+    extract_tags(root)
+    return tags
+
+
+def extract_params_html(html_data):
+    input_tag_regex = re.compile(r"<input.+?name=[\"\'](\w+)[\"\']")
+    jquery_get_regex = re.compile(r"url:\s?[\"\'].+?\?(\w+)=")
+    jquery_post_regex = re.compile(r"\$.post\([\'\"].+[\'\"].+\{(.+)\}")
+    a_tag_regex = re.compile(r"<a\s+(?:[^>]*?\s+)?href=(?:[\"\'](.+\?.+?))[\"\'].+[>\s]")
+
+    input_tag = regexes.input_tag_regex.findall(html_data)
+
+    for i in input_tag:
+        log.debug(f"FOUND PARAM ({i}) IN INPUT TAGS")
+        yield i
+
+    # check for jquery get parameters
+    jquery_get = regexes.jquery_get_regex.findall(html_data)
+
+    for i in jquery_get:
+        log.debug(f"FOUND PARAM ({i}) IN JQUERY GET PARAMS")
+        yield i
+
+    # check for jquery post parameters
+    jquery_post = regexes.jquery_post_regex.findall(html_data)
+    if jquery_post:
+        for i in jquery_post:
+            for x in i.split(","):
+                s = x.split(":")[0].rstrip()
+                log.debug(f"FOUND PARAM ({s}) IN A JQUERY POST PARAMS")
+                yield s
+
+    a_tag = regexes.a_tag_regex.findall(html_data)
+    if a_tag:
+        for url in a_tag:
+            if url.startswith("http"):
+                url_parsed = self.helpers.parse_url(url)
+                if not self.scan.in_scope(url_parsed.netloc):
+                    log.debug(f"Skipping checking for parameters because URL ({url}) is not in scope")
+                    continue
+                i = url_parsed.query.split("&")
+            else:
+                i = url.split("?")[1].split("&")
+            for x in i:
+                s = x.split("=")[0]
+
+                log.debug(f"FOUND PARAM ({s}) IN A TAG GET PARAMS")
+                yield s
+
+
 def extract_words(data, acronyms=True, wordninja=True, model=None, max_length=100, word_regexes=None):
     """
     Intelligently extract words from given data
diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index 634257ca5f..cc921f383e 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -62,3 +62,9 @@
 dns_name_regex = re.compile(_dns_name_regex, re.I)
 scan_name_regex = re.compile(r"[a-z]{3,20}_[a-z]{3,20}")
 hostname_regex = re.compile(_hostname_regex, re.I)
+
+# For use with extract_params_html helper
+input_tag_regex = re.compile(r"<input.+?name=[\"\'](\w+)[\"\']")
+jquery_get_regex = re.compile(r"url:\s?[\"\'].+?\?(\w+)=")
+jquery_post_regex = re.compile(r"\$.post\([\'\"].+[\'\"].+\{(.+)\}")
+a_tag_regex = re.compile(r"<a\s+(?:[^>]*?\s+)?href=(?:[\"\'](.+\?.+?))[\"\'].+[>\s]")
diff --git a/bbot/modules/hunt.py b/bbot/modules/hunt.py
index 64abd181eb..a58fc8c544 100644
--- a/bbot/modules/hunt.py
+++ b/bbot/modules/hunt.py
@@ -1,8 +1,8 @@
-# adopted from https://github.com/bugcrowd/HUNT
+# adapted from https://github.com/bugcrowd/HUNT
 
 import re
 from bbot.modules.base import BaseModule
-
+from bbot.core.helpers.misc import extract_params_html
 
 hunt_param_dict = {
     "Command Injection": [
@@ -273,11 +273,6 @@
 
 
 class hunt(BaseModule):
-    input_tag_regex = re.compile(r"<input.+?name=[\"\'](\w+)[\"\']")
-    jquery_get_regex = re.compile(r"url:\s?[\"\'].+?\?(\w+)=")
-    jquery_post_regex = re.compile(r"\$.post\([\'\"].+[\'\"].+\{(.+)\}")
-    a_tag_regex = re.compile(r"<a\s+(?:[^>]*?\s+)?href=(?:[\"\'](.+\?.+?))[\"\'].+[>\s]")
-
     watched_events = ["HTTP_RESPONSE"]
     produced_events = ["FINDING"]
     flags = ["active", "safe", "web-basic", "web-thorough"]
@@ -285,50 +280,9 @@ class hunt(BaseModule):
     # accept all events regardless of scope distance
     scope_distance_modifier = None
 
-    def extract_params(self, body):
-        # check for input tags
-        input_tag = self.input_tag_regex.findall(body)
-
-        for i in input_tag:
-            self.debug(f"FOUND PARAM ({i}) IN INPUT TAGS")
-            yield i
-
-        # check for jquery get parameters
-        jquery_get = self.jquery_get_regex.findall(body)
-
-        for i in jquery_get:
-            self.debug(f"FOUND PARAM ({i}) IN JQUERY GET PARAMS")
-            yield i
-
-        # check for jquery post parameters
-        jquery_post = self.jquery_post_regex.findall(body)
-        if jquery_post:
-            for i in jquery_post:
-                for x in i.split(","):
-                    s = x.split(":")[0].rstrip()
-                    self.debug(f"FOUND PARAM ({s}) IN A JQUERY POST PARAMS")
-                    yield s
-
-        a_tag = self.a_tag_regex.findall(body)
-        if a_tag:
-            for url in a_tag:
-                if url.startswith("http"):
-                    url_parsed = self.helpers.parse_url(url)
-                    if not self.scan.in_scope(url_parsed.netloc):
-                        self.debug(f"Skipping checking for parameters because URL ({url}) is not in scope")
-                        continue
-                    i = url_parsed.query.split("&")
-                else:
-                    i = url.split("?")[1].split("&")
-                for x in i:
-                    s = x.split("=")[0]
-
-                    self.debug(f"FOUND PARAM ({s}) IN A TAG GET PARAMS")
-                    yield s
-
     async def handle_event(self, event):
         body = event.data.get("body", "")
-        for p in self.extract_params(body):
+        for p in extract_params_html(body):
             for k in hunt_param_dict.keys():
                 if p.lower() in hunt_param_dict[k]:
                     description = f"Found potential {k.upper()} parameter [{p}]"
diff --git a/bbot/modules/paramminer_cookies.py b/bbot/modules/paramminer_cookies.py
index 0d4e28b0e6..907e2c32ea 100644
--- a/bbot/modules/paramminer_cookies.py
+++ b/bbot/modules/paramminer_cookies.py
@@ -6,19 +6,20 @@ class paramminer_cookies(paramminer_headers):
     Inspired by https://github.com/PortSwigger/param-miner
     """
 
-    watched_events = ["URL"]
+    watched_events = ["HTTP_RESPONSE"]
     produced_events = ["FINDING"]
     flags = ["active", "aggressive", "slow", "web-paramminer"]
     meta = {
         "description": "Smart brute-force to check for common HTTP cookie parameters",
     }
-    options = {"wordlist": "https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params"}
+    options = {"wordlist": ""}  # default is defined separately
     options_desc = {"wordlist": "Define the wordlist to be used to derive cookies"}
     scanned_hosts = []
     cookie_blacklist = []
     max_event_handlers = 12
     in_scope_only = True
     compare_mode = "cookie"
+    default_wordlist = "paramminer_parameters.txt"
 
     async def check_batch(self, compare_helper, url, cookie_list):
         cookies = {p: self.rand_string(14) for p in cookie_list}
diff --git a/bbot/modules/paramminer_getparams.py b/bbot/modules/paramminer_getparams.py
index 417c14ac54..c0ff27afe5 100644
--- a/bbot/modules/paramminer_getparams.py
+++ b/bbot/modules/paramminer_getparams.py
@@ -6,17 +6,17 @@ class paramminer_getparams(paramminer_headers):
     Inspired by https://github.com/PortSwigger/param-miner
     """
 
-    watched_events = ["URL"]
+    watched_events = ["HTTP_RESPONSE"]
     produced_events = ["FINDING"]
     flags = ["active", "aggressive", "slow", "web-paramminer"]
     meta = {"description": "Use smart brute-force to check for common HTTP GET parameters"}
-
-    options = {"wordlist": "https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params"}
+    options = {"wordlist": ""}  # default is defined separately
     options_desc = {"wordlist": "Define the wordlist to be used to derive GET params"}
     scanned_hosts = []
     getparam_blacklist = []
     in_scope_only = True
     compare_mode = "getparam"
+    default_wordlist = "paramminer_parameters.txt"
 
     async def check_batch(self, compare_helper, url, getparam_list):
         test_getparams = {p: self.rand_string(14) for p in getparam_list}
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 8357ea4db9..a4c1f14305 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -1,5 +1,6 @@
 from bbot.modules.base import BaseModule
 from bbot.core.errors import HttpCompareError
+from bbot.core.helpers.misc import extract_params_json, extract_params_xml, extract_params_html
 
 
 class paramminer_headers(BaseModule):
@@ -7,12 +8,20 @@ class paramminer_headers(BaseModule):
     Inspired by https://github.com/PortSwigger/param-miner
     """
 
-    watched_events = ["URL"]
+    watched_events = ["HTTP_RESPONSE"]
     produced_events = ["FINDING"]
     flags = ["active", "aggressive", "slow", "web-paramminer"]
     meta = {"description": "Use smart brute-force to check for common HTTP header parameters"}
-    options = {"wordlist": "https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers"}
-    options_desc = {"wordlist": "Define the wordlist to be used to derive headers"}
+    options = {
+        "wordlist": "",  # default is defined within setup function
+        "http_extract": True,
+        "skip_boring_words": True,
+    }
+    options_desc = {
+        "wordlist": "Define the wordlist to be used to derive headers",
+        "http_extract": "Attempt to find additional wordlist words from the HTTP Response",
+        "skip_boring_words": "Remove commonly uninteresting words from the wordlist",
+    }
     scanned_hosts = []
     header_blacklist = [
         "content-length",
@@ -28,17 +37,25 @@ class paramminer_headers(BaseModule):
     max_event_handlers = 12
     in_scope_only = True
     compare_mode = "header"
+    default_wordlist = "paramminer_headers.txt"
 
     async def setup(self):
+        wordlist = self.config.get("wordlist", "")
+        if not wordlist:
+            wordlist = f"{self.helpers.wordlist_dir}/{self.default_wordlist}"
+        self.debug(f"Using wordlist: [{wordlist}]")
         wordlist_url = self.config.get("wordlist", "")
         self.wordlist = await self.helpers.wordlist(wordlist_url)
+        self.boringlist = [
+            h.strip().lower() for h in self.helpers.read_file(f"{self.helpers.wordlist_dir}/paramminer_boring.txt")
+        ]
         return True
 
     def rand_string(self, *args, **kwargs):
         return self.helpers.rand_string(*args, **kwargs)
 
     async def handle_event(self, event):
-        url = event.data
+        url = event.data.get("url")
         try:
             compare_helper = self.helpers.http_compare(url)
         except HttpCompareError as e:
@@ -56,8 +73,17 @@ async def handle_event(self, event):
 
         fl = [h.strip().lower() for h in self.helpers.read_file(self.wordlist)]
 
-        wordlist_cleaned = list(filter(self.clean_list, fl))
+        # clean list against the blacklist
+        wordlist_cleaned = list(filter(self.clean_list_blacklist, fl))
 
+        # clean list against the boring list, if the option is set
+        if self.config.get("skip_boring_words", True):
+            wordlist_cleaned = list(filter(self.clean_list_boring, fl))
+
+        if self.config.get("http_extract"):
+            wordlist_cleaned = self.load_extracted_words(
+                wordlist_cleaned, event.data.get("body"), event.data.get("content_type")
+            )
         results = set()
         abort_threshold = 25
         try:
@@ -77,7 +103,7 @@ async def handle_event(self, event):
             tags = []
             if reflection:
                 tags = ["http_reflection"]
-            description = f"[Paramminer] {self.compare_mode.capitalize()}: [{result}] Reasons: [{reasons}]"
+            description = f"[Paramminer] {self.compare_mode.capitalize()}: [{result}] Reasons: [{reasons}] Reflection: [{str(reflection)}]"
             self.emit_event(
                 {"host": str(event.host), "url": url, "description": description},
                 "FINDING",
@@ -107,11 +133,25 @@ def gen_count_args(self, url):
             yield header_count, (url,), {"headers": fake_headers}
             header_count -= 5
 
-    def clean_list(self, header):
+    def clean_list_blacklist(self, header):
         if (len(header) > 0) and ("%" not in header) and (header not in self.header_blacklist):
             return True
         return False
 
+    def clean_list_boring(self, header):
+        if (len(header) > 0) and ("%" not in header) and (header not in self.boringlist):
+            return True
+        return False
+
+    def load_extracted_words(self, wordlist_cleaned, body, content_type):
+        if "json" in content_type.lower():
+            return wordlist_cleaned + extract_params_json(body)
+        elif "xml" in content_type.lower():
+            return wordlist_cleaned + extract_params_xml(body)
+        else:
+            return wordlist_cleaned + list(extract_params_html(body))
+        return wordlist_cleaned
+
     async def binary_search(self, compare_helper, url, group, reasons=None, reflection=False):
         if reasons is None:
             reasons = []
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
index d8fe73aaa6..c5b0ab145e 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
@@ -1,9 +1,12 @@
+import re
+
 from .test_module_paramminer_headers import *
 
 
 class TestParamminer_Getparams(TestParamminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
     config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"])}}}
+
     getparam_body = """
     <html>
     <title>the title</title>
@@ -36,10 +39,195 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [id] Reasons: [body]"
+            e.type == "FINDING" and "[Paramminer] Getparam: [id] Reasons: [body]" in e.data["description"]
             for e in events
         )
         assert not any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Getparam: [canary] Reasons: [body]"
+            e.type == "FINDING" and "[Paramminer] Getparam: [canary] Reasons: [body]" in e.data["description"]
+            for e in events
+        )
+
+
+class TestParamminer_Getparams_boring_off(TestParamminer_Getparams):
+    config_overrides = {
+        "modules": {"paramminer_getparams": {"skip_boring_words": False, "wordlist": tempwordlist(["canary", "host"])}}
+    }
+
+    async def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+        expect_args = {"query_string": b"host=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {"response_data": self.getparam_body_match}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.getparam_body}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING" and "[Paramminer] Getparam: [host] Reasons: [body]" in e.data["description"]
+            for e in events
+        )
+
+
+class TestParamminer_Getparams_boring_on(TestParamminer_Getparams_boring_off):
+    config_overrides = {
+        "modules": {"paramminer_getparams": {"skip_boring_words": True, "wordlist": tempwordlist(["canary", "host"])}}
+    }
+
+    def check(self, module_test, events):
+        assert not any(
+            e.type == "FINDING" and "[Paramminer] Getparam: [host] Reasons: [body]" in e.data["description"]
+            for e in events
+        )
+
+
+class TestParamminer_Getparams_Extract_Json(TestParamminer_Headers):
+    modules_overrides = ["httpx", "paramminer_getparams"]
+    config_overrides = {
+        "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"]), "http_extract": True}}
+    }
+
+    getparam_extract_json = """
+    {
+  "obscureParameter": 1,
+  "common": 1
+}
+    """
+
+    getparam_extract_json_match = """
+    {
+  "obscureParameter": "AAAAAAAAAAAAAA",
+  "common": 1
+}
+    """
+
+    async def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+
+        expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&common=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {
+            "response_data": self.getparam_extract_json_match,
+            "headers": {"Content-Type": "application/json"},
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {
+            "response_data": self.getparam_extract_json_match,
+            "headers": {"Content-Type": "application/json"},
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.getparam_extract_json, "headers": {"Content-Type": "application/json"}}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING"
+            and "[Paramminer] Getparam: [obscureParameter] Reasons: [body]" in e.data["description"]
+            for e in events
+        )
+
+
+class TestParamminer_Getparams_Extract_Xml(TestParamminer_Headers):
+    modules_overrides = ["httpx", "paramminer_getparams"]
+    config_overrides = {
+        "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"]), "http_extract": True}}
+    }
+
+    getparam_extract_xml = """
+<data>
+    <obscureParameter>1</obscureParameter>
+    <common>1</common>
+</data>
+    """
+
+    getparam_extract_xml_match = """
+<data>
+    <obscureParameter>AAAAAAAAAAAAAA</obscureParameter>
+    <common>1</common>
+</data>
+    """
+
+    async def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+
+        expect_args = {
+            "query_string": b"data=AAAAAAAAAAAAAA&obscureParameter=AAAAAAAAAAAAAA&common=AAAAAAAAAAAAAA&AAAAAA=1"
+        }
+        respond_args = {
+            "response_data": self.getparam_extract_xml_match,
+            "headers": {"Content-Type": "application/xml"},
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&common=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {
+            "response_data": self.getparam_extract_xml_match,
+            "headers": {"Content-Type": "application/xml"},
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {
+            "response_data": self.getparam_extract_xml_match,
+            "headers": {"Content-Type": "application/xml"},
+        }
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.getparam_extract_xml, "headers": {"Content-Type": "application/xml"}}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING"
+            and "[Paramminer] Getparam: [obscureParameter] Reasons: [body]" in e.data["description"]
+            for e in events
+        )
+
+
+class TestParamminer_Getparams_Extract_Html(TestParamminer_Headers):
+    modules_overrides = ["httpx", "paramminer_getparams"]
+    config_overrides = {
+        "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary"]), "http_extract": True}}
+    }
+
+    getparam_extract_html = """
+<html><a href="/?hack=1">ping</a></html>
+    """
+
+    getparam_extract_html_match = """
+<html><a href="/?hack=1">ping</a><p>HackThePlanet</p></html>
+    """
+
+    async def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+
+        expect_args = {"query_string": b"id=AAAAAAAAAAAAAA&hack=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {"response_data": self.getparam_extract_html_match, "headers": {"Content-Type": "text/html"}}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"query_string": b"hack=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {"response_data": self.getparam_extract_html_match, "headers": {"Content-Type": "text/html"}}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        respond_args = {"response_data": self.getparam_extract_html, "headers": {"Content-Type": "text/html"}}
+        module_test.set_expect_requests(respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING" and "[Paramminer] Getparam: [hack] Reasons: [body]" in e.data["description"]
             for e in events
         )
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
index 4ee4e80e89..8cf8bf50fe 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
@@ -40,10 +40,9 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [tracestate] Reasons: [body]"
+            e.type == "FINDING" and "[Paramminer] Header: [tracestate] Reasons: [body]" in e.data["description"]
             for e in events
         )
         assert not any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Header: [junkword1] Reasons: [body]"
-            for e in events
+            e.type == "FINDING" and "[Paramminer] Header: [junkword1]" in e.data["description"] for e in events
         )

From 70e87c86273a2af5a13a48ee0c68b77fa836d313 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 14:19:30 -0400
Subject: [PATCH 202/387] flake8

---
 .../module_tests/test_module_paramminer_getparams.py            | 2 --
 1 file changed, 2 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
index c5b0ab145e..3574a85c88 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
@@ -1,5 +1,3 @@
-import re
-
 from .test_module_paramminer_headers import *
 
 
From 6822c3f7cf7ca64fc10d8b9dbd72247758a8efb0 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 14:20:50 -0400
Subject: [PATCH 203/387] more flake8

---
 bbot/modules/hunt.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/modules/hunt.py b/bbot/modules/hunt.py
index a58fc8c544..7cc2e06dc1 100644
--- a/bbot/modules/hunt.py
+++ b/bbot/modules/hunt.py
@@ -1,6 +1,5 @@
 # adapted from https://github.com/bugcrowd/HUNT
 
-import re
 from bbot.modules.base import BaseModule
 from bbot.core.helpers.misc import extract_params_html
 

From e9024a9ca1d7403eb7a86d2f0a09a422352c1acc Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 14:23:07 -0400
Subject: [PATCH 204/387] even more flake8

---
 bbot/core/helpers/misc.py | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 600e83f4f5..1e818badda 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -417,11 +417,6 @@ def extract_tags(element):
 
 
 def extract_params_html(html_data):
-    input_tag_regex = re.compile(r"<input.+?name=[\"\'](\w+)[\"\']")
-    jquery_get_regex = re.compile(r"url:\s?[\"\'].+?\?(\w+)=")
-    jquery_post_regex = re.compile(r"\$.post\([\'\"].+[\'\"].+\{(.+)\}")
-    a_tag_regex = re.compile(r"<a\s+(?:[^>]*?\s+)?href=(?:[\"\'](.+\?.+?))[\"\'].+[>\s]")
-
     input_tag = regexes.input_tag_regex.findall(html_data)
 
     for i in input_tag:

From 07575a0e23ef870ead2396725f8823a615c7a331 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 14:36:48 -0400
Subject: [PATCH 205/387] adding in-house wordlists for paramminer

---
 bbot/wordlists/paramminer_boring.txt     |   44 +
 bbot/wordlists/paramminer_headers.txt    | 1150 ++++
 bbot/wordlists/paramminer_parameters.txt | 6523 ++++++++++++++++++++++
 3 files changed, 7717 insertions(+)
 create mode 100644 bbot/wordlists/paramminer_boring.txt
 create mode 100644 bbot/wordlists/paramminer_headers.txt
 create mode 100644 bbot/wordlists/paramminer_parameters.txt

diff --git a/bbot/wordlists/paramminer_boring.txt b/bbot/wordlists/paramminer_boring.txt
new file mode 100644
index 0000000000..2a76801959
--- /dev/null
+++ b/bbot/wordlists/paramminer_boring.txt
@@ -0,0 +1,44 @@
+host
+cookie
+user-agent
+content-encoding
+cf-connecting-ip
+content-range
+content-encoding
+x_alto_ajax_key
+referer
+upgrade
+expect
+vary
+connection
+accept-encoding
+accept-language
+accept
+transfer-encoding
+content-type
+content-length
+range
+if-unmodified-since
+if-modified-since
+if-match
+if
+proxy
+trailer
+waf-stuff-below
+negotiate
+javascript
+action
+authorization
+label
+start
+date
+keep-alive
+x-scanner
+zreferrer
+zvia
+zaccess-control-request-method
+zaccess-control-request-headers
+zorigin
+zx-request-id
+zx-timer
+zmax-forwards
\ No newline at end of file
diff --git a/bbot/wordlists/paramminer_headers.txt b/bbot/wordlists/paramminer_headers.txt
new file mode 100644
index 0000000000..53ea11e8b4
--- /dev/null
+++ b/bbot/wordlists/paramminer_headers.txt
@@ -0,0 +1,1150 @@
+accept
+accept-charset
+accept-encoding
+accept-language
+accept-ranges
+access-control-allow-credentials
+access-control-allow-headers
+access-control-allow-methods
+access-control-allow-origin
+access-control-expose-headers
+access-control-max-age
+access-control-request-headers
+access-control-request-method
+age
+allow
+authorization
+authenticate
+cache-control
+connection
+contact
+content-disposition
+content-encoding
+content-language
+content-length
+content-location
+content-range
+content-security-policy
+content-security-policy-report-only
+content-type
+cookie
+cookie2
+dnt
+date
+destination
+etag
+expect
+expires
+forwarded
+from
+host~%h:%s
+if-match
+if-modified-since
+if-none-match
+if-range
+if-unmodified-since
+keep-alive
+large-allocation
+last-modified
+location
+origin~https://%s.%h
+pragma
+profile
+proxy-authenticate
+proxy-authorization
+public-key-pins
+public-key-pins-report-only
+range
+referer~http://%s.%h/
+referrer-policy
+report-to
+retry-after
+server
+set-cookie
+set-cookie2
+sourcemap
+strict-transport-security
+te
+timing-allow-origin
+tk
+trailer
+transfer-encoding
+upgrade-insecure-requests
+user-agent
+vary
+via
+www-authenticate
+warning
+x-content-type-options
+x-dns-prefetch-control
+x-forwarded-for
+x-forwarded-host~%s.%h
+x-forwarded-proto
+x-forwarded-port
+x-forwarded-prefix
+front-end-https
+x-forwarded-protocol
+x-forwarded-ssl
+x-url-scheme
+x-cluster-client-ip
+x-forwarded-server~%s.%h
+proxy-host
+x-wap-profile
+x-original-url
+x-rewrite-url
+x-http-destinationurl
+proxy-connection
+x-uidh
+true-client-ip
+request-uri
+orig_path_info
+client-ip
+x-real-ip
+x-originating-ip
+cf-ipcountry
+cf-visitor
+remote-userhttps
+server-software
+web-server-api
+remote-addr
+remote-host
+remote-user
+request-method
+script-name
+path-info
+unencoded-url
+x-arr-ssl
+x-arr-log-id
+soapaction
+x-original-http-command
+x-server-name
+x-server-port
+query-string
+auth-password
+auth-type
+auth-user
+cert-cookie
+cert-flags
+cert-issuer
+cert-keysize
+cert-secretkeysize
+cert-serialnumber
+cert-server-issuer
+cert-server-subject
+cert-subject
+cf-template-path
+context-path
+gateway-interface
+https-keysize
+https-secretkeysize
+https-server-issuer
+https-server-subject
+http-accept
+http-accept-encoding
+http-accept-language
+http-connection
+http-cookie
+http-host
+http-referer
+http-url
+http-user-agent
+local-addr
+path-translated
+server-name
+server-port
+server-port-secure
+server-protocol
+cloudfront-viewer-country
+x-scheme
+x-cascade
+x-http-method-override
+x-http-path-override
+x-http-host-override
+x-http-method
+x-method-override
+x-cf-url
+php-auth-user
+php-auth-pw
+error
+post-vars
+raw-post-data
+proxy-request-fulluri
+request
+server-varsabantecart
+accept-application
+accept-auth
+accept-encodxng
+accept-version
+action
+admin
+akamai-origin-hop
+app
+app-key
+apply-to-redirect-ref
+atcept-language
+auth-digest-ie
+auth-key
+auth-realm
+base-url
+bearer-indication
+browser-user-agent
+case-files
+category
+ch
+challenge-response
+charset
+client-address
+client-bad-request
+client-conflict
+client-error-connect
+client-expectation-failed
+client-forbidden
+client-gone
+client-length-required
+client-method-not-allowed
+client-not-acceptable
+client-not-found
+client-payment-required
+client-precondition-failed
+client-proxy-auth-required
+client-quirk-mode
+client-requested-range-not-possible
+client-request-timeout
+client-request-too-large
+client-request-uri-too-large
+client-unauthorized
+client-unsupported-media-type
+cloudinary-name
+cloudinary-public-id
+cloudinaryurl
+cloudinary-version
+compress
+connection-type
+content
+content-type-xhtml
+cookies
+core-base
+credentials-filepath
+curl
+curl-multithreaded
+custom-secret-header
+dataserviceversion
+destroy
+devblocksproxybase
+devblocksproxyhost
+devblocksproxyssl
+digest
+dir
+dir-name
+dir-resource
+disable-gzip
+dkim-signature
+download-bad-url
+download-cut-short
+download-mime-type
+download-no-server
+download-size
+download-status-not-found
+download-status-server-error
+download-status-unauthorized
+download-status-unknown
+download-url
+env-silla-environment
+espo-authorization
+espo-cgi-auth
+eve-charid
+eve-charname
+eve-solarsystemid
+eve-solarsystemname
+ex-copy-movie
+ext
+fake-header
+fastly-client-ip
+fb-appid
+fb-secret
+filename
+file-not-found
+files
+files-vars
+foo-bar
+force-language
+force-local-xhprof
+forwarded-proto
+fromlink
+givenname
+global-all
+global-cookie
+global-get
+global-post
+google-code-project-hosting-hook-hmac
+h0st
+home
+host-liveserver
+host-name
+host-unavailable
+http-authorization
+if-modified-since-version
+if-posted-before
+if-unmodified-since-version
+images
+info
+ischedule-version
+iv-groups
+iv-user
+jenkins
+kiss-rpc
+last-event-id
+local-dir
+mail
+max-conn
+maxdataserviceversion
+max-request-size
+max-uri-length
+message
+message-b
+mode
+mod-env
+mod-security-message
+module-class
+module-class-path
+module-name
+ms-asprotocolversion
+msisdn
+my-header
+mysqlport
+native-sockets
+nonce
+not-exists
+notification-template
+onerror-return
+organizer
+params-get-catid
+params-get-currentday
+params-get-disposition
+params-get-downwards
+params-get-givendate
+params-get-lang
+params-get-type
+passkey
+path-base
+path-themes
+phpthreads
+portsensor-auth
+post-error
+postredir-301
+postredir-302
+postredir-all
+protocol
+protocols
+proxy-agent
+proxy-http-1-0
+proxy-pwd
+proxy-socks4a
+proxy-socks5-hostname
+proxy-url
+pull
+querystring
+realip
+real-ip
+real-method
+reason
+reason-phrase
+redirected-accept-language
+redirection-found
+redirection-multiple-choices
+redirection-not-modified
+redirection-permanent
+redirection-see-other
+redirection-temporary
+redirection-unused
+redirection-use-proxy
+redirect-problem-withoutwww
+redirect-problem-withwww
+ref
+referer
+refresh
+remix-hash
+remote-host-wp
+request-method-
+response
+rest-key
+returned-error
+rlnclientipaddr
+safe-ports-list
+safe-ports-ssl-list
+schedule-reply
+sec-websocket-accept
+sec-websocket-extensions
+sec-websocket-key1
+sec-websocket-key2
+sec-websocket-origin
+sec-websocket-protocol
+sec-websocket-version
+self
+send-x-frame-options
+server-bad-gateway
+server-error
+server-gateway-timeout
+server-internal
+server-not-implemented
+server-service-unavailable
+server-unsupported-version
+session-id-tag
+shib-
+shib-identity-provider
+shib-logouturl
+shopilex
+sn
+socketlog
+somevar
+sp-client
+ssl-offloaded
+sslsessionid
+ssl-session-id
+status-
+status-403
+status-403-admin-del
+status-404
+status-code
+status-platform-403
+success-accepted
+success-created
+success-no-content
+success-non-authoritative
+success-ok
+success-partial-content
+success-reset-content
+test
+test-config
+test-server-path
+test-something-anything
+ticket
+time-out
+tmp
+translate
+ua-color
+ua-resolution
+ua-voice
+unit-test-mode
+upgrade
+uri
+url-sanitize-path
+use-gzip
+useragent-via
+user-email
+user-id
+user-photos
+util
+verbose
+versioncode
+x-aastra-expmod1
+x-aastra-expmod2
+x-aastra-expmod3
+x-accel-mapping
+x-advertiser-id
+x-ajax-real-method
+x-alto-ajax-keyz
+x-api-signature
+x-api-timestamp
+x-apple-client-application
+x-apple-store-front
+x-authentication
+x-authentication-key
+x-auth-mode
+x-authorization
+x-auth-password
+x-auth-service-provider
+x-auth-token
+x-auth-userid
+x-auth-username
+x-avantgo-screensize
+x-azc-remote-addr
+x-bear-ajax-request
+x-bluecoat-via
+x-browser-height
+x-browser-width
+x-cache
+x-cept-encoding
+x-chrome-extension
+x-cisco-bbsm-clientip
+x-client-host
+x-client-id
+x-clientip
+x-client-key
+x-client-os
+x-client-os-ver
+x-collect-coverage
+x-credentials-request
+x-csrf-crumb
+x-cuid
+x-custom
+x-dagd-proxy
+x-davical-testcase
+x-debug-test
+x-dialog
+x-drestcg
+x-dsid
+x-enable-coverage
+x-environment-override
+x-experience-api-version
+x-fb-user-remote-addr
+x-file-id
+x-file-resume
+x-foo-bar
+x-forwarded-for-original
+x-forwarder-for
+x-forward-proto
+x-from
+x-gb-shared-secret
+x-geoip-country
+x-get-checksum
+x-helpscout-event
+x-hgarg-
+x-host
+x-https
+x-htx-agent
+x-if-unmodified-since
+x-imbo-test-config
+x-insight
+x-ip
+x-ip-trail
+x-iwproxy-nesting
+x-jphone-color
+x-jphone-geocode
+x-kaltura-remote-addr
+x-known-signature
+x-known-username
+x-litmus-second
+x-machine
+x-mandrill-signature
+x-mobile-ua
+x-mosso-dt
+x-msisdn
+x-ms-policykey
+x-myqee-system-debug
+x-myqee-system-hash
+x-myqee-system-isadmin
+x-myqee-system-isrest
+x-myqee-system-pathinfo
+x-myqee-system-project
+x-myqee-system-rstr
+x-myqee-system-time
+x-network-info
+x-nfsn-https
+x-ning-request-uri
+x-nokia-connection-mode
+x-nokia-msisdn
+x-nokia-wia-accept-original
+x-nokia-wtls
+x-nuget-apikey
+x-opera-info
+x-operamini-features
+x-orchestra-scheme
+x-orig-client
+x-original-host
+x-originally-forwarded-for
+x-originally-forwarded-proto
+x-original-remote-addr
+x-overlay
+x-pagelet-fragment
+x-password
+xpdb-debugger
+x-phabricator-csrf
+x-phpbb-using-plupload
+xproxy
+x-proxy-url
+x-pswd
+x-qafoo-profiler
+x-remote-protocol
+x-render-partial
+x-request
+x-request-id
+x-request-start
+x-response-format
+x-rest-cors
+x-sakura-forwarded-for
+x-scalr-auth-key
+x-scalr-auth-token
+x-scalr-env-id
+x-screen-height
+x-screen-width
+x-sendfile-type
+x-serialize
+x-serial-number
+x-server-id
+x-sina-proxyuser
+x-skyfire-screen
+x-ssl
+x-subdomain
+x-teamsite-preremap
+x-test-session-id
+x-tine20-jsonkey
+x-tine20-request-type
+x-tomboy-client
+x-tor
+x-twilio-signature
+x-uniquewcid
+x-up-calling-line-id
+x-up-devcap-screendepth
+x-upload-content-type
+x-upload-maxresolution
+x-upload-name
+x-upload-size
+x-upload-type
+x-user-agent
+x-username
+x-verify-credentials-authorization
+x-wap-client-sdu-size
+x-wap-gateway
+x-wap-network-client-ip
+x-wap-network-client-msisdn
+x-wap-proxy-cookie
+x-wap-session-id
+x-wap-tod
+x-wap-tod-coded
+x-wopi-override
+x-wikimedia-debug
+x-wp-pjax-prefetch
+x-ws-api-key
+x-xc-schema-version
+x-xhprof-debug
+x-xhr-referer
+x-xmlhttprequest
+x-xpid
+xxx-real-ip
+xxxxxxxxxxxxxxx
+x-zikula-ajax-token
+x-zotero-version
+x-ztgo-bearerinfo
+y
+zotero-api-version
+zotero-write-token
+access-token
+ajax
+app-env
+bae-env-addr-bcms
+bae-env-addr-bus
+bae-env-addr-channel
+bae-logid
+basic
+catalog
+clientip
+debug
+delete
+enable-gzip
+enable-no-cache-headers
+error-1
+error-2
+error-3
+error-4
+eve-trusted
+fire-breathing-dragon
+format
+gzip-level
+head
+hosti
+htaccess
+image
+incap-client-ip
+local-content-sha1
+on-behalf-of
+options
+password
+pink-pony
+proxy-password
+put
+request2-tests-base-url
+request2-tests-proxy-host
+request-timeout
+rest-sign
+root
+support-events
+token
+user
+useragent
+user-mail
+user-name
+version-none
+viad
+x
+x-access-token
+x-amz-date
+x-amz-server-side-encryption
+x-auth-key
+x-auth-user
+x-confirm-delete
+x-do-not-track
+x-elgg-nonce
+x-expected-entity-length
+x-filename
+x-flash-version
+x-flx-consumer-key
+x-flx-consumer-secret
+x-flx-redirect-url
+x-forwarded-scheme
+x-jphone-msname
+x-options
+x-os-prefs
+x-pjax-container
+x-request-timestamp
+x-rest-password
+x-rest-username
+x-te
+x-unique-id
+x-up-devcap-iscolor
+accesskey
+auth-any
+auth-basic
+auth-digest
+auth-gssneg
+auth-ntlm
+code
+cookie-httponly
+cookie-parse-raw
+cookie-secure
+deflate-level-def
+deflate-level-max
+deflate-level-min
+deflate-strategy-def
+deflate-strategy-filt
+deflate-strategy-fixed
+deflate-strategy-huff
+deflate-strategy-rle
+deflate-type-gzip
+deflate-type-raw
+deflate-type-zlib
+e-encoding
+e-header
+e-invalid-param
+e-malformed-headers
+e-message-type
+encoding-stream-flush-full
+encoding-stream-flush-none
+encoding-stream-flush-sync
+e-querystring
+e-request
+e-request-method
+e-request-pool
+e-response
+e-runtime
+e-socket
+e-url
+get
+header
+http-phone-number
+ipresolve-any
+ipresolve-v4
+ipresolve-v6
+link
+meth-acl
+meth-baseline-control
+meth-checkin
+meth-checkout
+meth-connect
+meth-copy
+meth-label
+meth-lock
+meth-merge
+meth-mkactivity
+meth-mkcol
+meth-mkworkspace
+meth-move
+meth-options
+meth-propfind
+meth-proppatch
+meth-report
+meth-trace
+meth-uncheckout
+meth-unlock
+meth-update
+meth-version-control
+msg-none
+msg-request
+msg-response
+oc-chunked
+ocs-apirequest
+params-allow-comma
+params-allow-failure
+params-default
+params-raise-error
+path
+phone-number
+pragma-no-cache
+proxy-http
+proxy-socks4
+proxy-socks5
+querystring-type-array
+querystring-type-bool
+querystring-type-float
+querystring-type-int
+querystring-type-object
+querystring-type-string
+redirect
+redirect-found
+redirect-perm
+redirect-post
+redirect-proxy
+redirect-temp
+refferer
+requesttoken
+sec-ch-ua
+sec-ch-ua-arch
+sec-ch-ua-bitness
+sec-ch-ua-full-version-list
+sec-ch-ua-mobile
+sec-ch-ua-model
+sec-ch-ua-platform
+sec-ch-ua-platform-version
+sec-fetch-dest
+sec-fetch-mode
+sec-fetch-site
+sec-fetch-user
+sec-websocket-key
+sp-host
+ssl
+ssl-version-any
+status-bad-request
+status-forbidden
+support
+support-encodings
+support-magicmime
+support-requests
+support-sslrequests
+surrogate-capability
+ua
+upload-default-chmod
+url
+url-from-env
+verbose-throttle
+version-1-0
+version-1-1
+version-any
+webodf-member-id
+webodf-session-id
+webodf-session-revision
+work-directory
+x-
+x-api-key
+x-apitoken
+x-csrftoken
+x-elgg-apikey
+x-elgg-hmac
+x-elgg-hmac-algo
+x-elgg-posthash
+x-elgg-posthash-algo
+x-elgg-time
+x-foo
+x-forwarded-by
+x-json
+x-litmus
+x-locking
+x-oc-mtime
+x-remote-addr
+x-request-signature
+x-ua-device
+x-update-range
+x-varnish
+x-wp-nonce
+auth
+brief
+chunk-size
+client
+download-attachment
+download-bz2
+download-e-headers-sent
+download-e-invalid-archive-type
+download-e-invalid-content-type
+download-e-invalid-file
+download-e-invalid-param
+download-e-invalid-request
+download-e-invalid-resource
+download-e-no-ext-mmagic
+download-e-no-ext-zlib
+download-inline
+download-tar
+download-tgz
+download-zip
+header-lf
+header-status-client-error
+header-status-informational
+header-status-redirect
+header-status-server-error
+header-status-successful
+https-from-lb
+meth-delete
+meth-head
+meth-post
+multipart-boundary
+originator
+php
+recipient
+request-error
+request-vars
+secretkey
+status-ok
+xauthorization
+x-codeception-codecoverage
+x-codeception-codecoverage-config
+x-codeception-codecoverage-debug
+x-codeception-codecoverage-suite
+x-csrf-token
+x-dokuwiki-do
+x-helpscout-signature
+x-nokia-bearer
+xonnection
+x-purpose
+xroxy-connection
+x-user
+bae-env-appid
+catalog-server
+cookie-path
+custom-header
+forwarded-for-ip
+meth-get
+meth-put
+opencart
+unless-modified-since
+www-address
+x-content-type
+x-hub-signature
+x-signature
+bae-env-addr-sql-ip
+bae-env-addr-sql-port
+cache-info
+client-error-cannot-access-local-file
+client-error-cannot-connect
+client-error-communication-failure
+client-error-invalid-parameters
+client-error-invalid-server-address
+client-error-no-error
+client-error-protocol-failure
+client-error-unspecified-error
+error-formatting-html
+lock-token
+onerror-continue
+onerror-die
+overwrite
+prefer
+shib-application-id
+x-fireloggerauth
+cookie-domain
+https
+meth-
+modauth
+port
+post
+read-state-begin
+read-state-body
+read-state-headers
+socket-connection-err
+str-match
+transport-err
+coming-from
+nl
+ua-pixels
+x-coming-from
+x-jphone-display
+x-up-devcap-screenpixels
+x-whatever
+appname
+proxy-port
+version
+x-forward-for
+proxy-user
+x-em-uid
+x-file-type
+bar
+proxy
+timeout
+referrer
+x-forwarded-ssl
+x-jphone-uid
+x-file-size
+accepted
+appcookie
+bad-gateway
+bae-env-addr-bcs
+conflict
+continue
+created
+expectation-failed
+failed-dependency
+gateway-time-out
+gone
+insufficient-storage
+internal-server-error
+length-required
+locked
+method-not-allowed
+moved-permanently
+moved-temporarily
+multiple-choices
+multi-status
+no-content
+non-authoritative
+not-acceptable
+not-extended
+not-implemented
+not-modified
+partial-content
+payment-required
+precondition-failed
+processing
+proxy-authentication-required
+range-not-satisfiable
+request-entity-too-large
+request-time-out
+request-uri-too-large
+reset-content
+see-other
+service-unavailable
+switching-protocols
+temporary-redirect
+unprocessable-entity
+unsupported-media-type
+upgrade-required
+use-proxy
+variant-also-varies
+version-not-supported
+x-operamini-phone
+bad-request
+forbidden
+unauthorized
+user-agent-via
+appversion
+not-found
+url-strip-
+x-pjax
+cf-connecting-ip
+x-dcmguid
+foo
+info-download-size
+info-download-time
+info-return-code
+info-total-request-stat
+info-total-response-stat
+x-firelogger
+content-md5
+x-up-subno
+bae-env-ak
+bae-env-sk
+if
+ok
+url-join-path
+url-join-query
+url-replace
+url-strip-all
+url-strip-auth
+url-strip-fragment
+url-strip-pass
+url-strip-path
+url-strip-port
+url-strip-query
+url-strip-user
+depth
+x-file-name
+x-moz
+x-ucbrowser-device-ua
+device-stock-ua
+mod-rewrite
+x-nokia-ipaddress
+x-bolt-phone-ua
+x-original-user-agent
+x-skyfire-phone
+title
+ssl-https
+request-error-file
+request-error-gzip-crc
+request-error-gzip-data
+request-error-gzip-method
+request-error-gzip-read
+request-error-proxy
+request-error-redirects
+request-error-response
+request-error-url
+slug
+x-att-deviceid
+authentication
+x-firephp-version
+x-mobile-gateway
+request-mbstring
+x-device-user-agent
+x-huawei-userid
+x-orange-id
+x-vodafone-3gpdpcontext
+x-wap-clientid
+ua-cpu
+wap-connection
+x-nokia-gateway-id
+ua-os
+body-maxlength
+body-truncated
+max-forwards
+mimetype
+verify-cert
+request-http-ver-1-0
+request-http-ver-1-1
+request-method-delete
+request-method-get
+request-method-head
+request-method-options
+request-method-post
+request-method-put
+request-method-trace
+x-operamini-phone-ua
+status
+x-update
+method
+forwarded-for
+x-forwarded
+scheme
+x-forwarded-server
+origin
+x-client-ip
+x-prototype-version
+clientaddress
+base
+pc-remote-addr
+post-files
+session-vars
+cookie-vars
+env-vars
+get-vars
+server-vars
+x-forwarded-host
+x-requested-with
+referer
+host
+alt-used
+x-original-url~/%s
+x-rewrite-url~/%s
+command
+__requesturi
+__requestverb
+x-http-status-code-override
+x-amzn-remapped-host
+x-amz-website-redirect-location
+x-up-devcap-post-charset
+http_sm_authdirname
+http_sm_authdirnamespace
+http_sm_authdiroid
+http_sm_authdirserver
+http_sm_authreason
+http_sm_authtype
+http_sm_dominocn
+http_sm_realm
+http_sm_realmoid
+http_sm_sdomain
+http_sm_serveridentityspec
+http_sm_serversessionid
+http_sm_serversessionspec
+http_sm_sessiondrift
+http_sm_timetoexpire
+http_sm_transactionid
+http_sm_universalid
+http_sm_user
+http_sm_userdn
+http_sm_usermsg
+x-remote-ip
+traceparent
+tracestate
\ No newline at end of file
diff --git a/bbot/wordlists/paramminer_parameters.txt b/bbot/wordlists/paramminer_parameters.txt
new file mode 100644
index 0000000000..2022323fb3
--- /dev/null
+++ b/bbot/wordlists/paramminer_parameters.txt
@@ -0,0 +1,6523 @@
+id
+user
+account
+number
+order
+no
+doc
+key
+email
+group
+profile
+edit
+report
+daemon
+upload
+dir
+execute
+download
+log
+ip
+cli
+cmd
+file
+document
+folder
+root
+path
+pg
+style
+pdf
+template
+php_path
+select
+role
+update
+query
+name
+sort
+where
+search
+params
+process
+row
+view
+table
+from
+sel
+results
+sleep
+fetch
+keyword
+column
+field
+delete
+string
+filter
+dest
+redirect
+uri
+continue
+url
+window
+next
+data
+reference
+site
+html
+val
+validate
+domain
+callback
+return
+page
+feed
+host
+port
+to
+out
+show
+navigation
+open
+preview
+activity
+content
+access
+admin
+dbg
+debug
+grant
+test
+alter
+clone
+create
+disable
+enable
+exec
+load
+make
+modify
+rename
+reset
+shell
+utm_content
+toggle
+adm
+cfg
+config
+action
+_method
+password
+type
+username
+title
+code
+q
+submit
+token
+message
+t
+c
+mode
+lang
+p
+status
+start
+charset
+description
+s
+post
+excerpt
+login
+comment
+step
+ajax
+state
+f
+error
+save
+format
+tab
+offset
+a
+limit
+do
+plugin
+theme
+text
+language
+height
+logout
+pass
+h
+value
+filename
+year
+version
+subject
+m
+u
+confirm
+width
+w
+size
+date
+source
+GLOBALS
+op
+method
+uid
+tag
+category
+target
+ids
+term
+new
+locale
+author
+paged
+cat
+msg
+add
+d
+day
+nonce
+captcha
+output
+revision
+i
+xml
+db
+time
+section
+image
+r
+files
+tags
+users
+send
+updated
+skips
+n
+check
+orderby
+num
+import
+prefix
+fields
+pwd
+pid
+month
+module
+parent
+cancel
+activate
+checked
+success
+desc
+case
+remove
+position
+location
+extra
+count
+b
+rating
+pass2
+hostname
+move
+hash
+dry
+cid
+body
+src
+level
+generate
+g
+dbname
+option
+userid
+sql
+options
+address
+activated
+action2
+password2
+pass1
+meta
+ID
+deleted
+act
+e
+taxonomy
+ref
+publish
+secret
+app
+rememberme
+country
+phone
+hidden
+force
+export
+sticky
+nickname
+v
+plugins
+locked
+command
+returnUrl
+item
+amount
+timestamp
+server
+signature
+part
+json
+del
+comments
+visible
+LoginForm
+keywords
+enabled
+base
+refresh
+foo
+y
+media
+info
+guid
+dt
+x
+testdata
+list
+visibility
+User
+thumb
+stage
+history
+timezone
+upgrade
+menu
+items
+class
+blog
+link
+end
+dbhost
+approved
+stylesheet
+sid
+settings
+postid
+deactivate
+closed
+posted
+noheader
+ContactForm
+tax
+ss
+inline
+gid
+attachments
+added
+replytocom
+dismiss
+clear
+city
+spam
+request
+all
+sidebar
+dbuser
+checkbox
+short
+active
+session
+registration
+hh
+price
+nsql
+mm
+loggedout
+lastname
+SMALLER
+saved
+rsd
+ps
+newcontent
+mn
+linkurl
+jj
+install
+hidem
+firstname
+detached
+color
+clearsql
+checkemail
+BIGGER
+aa
+slug
+remember
+referrer
+reason
+o
+note
+referredby
+l
+deletepost
+dbpass
+attached
+tid
+testcookie
+noredir
+newcat
+monthnum
+metakeyinput
+insertonlybutton
+input
+form
+failure
+down
+deletemeta
+deletecomment
+context
+backto
+undismiss
+sitename
+service
+resetheader
+print
+phperror
+oitar
+metavalue
+metakeyselect
+mail
+liveupdate
+linkcheck
+deletebookmarks
+changeit
+answers
+addmeta
+trashed
+fid
+back
+selection
+mod
+label
+img
+features
+direction
+uname
+sidebars
+hide
+auth
+untrashed
+task
+submitted
+database
+addnew
+Submit
+purge
+notes
+editwidget
+removewidget
+nrows
+groups
+disabled
+zip
+trash
+repair
+overwrite
+referer
+themes
+mid
+defaults
+custom
+ctype
+widget
+topic
+main
+js
+blogname
+untrash
+unspammed
+unspam
+spammed
+selectall
+quantity
+newuser
+networkwide
+invalid
+index
+function
+screen
+reply
+lat
+gender
+find
+display
+directory
+batch
+alt
+set
+scrollto
+fwidth
+fheight
+sub
+same
+rows
+reauth
+notify
+confirmdelete
+autosave
+aid
+vote
+review
+keys
+destination
+allusers
+passwd
+change
+apage
+allblogs
+private
+noapi
+charsout
+catslist
+categories
+up
+subscribe
+script
+removeheader
+pos
+period
+nocache
+kill
+columns
+api
+z
+sortby
+register
+recovered
+pagenum
+last
+event
+customized
+attachment
+answer
+welcome
+timeout
+scope
+rid
+result
+public
+payload
+ns
+mobile
+css
+align
+what
+rank
+qqfile
+max
+createuser
+background
+avatar
+alias
+total
+question
+priority
+days
+cache
+skin
+schema
+orientation
+groupid
+done
+summary
+skipped
+range
+go
+dump
+confirmation
+CKEditorFuncNum
+changes
+ticket
+pw
+pointer
+param
+first
+entry
+drop
+default
+selected
+popup
+owner
+nolog
+nochange
+length
+goto
+company
+Comment
+close
+website
+st
+skip
+restart
+pages
+node
+localize
+fname
+except
+Type
+restore
+profiler
+previewed
+password1
+NewFolderName
+lng
+left
+layout
+k
+fn
+flag
+doaction2
+details
+currency
+copy
+compare
+broken
+block
+paper
+line
+jax
+icon
+flush
+fileName
+dl
+controller
+catid
+PayerID
+newname
+flash
+decomposition
+confirmed
+chromeless
+bid
+yes
+weight
+verify
+values
+run
+route
+replace
+read
+project
+Post
+PHPSESSID
+nid
+md5
+map
+logopng
+listInfo
+letter
+hour
+fullname
+exclude
+dbprefix
+authors
+zoom
+userId
+trigger
+setting
+rs
+provider
+package
+operation
+ok
+object
+mark
+lid
+invoice
+insertonly
+full
+forum
+err
+doit
+backup
+ac
+sent
+phpThumbDebug
+photo
+interval
+editor
+echostr
+channel
+args
+agree
+WPLANG
+userspage
+usersearch
+triggers
+insert
+inc
+homepage
+hello
+func
+duration
+did
+cookie
+contact
+chunk
+apply
+terms
+tables
+startdate
+shortcode
+scale
+reverse
+required
+origin
+indexes
+identifier
+hashed
+fontcolor
+databases
+approve
+advanced
+webfile
+urls
+types
+toggledisplay
+subaction
+sortorder
+sign
+sEcho
+searchtype
+saveasdraft
+rss
+recipient
+prev
+notice
+njlowercolor
+njform
+njfontcolor
+members
+member
+md5s
+init
+hs
+headerimage
+header
+fontdisplay
+finish
+fax
+engine
+current
+client
+cc
+callf
+article
+ver
+ts
+roles
+region
+raw
+qid
+old
+nick
+model
+lon
+lock
+iDisplayLength
+ext
+expire
+enddate
+empty
+chunks
+album
+userselect
+userName
+telephone
+stats
+saveauthors
+right
+revert
+response
+news
+lname
+images
+highlight
+frob
+embed
+denied
+dccharset
+contents
+compress
+Command
+area
+aim
+accept
+vid
+unit
+undeleted
+thread
+textinputs
+textcolor
+store
+sqlite
+showall
+rsargs
+reload
+record
+posts
+pagenow
+override
+opt
+opname
+job
+idx
+help
+groupname
+filters
+fileid
+expand
+entity
+cp
+clean
+caption
+apikey
+verbose
+var
+tpl
+topics
+top
+tablename
+sSearch
+sex
+separator
+scripts
+rules
+rt
+rate
+product
+prepopulate
+pgtIou
+pgtId
+pgsql
+permissions
+oracle
+oldpass
+mssql
+modules
+labels
+get
+foldername
+family
+delimiter
+CurrentFolder
+choice
+box
+autologin
+age
+again
+actions
+wysiwyg
+word
+userID
+unsort
+uninstall
+unfoldmenu
+support
+startDate
+standalone
+since
+score
+runtests
+regex
+published
+proxy
+points
+phrase
+oldpassword
+oid
+noajax
+newpassword
+newName
+minute
+mac
+langCode
+iDisplayStart
+genre
+From
+font
+emails
+eid
+dst
+device
+demo
+deletefile
+cropDetails
+connection
+collation
+cms
+attributes
+attribute
+as
+adduser
+zone
+zipcode
+words
+viewtype
+usr
+To
+ssl
+single
+sendmail
+protocol
+phpinfo
+perpage
+newsletter
+newsid
+names
+Name
+min
+logoutRequest
+logo
+interface
+frequency
+firstName
+dbName
+criteria
+by
+button
+break
+bg
+ban
+authorize
+artist
+allow
+un
+stripeToken
+resize
+replyto
+remote
+random
+products
+pic
+perms
+parentid
+original
+opener
+namespace
+mime
+loc
+lastName
+jabber
+global
+forums
+foo1
+FileName
+endpoint
+Email
+detail
+descr
+deny
+delall
+customer
+copyright
+compression
+collection
+address2
+yim
+week
+unsubscribe
+truncate
+tableName
+speed
+sortOrder
+sig
+share
+servername
+sections
+room
+resource
+req
+qty
+perm
+orderid
+operator
+noconfirmation
+newFileName
+makedoc
+license
+graph
+frame
+duplicate
+discount
+created
+clearcache
+CKEditor
+auto
+after
+about
+wsdl
+video
+uploaded
+unban
+thumbnail
+subtitle
+stop
+startIndex
+sorttype
+snippet
+silent
+sessionid
+sequence
+sender
+searchTerm
+sd
+sc
+rule
+reg
+redir
+quote
+prune
+productid
+popupurl
+popuptitle
+pageid
+oc
+nom
+newpass
+memo
+maxResults
+iSortingCols
+gateway
+for
+feedback
+fcksource
+extension
+draft
+dev
+deleteall
+csv
+business
+board
+address1
+addr
+addgroup
+who
+unread
+ttl
+temp
+tagid
+sure
+subpage
+stat
+showThumbs
+setup
+res
+queryType
+postcode
+permission
+pending
+pattern
+passkey
+nr
+match
+jsonp
+itemid
+invites
+invite
+foo6
+foo2
+filetype
+fc
+encoding
+enc
+em
+element
+discard
+delay
+def
+dbpassword
+currentFolder
+course
+commit
+cols
+challenge
+call
+branch
+blogid
+banned
+array
+archive
+web
+unlock
+uniqid
+txt
+twitter
+todo
+threadid
+team
+system
+storage
+STATUS
+sites
+rollback
+resettext
+repeat
+rem
+receiver
+rebuild
+rebroadcast
+re
+quality
+qq
+Profile
+privileges
+primary
+poll
+Password
+parameters
+os
+orderbydate
+opauth
+messages
+maintenance
+long
+links
+ignore
+handler
+forward
+fileext
+endDate
+driver
+docroot
+deletepage
+d2
+cron
+control
+configure
+conditions
+Collation
+codepress
+chart
+bitrate
+barcode
+AuthItemForm
+assign
+adminpass
+write
+watch
+switch
+subtype
+street
+str
+siteurl
+shipping
+salt
+rev
+returnto
+repo
+rel
+RegistrationForm
+r2
+pre
+player
+place
+pk
+person
+permalink
+pc
+payment
+pagename
+other
+openid
+notifications
+nojs
+newPassword
+newdir
+network
+multi
+mailbox
+lowercase
+layer
+jsoncallback
+itemName
+isbn
+iid
+grade
+game
+expires
+expiration
+encode
+edited
+dropped
+domains
+dept
+dbtype
+conf
+col
+cname
+char
+browse
+bio
+banner
+balance
+asc
+anonymous
+announcement
+xmldump
+UserRecoveryForm
+UserLogin
+UserChangePassword
+USER
+updates
+tx
+tweet
+trust
+track
+topicid
+tool
+timeformat
+tb
+step2
+ssid
+sendto
+season
+Search
+schedule
+scan
+sa
+repassword
+reinstall
+realname
+radius
+px
+proxyuser
+ProfileField
+pmid
+pm
+picture
+paymentType
+param2
+nopass
+newfolder
+mysql
+multiple
+Message
+longitude
+logtype
+loader
+latitude
+languages
+join
+ipaddress
+instance
+iframe
+id2
+hours
+home
+groupId
+gallery
+ftp
+friends
+footer
+fld
+fieldtype
+feature
+fail
+explain
+episode
+email2
+EaseTemplateVer
+distance
+dirname
+depth
+delfile
+decode
+dbport
+crop
+cost
+connect
+confirmpassword
+com
+co
+chk
+child
+categoryid
+Body
+birthdate
+begin
+before
+BackURL
+avatars
+autofocus
+authenticate
+at
+aname
+agreement
+adminname
+activkey
+xajax
+viewonline
+unwatch
+ui
+typeid
+th
+templateid
+targets
+tagged
+sw
+super
+subname
+subform
+subdir
+strings
+strict
+statistics
+starttime
+spec
+sord
+snapshot
+side
+sh
+serial
+second
+rewrite
+retry
+realm
+rand
+profiling
+previous
+preset
+poster
+policies
+pn
+platform
+placement
+pin
+pID
+php
+parentID
+pagination
+pagesize
+p2
+p1
+oldPassword
+name2
+msn
+moved
+monitor
+migrate
+merge
+maxage
+mask
+manufacturer
+ls
+loginname
+ld
+Lang
+kid
+include
+idSelect
+hook
+goback
+fs
+frontpage
+fontsize
+filepath
+Filename
+filecontent
+featured
+fav
+failed
+extend
+eventId
+eventid
+endtime
+editid
+div
+delivery
+dbUser
+dbsize
+dbPassword
+DATA
+dashboard
+cursor
+container
+component
+compact
+colors
+collapse
+characters
+ch
+cats
+cart
+calendar
+C
+browser
+brand
+birthday
+bcc
+attr
+apps
+ad
+zid
+xajaxargs
+which
+warned
+venue
+uuid
+usuario
+usesubform
+unique
+undelete
+uids
+tz
+torrent
+titles
+templates
+templatename
+targetid
+TableList
+syear
+svg
+suser
+suffix
+subtotal
+submitorderby
+submitoptions
+State
+staff
+special
+sortBy
+sorder
+sname
+sm
+sitemap
+siteid
+simpledb
+signin
+sidx
+sID
+ShowFunctionFields
+shoutbox
+sec
+sample
+revokeall
+resume
+resetpasskey
+regenerate
+recursive
+recover
+recipients
+receipt
+quota
+quiet
+queue
+publisher
+progress
+program
+problem
+postsperpage
+postId
+pollid
+playlist
+paymentAmount
+passphrase
+pagetitle
+pageSize
+pageno
+pageID
+padding
+otp
+onserver
+obfuscate
+newvalue
+newDir
+mongo
+moderator
+modal
+mimetype
+mID
+ma
+lst
+loop
+lookup
+loggedin
+lastID
+issue
+intro
+in
+idp
+head
+handle
+gz
+groupID
+gift
+gID
+funcs
+fulltext
+folderid
+flags
+fill
+fieldname
+feedurl
+feeds
+errors
+entries
+elastic
+dontlimitchars
+donor
+dob
+displayname
+disp
+des
+department
+delmarked
+dbusername
+dbstats
+dateformat
+crypt
+credit
+createview
+cpu
+cover
+coppa
+contentType
+complete
+Comments
+commentid
+cID
+catorder
+book
+authkey
+attach
+articles
+appname
+appid
+append
+and
+analyze
+agreed
+agent
+adress
+adminmail
+addfolder
+addcomment
+accountid
+y2
+x2
+WriteTags
+with
+wipe
+why
+wctx
+vp
+videoType
+vcode
+vbrmethod
+userrole
+userpass
+Username
+useremail
+userdata
+unsynchronizedtags
+unstick
+unsecuresubmit
+unbookmark
+ua
+utm_source
+utm_campaign
+utm_medium
+utm_term
+typ
+tv
+tree
+transfer
+trackzero
+TracksTotal
+tracknoalbum
+trackinalbum
+Track
+trace
+tot
+torrentid
+Toolbar
+TOKEN
+todate
+titlefeat
+tipo
+thumbs
+tel
+tc
+tagtypes
+tagname
+TagFormatsToWrite
+synchronizetagsfrom
+sum
+subdomain
+stype
+stub
+struct
+stock
+stick
+static
+srv
+split
+sp
+sn
+smtp
+sku
+Skin
+signout
+showwysiwyg
+showtagfiles
+ShowMD5
+showfiles
+shadow
+selector
+securesubmit
+searchtext
+searchKey
+savemode
+saveid
+saveField
+SAMLResponse
+samemix
+rpp
+rolename
+rights
+returnURL
+returnurl
+restrict
+resolve
+rescanerrors
+reorder
+renamefileto
+reminder
+rememberMe
+relative
+recent
+realName
+radio
+quickmod
+qa
+pw2
+psubmit
+properties
+projects
+proceed
+privacy
+pretty
+pname
+phase
+persistent
+permanent
+percent
+pay
+PASSWORD
+passwd2
+partial
+paid
+orderId
+oID
+npassword
+notmodrewrite
+notapache
+nonemptycomments
+noalert
+newUser
+newscan
+newpw
+newpass2
+newpage
+newfile
+msgid
+mrpage
+more
+money
+moduleName
+mlpage
+mkdir
+missingtrackvolume
+minutes
+minor
+mensaje
+md5datadupes
+manager
+m3utitle
+m3ufilename
+m3uartist
+m3u
+longurl
+logs
+Login
+ln
+lists
+listid
+listdirectory
+linktype
+lines
+like
+lib
+KEY
+itemType
+itemId
+isAjax
+int
+initial
+grp
+groupName
+GenreOther
+genredistribution
+Genre
+fullfolder
+framed
+formName
+formid
+formatdistribution
+foldmenu
+flip
+fixid3v1padding
+filetypelist
+filesize
+filenamepattern
+filelist
+fileextensions
+fieldValue
+fieldName
+fieldid
+fID
+feid
+extended
+extAction
+existing
+ex
+events
+eventName
+errorswarnings
+encoderoptionsdistribution
+encodedbydistribution
+emptygenres
+emailAddress
+emailaddress
+edituser
+dp
+displayName
+disallow
+dirs
+dictionary
+deleteid
+defaultValue
+deadfilescheck
+deactivated
+dd
+dbType
+dates
+ctf
+createdb
+Country
+correctcase
+copied
+cookies
+convert
+contactname
+confirmPassword
+configuration
+condition
+cluster
+CKFinderFuncNum
+CKFinderCommand
+chmod
+children
+chat
+cep
+cd
+cb
+catname
+catID
+CardType
+caching
+bookmark
+bodytext
+bgcolor
+baseurl
+bar
+autofixforcesource
+autofixforcedest
+autofix
+authtype
+audiobitrates
+assignment
+artisttitledupes
+application
+APICpictureType
+ans
+announce
+anchor
+amt
+always
+adv
+addusers
+accessType
+y1
+xrds
+x1
+wrap
+work
+way
+warning
+votes
+vn
+views
+videoid
+verifypeer
+verifyhost
+vendor
+varValue
+varName
+variant
+variable
+utmr
+utmp
+utmdebug
+utmac
+uses
+userEmail
+use
+uporder
+updatedb
+unbansubmit
+ult
+ul2
+ul
+UA
+u2
+u1
+type2
+txtDescription
+transaction
+tracker
+tos
+torrentsperpage
+topicsperpage
+toboard
+Title
+timeframe
+tID
+textarea
+testing
+testemail
+tbl
+tasks
+taglist
+Tag
+tableprefix
+tableId
+t2
+t1
+survey
+surname
+supportfor
+subtab
+subscription
+submit1
+subj
+styles
+storyid
+step1
+stay
+Status
+start2
+standard
+span
+so
+smtpPort
+smiley
+slogan
+slide
+sitetitle
+signatures
+SID
+showqueries
+showpage
+shout
+sha1
+sf
+severity
+sesskey
+sessidpass
+series
+sectionid
+searchText
+searchid
+searchField
+sdb
+sday
+scheme
+scene
+scenario
+savesettings
+savepms
+savefile
+saveData
+Save
+sandbox
+rotatefile
+rotate
+roleid
+rn
+revoke
+returnID
+resync
+restock
+resolution
+resizetype
+resizefile
+resetkey
+resend
+requestid
+reportid
+renamefile
+renameext
+removeall
+release
+relation
+recurring
+RecordingUrl
+recordid
+reasontype
+race
+qs
+push
+pub
+province
+protection
+property
+pref
+predefined
+pp
+play
+plan
+pl
+ping
+pf
+permerror
+passw
+PASS
+PaRes
+parameter
+organization
+org
+orderBy
+online
+oldusername
+oldpwd
+older
+objects
+nowarn
+notification
+newpw2
+NEWPASS
+newlang
+nav
+myEditor
+modname
+modeextension
+modcomment
+metric
+memberName
+maxwidth
+matchtype
+mapping
+mandatory
+ls2
+local
+lightbox
+levels
+langID
+L
+kick
+karma
+j
+Itemid
+isDuplicate
+iphone
+ipexclude
+invitecode
+inv
+interests
+interest
+ins
+inputH
+industry
+incldead
+importance
+imgurl
+imgpath
+IMG
+imageid
+ident
+id1
+Id
+icq
+href
+hostid
+hl
+hit
+headline
+heading
+HeaderHexBytes
+goodfiles
+Generate
+ft
+fragment
+forumid
+foreign
+followup
+fm
+fldr
+fileType
+filetotal
+fileID
+fg
+fCancel
+facebook
+extUpload
+extTID
+extMethod
+expiry
+example
+errorCode
+eol
+entityid
+encoded
+emphasis
+emailnotif
+elements
+edition
+editing
+editfile
+editaction
+dupfiles
+donated
+doinstall
+docid
+dlt
+dl2
+direct
+dip
+Digits
+dict
+delid
+deletepms
+deleteImage
+decoded
+datetime
+dateStart
+dateEnd
+date2
+datatype
+cut
+currencyCodeType
+ct
+csrf
+cs
+cPath
+courses
+coupon
+controllers
+content1
+contacts
+contactid
+conn
+commentId
+cod
+cm
+clientid
+clearLogs
+classification
+chosen
+channelmode
+chanid
+chan
+Category
+campaign
+callerid
+caller
+cached
+bulk
+bucket
+boards
+blogusers
+blogs
+billing
+bID
+bib
+bbconfigloc
+base64
+bansubmit
+badfiles
+authorID
+attempt
+arguments
+anon
+angle
+alpha
+alert
+albumid
+ageverify
+agb
+afilter
+adminpassword
+adminid
+adminemail
+AddAuthItemForm
+activation
+actionfile
+Action
+acceptpms
+accepted
+abstract
+abort
+a2
+zoneid
+youtube
+yourname
+wwname
+wmax
+wiki
+widgets
+Widget
+whitelist
+wait
+voucher
+vol
+vl
+visualizationSettings
+viewName
+viewname
+via
+Version
+varname
+variables
+validator
+valid
+utype
+utf8
+usort
+Users
+USERNAME
+url1
+URL
+uploadpos
+Upload
+Update
+upc
+until
+unset
+unselectall
+unpublished
+undo
+u9
+u8
+u7
+u6
+u50
+u5
+u49
+u48
+u47
+u46
+u45
+u44
+u43
+u42
+u41
+u40
+u4
+u39
+u38
+u37
+u36
+u35
+u34
+u33
+u32
+u31
+u30
+u3
+u29
+u28
+u27
+u26
+u25
+u24
+u23
+u22
+u21
+u20
+u19
+u18
+u17
+u16
+u15
+u14
+u13
+u12
+u11
+u10
+txtEmail
+trid
+transactionID
+trackusers
+totalProductCount
+topicID
+tokens
+times
+timer
+timelimit
+thumbnails
+throttle
+themename
+testmethods
+taskid
+targetboard
+tac
+tableFields
+tabid
+sys
+sy
+suspend
+supplierID
+subwdata
+suburb
+substruc
+substep
+submit2
+sublogin
+subjoin
+subconst
+subcat
+subacc
+student
+STRUCTURE
+structure
+strReferrer
+strProfileData
+strId
+strFormId
+stream
+steps
+stdDateFilterField
+stdDateFilter
+station
+startTime
+startday
+sserver
+square
+sqlquery
+sq
+spass
+sound
+sortKey
+sortfield
+sortDir
+sort2
+song
+smonth
+skype
+singleout
+signup
+SignatureValue
+Signature
+showtemplate
+showSource
+ShowFieldTypesInDataEditView
+showAll
+shortname
+shop
+ship
+searchType
+searchterm
+searchbox
+searchaction
+searchable
+school
+saveToFile
+runQuery
+ruleid
+rp
+round
+Role
+rmFiles
+rm
+rID
+responsecompression
+Reset
+requiredData
+requestKey
+requestcompression
+repopulate
+removeVariables
+removeID
+removeid
+removeAll
+remark
+relmodule
+RelayState
+regSubmit
+RegisterForm
+refid
+referral
+records
+rec
+reboot
+rc
+ratio
+ratings
+r1
+quick
+quest
+queryPart
+qtype
+qr
+purpose
+pto
+proxypwd
+proxyport
+proto
+promote
+probe
+PRIVILEGES
+printview
+previewwrite
+pressthis
+prenom
+posttext
+pop
+point
+pms
+pmnotif
+plus
+pkg
+phpMyAdmin
+phonenumber
+phone2
+phone1
+pfrom
+paypal
+paste
+passwrd
+passwordConfirm
+password3
+partner
+parked
+parenttab
+ParentID
+param1
+panel
+pageTitle
+PAGE
+Page
+pack
+p2ajax
+OutSum
+OUTPUTFILETEXT
+OUTPUT
+orderNo
+or
+optimize
+oldname
+offline
+occ
+npw
+np
+nowarned
+nombre
+nn
+nID
+newuseremail
+newtitle
+newtext
+newtag
+newstatus
+newpwd
+NEWPRIVILEGES
+newpassword2
+newPass2
+newpass1
+newPass
+NEWNAME
+NEWHOST
+newdid
+NEWCHOICE
+nb
+name1
+NAME
+mytribe
+mtime
+mp
+movie
+movefile
+mood
+months
+monitorconfig
+modifier
+modid
+mirror
+mhpw
+metrics
+methodpayload
+membername
+memberID
+membergroups
+mediaid
+maxtime
+markread
+markdown
+mailto
+mailSubject
+mailid
+longtitle
+logoff
+loginguest
+logid
+locations
+locationName
+listPrice
+linkname
+limitTypes
+lim
+lID
+legend
+leap
+lead
+lcwidget
+latest
+languageID
+labelName
+keystring
+keepHTML
+keep
+keepalive
+ItemId
+itemID
+itemCode
+ipp
+IP
+invoiceid
+InvId
+intTimestamp
+intDatabaseIndex
+institution
+installmode
+inst
+INSERTTYPE
+initdb
+INDEXTYPE
+INDEXCOLUMNLIST
+imaptest
+IGNOREFIRST
+if
+idstring
+idlist
+hosts
+HOST
+hdnProductId
+gzip
+grid
+GRANTOPTION
+google
+gold
+gids
+getInfos
+GenerateForm
+generated
+fullsite
+frontend
+fromdate
+formSubmit
+FormbuilderTestModel
+FORMAT
+follow
+folders
+folderID
+foffset
+focus
+fldName
+filtertype
+filterText
+filterName
+fileFormat
+Fields
+FIELDNAMES
+field2
+field1
+fee
+f2
+EXPORTTABLE
+exportImages
+EXPORTDB
+exception
+exact
+eventID
+eval
+endyear
+en
+email1
+EMAIL
+elementId
+eids
+education
+editParts
+Edit
+ec
+dtstart
+dtend
+downloadpos
+downloaded
+dname
+dm
+dlconfig
+distinct
+displayVisualization
+director
+directmode
+dipl
+difficulty
+DeviceId
+design
+descending
+desact
+deluser
+DELIMITER
+deleteUsers
+deletefolder
+deldir
+decline
+dbms
+DBLIST
+dbase
+dayDelta
+date1
+dataType
+DATABASE
+d1
+cvv
+customers
+currentid
+curr
+curfile
+cur
+ctid
+credits
+createclass
+cr
+countryName
+countryCode
+counter
+core
+coords
+contactName
+connectt
+conflict
+configfile
+completed
+comp
+commenttext
+colours
+colName
+CollectionId
+Cmd
+clientcookies
+clickedon
+clicked
+cleanup
+CHOICE
+chartSettings
+chars
+charge
+channelName
+channelID
+changed
+cf
+cert
+cdone
+catId
+card
+canvas
+campaignid
+cal
+cainfo
+build
+btn
+breakdown
+border
+bool
+blocks
+blockid
+blacklist
+birthDate
+binary
+bi
+bbox
+banreason
+bank
+bandwidth
+backend
+autodeltime
+autodel
+autocomplete
+authorName
+authorized
+AuthItem
+AuthChildForm
+atype
+AttachmentName
+AssignmentForm
+Artist
+Article
+aoe
+allrows
+alli2
+allDay
+akey
+ajxaction
+ajaxRequest
+aggregate
+adminpwd
+admid
+addon
+additional
+ADAPTER
+ACTION
+ACCESSLEVEL
+a1
+3
+1
+
+png
+ob
+maxdays
+aliases
+SHIPTOZIP
+SHIPTOSTATE
+SHIPTOCOUNTRY
+SHIPTOCITY
+Delete
+Address
+zID
+yeniyer
+ww
+wser
+wq
+wdir
+vpn
+voting
+viewscount
+verified
+vPath
+ux
+ut
+usrid
+userspec
+userpicpersonal
+usefilename
+urldown
+uptime
+uploadloc
+upfile
+ty
+tradercap
+todoAction
+toaddress
+toAdd
+tmp
+tickets
+templateID
+tarfile
+sv
+submitcollation
+step4
+step3
+srcport
+sqlf
+shortcut
+seqnum
+searchlabel
+searchip
+searchClause2
+searchClause
+scheduled
+sameall
+rw
+rto
+rmdir
+reveal
+resetVoteCount
+renamefolder
+remoteserver
+regval
+regtype
+regname
+registre
+redirection
+readregname
+qaction
+pu
+prog
+prepare
+preference
+precmd
+power
+postgroup
+postRedirect
+pool
+pmsg
+pipi
+pids
+phpvarname
+phpexec
+phpev
+passwrd2
+passwrd1
+pa
+ox
+overmodsecurity
+orderdir
+orderByColumn
+onserverover
+oldpasswrd
+oldemail
+obgz
+newver
+newdirectory
+netmask
+nere
+mysqlpass
+mx
+msgs
+mquery
+moderators
+mkfile
+missing
+mip
+minage
+menuHashes
+mem
+mbname
+maxPlotLimit
+mass
+lngfile
+ldap
+kind
+jump
+it
+ispublic
+ipaddr
+inside
+immediate
+imagesize
+iStart
+iLength
+iColumns
+hp
+hname
+guestname
+gf
+getfile
+generalgroup
+fromname
+fixErrors
+finished
+filterCategory
+filterAlert
+fileperm
+fileact
+fedit
+fdownload
+fdelete
+fchmod
+fallback
+eventDate
+erorr
+ephp
+ep
+env
+enquiry
+emailto
+emailActivate
+eheight
+ef
+editform
+editfilename
+ed
+dup
+dstport
+dosyaa
+dontFormat
+dolma
+doi
+displayAllColumns
+dirupload
+dif
+delregname
+delim
+deleteuser
+deleteAccount
+dc
+dbu
+dbsession
+dbp
+dbh
+dateFormat
+dataLabel
+cy
+customerid
+customWhereClause
+curl
+curdir
+criteriaValues
+criteriaTables
+criteriaSort
+criteriaShow
+criteriaSearchType
+criteriaSearchString
+criteriaRowInsert
+criteriaRowDelete
+criteriaRowAdd
+criteriaColumnTypes
+criteriaColumnOperators
+criteriaColumnNames
+criteriaColumnName
+criteriaColumnInsert
+criteriaColumnDelete
+criteriaColumnCount
+criteriaColumnCollations
+criteriaColumnAdd
+criteriaColumn
+criteriaAndOrRow
+criteriaAndOrColumn
+createfolder
+cpy
+coppaPost
+coppaFax
+coord
+cookiename
+cookielength
+contactId
+con
+community
+columnsToDisplay
+cn
+cl
+chmod0
+checksum
+changeusername
+certificate
+censortext
+censortest
+censorWholeWord
+censorIgnoreCase
+calname
+calid
+c99shcook
+bug
+brd
+bport
+boardurl
+boardid
+boardaccess
+bgc
+bday2
+backuptype
+backconnectport
+backcconnmsge
+backcconnmsg
+appId
+animate
+allday
+actionfolder
+aclid
+absolute
+aPath
+TYPE
+SHIPTOSTREET
+ProfileForm
+Mohajer22
+MD
+M2
+F
+ER
+Direction
+CURRENCYCODE
+A
+zrecord
+zpage
+zonetxt
+zonet
+zonesub
+yearend
+yPath
+xsrf
+wstype
+woeid
+weekdays
+webid
+watermark
+vv
+vpassword
+viewed
+viewall
+viewUsers
+viewResults
+viewOption
+ver2
+ver1
+variations
+usertype
+userlength
+userip
+usergroup
+userGroup
+userEnableRecovery
+usepost
+used
+upsql
+uploadfile
+uploadForm
+updateRecordID
+updateFileID
+updateData
+updateBiblioID
+upd
+upage
+unzip
+untilDate
+unstable
+unhideNavItem
+uitype
+ue
+typE
+txtCommand
+txtAddComment
+tvid
+tt
+transactionId
+transStatus
+transId
+tpp
+tp
+totaltopics
+topicseen
+tools
+toolbar
+tok
+timezonedetection
+timeUnit
+timeIncrement
+ti
+threshold
+thankyou
+tftp
+tfid
+tests
+testmode
+tempLoanID
+te
+taxid
+tagvalue
+tabs
+sync
+symlinktarget
+symlink
+supplierPlace
+supplierPhone
+supplierName
+supplierFax
+supplierEmail
+supplierContact
+supplierAccount
+subsection
+subscribed
+subs
+submitok
+subjectType
+subid
+subfiles
+subdom
+subcategory
+subact
+strategy
+strHtml
+story
+stories
+statusID
+states
+startval
+starts
+stars
+star
+stUpload
+ssi
+sshport
+ssearch
+sqluser
+sqlpass
+sqlhost
+spoiler
+specialchars
+specDetailInfo
+spage
+smtpusername
+smtpport
+smtppassword
+smodule
+sl
+skid
+siteName
+showsc
+shown
+showh
+showevent
+showdupes
+showUnhideDialog
+showCheckbox
+shared
+shareWith
+shareType
+setMetrics
+setDefault
+sessionId
+sesc
+services
+serverurl
+servertype
+servers
+serverid
+serveR
+seriesTitle
+serialID
+seqNumber
+seq
+separate
+selectedDoc
+security
+sect
+searchin
+searchby
+searchString
+searchName
+searchId
+sea
+scid
+scdir
+scalingup
+savemsg
+saveandnext
+saveZ
+saveNclose
+saveLogs
+saveKardexes
+salesrank
+saction
+runcmd
+ruletype
+ruledefgroup
+ruledef
+rssfeed
+rowspage
+rownumber
+rowid
+routines
+routes
+rmver
+rminstall
+returnaction
+resultXML
+reshares
+resetpassword
+reserved
+reserveLimit
+reserveItemID
+reserveID
+reserveAlert
+resent
+requireAgreement
+reqType
+reportsent
+reports
+reportView
+reportContentType
+replies
+replaceWith
+repeatable
+ren
+removesess
+removeFines
+remotefile
+remipp
+remail
+relpathinfo
+releasedate
+relatedmodule
+regularity
+regexp
+regDate
+refurl
+recvDate
+recsEachPage
+recoveryPassword
+recordSep
+recordOffset
+recordNum
+recaptcha
+recapBy
+reborrowLimit
+ready
+rback
+rawfilter
+ranking
+ragename
+rage
+r4
+quirks
+quickReturnID
+questionid
+querY
+qt
+qindsub
+qcontent
+qact2
+qact
+publisherName
+publisherID
+publicUpload
+ptype
+ptID
+pt
+pruningOptions
+proxypass
+proxyhostmsg
+protect
+prop
+projectid
+projectID
+progresskey
+profiles
+producttype
+processed
+pro
+priceCurrency
+pr
+postto
+postgroups
+postfrom
+postal
+portalauth
+popuptype
+pod
+plug
+plain
+placeName
+placeID
+pipe
+phpini
+phpcode
+pftext
+personal
+pd
+pb
+paymentStatus
+pause
+passwords
+passwd1
+passlength
+passWord
+pasS
+parentId
+palette
+pais
+pageId
+packageName
+overrideID
+outbox
+ot
+ordDate
+optimization
+opml
+operations
+opacHide
+oldform
+oldfilename
+off
+oauth
+nzbpath
+numbers
+numExtended
+null
+ntp2
+ntp1
+noupdate
+notsent
+notificationType
+notificationCode
+noteid
+notdeleted
+notactivated
+noredirect
+noChangeGroup
+nfid
+nf
+newowner
+newgroupname
+newf
+newer
+newemail
+newdb
+newWidth
+newPassword2
+newLoanDate
+newHeight
+newDueDate
+newDirectory
+nentries
+myip
+msgfield
+ms
+movieview
+mountType
+mountPoint
+modulename
+moduleid
+modulePath
+moduleDesc
+modifiedSince
+misc
+minuteDelta
+minus
+mins
+minimum
+mini
+microhistory
+methodsig
+memory
+memberTypeName
+memberTypeID
+memberPostal
+memberPhone
+memberPeriode
+memberPIN
+memberNotes
+memberFax
+memberEmail
+memberAddress
+me
+md5sum
+md5sig
+maxentries
+maxUploadSize
+matchword
+matchuser
+matchname
+matchcase
+massupload
+marked
+makenote
+makedir
+mailtxt
+mailsub
+mailing
+magic
+logging
+logfile
+logdefaultblock
+logMeIn
+locationID
+loanStatus
+loanSessionID
+loanPeriode
+loanLimit
+loanID
+listprice
+listname
+listing
+listarea
+listShow
+link2
+lineid
+lifetime
+library
+len
+leave
+layoutType
+layers
+lasturl
+lastmodified
+lastid
+lastQueryStr
+languagePrefix
+langName
+labelDesc
+labdef
+kw
+kstart
+keyname
+keydata
+key2
+key1
+kb
+k2
+jupart
+jufinal
+joindate
+iv
+itemname
+itemStatusID
+itemStatus
+itemSourceName
+itemSource
+itemSite
+itemShares
+itemCollID
+itemAction
+iso
+isdescending
+isPersonal
+isPending
+invitepage
+inverse
+inventoryCode
+invcDate
+installpath
+installed
+installdata
+installbind
+instName
+inputSearchVal
+inheritperm
+inherit
+indxtxt
+indx
+incspeed
+inXML
+inUsername
+inPopUp
+inPassword
+inNewPass
+imdbid
+imdb
+ie
+idtype
+idc
+htaccess
+hot
+holiday
+holDesc
+holDateEnd
+holDate
+hideNavItem
+hex
+headers
+harm
+harddiskstandby
+gx
+guest
+gtype
+grouptype
+groupreason
+groupr
+groupfilter
+graphid
+gracePeriode
+grabs
+gpack
+googleplus
+gmdName
+gmdID
+gmdCode
+gmd
+giveout
+getupdatestatus
+getstatus
+getprogress
+getactivity
+getDropdownValues
+geoOption
+generic
+gen
+gameid
+fu
+ftpuser
+fstype
+front
+fromsearch
+fromemail
+frequencyName
+frequencyID
+free
+fp
+forgot
+foreignTable
+foreignDb
+forceRefresh
+folderpath
+flow
+fldname
+fldlength
+fldlabel
+flddecimal
+fldType
+fldPickList
+fldLength
+fldLabel
+fldDecimal
+fix
+firstday
+finishID
+finesDesc
+finesDate
+fineEachDay
+findString
+fileurl
+fileto
+fileold
+filenew
+filename2
+filefrom
+fileframe
+filecontents
+fileURL
+fileTitle
+fileDir
+fileDesc
+fieldlabel
+fieldType
+fieldSep
+fieldId
+fieldEnc
+fh
+ffile
+favicon
+fam
+external
+extensions
+exponent
+expirationyear
+expirationmonth
+expDateYear
+expDateMonth
+expDate
+exemplar
+exe
+exccat
+evtitle
+eta
+errorstr
+errormsg
+errormail
+errmsg
+enroll
+ends
+endday
+encryption
+encrypted
+encrypt
+enclose
+enableReserve
+emailcomplete
+emailId
+editf
+editable
+editUserGroupSubmit
+editUserGroup
+eday
+ecotax
+dwld
+due
+dto
+dos
+documentID
+doaction
+doSearch
+doImport
+doExport
+dnssec
+dns2
+dns1
+dn
+dmodule
+disk
+disablelocallogging
+disabledBBC
+dis
+dirToken
+dim
+digest
+dialog
+dhcp
+dfrom
+df
+depts
+demolish
+delsub
+delrule
+delrow
+delgroup
+deletesmiley
+deleteip
+deleteevent
+deletecheck
+deleteUserGroup
+debet
+dbserver
+dbpw
+dbid
+dbPrefix
+dbPort
+dbHost
+dayname
+datetype
+dateto
+datefrom
+dateReceived
+dateExpected
+dataurl
+dataset
+datadir
+databaseloginpassword
+databaseloginname
+databasehost
+dB
+cw
+cvv2Number
+cvmodule
+customfield
+custid
+cust
+currentFolderPath
+curpage
+csid
+crt
+creditCardType
+creditCardNumber
+credentials
+createpages
+createmode
+crdir
+couponamount
+counts
+convertmode
+conversation
+conv
+contest
+contentTitle
+contentPath
+contentDesc
+contbutt
+contains
+consumer
+constraint
+consoleview
+confirmFinish
+combine
+columnIndex
+color2
+colltype
+collTypeName
+collTypeID
+collType
+codes
+cmspassword
+cmsadminemail
+cmsadmin
+cls
+clientId
+cleared
+classOptions
+claim
+chvalue
+chpage
+chkagree
+checkprivstable
+checkprivsdb
+checkout
+checking
+checkboxes
+checkShares
+checkReshare
+check1
+channels
+changepassword
+changecurrent
+changeUserGroup
+cfgval
+cfgkey
+categoryID
+cardtype
+cap
+callbackPW
+callNumber
+calendarid
+calcolor
+bzipcode
+buddies
+btnSubmit
+bstate
+bridge
+breadcrumb
+bphone
+boxes
+box3
+box2
+box1
+bootstrap
+bomb
+boardtheme
+boardseen
+boardprofile
+blocklabel
+blastname
+bits
+birthyear
+birthmonth
+binding
+bill
+biblioTitle
+biblioID
+bfirstname
+beta
+bemail
+beginner
+bcountry
+bconfirmemail
+bcity
+bbc
+baza
+batchID
+batchExtend
+basedn
+baddress2
+baddress1
+backupnow
+backdrop
+baba
+autoupdate
+automatic
+authorityType
+authPin
+authList
+audioFolder
+asin
+arg
+arch
+applicable
+appkey
+appeal
+aop
+animal
+altmethodpayload
+alterview
+alsoDeleteFile
+allsignups
+allflag
+allfiles
+allboards
+aliasid
+algorithm
+afterupload
+aemail
+adopt
+adminuser
+adminpass2
+adminEnableRecovery
+addcategory
+addUserGroupSubmit
+addUserGroup
+addSpider
+addReply
+addMessage
+addList
+acttype
+actors
+actionName
+acl
+acct
+accountnumber
+accountname
+abc
+aID
+WSDL
+UserChangePassForm
+UID
+Test
+Term
+Tab
+T
+Submit1
+Settings
+SaveInSent
+SORT
+SHIPTOSTREET2
+Review
+ReturnUrl
+RecordingDuration
+Project
+Product
+PasswordResetForm
+PasswordForm
+Or
+MenuItem
+Menu
+METHOD
+Language
+LOCALECODE
+Issue
+InstallForm
+Group
+ExpirationYear
+ExpirationMonth
+ERORR
+DialCallStatus
+DeviceType
+DATE
+D
+Condition
+CallSid
+CVV
+B
+AudioPlayerSubmit
+AudioPlayerReset
+AccountNumber
+zonefile
+zipName
+zhsd
+yy
+ystart
+yellowtemp
+yellowstales
+yellowremfails
+yellowrejects
+yellowgetfails
+yellowgessper
+yellowfan
+yellowdiscards
+yellowavgmhper
+years
+yahoo
+xxx
+xx
+xtype
+xnum
+xmode
+xmldata
+xjxmthd
+xjxfun
+xjxevt
+xjxcls
+xjxargs
+xjxGenerateStyle
+xjxGenerateJavascript
+xhrLocation
+xhprof
+xdebug
+wu
+wstoken
+writeSchema
+wresult
+wrcont
+wpseo
+wpnonce
+wpas
+workingdiR
+workgroup
+workflow
+workerId
+wordlist
+wood
+wlk
+wli
+withdraw
+withCount
+wins2
+wins1
+wins
+wildcard
+wikitext
+wide
+whw
+whom
+websiteId
+webserver
+webpage
+webguiproto
+webguiport
+wbp
+wbcp
+warn
+want
+wakeall
+wa
+vuln
+vrt
+vpntype
+vouchersyncusername
+vouchersyncport
+vouchersyncpass
+vouchersyncdbip
+vouchers
+volume
+void
+vnutr
+vlanprioset
+vlanprio
+vjcomp
+villagename
+viewweek
+viewupgradelog
+viewscope
+viewMode
+viewBag
+videos
+videopress
+videoTitle
+videoTags
+videoId
+videoDescription
+videoCategory
+vhostcontainer
+vhid
+vgrlf
+versions
+verse
+verifycode
+verification
+verboselog
+verb
+vecdo
+ve
+vcheck
+vbxsite
+vbulletin
+vbss
+vbsq
+vat
+vars
+variants
+var2
+var1
+valor
+validation
+validateValue
+validateId
+ustsub
+ustools
+ustname
+usrgroups
+usetoken
+usetcp
+userrealname
+usernamefld
+username2
+usermail
+userlogin
+userlevel
+userinfo
+userids
+userf
+useraction
+userPassword
+userEdit
+userDialogResult
+userAgent
+usepublicip
+useicmp
+usecurl
+useR
+uscmnds
+urlup
+urltype
+urlf
+urldd0
+url2
+urL
+upports
+uploadurl
+uploading
+uploadhd
+uploadf
+uploader
+uploaddir
+uploadPath
+upl
+upip
+upin
+upff
+upf
+updateurl
+updatempd
+updateme
+updateid
+updatefile
+updateType
+updateMsgCount
+upcont
+upcom
+upchange
+unverify
+unscheduled
+unreleased
+unpubdate
+unknown
+units
+unitprice
+uniqueid
+uniqueID
+undodrag
+unbanreason
+ulang
+uk
+uf
+ucd
+uback
+uN
+uID
+u1p
+typeofdata
+typename
+typefilter
+type6
+type1
+txtwebemail
+txtsupport
+txtUsername
+txtRecallBuffer
+txtPHPCommand
+txtCaptcha
+txtAddress
+txpower
+txkey
+txantenna
+tvname
+tuser
+tunable
+tribe
+tresc
+trapstring
+trapserverport
+trapserver
+trappercap
+trapenable
+transport
+transient
+traffic
+tracks
+trackback
+tpshcook
+tplName
+tplID
+town
+touserid
+touch
+totalcount
+totalTracks
+totalItems
+topsearch
+toppool
+tooltip
+tomod
+toid
+toProcess
+tn
+tld
+titulo
+titre
+tint
+timeupdateinterval
+timeservers
+timeoffset
+timeint
+timedescr
+timedd0
+timeFormat
+tile
+tids
+ticketid
+ticketbits
+thumbWidth
+thumbHeight
+throwexception
+threadID
+thisX
+themeName
+tftpinterface
+textonly
+texto
+textmail
+textfield
+textIn
+text0Name
+testvar
+testdbpwd
+testdb
+testType
+testMode
+testID
+templatefile
+tempName
+temat
+teamid
+teacher
+tdir
+td
+tcpmssfix
+tcpidletimeout
+tcp
+tbname
+tbls
+taxtype
+taxrate
+taskID
+targetname
+targetip
+tagcloudview
+tagId
+tablo
+tableList
+tabla
+tabAction
+tab1
+ta
+t3
+syslocation
+sysevents
+sysemail
+syscontact
+syscmd
+syntax
+synconupgrade
+synchronize
+syncfilter
+symgo
+symbol
+svff
+svdi
+supprimer
+suppr
+sunrise
+subsubaction
+subset
+subscriptionId
+subscribers
+subqcmnds
+subop
+subnetv6
+subnet
+submode
+submitv
+submitrobots
+submithtaccess
+submitf
+submitThemes
+submitReset
+submitFilter
+submitFilesAdminSettings
+submitEmail
+submitAdd
+submit4
+submit3
+submail
+subjectid
+subfolder
+subdomains
+subcanemaildomain
+subId
+subGenre
+stuid
+stuff
+students
+studentidx
+sts
+strukt
+stringtoh
+strin
+strictcn
+strictbind
+streamMode
+stp
+storagegroup
+stoptime
+stoppool
+stoppga
+stopbtn
+stime
+stereo
+stepid
+step5
+stdlib
+stderr
+statut
+statusid
+statsgraph
+staticarp
+statetype
+statetimeout
+statetable
+stateid
+stateOrProvinceName
+startyear
+startpool
+startpga
+startnum
+startmonth
+startdisplayingat
+startbtn
+startMonth
+starred
+stamp
+staffId
+stack
+sshdkeyonly
+srname
+srm
+srctype
+srctrack
+srctext
+srcnot
+srcmask
+srch
+srcfmt
+srcendport
+srcbeginposrt
+srcbeginport
+sr
+sqtid
+sqsrv
+sqquery
+sqpwd
+sqprt
+sqlwxp
+sqluser4
+sqluser3
+sqluser2
+sqluser1
+sqltype
+sqlty
+sqlportb4
+sqlportb3
+sqlportb2
+sqlportb1
+sqlport4
+sqlport3
+sqlport2
+sqlport1
+sqlport
+sqlpass4
+sqlpass3
+sqlpass2
+sqlpass1
+sqlog
+sqlite2
+sqlhost4
+sqlhost3
+sqlhost2
+sqlhost1
+sqlfile
+sqldp
+sqldebug
+sqlcode
+sqlaction
+sqdbn
+sqconf
+spy
+spots
+spot
+sport
+spoofmac
+spellstring
+spelling
+specs
+specifiedpassword
+specialsettings
+speciallogfile
+specialFiles
+spammer
+spamcheck
+sourcetracking
+sourceport
+sourceip
+sourcego
+sorttable
+sortname
+sorting
+sortdirection
+sortdir
+sortable
+sortField
+songid
+soname
+something
+somestuff
+some
+solrsort
+snn
+snmpscanner
+snatched
+snaplen
+smtptls
+smtpssl
+smtprelay
+smtpnotifyemailaddress
+smtpipaddress
+smtpfromaddress
+smtpPassword
+sms
+smode
+smile
+smfdbu
+smfdbp
+smfdbn
+smfdbh
+smf
+smartpagebreak
+smartmonemail
+slot
+slid
+skiplang
+skipIOS
+skipANDROID
+skinname
+skinName
+sk
+sjid
+sizey
+sizes
+sitter2
+sitter1
+sitedown
+siteId
+simpin
+silver
+showthumbs
+showtext
+showslow
+showmessage
+showinfo
+showinactive
+showbd
+showact
+showIndex
+showFooterMessage
+shorturl
+shortseq
+shopping
+shiptobilling
+sharing
+sharednet
+sh311
+sh3
+sfname
+sfldr
+sfilter
+sfilename
+setype
+setupid
+settype
+settags
+setrw
+setoption
+setname
+setlanguage
+setlang
+setdefault
+setUserAgent
+setPublic
+sessions
+sessid
+sess
+servicestatusfilter
+serviceName
+serversdisabled
+serverip
+servercn
+serverId
+serie
+serialspeed
+serialport
+serialize
+serdir
+ser
+sentitems
+senm
+senha
+sendtime
+sendpassword
+sendmsg
+sendmethod
+sendit
+sendfile
+senderEmail
+sendemail
+sendactivation
+sendTo
+selyear
+selmonth
+sellernick
+selectvalues
+selectop
+selectlist
+selectedmodule
+selectedTable
+selectcategory
+selectAmount
+sele
+selday
+selCountry
+segment
+seed
+sedir
+securityscanner
+secu
+secs
+secretKey
+searchval
+searchuser
+searchstring
+searchfield
+searchadvsizeto
+searchadvsizefrom
+searchadvr
+searchadvposter
+searchadvgroups
+searchadvcat
+searchUsername
+searchQuery
+searchOper
+searcc
+seC
+scrubrnid
+scrubnodf
+scores
+schooldatex
+schedule0
+sched
+scalepoints
+sca
+sbjct
+savmode
+savetest
+saveoptions
+savehostid
+savegroup
+savefolderurl
+savefolder
+savefilenameurl
+savefilename
+savedraft
+saveconf
+savePath
+saveNedit
+saveNcreate
+saveNback
+sat
+sampledata
+salutation
+saleprice
+safemodz
+safefile
+safecss
+safe
+sabsetting
+sabapikeytype
+sYear
+sName
+sColumns
+s3key
+s3bucket
+rxantenna
+rwenable
+rwcommunity
+rvm
+runsnippet
+runid
+runer
+runState
+rtl
+rstarget4
+rstarget3
+rstarget2
+rstarget1
+rsswidgettextlength
+rsswidgetheight
+rssurl
+rssmaxitems
+rrule
+rrdbackup
+rport
+rpassword
+rownum
+rowId
+routeid
+rootpath
+rollbits
+rocommunity
+robotsnew
+rname
+rmid
+richtext
+rfiletxt
+rfile
+rfc959workaround
+rf
+reverseacct
+returnsession
+returnpage
+retries
+ret
+resultmatch
+resultid
+resubmit
+restorefile
+restorearea
+restartchk
+respuesta
+responsive
+resources
+resourcefile
+residence
+resetwidgets
+resetpass
+resetlogs
+resetlog
+resetPassword
+rescanwifi
+requests
+reqid
+reqFor
+req128
+repwd
+repositoryurl
+reportname
+reportfun
+reportType
+replayMode
+repeatMonth
+repass
+reopen
+rensub
+renold
+rennew
+renf
+renderlinks
+renderimages
+renderforms
+renderfields
+render
+rempool
+removep
+removemp
+removefields
+removeOldVisits
+remoteserver3
+remoteserver2
+remotekey
+remoteip
+remot
+remmin
+remhrs
+remdays
+remarks
+reloadfilter
+relevance
+relayd
+relay
+relationships
+relationship
+relations
+related
+rela
+reglocation
+registered
+reginput
+regid
+regdomain
+regdhcpstatic
+regdhcp
+regcountry
+refuse
+refund
+refuid
+refreshinterval
+reflectiontimeout
+refkod
+referid
+referer2
+redirurl
+redirectto
+redirectUri
+redfi
+reddi
+recurse
+recurringtype
+recurrence
+recreate
+recordsArray
+recordcount
+recordType
+recordID
+reconstruct
+recommend
+recipientCurrency
+recipientAmount
+recherche
+receipient
+recache
+reauthenticateacct
+reauthenticate
+realpath
+readonly
+readme
+reading
+rdata
+rawAuthMessage
+rasamednsasdhcp6
+rapriority
+randkey
+ramode
+rainterface
+radomainsearchlist
+radns2
+radns1
+radiusvendor
+radiusserverport
+radiusserveracctport
+radiusserver2port
+radiusserver2acctport
+radiusserver2
+radiusserver
+radiussecret2
+radiussecret
+radiussecenable
+radiusport4
+radiusport3
+radiusport2
+radiusport
+radiusnasid
+radiuskey4
+radiuskey3
+radiuskey2
+radiuskey
+radiusissueips
+radiusip4
+radiusip3
+radiusip2
+radiusip
+radiusenable
+radiusacctport
+radiobutton
+radPostPage
+rN
+rM
+r3
+r00t
+qx
+quoteid
+qunfatmpname
+quizid
+quitchk
+quietlogin
+quickmanagertv
+quickmanagerclose
+quickmanager
+quicklogin
+questions
+querytype
+querysql
+queryString
+quantityBackup
+qu
+qtranslateincompatiblemessage
+qsubject
+qqfafile
+qmrefresh
+qact3
+q3
+q2
+purgedb
+puremode
+purchaseorderid
+purchaseid
+publickey
+pubkey
+pubdate
+puT
+ptpid
+ptp
+psk
+psid
+pseudo
+ps2pdf
+prv
+proxyusername
+proxyurl
+proxypassword
+proxyhost
+prov
+protocomp
+protmode
+promiscuous
+projectionxy
+projection
+profileId
+prof
+productname
+productlist
+productcode
+productDescription
+processlogin
+processlist
+processing
+procedure
+probability
+prj
+privid
+privatekey
+priv
+priority3
+priority2
+priority1
+prio
+printer
+principal
+primarymodule
+primaryconsole
+prices
+pri
+prevpage
+press
+presence
+prescription
+prereq
+preg
+prefork
+prefetchkey
+prefetch
+preauthurl
+ppsstratum
+ppsselect
+ppsrefid
+ppsport
+ppsfudge1
+ppsflag4
+ppsflag3
+ppsflag2
+pppoeid
+ppid
+ppdebug
+ppage
+potentialid
+potentalid
+posttype
+postedText
+postback
+postafterlogin
+postData
+post2
+post1
+portscanner
+portbw
+portbl
+portbc
+port1
+porder
+pop3host
+pools
+poolopts
+poolname
+pollvote
+pollport
+pollQuestion
+pollOptions
+plusminus
+plname
+plid
+playlistTitle
+playlistDescription
+plaintext
+pkgs
+pkgrepourl
+pinned
+pictitle
+pics
+pickfieldtable
+pickfieldname
+pickfieldlabel
+pickfieldcolname
+pick
+piasS
+pi
+phpsettings
+phpsettingid
+phpenabled
+phpbbkat
+phpbbdbu
+phpbbdbp
+phpbbdbn
+phpbbdbh
+phpbb
+photoid
+phoneNr
+phone3
+pguser
+pgsqlcon
+pgport
+pgdb
+peruserbw
+personality
+personId
+persistcommonwireless
+persist
+perms9
+perms8
+perms7
+perms6
+perms5
+perms4
+perms3
+perms2
+perms1
+perms0
+permStatus
+periodo
+periodidx
+perform
+perPage
+peerstats
+peace
+pdouser
+pdopass
+pdodsn
+pdocon
+pdnpipe
+pcid
+paypalListener
+payments
+paymentId
+paymentData
+paths
+pathf
+path2news
+patch
+passwordnotifymethod
+passwordkey
+passwordgenmethod
+passwordfld2
+passwordfld1
+passwordfld
+passwordconfirm
+passwordc
+passwdList
+passthrumacaddusername
+passthrumacadd
+passgen
+passf
+passenger
+passd
+partition
+parseSchema
+parid
+parentqueue
+parentfieldid
+paranoia
+paporchap
+pagestyle
+pagestart
+pageop
+pagenumber
+pageborder
+pageType
+pageOwner
+padID
+paID
+pW
+pUID
+pPassConf
+pPass
+pPage
+pName
+pMail
+pDesc
+p4ssw0rD
+p3
+p2p
+p2index
+p2entry
+p1index
+p1entry
+overwriteconfigxml
+overdue
+ouT
+ostlang
+orionprofile
+origname
+organizationalUnitName
+organizationName
+orgajax
+orders
+ordering
+orderType
+orauser
+oraclecon
+opwd
+optin
+optimizer
+oper
+openings
+opened
+openbasedir
+oof
+onw
+onlyforuser
+onlyfind
+ondemand
+on
+oldtime
+olddir
+oldaction
+oldPlaylistTitle
+oldMountPoint
+oldEmail
+odbcuser
+odbcpass
+odbcdsn
+odbccon
+odb
+occupation
+objectIDs
+obj
+nurlen
+nurld
+numwant
+numlabel
+numberposts
+numail
+nuked
+nuf
+ntporphan
+nslookup
+nrresults
+npassworda
+npage
+noxml
+nowmodule
+nounce
+notrap
+notices
+noti
+not
+nosync
+noserve
+noreload
+nordr
+noquery
+nopfsync
+nopeer
+nopackages
+noofrows
+none
+nonat
+nomodify
+nometool
+nome
+nomacfilter
+nolimit
+nolang
+nohttpsforwards
+nohttpreferercheck
+nohtml
+nogrants
+noexpand
+noedit
+nodraft
+nodnsrebindcheck
+nodeid
+noconcurrentlogins
+noantilockout
+noaction
+noRedirect
+noOfBytes
+nmdf
+nfile
+nf4cs
+nf4c
+nf1
+nextserver
+nextid
+nextPage
+newwin
+newusername
+newusergroup
+newtype
+newtime
+newtheme
+newtemplate
+newrule
+newprefix
+newpref
+newpath
+newnick
+newmessage
+newids
+newid
+newgroup
+newdocgroup
+newcode
+newcategory
+newalbum
+newaccount
+newX10Monitor
+newWindow
+newVideoTitle
+newVideoTags
+newVideoDescription
+newVideoCategory
+newValue
+newText
+newSite
+newProject
+newPlaylistTitle
+newPlaylistDescription
+newPath
+newMonitor
+newGroup
+newGame
+newControl
+netgraph
+netboot
+nested
+neg
+ncbase
+nc
+natreflection
+natport
+nameren
+namelist
+namefe
+name3
+namE
+n1
+myusername
+mysqls
+mysqlcon
+mypassword
+myname
+mylogout
+mycode
+mybulletin
+mybbindex
+mybbdbu
+mybbdbp
+mybbdbn
+mybbdbh
+mw
+mve
+mvdi
+mute
+music
+muser
+multiplier
+multifieldname
+multifieldid
+mtype
+mtu
+mto
+mtext
+msubj
+mssqlcon
+mss
+msqur
+msq1
+msid
+msi
+msgtype
+msgnoaccess
+msgno
+msgexpired
+msgcachesize
+msg1
+mru
+mpdconf
+mpath
+mpage
+moveup
+moveto
+movedown
+movd
+mount
+motivo
+motd
+moodlewsrestformat
+mon
+moduletype
+moduleorder
+moduleguid
+moduleType
+moduleId
+modified
+modfunc
+modfile
+moderate
+modelId
+modeid
+modcat
+modE
+mobj
+mobilephone
+mnam
+mmsg
+mmail
+mlist
+ml
+mkF
+mkD
+mito
+minkills
+minViewability
+minJs
+minCss
+mimetypes
+milw0
+mids
+mibii
+mhtc
+mhost
+mhash
+mh
+mg
+mfrom
+mfldr
+mffw
+metadata
+messagesubject
+messageid
+messagebody
+messageMultiplier
+mess
+meridiem
+mergefile
+merchantReference
+menutitle
+menus
+menuindex
+menuid
+memtype
+memday944
+memday942
+memberPasswd2
+memberPasswd
+memberPassWord
+mediatype
+mediaopt
+medalweek
+medalid
+mdp
+md5q
+md5pass
+md5hash
+md5crack
+md
+mcid
+mc
+mbox
+mbadmin
+maxtry
+maxtemp
+maxstore
+maxstales
+maxremfails
+maxrejects
+maxprocperip
+maxproc
+maxmss
+maxleasetime
+maximumtableentries
+maximumstates
+maxgetfails
+maxgessper
+maxfan
+maxdiscards
+maxcrop
+maxaddr
+maxZipInputSize
+master
+masssource
+massedit
+massdefaceurl
+massdefacedir
+massa
+masdr
+marker
+markdefault
+manual
+managerlanguage
+manage
+man
+makeupdate
+maintitle
+maint
+mainmessage
+mainGenre
+mailsent
+maillisttmpname
+mailcontent
+mailbodyid
+mailbody
+mailMethod
+mailAuth
+magicfields
+macname
+mV
+mSendm
+mKf
+mKd
+mD
+lucky
+lticket
+lp
+losslow
+losshigh
+loopstats
+lookfornewversion
+longlastingsession
+logsys
+logprivatenets
+logpeer
+logoutid
+loglighttpd
+loglevel
+loginmessage
+loginemail
+loginautocomplete
+logic
+loggedAt
+logfilesize
+logfilE
+logf
+logeraser
+logdefaultpass
+logbogons
+logall
+logable
+logType
+logFile
+lockid
+locationid
+localized
+localityName
+localip
+localfile
+localf
+localbeginport
+loan
+lm
+live
+listorder
+listmode
+liste2
+liste1
+liste
+listSubmitted
+listItem
+listId
+linkedin
+link1
+link0
+limitpage
+limitless
+limite
+liked
+lfilename
+lemail
+legendstyle
+legendsize
+legendfontsize
+legendfontr
+legendfontg
+legendfontb
+legendfont
+lecture
+leaptxt
+leadval
+leadsource
+lbg
+lbcp
+latencylow
+latencyhigh
+lastactive
+lastActive
+langs
+langname
+lanes
+lane
+landscape
+lan
+laggif
+l7container
+kr
+kod
+king
+kime
+kim
+killfilter
+kil
+keytype
+keylen
+keyid
+keepslashes
+keeppass
+katid
+jpeg
+joingroup
+joined
+jid
+jform
+jenkins
+jaxl
+jahr
+jCryption
+itemkey
+itemcount
+isverify
+issues
+ispersis
+isocode
+isnano
+isim
+isenabled
+isemaildomain
+iscustomreport
+iscomment
+iscatchall
+isbinddomain
+isactive
+isSwitch
+isDev
+iron
+ipv6allow
+ipsecpsk
+ipscanner
+iprestricted
+ipprotocol
+ipproto
+iplist
+ipandport
+ipaddrv6
+invoiceId
+inviteesid
+invited
+invitation
+invest
+invalidate
+introeditor
+interfaces
+instanceId
+installstep
+installGoingOn
+inputid
+inputSize
+injector
+initstr
+initialtext
+initialise
+initdelay
+inifile
+inid
+inf3ct
+ineligible
+indent
+includenoncache
+incl
+iname
+inajax
+inactive
+inViewWarnings
+inViewLogs
+inViewErrors
+inSessionSecuirty
+inRemember
+inNewUserName
+inForgotPassword
+inDownLoad
+inConfEmail
+inBindLog
+importrobotsmeta
+importonly
+importmethod
+importid
+importfile
+importer
+important
+importaioseo
+importType
+importFile
+impersonate
+imgtype
+imgid
+imdbID
+imagename
+imagefile
+imagedetails
+imageUrl
+imageThumbID
+imagE
+ikesaid
+ikeid
+ignoresubjectmismatch
+ignorephpver
+ignorefatal
+ignored
+ignoreTV
+ifnum
+ifname
+ieee8021x
+idname
+idletimeout
+identity
+identifiant
+idb
+idSite
+idL
+id9level
+id9gid
+id8level
+id8gid
+id7level
+id7gid
+id6level
+id6gid
+id5level
+id5gid
+id4level
+id4gid
+id40level
+id40gid
+id3level
+id3gid
+id39level
+id39gid
+id38level
+id38gid
+id37level
+id37gid
+id36level
+id36gid
+id35level
+id35gid
+id34level
+id34gid
+id33level
+id33gid
+id32level
+id32gid
+id31level
+id31gid
+id30level
+id30gid
+id2level
+id2gid
+id29level
+id29gid
+id28level
+id28gid
+id27level
+id27gid
+id26level
+id26gid
+id25level
+id25gid
+id24level
+id24gid
+id23level
+id23gid
+id22level
+id22gid
+id21level
+id21gid
+id20level
+id20gid
+id1level
+id1gid
+id19level
+id19gid
+id18level
+id18gid
+id17level
+id17gid
+id16level
+id16gid
+id15level
+id15gid
+id14level
+id14gid
+id13level
+id13gid
+id12level
+id12gid
+id11level
+id11gid
+id10level
+id10gid
+icp
+icode
+icmptype
+icerik
+ical
+hwhy
+htype
+httpsverify
+httpsname
+httpscanner
+https
+httpbanner
+htmlemail
+html2xhtml
+htcc
+htc
+htaccessnew
+hrs
+howmuch
+howmany
+howlong
+how
+hostres
+hostipformat
+hostapd
+hostName
+hosT
+horario
+holdcnt
+hlp
+hldb
+hidrfile
+hidid
+hideversion
+hidemenu
+hideidentity
+hidFileID
+hid
+hellotime
+health
+hd
+hc
+having
+hashtoh
+hashkey
+hasAudio
+hardenglue
+ham
+gtin
+gt
+gs
+grupo
+grps
+grpage
+grouped
+groupdesc
+groupdel
+groupby
+groupIDs
+groupCounter
+greif
+graphtype
+graphlot
+granularity
+grants
+granted
+gr
+gpstype
+gpssubsec
+gpsstratum
+gpsspeed
+gpsselect
+gpsrefid
+gpsprefer
+gpsport
+gpsnmea
+gpsinitcmd
+gpsfudge2
+gpsfudge1
+gpsflag4
+gpsflag3
+gpsflag2
+gpsflag1
+gotod
+goodsid
+gomkf
+godb
+godashboard
+goal
+gn
+github
+gip
+gifif
+ggid
+gfils
+getpic
+getm
+getenv
+getdyndnsstatus
+getdb
+getdate
+getcfg
+getThermalSensorsData
+getOutputCompression
+generatekey
+generateKeypair
+general
+ged
+geT
+gdork
+gd
+gc
+gbid
+gatewayv6
+gameID
+gadget
+ga
+fyear
+fwdelay
+fw
+fvonly
+fuzz
+functionz
+functionp
+ftype
+ftpscanner
+ftps
+ftppass
+ftphost
+fsOP
+fromAddress
+frm
+friendlyiface
+friend
+fresh
+frames
+fqdn
+fq
+fpath
+fpassw
+forwarding
+forwarderid
+formname
+formfactor
+formdata
+formatup
+formats
+formatdown
+formage
+formId
+formAutosave
+forgotPassword
+forever
+foreground
+forceIcon
+forceFormat
+fontr
+fontg
+fonte
+fontb
+fontSize
+following
+folderId
+fmt
+flushcache
+flowtable
+floor
+floating
+fldMandatory
+flashtype
+flashpga
+fl
+fixmetadesc
+firmwareurl
+finds
+findid
+fin
+filtre
+filtertext
+filterlogentriesinterfaces
+filterlogentries
+filterdescriptions
+filled
+filew
+filetosave
+filesend
+fileoffset
+filename64
+filename32
+filecreate
+filecount
+fileOffset
+fileLength
+fileExistsAction
+fileEdit
+fileDataName
+fileContent
+file2ch
+filE
+fieldkey
+fieldCounter
+fid2
+feedId
+fe
+fdo
+fdel
+fcsubmit
+fcopy
+fbclearall
+favourite
+favorites
+favicons
+fast
+familyName
+facility
+facid
+fType
+ezID
+eyear
+extras
+extractDir
+extern
+extdisplay
+extdir
+exportVideo
+exportMisc
+exportFrames
+exportFormat
+exportFile
+exportDetail
+exploit
+expirationDate
+expid
+expertise
+expanded
+expandAll
+exp
+exitsql
+exists
+exif
+executeForm
+execmethod
+execmassdeface
+excludedRecords
+exchange
+exc
+exTime
+exT
+ewidth
+eventname
+eventTitle
+evap
+evalsource
+evalinfect
+evalcode
+evac
+etag
+et
+eshopId
+eshopAccount
+esId
+error500path
+error404path
+error403path
+erne
+epot
+epoch
+entryid
+entryPoint
+entryId
+entryID
+entityID
+entire
+enhanced
+enforceHTTPS
+endport
+endmonth
+encoder
+encod
+enablestp
+enablesshd
+enableserial
+enablenatreflectionhelper
+enablebinatreflection
+emonth
+eml
+embedded
+emailsubject
+emailfrom
+emailch
+emailToken
+emailList
+emailID
+emailBody
+elementType
+ee
+edittxt
+editprofile
+editkey
+editgroup
+editedon
+edge
+ecraz
+ealgo
+dynamic
+dxval
+dxsqlsearch
+dxportscan
+dxparam
+dxmode
+dxinstant
+dximg
+dxfile
+dxdirsimple
+dxdir
+dummy
+dumd
+duid
+duedate
+dsttype
+dstnot
+dstmask
+dstip
+dstendport
+dstbeginport
+dscp
+dryrun
+droptables
+drilldown
+dragtable
+dragdroporder
+dpgn
+dpath
+downloadid
+downloadbtn
+downloadbackup
+downloadIndex
+downloaD
+downf
+downchange
+dosthisserver
+dosearch
+dopt
+donotbackuprrd
+domerge
+domen
+domainsearchlist
+domainname
+domaiN
+doimage
+documentroot
+documentgroup
+doctype
+docs
+docgroups
+docgroup
+doRegister
+doDelete
+dnssrcip
+dnssecstripped
+dnsquery
+dnslocalhost
+dnsallowoverride
+dns4
+dns3
+dnpipe
+dlgzip
+dldone
+dlPath
+dkim
+dizin
+divider
+diversity
+distribution
+diskspace
+discipline
+disapprove
+disablevpnrules
+disablesegmentationoffloading
+disablescrub
+disablereplyto
+disablenegate
+disablelargereceiveoffloading
+disablehttpredirect
+disablefilter
+disableconsolemenu
+disablechecksumoffloading
+disablecheck
+disablecarp
+disablebeep
+dirr
+dirlisting
+dirfree
+directoryscanner
+direccion
+dire
+dircreate
+diract
+dirList
+dimensions
+dig
+diff
+dhtc
+dhcpv6leaseinlocaltime
+dhcprejectfrom
+dhcpleaseinlocaltime
+dhcphostname
+dhcpfirst
+dhcpbackup
+dhcp6usev4iface
+dhcp6prefixonly
+dfilename
+devid
+deviceid
+detail0
+destslice
+destino
+destd
+descripcion
+desc2
+desc1
+deptid
+deposit
+depid
+denyunknown
+dend
+demoData
+deltype
+deltpl
+delstring
+delsel
+delpref
+delmac
+deliveries
+deliver
+delimeter
+delfriend
+delfolder
+delfl
+delfbadmin
+delf
+deleteweek
+deletesubmit
+deleterule
+deletegrp
+deleteg
+deletedir
+deletedSpecs
+deletecntlist
+deleteUser
+deletePrices
+deleteList
+deleteIndex
+deleteImages
+deleteCategory
+deldat
+deld
+delName
+degrees
+deftime
+defaulttemplate
+defaultqueue
+defaultleasetime
+defaultgw
+deduction
+decrypt
+debugmethods
+debugfailover
+debugbox
+debug3
+debug2
+debit
+deathplace
+deathdate
+deadline
+deact
+deS
+deL
+ddo
+ddnsupdate
+ddnsdomainprimary
+ddnsdomainkeyname
+ddnsdomainkey
+ddnsdomain
+dbsocket
+dbn
+dbbase
+dbUsername
+dbTablePrefix
+dbPwd
+dbPass
+dbOP
+datestamp
+datechange
+datasrt
+dataroot
+dataofs
+datagapradius
+datagapangle
+dataflt
+databasename
+dataangle
+data2
+darezz
+dare
+dID
+cx
+customernumber
+customcss
+customaddtplid
+customId
+customFieldId
+currentday
+currentPassword
+currentPage
+currencyid
+currencyCode
+curpath
+cuenta
+ctx
+ctrl
+ctag
+csvIDs
+csspreview
+csrftoken
+csr
+cs2
+cs1
+crypo
+crtty
+crrt
+crefile
+createstdsubdomain
+createlist
+createdon
+createaccount
+cre
+crcf
+crannycap
+cracK
+cpyto
+cpw
+cpath
+cpass
+cpage
+coverage
+courseId
+couponcode
+coupling
+countryID
+countonly
+copyname
+cop
+contenttype
+containerid
+contactidlist
+contactID
+contactEmail
+cont
+consumerSecret
+consumerKey
+const
+consent
+connsub
+connport
+connections
+connectionType
+connectback
+confirmEmail
+confirm3
+confirm2
+configs
+concepto
+compr
+compose
+communication
+commonName
+commits
+commex
+commentaire
+commander
+combo
+color1
+college
+collectionto
+collectionfrom
+collectcolumn
+coin
+codetype
+coded
+codeblock
+coauthors
+coM
+cnpj
+cmspasswordconfirm
+cmode
+cmmd
+cmediafix
+cmdr
+cmdir
+cmdid
+cmdex
+cmde
+closenotice
+closedate
+clockstats
+clipboard
+cleartokens
+clearquery
+clearlogs
+clearSess
+clearLog
+cleancache
+clay
+classname
+cktime
+ckeditor
+ck
+cipher
+cinterface
+cids
+choix
+choice2
+chmodnow
+chmodenum
+chm
+chkalldocs
+chfl
+checksumbits
+checknum
+checkmetadesc
+checkid
+checkconnect
+checkaliasesurlcert
+chdir
+chats
+chatmsg
+chartsize
+characterid
+chapter
+chapo
+changestatus
+changero
+changeVisitAlpha
+changePass
+cfy
+cfx
+cfilename
+cfile
+cfil
+cfed
+certsubject
+certref
+certid
+certdepth
+cds
+cdirname
+cdir
+cateid
+categoryname
+categoryName
+catalogid
+catalogName
+casein
+cartId
+caref
+cardno
+capture
+cantidad
+canpreview
+canned
+caneditphpsettings
+caneditdomain
+cancelled
+canceldelete
+campo
+cambio
+callop
+callerId
+caid
+cacheable
+cable
+cP
+c37url
+c2
+byws
+bythis
+bysyml
+bypcu
+bypassstaticroutes
+byoc
+byfc9
+byfc
+byetc
+bye
+bycw
+byapache
+bwdefaultup
+bwdefaultdn
+bv
+buy
+buttonval
+buttons
+businessName
+bulletin
+budget
+bs
+broadcast
+bridgeif
+breakpoints
+breakpoint
+bps
+bpg
+bpage
+bounce
+bottom
+bots
+bootslice
+boolean
+bookings
+bonus
+bogonsinterval
+boardmod
+blogtitle
+blogtags
+blogbody
+blockpriv
+blockeduntil
+blockedmacsurl
+blockedafter
+blockbogons
+blatent
+birthplace
+birth
+bip
+bindpw
+bindip
+binddn
+bgColor
+benchmark
+behaviour
+be
+bduss
+bcip
+baz
+baslik
+basket
+basic
+basemodule
+bantype
+bantime
+bannedUser
+banip
+banid
+backurl
+backupcount
+backupbeforeupgrade
+backuparea
+autorefresh
+autoredirect
+autoptp
+autoplay
+autogroup
+autoenable
+autoedge
+autoassign
+autoapprove
+autoadjust
+autoaddfields
+authserver
+authorship
+authorizedkeys
+authname
+authmode
+authlvl
+authentication
+authcn
+authcfg
+auid
+attendance
+attachmentsid
+attachmentUploadDir
+attachmentId
+attachid
+attaches
+assigntype
+assignedTo
+assigned
+asset
+assertion
+asid
+asText
+artistid
+articleid
+argv
+argb
+arg2
+archivo
+archivedate
+archiveDate
+apple
+apnum
+apn
+apinger
+apiKey
+aot
+answerid
+annotation
+ann
+animetitle
+anidb
+andor
+ampm
+amountup
+amountdown
+alturlenable
+althostnames
+alternate
+allyid
+allss
+allqw
+allowopts
+allowinvalidsig
+allowed
+allowZipDownload
+allids
+allfields
+allergies
+allDepts
+aliasimport
+aliasesresolveinterval
+aliA
+algo
+alertEmail
+albumname
+alI
+al
+ak
+ajaxMode
+ajaxCalendar
+ajaxAction
+aj
+airdate
+agentoption
+affw
+affiliate
+af
+advskew
+advbase
+advancedview
+adsr
+adresse
+admins
+adminlogin
+adminUser
+adminPass
+adminPWD
+adminEmail
+adlr
+addurl
+addtype
+addtxt
+addtag
+addsite
+addrule
+addressren
+address0
+addpool
+addonkey
+additionalData
+addfile
+addevent
+addcat
+addacc
+addUser
+addOption
+addComment
+addBase
+adaptivestart
+adaptiveend
+adapter
+ad2syp
+ad2syc
+actreject
+actpass
+activityID
+activationKey
+actionadd
+actionType
+actid
+actblock
+act3
+act2
+acpage
+ackqueue
+ack
+acfcomp
+accLimit
+acao
+abbr
+ZipName
+Yol
+Y
+XL
+WIDsubject
+VerifyCode
+VPSSignature
+UserType
+UserSettingsForm
+UserName
+UserLoginForm
+UserForm
+UserCreateForm
+URI
+TxAuthNo
+TrYaG
+Touchm
+Toucha
+Touch
+Taxonomy
+Task
+Target
+TO
+TITL
+SysMessage
+SubsiteID
+Submit2
+StoreCategory
+StepID
+Soups
+ShareForm
+SettingsForm
+Setting
+Service
+SecurityKey
+SearchForm
+Sandwiches
+Salads
+SURN
+SUBMIT
+SPFX
+SAMLRequest
+Result
+ResourceUploadForm
+ResetRRD
+Register
+ReduxFrameworkPlugin
+ROMN
+RESULT
+RESET
+REPO
+RECHECK
+RC
+Q
+Public
+ProjectUserForm
+PostCodeResult
+PostCode
+Plain
+Person
+Perms
+PayerStatus
+ParentPage
+Parent
+PWD
+PUBL
+PHONE
+Owner
+Opt2
+Opt1
+OpenWith
+Object
+NetworkUserID
+NetworkScreenName
+NetworkPlatform
+NSFX
+NPFX
+NOTE
+NICK
+N3tshcook
+ModuleVar
+LostPasswordForm
+Lookup
+LegendMode
+Last4Digits
+LATEST
+KloutID
+Joomla
+Import
+IPv6
+HowMany
+Hkrkoz
+Help
+Heads
+Hash
+HMACKey
+Good
+GiftAid
+GROUP
+GRAPHS
+GIVN
+GENDER
+Form
+Flag
+Filter
+FileIDs
+File
+Field
+FactoryName
+FactoryId
+FXuser
+FXpass
+FXimage
+FONE
+FILES
+FIELDS
+Export
+ExpiryDate
+Example
+Event
+EmailForm
+EVEN
+ENCRYPTION
+E
+Download
+DevForceUpdate
+Desserts
+DUMP
+DESC
+Customer
+CustomPage
+Currency
+Create
+Coupon
+ContentList
+Contacts
+City
+Cancel
+CallStatus
+Calendar
+CV2Result
+CSalt
+CID
+CHIL
+CAVV
+CAPTCHA
+CALN
+Blog
+Block
+Beverages
+AuthItemChild
+Attachment
+Albania
+Admin
+AddressStatus
+AddressResult
+Accounts
+AVSCV2
+AUTH
+AMOUNT
+ALL
+ABBR
+4
+3DSecureStatus
+23
+22
+21
+2
+17
+16
+15
+14
+13
+12
+11
+_escaped_fragment_
+__amp_source_origin
+http_host
+api-version
+x-method-override
+x-http-method-override
+access_token
+applicationid
+assembly
+assemblyPath
+bloburl
+buildid
+checkin
+checkno
+classID
+classid
+classnames
+codetext
+connectionData
+connectionId
+connectionString
+connectionToken
+culture
+customerNum
+dataid
+echo
+FappId
+flinkid
+FLinkId
+idNoticia
+idUsuario
+Usuario
+Noticia
+jobid
+linkid
+LocationPath
+methodid
+nextUrl
+noscript
+oauth_token
+oauth_verifier
+orderNumber
+originalPath
+OriginalUrl
+OutputType
+OverridePath
+pagepath
+PortalId
+promoId
+proxyRestUri
+ReportPath
+reqclient
+requestType
+resourceId
+returnpath
+searchword
+secretcode
+ServerPath
+sourcePage
+SourcePath
+statuscode
+suppress
+tabname
+tblname
+testAction
+uploadType
+OAuthCookie
+shell_path
+user_token
+adminCookie
+fullapp
+LandingUrl
\ No newline at end of file

From 36f5141d91eab8ff9e29f90b962aadc887f45d0e Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 15:12:44 -0400
Subject: [PATCH 206/387] fixes tests

---
 bbot/core/helpers/misc.py                     | 51 +++++++++++++------
 bbot/modules/paramminer_headers.py            |  1 +
 .../test_module_paramminer_getparams.py       |  6 +--
 3 files changed, 39 insertions(+), 19 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 1e818badda..164277b99d 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -380,24 +380,45 @@ def extract_params_json(json_data):
     try:
         data = json.loads(json_data)
     except json.JSONDecodeError:
-        log.debug(f"Invalid JSON supplied. Returning empty list.")
+        log.debug("Invalid JSON supplied. Returning empty list.")
         return []
 
     keys = []
+    stack = [data]
 
-    def extract_keys(data):
-        if isinstance(data, dict):
-            for key, value in data.items():
+    while stack:
+        current_data = stack.pop()
+        if isinstance(current_data, dict):
+            for key, value in current_data.items():
                 keys.append(key)
-                extract_keys(value)
-        elif isinstance(data, list):
-            for item in data:
-                extract_keys(item)
+                if isinstance(value, (dict, list)):
+                    stack.append(value)
+        elif isinstance(current_data, list):
+            for item in current_data:
+                if isinstance(item, (dict, list)):
+                    stack.append(item)
 
-    extract_keys(data)
     return keys
 
 
+# def extract_params_xml(xml_data):
+#     try:
+#         root = ET.fromstring(xml_data)
+#     except ET.ParseError:
+#         log.debug("Invalid XML supplied. Returning empty list.")
+#         return []
+
+#     tags = []
+
+#     def extract_tags(element):
+#         tags.append(element.tag)
+#         for child in element:
+#             extract_tags(child)
+
+#     extract_tags(root)
+#     return tags
+
+
 def extract_params_xml(xml_data):
     try:
         root = ET.fromstring(xml_data)
@@ -406,13 +427,13 @@ def extract_params_xml(xml_data):
         return []
 
     tags = []
+    stack = [root]
 
-    def extract_tags(element):
-        tags.append(element.tag)
-        for child in element:
-            extract_tags(child)
-
-    extract_tags(root)
+    while stack:
+        current_element = stack.pop()
+        tags.append(current_element.tag)
+        for child in current_element:
+            stack.append(child)
     return tags
 
 
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index a4c1f14305..616ed091b1 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -150,6 +150,7 @@ def load_extracted_words(self, wordlist_cleaned, body, content_type):
             return wordlist_cleaned + extract_params_xml(body)
         else:
             return wordlist_cleaned + list(extract_params_html(body))
+
         return wordlist_cleaned
 
     async def binary_search(self, compare_helper, url, group, reasons=None, reflection=False):
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
index 3574a85c88..7e21e20dda 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
@@ -135,9 +135,7 @@ def check(self, module_test, events):
 
 class TestParamminer_Getparams_Extract_Xml(TestParamminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
-    config_overrides = {
-        "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"]), "http_extract": True}}
-    }
+    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist([]), "http_extract": True}}}
 
     getparam_extract_xml = """
 <data>
@@ -168,7 +166,7 @@ async def setup_after_prep(self, module_test):
         }
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
-        expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&common=AAAAAAAAAAAAAA&AAAAAA=1"}
+        expect_args = {"query_string": b"common=AAAAAAAAAAAAAA&obscureParameter=AAAAAAAAAAAAAA&AAAAAA=1"}
         respond_args = {
             "response_data": self.getparam_extract_xml_match,
             "headers": {"Content-Type": "application/xml"},

From 314622ab7be3ccfd1d5b0b4efa3b3322d453c823 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 15:16:28 -0400
Subject: [PATCH 207/387] even more test fixes

---
 .../module_tests/test_module_paramminer_cookies.py            | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
index 87c569aaba..00e9ea6635 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
@@ -37,10 +37,10 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [admincookie] Reasons: [body]"
+            e.type == "FINDING" and "[Paramminer] Cookie: [admincookie] Reasons: [body]" in e.data["description"]
             for e in events
         )
         assert not any(
-            e.type == "FINDING" and e.data["description"] == "[Paramminer] Cookie: [junkcookie] Reasons: [body]"
+            e.type == "FINDING" and "[Paramminer] Cookie: [junkcookie] Reasons: [body]" in e.data["description"] 
             for e in events
         )

From 2aeea38370e79522faed6dbb1a082be3e0453543 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 15:16:33 -0400
Subject: [PATCH 208/387] optionally omit DNS queries

---
 bbot/core/helpers/dns.py | 28 +++++++++++++++++++++++++++-
 bbot/defaults.yml        |  7 +++++++
 2 files changed, 34 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 669fb336ad..2d5216059c 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -36,6 +36,22 @@ def __init__(self, parent_helper):
         self.resolver.lifetime = self.timeout
         self._resolver_list = None
 
+        # skip certain queries
+        dns_omit_queries = self.parent_helper.config.get("dns_omit_queries", None)
+        if not dns_omit_queries:
+            dns_omit_queries = []
+        self.dns_omit_queries = dict()
+        for d in dns_omit_queries:
+            d = d.split(":")
+            if len(d) == 2:
+                rdtype, query = d
+                rdtype = rdtype.upper()
+                query = query.lower()
+                try:
+                    self.dns_omit_queries[rdtype].add(query)
+                except KeyError:
+                    self.dns_omit_queries[rdtype] = {query}
+
         self.wildcard_ignore = self.parent_helper.config.get("dns_wildcard_ignore", None)
         if not self.wildcard_ignore:
             self.wildcard_ignore = []
@@ -124,8 +140,18 @@ async def _resolve_hostname(self, query, **kwargs):
         self.debug(f"Resolving {query} with kwargs={kwargs}")
         results = []
         errors = []
-        parent = self.parent_helper.parent_domain(query)
         rdtype = kwargs.get("rdtype", "A")
+
+        # skip certain queries if requested
+        if rdtype in self.dns_omit_queries:
+            if any(h == query or query.endswith(f".{h}") for h in self.dns_omit_queries[rdtype]):
+                log.hugesuccess(f"{rdtype}:{query} in {self.dns_omit_queries}")
+                self.debug(f"Skipping {rdtype}:{query} because it's omitted in the config")
+                return results, errors
+            else:
+                log.critical(f"{rdtype}:{query} not in {self.dns_omit_queries}")
+
+        parent = self.parent_helper.parent_domain(query)
         retries = kwargs.pop("retries", self.retries)
         cache_result = kwargs.pop("cache_result", False)
         tries_left = int(retries) + 1
diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 1ee19b199f..3495ccd9a3 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -127,3 +127,10 @@ agent_token: ''
 interactsh_server: null
 interactsh_token: null
 interactsh_disable: false
+
+# For performance reasons, always skip these DNS queries
+# Microsoft's DNS infrastructure is misconfigured so that some queries to mail.protection.outlook.com always time out
+dns_omit_queries:
+  - SRV:mail.protection.outlook.com
+  - CNAME:mail.protection.outlook.com
+  - TXT:mail.protection.outlook.com

From 6361f01b5ecb8531641cf28bbb10ff3514991fe4 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 15:16:53 -0400
Subject: [PATCH 209/387] black...

---
 .../test_step_2/module_tests/test_module_paramminer_cookies.py  | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
index 00e9ea6635..176f9e1f4d 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
@@ -41,6 +41,6 @@ def check(self, module_test, events):
             for e in events
         )
         assert not any(
-            e.type == "FINDING" and "[Paramminer] Cookie: [junkcookie] Reasons: [body]" in e.data["description"] 
+            e.type == "FINDING" and "[Paramminer] Cookie: [junkcookie] Reasons: [body]" in e.data["description"]
             for e in events
         )

From 16db6bb5bd6d8c3bb4de2f38ce72351c4d302209 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 15:17:16 -0400
Subject: [PATCH 210/387] remove debugging statements

---
 bbot/core/helpers/dns.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 2d5216059c..1eedff2d66 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -145,11 +145,8 @@ async def _resolve_hostname(self, query, **kwargs):
         # skip certain queries if requested
         if rdtype in self.dns_omit_queries:
             if any(h == query or query.endswith(f".{h}") for h in self.dns_omit_queries[rdtype]):
-                log.hugesuccess(f"{rdtype}:{query} in {self.dns_omit_queries}")
                 self.debug(f"Skipping {rdtype}:{query} because it's omitted in the config")
                 return results, errors
-            else:
-                log.critical(f"{rdtype}:{query} not in {self.dns_omit_queries}")
 
         parent = self.parent_helper.parent_domain(query)
         retries = kwargs.pop("retries", self.retries)

From fa23366c962426fad2cccc1b820cbb0921ccca11 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 15:40:13 -0400
Subject: [PATCH 211/387] add myssl module

---
 bbot/modules/myssl.py                         | 25 ++++++++++++
 .../module_tests/test_module_myssl.py         | 39 +++++++++++++++++++
 2 files changed, 64 insertions(+)
 create mode 100644 bbot/modules/myssl.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_myssl.py

diff --git a/bbot/modules/myssl.py b/bbot/modules/myssl.py
new file mode 100644
index 0000000000..7edd3fbc0b
--- /dev/null
+++ b/bbot/modules/myssl.py
@@ -0,0 +1,25 @@
+from .crobat import crobat
+
+
+class myssl(crobat):
+    flags = ["subdomain-enum", "passive", "safe"]
+    watched_events = ["DNS_NAME"]
+    produced_events = ["DNS_NAME"]
+    meta = {"description": "Query myssl.com's API for subdomains"}
+
+    base_url = "https://myssl.com/api/v1/discover_sub_domain"
+
+    async def request_url(self, query):
+        url = f"{self.base_url}?domain={self.helpers.quote(query)}"
+        return await self.request_with_fail_count(url)
+
+    def parse_results(self, r, query):
+        results = set()
+        json = r.json()
+        if json and isinstance(json, dict):
+            data = json.get("data", [])
+            for d in data:
+                hostname = d.get("domain", "").lower()
+                if hostname:
+                    results.add(hostname)
+        return results
diff --git a/bbot/test/test_step_2/module_tests/test_module_myssl.py b/bbot/test/test_step_2/module_tests/test_module_myssl.py
new file mode 100644
index 0000000000..34b9b9972e
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_myssl.py
@@ -0,0 +1,39 @@
+from .base import ModuleTestBase
+
+
+class TestMySSL(ModuleTestBase):
+    async def setup_after_prep(self, module_test):
+        module_test.module.abort_if = lambda e: False
+        module_test.httpx_mock.add_response(
+            url=f"https://myssl.com/api/v1/discover_sub_domain?domain=blacklanternsecurity.com",
+            json={
+                "code": 0,
+                "data": [
+                    {
+                        "ip": "1.2.3.4",
+                        "port": "443",
+                        "tips": [],
+                        "level": 2,
+                        "title": "",
+                        "domain": "asdf.blacklanternsecurity.com",
+                        "is_ats": True,
+                        "is_pci": False,
+                        "server": "",
+                        "is_tlcp": False,
+                        "duration": 46,
+                        "icon_url": "",
+                        "is_sslvpn": False,
+                        "level_str": "A",
+                        "ip_location": "美国",
+                        "is_enable_gm": False,
+                        "evaluate_date": "2022-03-13T02:38:08Z",
+                        "demotion_reason": [],
+                        "ignore_trust_level": "A",
+                        "meet_gm_double_cert_statndard": False,
+                    }
+                ],
+            },
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"

From d03745af458473fbd835167ebd14de0d5e52442d Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 15:50:52 -0400
Subject: [PATCH 212/387] reworking blacklist/boringlist

---
 bbot/core/helpers/misc.py                     | 18 -----
 bbot/modules/paramminer_cookies.py            |  7 +-
 bbot/modules/paramminer_getparams.py          |  7 +-
 bbot/modules/paramminer_headers.py            | 78 ++++++++++++-------
 .../test_module_paramminer_getparams.py       | 15 ++--
 bbot/wordlists/paramminer_boring.txt          | 44 -----------
 6 files changed, 63 insertions(+), 106 deletions(-)
 delete mode 100644 bbot/wordlists/paramminer_boring.txt

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 164277b99d..0d92feb850 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -401,24 +401,6 @@ def extract_params_json(json_data):
     return keys
 
 
-# def extract_params_xml(xml_data):
-#     try:
-#         root = ET.fromstring(xml_data)
-#     except ET.ParseError:
-#         log.debug("Invalid XML supplied. Returning empty list.")
-#         return []
-
-#     tags = []
-
-#     def extract_tags(element):
-#         tags.append(element.tag)
-#         for child in element:
-#             extract_tags(child)
-
-#     extract_tags(root)
-#     return tags
-
-
 def extract_params_xml(xml_data):
     try:
         root = ET.fromstring(xml_data)
diff --git a/bbot/modules/paramminer_cookies.py b/bbot/modules/paramminer_cookies.py
index 907e2c32ea..8cdeba6bd6 100644
--- a/bbot/modules/paramminer_cookies.py
+++ b/bbot/modules/paramminer_cookies.py
@@ -15,7 +15,7 @@ class paramminer_cookies(paramminer_headers):
     options = {"wordlist": ""}  # default is defined separately
     options_desc = {"wordlist": "Define the wordlist to be used to derive cookies"}
     scanned_hosts = []
-    cookie_blacklist = []
+    boringlist = []
     max_event_handlers = 12
     in_scope_only = True
     compare_mode = "cookie"
@@ -33,8 +33,3 @@ def gen_count_args(self, url):
             fake_cookies = {self.rand_string(14): self.rand_string(14) for _ in range(0, cookie_count)}
             yield cookie_count, (url,), {"cookies": fake_cookies}
             cookie_count -= 5
-
-    def clean_list(self, cookie):
-        if (len(cookie) > 0) and (cookie.strip() not in self.cookie_blacklist):
-            return True
-        return False
diff --git a/bbot/modules/paramminer_getparams.py b/bbot/modules/paramminer_getparams.py
index c0ff27afe5..5506278f17 100644
--- a/bbot/modules/paramminer_getparams.py
+++ b/bbot/modules/paramminer_getparams.py
@@ -13,7 +13,7 @@ class paramminer_getparams(paramminer_headers):
     options = {"wordlist": ""}  # default is defined separately
     options_desc = {"wordlist": "Define the wordlist to be used to derive GET params"}
     scanned_hosts = []
-    getparam_blacklist = []
+    boringlist = []
     in_scope_only = True
     compare_mode = "getparam"
     default_wordlist = "paramminer_parameters.txt"
@@ -30,8 +30,3 @@ def gen_count_args(self, url):
             fake_getparams = {self.rand_string(14): self.rand_string(14) for _ in range(0, getparam_count)}
             yield getparam_count, (self.helpers.add_get_params(url, fake_getparams).geturl(),), {}
             getparam_count -= 5
-
-    def clean_list(self, getparam):
-        if (len(getparam) > 0) and (getparam.strip() not in self.getparam_blacklist):
-            return True
-        return False
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 616ed091b1..cf27ec29fd 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -23,16 +23,51 @@ class paramminer_headers(BaseModule):
         "skip_boring_words": "Remove commonly uninteresting words from the wordlist",
     }
     scanned_hosts = []
-    header_blacklist = [
-        "content-length",
-        "expect",
+    boringlist = [
+        "accept",
         "accept-encoding",
-        "transfer-encoding",
+        "accept-language",
+        "action",
+        "authorization",
+        "cf-connecting-ip",
         "connection",
+        "content-encoding",
+        "content-length",
+        "content-range",
+        "content-type",
+        "cookie",
+        "date",
+        "expect",
+        "host",
+        "if",
         "if-match",
         "if-modified-since",
         "if-none-match",
         "if-unmodified-since",
+        "javascript",
+        "keep-alive",
+        "label",
+        "negotiate",
+        "proxy",
+        "range",
+        "referer",
+        "start",
+        "trailer",
+        "transfer-encoding",
+        "upgrade",
+        "user-agent",
+        "vary",
+        "waf-stuff-below",
+        "x-scanner",
+        "x_alto_ajax_key",
+        "zaccess-control-request-headers",
+        "zaccess-control-request-method",
+        "zmax-forwards",
+        "zorigin",
+        "zreferrer",
+        "zvia",
+        "zx-request-id",
+        "zx-timer",
     ]
     max_event_handlers = 12
     in_scope_only = True
@@ -46,9 +81,6 @@ async def setup(self):
         self.debug(f"Using wordlist: [{wordlist}]")
         wordlist_url = self.config.get("wordlist", "")
         self.wordlist = await self.helpers.wordlist(wordlist_url)
-        self.boringlist = [
-            h.strip().lower() for h in self.helpers.read_file(f"{self.helpers.wordlist_dir}/paramminer_boring.txt")
-        ]
         return True
 
     def rand_string(self, *args, **kwargs):
@@ -71,23 +103,20 @@ async def handle_event(self, event):
             self.verbose(f'Aborting "{url}" due to failed canary check')
             return
 
-        fl = [h.strip().lower() for h in self.helpers.read_file(self.wordlist)]
-
-        # clean list against the blacklist
-        wordlist_cleaned = list(filter(self.clean_list_blacklist, fl))
+        wl_raw = [h.strip().lower() for h in self.helpers.read_file(self.wordlist)]
 
         # clean list against the boring list, if the option is set
         if self.config.get("skip_boring_words", True):
-            wordlist_cleaned = list(filter(self.clean_list_boring, fl))
+            wl = list(filter(self.clean_list, wl_raw))
+        else:
+            wl = wl_raw
 
         if self.config.get("http_extract"):
-            wordlist_cleaned = self.load_extracted_words(
-                wordlist_cleaned, event.data.get("body"), event.data.get("content_type")
-            )
+            wl = self.load_extracted_words(wl, event.data.get("body"), event.data.get("content_type"))
         results = set()
         abort_threshold = 25
         try:
-            for group in self.helpers.grouper(wordlist_cleaned, batch_size):
+            for group in self.helpers.grouper(wl, batch_size):
                 async for result, reasons, reflection in self.binary_search(compare_helper, url, group):
                     results.add((result, ",".join(reasons), reflection))
                     if len(results) >= abort_threshold:
@@ -133,25 +162,20 @@ def gen_count_args(self, url):
             yield header_count, (url,), {"headers": fake_headers}
             header_count -= 5
 
-    def clean_list_blacklist(self, header):
-        if (len(header) > 0) and ("%" not in header) and (header not in self.header_blacklist):
-            return True
-        return False
-
-    def clean_list_boring(self, header):
+    def clean_list(self, header):
         if (len(header) > 0) and ("%" not in header) and (header not in self.boringlist):
             return True
         return False
 
-    def load_extracted_words(self, wordlist_cleaned, body, content_type):
+    def load_extracted_words(self, wl, body, content_type):
         if "json" in content_type.lower():
-            return wordlist_cleaned + extract_params_json(body)
+            return wl + extract_params_json(body)
         elif "xml" in content_type.lower():
-            return wordlist_cleaned + extract_params_xml(body)
+            return wl + extract_params_xml(body)
         else:
-            return wordlist_cleaned + list(extract_params_html(body))
+            return wl + list(extract_params_html(body))
 
-        return wordlist_cleaned
+        return wl
 
     async def binary_search(self, compare_helper, url, group, reasons=None, reflection=False):
         if reasons is None:
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
index 7e21e20dda..6c2eb6ece6 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
@@ -48,15 +48,18 @@ def check(self, module_test, events):
 
 class TestParamminer_Getparams_boring_off(TestParamminer_Getparams):
     config_overrides = {
-        "modules": {"paramminer_getparams": {"skip_boring_words": False, "wordlist": tempwordlist(["canary", "host"])}}
+        "modules": {
+            "paramminer_getparams": {"skip_boring_words": False, "wordlist": tempwordlist(["canary", "boring"])}
+        }
     }
 
     async def setup_after_prep(self, module_test):
         module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.scan.modules["paramminer_getparams"].boringlist = ["boring"]
         module_test.monkeypatch.setattr(
             helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
         )
-        expect_args = {"query_string": b"host=AAAAAAAAAAAAAA&AAAAAA=1"}
+        expect_args = {"query_string": b"boring=AAAAAAAAAAAAAA&AAAAAA=1"}
         respond_args = {"response_data": self.getparam_body_match}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
@@ -65,19 +68,21 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(
-            e.type == "FINDING" and "[Paramminer] Getparam: [host] Reasons: [body]" in e.data["description"]
+            e.type == "FINDING" and "[Paramminer] Getparam: [boring] Reasons: [body]" in e.data["description"]
             for e in events
         )
 
 
 class TestParamminer_Getparams_boring_on(TestParamminer_Getparams_boring_off):
     config_overrides = {
-        "modules": {"paramminer_getparams": {"skip_boring_words": True, "wordlist": tempwordlist(["canary", "host"])}}
+        "modules": {
+            "paramminer_getparams": {"skip_boring_words": True, "wordlist": tempwordlist(["canary", "boring"])}
+        }
     }
 
     def check(self, module_test, events):
         assert not any(
-            e.type == "FINDING" and "[Paramminer] Getparam: [host] Reasons: [body]" in e.data["description"]
+            e.type == "FINDING" and "[Paramminer] Getparam: [boring] Reasons: [body]" in e.data["description"]
             for e in events
         )
 
diff --git a/bbot/wordlists/paramminer_boring.txt b/bbot/wordlists/paramminer_boring.txt
deleted file mode 100644
index 2a76801959..0000000000
--- a/bbot/wordlists/paramminer_boring.txt
+++ /dev/null
@@ -1,44 +0,0 @@
-host
-cookie
-user-agent
-content-encoding
-cf-connecting-ip
-content-range
-content-encoding
-x_alto_ajax_key
-referer
-upgrade
-expect
-vary
-connection
-accept-encoding
-accept-language
-accept
-transfer-encoding
-content-type
-content-length
-range
-if-unmodified-since
-if-modified-since
-if-match
-if
-proxy
-trailer
-waf-stuff-below
-negotiate
-javascript
-action
-authorization
-label
-start
-date
-keep-alive
-x-scanner
-zreferrer
-zvia
-zaccess-control-request-method
-zaccess-control-request-headers
-zorigin
-zx-request-id
-zx-timer
-zmax-forwards
\ No newline at end of file

From 970df8a4eeb2503431276de9d32495abbe55d8da Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 16:09:36 -0400
Subject: [PATCH 213/387] update user agent

---
 bbot/defaults.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 3495ccd9a3..00e8168484 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -19,7 +19,7 @@ status_frequency: 15
 # HTTP proxy
 http_proxy: 
 # Web user-agent
-user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36
+user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36
 
 
 ### ADVANCED OPTIONS ###

From 8c37fefd1eb4ea47c62ab2710cce15133b11e9a2 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Mon, 10 Jul 2023 16:52:19 -0400
Subject: [PATCH 214/387] fixing NASTY reflection detection bug

---
 bbot/core/helpers/diff.py                     |  9 ++++----
 bbot/modules/paramminer_cookies.py            |  2 +-
 bbot/modules/paramminer_getparams.py          |  4 +++-
 bbot/modules/paramminer_headers.py            |  3 +--
 .../test_module_paramminer_cookies.py         | 21 ++++++++++++++++++-
 .../test_module_paramminer_getparams.py       | 21 ++++++++++++++++++-
 .../test_module_paramminer_headers.py         | 21 ++++++++++++++++++-
 7 files changed, 70 insertions(+), 11 deletions(-)

diff --git a/bbot/core/helpers/diff.py b/bbot/core/helpers/diff.py
index 7203071df2..01dd7749af 100644
--- a/bbot/core/helpers/diff.py
+++ b/bbot/core/helpers/diff.py
@@ -160,10 +160,11 @@ async def compare(
 
             subject_params = self.parent_helper.get_get_params(subject)
             for k, v in subject_params.items():
-                if k != cache_key and v in subject_response.text:
-                    reflection = True
-                    break
-
+                if k != cache_key:
+                    for item in v:
+                        if item in subject_response.text:
+                            reflection = True
+                            break
         try:
             subject_json = xmltodict.parse(subject_response.text)
 
diff --git a/bbot/modules/paramminer_cookies.py b/bbot/modules/paramminer_cookies.py
index 8cdeba6bd6..138418d350 100644
--- a/bbot/modules/paramminer_cookies.py
+++ b/bbot/modules/paramminer_cookies.py
@@ -23,7 +23,7 @@ class paramminer_cookies(paramminer_headers):
 
     async def check_batch(self, compare_helper, url, cookie_list):
         cookies = {p: self.rand_string(14) for p in cookie_list}
-        return await compare_helper.compare(url, cookies=cookies)
+        return await compare_helper.compare(url, cookies=cookies, check_reflection=(len(cookie_list) == 1))
 
     def gen_count_args(self, url):
         cookie_count = 40
diff --git a/bbot/modules/paramminer_getparams.py b/bbot/modules/paramminer_getparams.py
index 5506278f17..c507d9124e 100644
--- a/bbot/modules/paramminer_getparams.py
+++ b/bbot/modules/paramminer_getparams.py
@@ -20,7 +20,9 @@ class paramminer_getparams(paramminer_headers):
 
     async def check_batch(self, compare_helper, url, getparam_list):
         test_getparams = {p: self.rand_string(14) for p in getparam_list}
-        return await compare_helper.compare(self.helpers.add_get_params(url, test_getparams).geturl())
+        return await compare_helper.compare(
+            self.helpers.add_get_params(url, test_getparams).geturl(), check_reflection=(len(getparam_list) == 1)
+        )
 
     def gen_count_args(self, url):
         getparam_count = 40
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index cf27ec29fd..6955692032 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -79,8 +79,7 @@ async def setup(self):
         if not wordlist:
             wordlist = f"{self.helpers.wordlist_dir}/{self.default_wordlist}"
         self.debug(f"Using wordlist: [{wordlist}]")
-        wordlist_url = self.config.get("wordlist", "")
-        self.wordlist = await self.helpers.wordlist(wordlist_url)
+        self.wordlist = await self.helpers.wordlist(wordlist)
         return True
 
     def rand_string(self, *args, **kwargs):
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
index 176f9e1f4d..4a8a27e56d 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
@@ -37,10 +37,29 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(
-            e.type == "FINDING" and "[Paramminer] Cookie: [admincookie] Reasons: [body]" in e.data["description"]
+            e.type == "FINDING"
+            and "[Paramminer] Cookie: [admincookie] Reasons: [body] Reflection: [True]" in e.data["description"]
             for e in events
         )
         assert not any(
             e.type == "FINDING" and "[Paramminer] Cookie: [junkcookie] Reasons: [body]" in e.data["description"]
             for e in events
         )
+
+
+class TestParamminer_Cookies_noreflection(TestParamminer_Cookies):
+    cookies_body_match = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello ADMINISTRATOR!</p>';
+    </body>
+    </html>
+    """
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING"
+            and "[Paramminer] Cookie: [admincookie] Reasons: [body] Reflection: [False]" in e.data["description"]
+            for e in events
+        )
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
index 6c2eb6ece6..cae2603f57 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
@@ -37,7 +37,8 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(
-            e.type == "FINDING" and "[Paramminer] Getparam: [id] Reasons: [body]" in e.data["description"]
+            e.type == "FINDING"
+            and "[Paramminer] Getparam: [id] Reasons: [body] Reflection: [True]" in e.data["description"]
             for e in events
         )
         assert not any(
@@ -46,6 +47,24 @@ def check(self, module_test, events):
         )
 
 
+class TestParamminer_Getparams_noreflection(TestParamminer_Getparams):
+    getparam_body_match = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello ADMINISTRATOR!</p>';
+    </body>
+    </html>
+    """
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING"
+            and "[Paramminer] Getparam: [id] Reasons: [body] Reflection: [False]" in e.data["description"]
+            for e in events
+        )
+
+
 class TestParamminer_Getparams_boring_off(TestParamminer_Getparams):
     config_overrides = {
         "modules": {
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
index 8cf8bf50fe..16e1a215cb 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
@@ -40,9 +40,28 @@ async def setup_after_prep(self, module_test):
 
     def check(self, module_test, events):
         assert any(
-            e.type == "FINDING" and "[Paramminer] Header: [tracestate] Reasons: [body]" in e.data["description"]
+            e.type == "FINDING"
+            and "[Paramminer] Header: [tracestate] Reasons: [body] Reflection: [True]" in e.data["description"]
             for e in events
         )
         assert not any(
             e.type == "FINDING" and "[Paramminer] Header: [junkword1]" in e.data["description"] for e in events
         )
+
+
+class TestParamminer_Headers(TestParamminer_Headers):
+    headers_body_match = """
+    <html>
+    <title>the title</title>
+    <body>
+    <p>Hello Administrator!</p>';
+    </body>
+    </html>
+    """
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING"
+            and "[Paramminer] Header: [tracestate] Reasons: [body] Reflection: [False]" in e.data["description"]
+            for e in events
+        )

From 7beda217981529b06b569d058061005ccc0b78e5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 10 Jul 2023 17:22:51 -0400
Subject: [PATCH 215/387] added NSEC module

---
 bbot/core/event/base.py                       |  1 +
 bbot/core/helpers/dns.py                      |  7 ++-
 bbot/modules/nsec.py                          | 43 +++++++++++++++++++
 .../module_tests/test_module_nsec.py          | 25 +++++++++++
 4 files changed, 74 insertions(+), 2 deletions(-)
 create mode 100644 bbot/modules/nsec.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_nsec.py

diff --git a/bbot/core/event/base.py b/bbot/core/event/base.py
index cc5ec89e85..af3867518b 100644
--- a/bbot/core/event/base.py
+++ b/bbot/core/event/base.py
@@ -500,6 +500,7 @@ def priority(self):
                 self._priority = (timestamp,)
             else:
                 self._priority = getattr(self.source, "priority", ()) + (timestamp,)
+
         return self._priority
 
     @property
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 669fb336ad..918106c05b 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -398,6 +398,8 @@ def extract_targets(self, record):
                     start, end = match.span()
                     host = s[start:end]
                     results.add((rdtype, host))
+        elif rdtype == "NSEC":
+            results.add((rdtype, self._clean_dns_record(record.next)))
         else:
             log.warning(f'Unknown DNS record type "{rdtype}"')
         return results
@@ -418,8 +420,9 @@ async def _catch(self, callback, *args, **kwargs):
             raise
         except dns.exception.DNSException as e:
             self.debug(f"{e} (args={args}, kwargs={kwargs})")
-        except Exception:
-            log.warning(f"Error in {callback.__qualname__}() with args={args}, kwargs={kwargs}")
+        except Exception as e:
+            log.warning(f"Error in {callback.__qualname__}() with args={args}, kwargs={kwargs}: {e}")
+            log.trace(traceback.format_exc())
         return []
 
     async def is_wildcard(self, query, ips=None, rdtype=None):
diff --git a/bbot/modules/nsec.py b/bbot/modules/nsec.py
new file mode 100644
index 0000000000..12c4582738
--- /dev/null
+++ b/bbot/modules/nsec.py
@@ -0,0 +1,43 @@
+from bbot.modules.base import BaseModule
+
+
+class NSEC(BaseModule):
+    watched_events = ["DNS_NAME"]
+    produced_events = ["DNS_NAME"]
+    flags = ["subdomain-enum", "passive", "safe"]
+    meta = {"description": "Enumerate subdomains by NSEC-walking"}
+    max_event_handlers = 5
+
+    async def filter_event(self, event):
+        if "ns-record" in event.tags:
+            return True
+        return False
+
+    async def handle_event(self, event):
+        emitted_finding = False
+        async for result in self.nsec_walk(event.data):
+            if not emitted_finding:
+                emitted_finding = True
+                self.emit_event(
+                    {"host": event.data, "description": f"DNSSEC NSEC Zone Walking Enabled for domain: {event.data}"},
+                    "FINDING",
+                    source=event,
+                )
+            self.emit_event(result, "DNS_NAME", source=event)
+
+    async def get_nsec_record(self, domain):
+        try:
+            for result in await self.helpers.resolve(domain, type="NSEC"):
+                return str(result)
+        except Exception as e:
+            self.warning(f"Error getting NSEC record for {domain}: {e}")
+
+    async def nsec_walk(self, domain):
+        current_domain = domain
+        while 1:
+            next_domain = await self.get_nsec_record(current_domain)
+            if next_domain == domain or next_domain is None:
+                break
+            if not next_domain.startswith("\\"):
+                yield next_domain
+            current_domain = next_domain
diff --git a/bbot/test/test_step_2/module_tests/test_module_nsec.py b/bbot/test/test_step_2/module_tests/test_module_nsec.py
new file mode 100644
index 0000000000..595601f390
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_nsec.py
@@ -0,0 +1,25 @@
+from .base import ModuleTestBase
+
+
+class TestNSEC(ModuleTestBase):
+    targets = ["blacklanternsecurity.notreal"]
+
+    async def setup_after_prep(self, module_test):
+        next(iter(module_test.scan.target.events)).add_tag("ns-record")
+
+        old_resolve_fn = module_test.scan.helpers.dns.resolve
+
+        async def resolve(query, **kwargs):
+            if query == "blacklanternsecurity.notreal" and kwargs.get("type", "").upper() == "NSEC":
+                return {"asdf.blacklanternsecurity.notreal"}
+            elif query == "asdf.blacklanternsecurity.notreal" and kwargs.get("type", "").upper() == "NSEC":
+                return {"zzzz.blacklanternsecurity.notreal"}
+            elif query == "zzzz.blacklanternsecurity.notreal" and kwargs.get("type", "").upper() == "NSEC":
+                return {"blacklanternsecurity.notreal"}
+            return await old_resolve_fn(query, **kwargs)
+
+        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "resolve", resolve)
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.notreal" for e in events), "Failed to detect subdomain #1"
+        assert any(e.data == "zzzz.blacklanternsecurity.notreal" for e in events), "Failed to detect subdomain #2"

From c724245c2e1993cf020b85433b73ef85281455a2 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 13:59:49 -0400
Subject: [PATCH 216/387] major paramminer overhaul + bug fixes + tests galore

---
 bbot/core/helpers/misc.py                     |  12 +-
 bbot/modules/paramminer_cookies.py            |  13 +-
 bbot/modules/paramminer_getparams.py          |  14 ++-
 bbot/modules/paramminer_headers.py            | 114 +++++++++++-------
 bbot/test/conftest.py                         |   2 +-
 .../test_module_paramminer_getparams.py       |  85 ++++++++-----
 6 files changed, 156 insertions(+), 84 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 0d92feb850..9f5c26801f 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -381,16 +381,16 @@ def extract_params_json(json_data):
         data = json.loads(json_data)
     except json.JSONDecodeError:
         log.debug("Invalid JSON supplied. Returning empty list.")
-        return []
+        return set()
 
-    keys = []
+    keys = set()
     stack = [data]
 
     while stack:
         current_data = stack.pop()
         if isinstance(current_data, dict):
             for key, value in current_data.items():
-                keys.append(key)
+                keys.add(key)
                 if isinstance(value, (dict, list)):
                     stack.append(value)
         elif isinstance(current_data, list):
@@ -406,14 +406,14 @@ def extract_params_xml(xml_data):
         root = ET.fromstring(xml_data)
     except ET.ParseError:
         log.debug("Invalid XML supplied. Returning empty list.")
-        return []
+        return set()
 
-    tags = []
+    tags = set()
     stack = [root]
 
     while stack:
         current_element = stack.pop()
-        tags.append(current_element.tag)
+        tags.add(current_element.tag)
         for child in current_element:
             stack.append(child)
     return tags
diff --git a/bbot/modules/paramminer_cookies.py b/bbot/modules/paramminer_cookies.py
index 138418d350..12b9ac32bf 100644
--- a/bbot/modules/paramminer_cookies.py
+++ b/bbot/modules/paramminer_cookies.py
@@ -12,10 +12,19 @@ class paramminer_cookies(paramminer_headers):
     meta = {
         "description": "Smart brute-force to check for common HTTP cookie parameters",
     }
-    options = {"wordlist": ""}  # default is defined separately
+    options = {
+        "wordlist": "",  # default is defined within setup function
+        "http_extract": True,
+        "skip_boring_words": True,
+    }
+    options_desc = {
+        "wordlist": "Define the wordlist to be used to derive headers",
+        "http_extract": "Attempt to find additional wordlist words from the HTTP Response",
+        "skip_boring_words": "Remove commonly uninteresting words from the wordlist",
+    }
     options_desc = {"wordlist": "Define the wordlist to be used to derive cookies"}
     scanned_hosts = []
-    boringlist = []
+    boring_words = set()
     max_event_handlers = 12
     in_scope_only = True
     compare_mode = "cookie"
diff --git a/bbot/modules/paramminer_getparams.py b/bbot/modules/paramminer_getparams.py
index c507d9124e..7891e05cfb 100644
--- a/bbot/modules/paramminer_getparams.py
+++ b/bbot/modules/paramminer_getparams.py
@@ -10,10 +10,18 @@ class paramminer_getparams(paramminer_headers):
     produced_events = ["FINDING"]
     flags = ["active", "aggressive", "slow", "web-paramminer"]
     meta = {"description": "Use smart brute-force to check for common HTTP GET parameters"}
-    options = {"wordlist": ""}  # default is defined separately
-    options_desc = {"wordlist": "Define the wordlist to be used to derive GET params"}
     scanned_hosts = []
-    boringlist = []
+    options = {
+        "wordlist": "",  # default is defined within setup function
+        "http_extract": True,
+        "skip_boring_words": True,
+    }
+    options_desc = {
+        "wordlist": "Define the wordlist to be used to derive headers",
+        "http_extract": "Attempt to find additional wordlist words from the HTTP Response",
+        "skip_boring_words": "Remove commonly uninteresting words from the wordlist",
+    }
+    boring_words = set()
     in_scope_only = True
     compare_mode = "getparam"
     default_wordlist = "paramminer_parameters.txt"
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 6955692032..5b4fbbd7b7 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -23,7 +23,7 @@ class paramminer_headers(BaseModule):
         "skip_boring_words": "Remove commonly uninteresting words from the wordlist",
     }
     scanned_hosts = []
-    boringlist = [
+    boring_words = {
         "accept",
         "accept-encoding",
         "accept-language",
@@ -68,50 +68,35 @@ class paramminer_headers(BaseModule):
         "zvia",
         "zx-request-id",
         "zx-timer",
-    ]
+    }
     max_event_handlers = 12
     in_scope_only = True
     compare_mode = "header"
     default_wordlist = "paramminer_headers.txt"
 
     async def setup(self):
+        self.event_dict = {}
         wordlist = self.config.get("wordlist", "")
         if not wordlist:
             wordlist = f"{self.helpers.wordlist_dir}/{self.default_wordlist}"
         self.debug(f"Using wordlist: [{wordlist}]")
-        self.wordlist = await self.helpers.wordlist(wordlist)
+        self.wl = set(
+            h.strip().lower()
+            for h in self.helpers.read_file(await self.helpers.wordlist(wordlist))
+            if len(h) > 0 and "%" not in h
+        )
+
+        # check against the boring list (if the option is set)
+
+        if self.config.get("skip_boring_words", True):
+            self.wl -= self.boring_words
+        self.matched_words = {}
         return True
 
     def rand_string(self, *args, **kwargs):
         return self.helpers.rand_string(*args, **kwargs)
 
-    async def handle_event(self, event):
-        url = event.data.get("url")
-        try:
-            compare_helper = self.helpers.http_compare(url)
-        except HttpCompareError as e:
-            self.debug(e)
-            return
-        batch_size = await self.count_test(url)
-        if batch_size == None or batch_size <= 0:
-            self.debug(f"Failed to get baseline max {self.compare_mode} count, aborting")
-            return
-        self.debug(f"Resolved batch_size at {str(batch_size)}")
-
-        if await compare_helper.canary_check(url, mode=self.compare_mode) == False:
-            self.verbose(f'Aborting "{url}" due to failed canary check')
-            return
-
-        wl_raw = [h.strip().lower() for h in self.helpers.read_file(self.wordlist)]
-
-        # clean list against the boring list, if the option is set
-        if self.config.get("skip_boring_words", True):
-            wl = list(filter(self.clean_list, wl_raw))
-        else:
-            wl = wl_raw
-
-        if self.config.get("http_extract"):
-            wl = self.load_extracted_words(wl, event.data.get("body"), event.data.get("content_type"))
+    async def do_mining(self, wl, url, batch_size, compare_helper):
         results = set()
         abort_threshold = 25
         try:
@@ -126,7 +111,10 @@ async def handle_event(self, event):
                         assert False
         except AssertionError:
             pass
+        return results
 
+    def process_results(self, event, results):
+        url = event.data.get("url")
         for result, reasons, reflection in results:
             tags = []
             if reflection:
@@ -139,6 +127,36 @@ async def handle_event(self, event):
                 tags=tags,
             )
 
+    async def handle_event(self, event):
+        url = event.data.get("url")
+
+        try:
+            compare_helper = self.helpers.http_compare(url)
+        except HttpCompareError as e:
+            self.debug(e)
+            return
+        batch_size = await self.count_test(url)
+        if batch_size == None or batch_size <= 0:
+            self.debug(f"Failed to get baseline max {self.compare_mode} count, aborting")
+            return
+        self.debug(f"Resolved batch_size at {str(batch_size)}")
+
+        self.event_dict[url] = (event, batch_size)
+
+        if await compare_helper.canary_check(url, mode=self.compare_mode) == False:
+            self.verbose(f'Aborting "{url}" due to failed canary check')
+            return
+
+        wl = set(self.wl)
+        if self.config.get("http_extract"):
+            extracted_words = self.load_extracted_words(event.data.get("body"), event.data.get("content_type"))
+            self.matched_words[url] = extracted_words
+            wl |= extracted_words
+            if self.config.get("skip_boring_words", True):
+                wl -= self.boring_words
+        results = await self.do_mining(wl, url, batch_size, compare_helper)
+        self.process_results(event, results)
+
     async def count_test(self, url):
         baseline = await self.helpers.request(url)
         if baseline is None:
@@ -161,29 +179,22 @@ def gen_count_args(self, url):
             yield header_count, (url,), {"headers": fake_headers}
             header_count -= 5
 
-    def clean_list(self, header):
-        if (len(header) > 0) and ("%" not in header) and (header not in self.boringlist):
-            return True
-        return False
-
-    def load_extracted_words(self, wl, body, content_type):
+    def load_extracted_words(self, body, content_type):
         if "json" in content_type.lower():
-            return wl + extract_params_json(body)
+            return extract_params_json(body)
         elif "xml" in content_type.lower():
-            return wl + extract_params_xml(body)
+            return extract_params_xml(body)
         else:
-            return wl + list(extract_params_html(body))
+            return set(extract_params_html(body))
 
-        return wl
 
     async def binary_search(self, compare_helper, url, group, reasons=None, reflection=False):
         if reasons is None:
             reasons = []
         self.debug(f"Entering recursive binary_search with {len(group):,} sized group")
-        if len(group) == 1:
-            if reasons:
-                yield group[0], reasons, reflection
-        elif len(group) > 1:
+        if len(group) == 1 and len(reasons) > 0:
+            yield group[0], reasons, reflection
+        elif len(group) > 1 or (len(group) == 1 and len(reasons) == 0):
             for group_slice in self.helpers.split_list(group):
                 match, reasons, reflection, subject_response = await self.check_batch(compare_helper, url, group_slice)
                 if match == False:
@@ -198,3 +209,18 @@ async def check_batch(self, compare_helper, url, header_list):
         for header in header_list:
             test_headers[header] = rand
         return await compare_helper.compare(url, headers=test_headers, check_reflection=(len(header_list) == 1))
+
+    async def finish(self):
+        for url, (event, batch_size) in self.event_dict.items():
+            compare_helper = self.helpers.http_compare(url)
+
+            untested_matches = set()
+            for k, s in self.matched_words.items():
+                if k != url:
+                    untested_matches.update(s)
+
+            if self.config.get("skip_boring_words", True):
+                untested_matches -= self.boring_words
+
+            results = await self.do_mining(untested_matches, url, batch_size, compare_helper)
+            self.process_results(event, results)
diff --git a/bbot/test/conftest.py b/bbot/test/conftest.py
index 6c7b125352..27b53320b5 100644
--- a/bbot/test/conftest.py
+++ b/bbot/test/conftest.py
@@ -25,7 +25,7 @@ def pytest_sessionfinish(session, exitstatus):
 
 @pytest.fixture
 def non_mocked_hosts() -> list:
-    return ["127.0.0.1"] + interactsh_servers
+    return ["127.0.0.1", "localhost"] + interactsh_servers
 
 
 @pytest.fixture
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
index cae2603f57..ac67a8823d 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
@@ -65,6 +65,10 @@ def check(self, module_test, events):
         )
 
 
+class TestParamminer_Getparams_singlewordlist(TestParamminer_Getparams):
+    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["id"])}}}
+
+
 class TestParamminer_Getparams_boring_off(TestParamminer_Getparams):
     config_overrides = {
         "modules": {
@@ -74,7 +78,7 @@ class TestParamminer_Getparams_boring_off(TestParamminer_Getparams):
 
     async def setup_after_prep(self, module_test):
         module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
-        module_test.scan.modules["paramminer_getparams"].boringlist = ["boring"]
+        module_test.scan.modules["paramminer_getparams"].boring_words = {"boring"}
         module_test.monkeypatch.setattr(
             helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
         )
@@ -108,9 +112,7 @@ def check(self, module_test, events):
 
 class TestParamminer_Getparams_Extract_Json(TestParamminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
-    config_overrides = {
-        "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"]), "http_extract": True}}
-    }
+    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist([]), "http_extract": True}}}
 
     getparam_extract_json = """
     {
@@ -132,13 +134,6 @@ async def setup_after_prep(self, module_test):
             helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
         )
 
-        expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&common=AAAAAAAAAAAAAA&AAAAAA=1"}
-        respond_args = {
-            "response_data": self.getparam_extract_json_match,
-            "headers": {"Content-Type": "application/json"},
-        }
-        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
         expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&AAAAAA=1"}
         respond_args = {
             "response_data": self.getparam_extract_json_match,
@@ -159,7 +154,11 @@ def check(self, module_test, events):
 
 class TestParamminer_Getparams_Extract_Xml(TestParamminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
-    config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist([]), "http_extract": True}}}
+    config_overrides = {
+        "modules": {
+            "paramminer_getparams": {"wordlist": tempwordlist([]), "http_extract": True, "skip_boring_words": True}
+        }
+    }
 
     getparam_extract_xml = """
 <data>
@@ -180,22 +179,7 @@ async def setup_after_prep(self, module_test):
         module_test.monkeypatch.setattr(
             helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
         )
-
-        expect_args = {
-            "query_string": b"data=AAAAAAAAAAAAAA&obscureParameter=AAAAAAAAAAAAAA&common=AAAAAAAAAAAAAA&AAAAAA=1"
-        }
-        respond_args = {
-            "response_data": self.getparam_extract_xml_match,
-            "headers": {"Content-Type": "application/xml"},
-        }
-        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-        expect_args = {"query_string": b"common=AAAAAAAAAAAAAA&obscureParameter=AAAAAAAAAAAAAA&AAAAAA=1"}
-        respond_args = {
-            "response_data": self.getparam_extract_xml_match,
-            "headers": {"Content-Type": "application/xml"},
-        }
-        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+        module_test.scan.modules["paramminer_getparams"].boring_words = {"data", "common"}
 
         expect_args = {"query_string": b"obscureParameter=AAAAAAAAAAAAAA&AAAAAA=1"}
         respond_args = {
@@ -251,3 +235,48 @@ def check(self, module_test, events):
             e.type == "FINDING" and "[Paramminer] Getparam: [hack] Reasons: [body]" in e.data["description"]
             for e in events
         )
+
+
+class TestParamminer_Getparams_finish(TestParamminer_Headers):
+    modules_overrides = ["httpx", "excavate", "paramminer_getparams"]
+    config_overrides = {
+        "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "canary2"]), "http_extract": True}}
+    }
+
+    targets = ["http://127.0.0.1:8888/test1.php", "http://127.0.0.1:8888/test2.php"]
+
+    test_1_html = """
+<html><a href="/test2.php?abcd1234=foo">paramstest2</a></html>
+    """
+
+    test_2_html = """
+<html></a><p>Hello</p></html>
+    """
+
+    test_2_html_match = """
+<html></a><p>HackThePlanet!</p></html>
+    """
+
+    async def setup_after_prep(self, module_test):
+        module_test.scan.modules["paramminer_getparams"].rand_string = lambda *args, **kwargs: "AAAAAAAAAAAAAA"
+        module_test.monkeypatch.setattr(
+            helper.HttpCompare, "gen_cache_buster", lambda *args, **kwargs: {"AAAAAA": "1"}
+        )
+
+        expect_args = {"uri": "/test2.php", "query_string": b"abcd1234=AAAAAAAAAAAAAA&AAAAAA=1"}
+        respond_args = {"response_data": self.test_2_html_match}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"uri": "/test2.php"}
+        respond_args = {"response_data": self.test_2_html}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        expect_args = {"uri": "/test1.php"}
+        respond_args = {"response_data": self.test_1_html}
+        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING" and "[abcd1234] Reasons: [body] Reflection: [False]" in e.data["description"]
+            for e in events
+        )

From 88304de70ed52527d73abd2b7fd5ed59cc338e1c Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 14:09:06 -0400
Subject: [PATCH 217/387] black

---
 bbot/modules/paramminer_headers.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 5b4fbbd7b7..8be6b3f71c 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -187,7 +187,6 @@ def load_extracted_words(self, body, content_type):
         else:
             return set(extract_params_html(body))
 
-
     async def binary_search(self, compare_helper, url, group, reasons=None, reflection=False):
         if reasons is None:
             reasons = []

From d83f7ba9b0a32ce86ba2d8e214b9a1f1f523fd0b Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 14:20:03 -0400
Subject: [PATCH 218/387] removing items in wordlist during finish

---
 bbot/modules/paramminer_headers.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 8be6b3f71c..3bd8fe05e2 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -218,6 +218,8 @@ async def finish(self):
                 if k != url:
                     untested_matches.update(s)
 
+            untested_matches -= self.wl
+
             if self.config.get("skip_boring_words", True):
                 untested_matches -= self.boring_words
 

From 673fc5f599047f5b46ba768b9d755c22d153861c Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 16:13:51 -0400
Subject: [PATCH 219/387] revising regexes

---
 bbot/core/helpers/misc.py    | 19 +++----------------
 bbot/core/helpers/regexes.py |  4 ++--
 2 files changed, 5 insertions(+), 18 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 9f5c26801f..a496fb9239 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -443,22 +443,9 @@ def extract_params_html(html_data):
                 yield s
 
     a_tag = regexes.a_tag_regex.findall(html_data)
-    if a_tag:
-        for url in a_tag:
-            if url.startswith("http"):
-                url_parsed = self.helpers.parse_url(url)
-                if not self.scan.in_scope(url_parsed.netloc):
-                    log.debug(f"Skipping checking for parameters because URL ({url}) is not in scope")
-                    continue
-                i = url_parsed.query.split("&")
-            else:
-                i = url.split("?")[1].split("&")
-            for x in i:
-                s = x.split("=")[0]
-
-                log.debug(f"FOUND PARAM ({s}) IN A TAG GET PARAMS")
-                yield s
-
+    for s in a_tag:
+        log.debug(f"FOUND PARAM ({s}) IN A TAG GET PARAMS")
+        yield s
 
 def extract_words(data, acronyms=True, wordninja=True, model=None, max_length=100, word_regexes=None):
     """
diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index cc921f383e..2e1494d759 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -64,7 +64,7 @@
 hostname_regex = re.compile(_hostname_regex, re.I)
 
 # For use with extract_params_html helper
-input_tag_regex = re.compile(r"<input.+?name=[\"\'](\w+)[\"\']")
+input_tag_regex = re.compile(r"<input[^>]+?name=[\"\'](\w+)[\"\']")
 jquery_get_regex = re.compile(r"url:\s?[\"\'].+?\?(\w+)=")
 jquery_post_regex = re.compile(r"\$.post\([\'\"].+[\'\"].+\{(.+)\}")
-a_tag_regex = re.compile(r"<a\s+(?:[^>]*?\s+)?href=(?:[\"\'](.+\?.+?))[\"\'].+[>\s]")
+a_tag_regex = re.compile(r"<a[^>]*href=[\"\'][^\"\'?>]*\?([^&\"\'=]+)")

From bd9bec5ab79b987672cdf0ba78de68d9cd438905 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 16:18:24 -0400
Subject: [PATCH 220/387] bug fixes for extracting words

---
 bbot/core/helpers/misc.py          | 1 +
 bbot/modules/paramminer_headers.py | 4 ++--
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index a496fb9239..2741037c1c 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -447,6 +447,7 @@ def extract_params_html(html_data):
         log.debug(f"FOUND PARAM ({s}) IN A TAG GET PARAMS")
         yield s
 
+
 def extract_words(data, acronyms=True, wordninja=True, model=None, max_length=100, word_regexes=None):
     """
     Intelligently extract words from given data
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 3bd8fe05e2..3ab65fd187 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -180,9 +180,9 @@ def gen_count_args(self, url):
             header_count -= 5
 
     def load_extracted_words(self, body, content_type):
-        if "json" in content_type.lower():
+        if content_type and "json" in content_type.lower():
             return extract_params_json(body)
-        elif "xml" in content_type.lower():
+        elif content_type and "xml" in content_type.lower():
             return extract_params_xml(body)
         else:
             return set(extract_params_html(body))

From 8ceadc6b785aac960821bf4ff7c67b8a47ff0da3 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 16:30:16 -0400
Subject: [PATCH 221/387] fix for empty body

---
 bbot/modules/paramminer_headers.py | 11 +++++++----
 1 file changed, 7 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 3ab65fd187..bb6a1a3354 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -150,10 +150,11 @@ async def handle_event(self, event):
         wl = set(self.wl)
         if self.config.get("http_extract"):
             extracted_words = self.load_extracted_words(event.data.get("body"), event.data.get("content_type"))
-            self.matched_words[url] = extracted_words
-            wl |= extracted_words
-            if self.config.get("skip_boring_words", True):
-                wl -= self.boring_words
+            if extracted_words:
+                self.matched_words[url] = extracted_words
+                wl |= extracted_words
+        if self.config.get("skip_boring_words", True):
+            wl -= self.boring_words
         results = await self.do_mining(wl, url, batch_size, compare_helper)
         self.process_results(event, results)
 
@@ -180,6 +181,8 @@ def gen_count_args(self, url):
             header_count -= 5
 
     def load_extracted_words(self, body, content_type):
+        if not body:
+            return None
         if content_type and "json" in content_type.lower():
             return extract_params_json(body)
         elif content_type and "xml" in content_type.lower():

From 393e4a981b89569151bea36f6ab380cbbf6d47a5 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 16:36:31 -0400
Subject: [PATCH 222/387] debug msg tweak

---
 bbot/modules/paramminer_headers.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index bb6a1a3354..04f02733ac 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -105,7 +105,7 @@ async def do_mining(self, wl, url, batch_size, compare_helper):
                     results.add((result, ",".join(reasons), reflection))
                     if len(results) >= abort_threshold:
                         self.warning(
-                            f"Abort threshold ({abort_threshold}) reached, too many {self.compare_mode}s found"
+                            f"Abort threshold ({abort_threshold}) reached, too many {self.compare_mode}s found for url: {url}"
                         )
                         results.clear()
                         assert False

From 7a49f1040eb7a9242cd446a26a21b0fec751c841 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Tue, 11 Jul 2023 16:56:50 -0400
Subject: [PATCH 223/387] additional debugging

---
 bbot/modules/paramminer_headers.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 04f02733ac..554902b470 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -151,6 +151,7 @@ async def handle_event(self, event):
         if self.config.get("http_extract"):
             extracted_words = self.load_extracted_words(event.data.get("body"), event.data.get("content_type"))
             if extracted_words:
+                self.debug(f"Extracted {str(len(extracted_words))} words from {url}")
                 self.matched_words[url] = extracted_words
                 wl |= extracted_words
         if self.config.get("skip_boring_words", True):

From 170ddc49b55e746edcb7e3d4823b4a46e0eee226 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 11:01:18 -0400
Subject: [PATCH 224/387] better error handling paramminer

---
 bbot/core/helpers/diff.py          |  2 +-
 bbot/modules/paramminer_headers.py | 18 ++++++++++++------
 2 files changed, 13 insertions(+), 7 deletions(-)

diff --git a/bbot/core/helpers/diff.py b/bbot/core/helpers/diff.py
index 01dd7749af..cf7252d8d9 100644
--- a/bbot/core/helpers/diff.py
+++ b/bbot/core/helpers/diff.py
@@ -146,7 +146,7 @@ async def compare(
             url, headers=headers, cookies=cookies, follow_redirects=allow_redirects, method=method
         )
 
-        if not subject_response:
+        if subject_response is None:
             # this can be caused by a WAF not liking the header, so we really arent interested in it
             return (True, "403", reflection, subject_response)
 
diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 554902b470..96f8c59853 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -98,7 +98,7 @@ def rand_string(self, *args, **kwargs):
 
     async def do_mining(self, wl, url, batch_size, compare_helper):
         results = set()
-        abort_threshold = 25
+        abort_threshold = 15
         try:
             for group in self.helpers.grouper(wl, batch_size):
                 async for result, reasons, reflection in self.binary_search(compare_helper, url, group):
@@ -133,7 +133,7 @@ async def handle_event(self, event):
         try:
             compare_helper = self.helpers.http_compare(url)
         except HttpCompareError as e:
-            self.debug(e)
+            self.debug(f"Error initializing compare helper: {e}")
             return
         batch_size = await self.count_test(url)
         if batch_size == None or batch_size <= 0:
@@ -143,8 +143,11 @@ async def handle_event(self, event):
 
         self.event_dict[url] = (event, batch_size)
 
-        if await compare_helper.canary_check(url, mode=self.compare_mode) == False:
-            self.verbose(f'Aborting "{url}" due to failed canary check')
+        try:
+            if not await compare_helper.canary_check(url, mode=self.compare_mode):
+                raise HttpCompareError("failed canary check")
+        except HttpCompareError as e:
+            self.verbose(f'Aborting "{url}" ({e})')
             return
 
         wl = set(self.wl)
@@ -215,8 +218,11 @@ async def check_batch(self, compare_helper, url, header_list):
 
     async def finish(self):
         for url, (event, batch_size) in self.event_dict.items():
-            compare_helper = self.helpers.http_compare(url)
-
+            try:
+                compare_helper = self.helpers.http_compare(url)
+            except HttpCompareError as e:
+                self.debug(f"Error initializing compare helper: {e}")
+                return
             untested_matches = set()
             for k, s in self.matched_words.items():
                 if k != url:

From f196a27a424366692082d3ad922a0ca94b145aea Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 15:44:12 -0400
Subject: [PATCH 225/387] more robust parsing for options for some modules

---
 bbot/core/helpers/misc.py             | 36 +++++++++++++++
 bbot/modules/deadly/ffuf.py           |  8 +++-
 bbot/modules/ffuf_shortnames.py       |  9 +++-
 bbot/modules/internal/speculate.py    | 14 ++++--
 bbot/test/test_step_1/test_helpers.py | 64 +++++++++++++++++++++++++++
 5 files changed, 125 insertions(+), 6 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 8e357378a0..002303f30e 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -1200,3 +1200,39 @@ def weighted_shuffle(items, weights):
         shuffled_items.append(chosen_item)
 
     return shuffled_items
+
+
+def parse_port_string(port_string):
+    elements = port_string.split(",")
+    ports = []
+
+    for element in elements:
+        if element.isdigit():
+            port = int(element)
+            if 1 <= port <= 65535:
+                ports.append(port)
+            else:
+                raise ValueError(f"Invalid port: {element}")
+        elif "-" in element:
+            range_parts = element.split("-")
+            if len(range_parts) != 2 or not all(part.isdigit() for part in range_parts):
+                raise ValueError(f"Invalid port or port range: {element}")
+            start, end = map(int, range_parts)
+            if not (1 <= start < end <= 65535):
+                raise ValueError(f"Invalid port range: {element}")
+            ports.extend(range(start, end + 1))
+        else:
+            raise ValueError(f"Invalid port or port range: {element}")
+
+    return ports
+
+
+def parse_list_string(list_string):
+    elements = list_string.split(",")
+    result = []
+
+    for element in elements:
+        if any((c in '<>:"/\\|?*') or (ord(c) < 32 and c != " ") for c in element):
+            raise ValueError(f"Invalid character in string: {element}")
+        result.append(element)
+    return result
diff --git a/bbot/modules/deadly/ffuf.py b/bbot/modules/deadly/ffuf.py
index 709b1d1be6..c0eb0d80b8 100644
--- a/bbot/modules/deadly/ffuf.py
+++ b/bbot/modules/deadly/ffuf.py
@@ -1,4 +1,5 @@
 from bbot.modules.base import BaseModule
+from bbot.core.helpers.misc import parse_list_string
 
 import random
 import string
@@ -54,7 +55,12 @@ async def setup(self):
         self.wordlist_lines = list(self.helpers.read_file(self.wordlist))
         self.tempfile, tempfile_len = self.generate_templist()
         self.verbose(f"Generated dynamic wordlist with length [{str(tempfile_len)}]")
-        self.extensions = self.config.get("extensions", "")
+        try:
+            self.extensions = parse_list_string(self.config.get("extensions", ""))
+            self.critical(f"Using custom extensions: [{','.join(self.extensions)}]")
+        except ValueError as e:
+            self.warning(f"Error parsing extensions: {e}")
+            return False
         return True
 
     async def handle_event(self, event):
diff --git a/bbot/modules/ffuf_shortnames.py b/bbot/modules/ffuf_shortnames.py
index d181319f03..7f05be52aa 100644
--- a/bbot/modules/ffuf_shortnames.py
+++ b/bbot/modules/ffuf_shortnames.py
@@ -86,7 +86,14 @@ async def setup(self):
             wordlist_extensions = f"{self.helpers.wordlist_dir}/raft-small-extensions-lowercase_CLEANED.txt"
         self.debug(f"Using [{wordlist_extensions}] for shortname candidate extension list")
         self.wordlist_extensions = await self.helpers.wordlist(wordlist_extensions)
-        self.extensions = self.config.get("extensions")
+
+        try:
+            self.extensions = parse_list_string(self.config.get("extensions", ""))
+            self.critical(f"Using custom extensions: [{','.join(self.extensions)}]")
+        except ValueError as e:
+            self.warning(f"Error parsing extensions: {e}")
+            return False
+
         self.ignore_redirects = self.config.get("ignore_redirects")
 
         self.per_host_collection = {}
diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index 1e00d1bdb7..0e2b6b9ce7 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -1,6 +1,7 @@
 import random
 import ipaddress
 
+from bbot.core.helpers.misc import parse_port_string
 from bbot.modules.internal.base import BaseInternalModule
 
 
@@ -24,7 +25,7 @@ class speculate(BaseInternalModule):
     flags = ["passive"]
     meta = {"description": "Derive certain event types from others by common sense"}
 
-    options = {"max_hosts": 65536, "ports": [80, 443]}
+    options = {"max_hosts": 65536, "ports": "80,443"}
     options_desc = {
         "max_hosts": "Max number of IP_RANGE hosts to convert into IP_ADDRESS events",
         "ports": "The set of ports to speculate on",
@@ -40,9 +41,14 @@ async def setup(self):
         self.range_to_ip = True
         self.dns_resolution = self.scan.config.get("dns_resolution", True)
 
-        self.ports = self.config.get("ports", [80, 443])
-        if isinstance(self.ports, int):
-            self.ports = [self.ports]
+        port_string = self.config.get("ports", "80,443")
+
+        try:
+            self.ports = parse_port_string(port_string)
+        except ValueError as e:
+            self.warning(f"Error parsing ports: {e}")
+            return False
+
         if not self.portscanner_enabled:
             self.info(f"No portscanner enabled. Assuming open ports: {', '.join(str(x) for x in self.ports)}")
 
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index f7dd72c57f..87bf518a1e 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -580,3 +580,67 @@ async def async_gen():
         except StopIteration:
             break
     assert l == [0, 1, 2, 3, 4]
+
+
+# test parse_port_string helper
+
+
+def test_portparse_singleports(helpers):
+    assert helpers.parse_port_string("80,443,22") == [80, 443, 22]
+
+
+def test_portparse_range_valid(helpers):
+    assert helpers.parse_port_string("80,443,22,1000-1002") == [80, 443, 22, 1000, 1001, 1002]
+
+
+def test_portparse_invalidport(helpers):
+    with pytest.raises(ValueError) as e:
+        helpers.parse_port_string("80,443,22,70000")
+    assert str(e.value) == "Invalid port: 70000"
+
+
+def test_portparse_range_invalid(helpers):
+    with pytest.raises(ValueError) as e:
+        helpers.parse_port_string("80,443,22,1000-70000")
+    assert str(e.value) == "Invalid port range: 1000-70000"
+
+
+def test_portparse_range_morethantwoparts(helpers):
+    with pytest.raises(ValueError) as e:
+        helpers.parse_port_string("80,443,22,1000-1001-1002")
+    assert str(e.value) == "Invalid port or port range: 1000-1001-1002"
+
+
+def test_portparse_range_startgreaterthanend(helpers):
+    with pytest.raises(ValueError) as e:
+        helpers.parse_port_string("80,443,22,1002-1000")
+    assert str(e.value) == "Invalid port range: 1002-1000"
+
+
+def test_portparse_nonnumericinput(helpers):
+    with pytest.raises(ValueError) as e:
+        helpers.parse_port_string("80,443,22,foo")
+    assert str(e.value) == "Invalid port or port range: foo"
+
+
+# test parse_list_string helper
+
+
+def test_liststring_valid_strings(helpers):
+    assert helpers.parse_list_string("hello,world,bbot") == ["hello", "world", "bbot"]
+
+
+def test_liststring_invalid_string(helpers):
+    with pytest.raises(ValueError) as e:
+        helpers.parse_list_string("hello,world,\x01")
+    assert str(e.value) == "Invalid character in string: \x01"
+
+
+def test_liststring_singleitem(helpers):
+    assert helpers.parse_list_string("hello") == ["hello"]
+
+
+def test_liststring_invalidfnchars(helpers):
+    with pytest.raises(ValueError) as e:
+        helpers.parse_list_string("hello,world,bbot|test")
+    assert str(e.value) == "Invalid character in string: bbot|test"

From 539a315eeb05320566ad6838fcdf5283de6b68e2 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 15:48:55 -0400
Subject: [PATCH 226/387] missing import

---
 bbot/modules/ffuf_shortnames.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/modules/ffuf_shortnames.py b/bbot/modules/ffuf_shortnames.py
index 7f05be52aa..3ac991967e 100644
--- a/bbot/modules/ffuf_shortnames.py
+++ b/bbot/modules/ffuf_shortnames.py
@@ -3,6 +3,7 @@
 import string
 
 from bbot.modules.deadly.ffuf import ffuf
+from bbot.core.helpers.misc import parse_list_string
 
 
 def find_common_prefixes(strings, minimum_set_length=4):

From 9ff4d29b7afc8d5a806f25a42845b34f0e8a99e8 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 16:09:05 -0400
Subject: [PATCH 227/387] moving telerik test patching

---
 bbot/test/bbot_fixtures.py                             |  8 --------
 .../test_step_2/module_tests/test_module_telerik.py    | 10 ++++++++++
 2 files changed, 10 insertions(+), 8 deletions(-)

diff --git a/bbot/test/bbot_fixtures.py b/bbot/test/bbot_fixtures.py
index 1d7fe4e230..d75cb0585c 100644
--- a/bbot/test/bbot_fixtures.py
+++ b/bbot/test/bbot_fixtures.py
@@ -21,14 +21,6 @@ def match_data(self, request: Request) -> bool:
 
 pytest_httpserver.httpserver.RequestMatcher = SubstringRequestMatcher
 
-from bbot.modules.telerik import telerik
-
-telerik.telerikVersions = ["2014.2.724", "2014.3.1024", "2015.1.204"]
-telerik.DialogHandlerUrls = [
-    "Admin/ServerSide/Telerik.Web.UI.DialogHandler.aspx",
-    "App_Master/Telerik.Web.UI.DialogHandler.aspx",
-    "AsiCommon/Controls/ContentManagement/ContentDesigner/Telerik.Web.UI.DialogHandler.aspx",
-]
 
 test_config = OmegaConf.load(Path(__file__).parent / "test.conf")
 if test_config.get("debug", False):
diff --git a/bbot/test/test_step_2/module_tests/test_module_telerik.py b/bbot/test/test_step_2/module_tests/test_module_telerik.py
index 34924451b7..994e02169c 100644
--- a/bbot/test/test_step_2/module_tests/test_module_telerik.py
+++ b/bbot/test/test_step_2/module_tests/test_module_telerik.py
@@ -1,6 +1,8 @@
 import re
 from .base import ModuleTestBase
 
+from bbot.modules.telerik import telerik
+
 
 class TestTelerik(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
@@ -45,6 +47,14 @@ async def setup_before_prep(self, module_test):
         respond_args = {"status": 200}
         module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
 
+    async def setup_after_prep(self, module_test):
+        module_test.scan.modules["telerik"].telerikVersions = ["2014.2.724", "2014.3.1024", "2015.1.204"]
+        module_test.scan.modules["telerik"].DialogHandlerUrls = [
+            "Admin/ServerSide/Telerik.Web.UI.DialogHandler.aspx",
+            "App_Master/Telerik.Web.UI.DialogHandler.aspx",
+            "AsiCommon/Controls/ContentManagement/ContentDesigner/Telerik.Web.UI.DialogHandler.aspx",
+        ]
+
     def check(self, module_test, events):
         telerik_axd_detection = False
         telerik_axd_vulnerable = False

From ec5b8311bf1ad208045fcba2ff130608729499f4 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 16:10:28 -0400
Subject: [PATCH 228/387] unnecessary import remove

---
 bbot/test/test_step_2/module_tests/test_module_telerik.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_telerik.py b/bbot/test/test_step_2/module_tests/test_module_telerik.py
index 994e02169c..6a4a7d97d7 100644
--- a/bbot/test/test_step_2/module_tests/test_module_telerik.py
+++ b/bbot/test/test_step_2/module_tests/test_module_telerik.py
@@ -1,8 +1,6 @@
 import re
 from .base import ModuleTestBase
 
-from bbot.modules.telerik import telerik
-
 
 class TestTelerik(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]

From e49aa53f17b29b4d1fec72a8354eb0f41ec32c8d Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 16:15:48 -0400
Subject: [PATCH 229/387] for got to also change handling in handle_event

---
 bbot/modules/deadly/ffuf.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/deadly/ffuf.py b/bbot/modules/deadly/ffuf.py
index c0eb0d80b8..2ef1938f9b 100644
--- a/bbot/modules/deadly/ffuf.py
+++ b/bbot/modules/deadly/ffuf.py
@@ -78,7 +78,7 @@ async def handle_event(self, event):
 
         exts = ["", "/"]
         if self.extensions:
-            for ext in self.extensions.split(","):
+            for ext in self.extensions:
                 exts.append(f".{ext}")
 
         filters = await self.baseline_ffuf(fixed_url, exts=exts)

From 48d6e480831eefb8a9c3cafc31f73352d179e932 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 12 Jul 2023 17:21:33 -0400
Subject: [PATCH 230/387] Added OAUTH + Azure Realm Modules

---
 .github/workflows/docs.yml                    |   2 +-
 bbot/core/helpers/helper.py                   |   3 -
 bbot/core/helpers/misc.py                     |  36 ++-
 bbot/core/helpers/regexes.py                  |  18 +-
 bbot/modules/azure_realm.py                   |  33 +++
 bbot/modules/azure_tenant.py                  |   2 +-
 bbot/modules/internal/excavate.py             |  11 +-
 bbot/modules/massdns.py                       |   2 -
 bbot/modules/oauth.py                         | 132 ++++++++++
 bbot/scanner/scanner.py                       |  23 ++
 bbot/test/test.conf                           |   3 +-
 bbot/test/test_step_1/test_helpers.py         |  13 +-
 .../module_tests/test_module_azure_realm.py   |  31 +++
 .../module_tests/test_module_oauth.py         | 230 ++++++++++++++++++
 poetry.lock                                   |  19 +-
 pyproject.toml                                |   3 +-
 16 files changed, 532 insertions(+), 29 deletions(-)
 create mode 100644 bbot/modules/azure_realm.py
 create mode 100644 bbot/modules/oauth.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_azure_realm.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_oauth.py

diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
index ef4a9f0af1..264a1639f6 100644
--- a/.github/workflows/docs.yml
+++ b/.github/workflows/docs.yml
@@ -2,7 +2,6 @@ name: docs
 on:
   push:
     branches:
-      - material-docs
       - dev
 permissions:
   contents: write
@@ -24,6 +23,7 @@ jobs:
           poetry run bbot/scripts/docs.py
       - name: Commit docs
         uses: EndBug/add-and-commit@v9
+        continue-on-error: true
         with:
           add: "*.md"
           default_author: github_actions
diff --git a/bbot/core/helpers/helper.py b/bbot/core/helpers/helper.py
index fd37387ef5..b052a63fbd 100644
--- a/bbot/core/helpers/helper.py
+++ b/bbot/core/helpers/helper.py
@@ -1,7 +1,6 @@
 import os
 import logging
 from pathlib import Path
-from threading import Lock
 
 from . import misc
 from .dns import DNSHelper
@@ -42,8 +41,6 @@ def __init__(self, config, scan=None):
         self.mkdir(self.temp_dir)
         self.mkdir(self.tools_dir)
         self.mkdir(self.lib_dir)
-        self._futures = set()
-        self._future_lock = Lock()
 
         self.dns = DNSHelper(self)
         self.web = WebHelper(self)
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 8e357378a0..fee0dc23c8 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -190,7 +190,13 @@ def split_domain(hostname):
     "www.internal.evilcorp.co.uk" --> ("www.internal", "evilcorp.co.uk")
     """
     parsed = tldextract(hostname)
-    return (parsed.subdomain, parsed.registered_domain)
+    subdomain = parsed.subdomain
+    domain = parsed.registered_domain
+    if not domain:
+        split = hostname.split(".")
+        subdomain = ".".join(split[:-2])
+        domain = ".".join(split[-2:])
+    return (subdomain, domain)
 
 
 def domain_stem(domain):
@@ -677,6 +683,34 @@ def search_format_dict(d, **kwargs):
     return d
 
 
+def search_dict_values(d, *regexes):
+    """
+    Recursively search a dictionary's values based on regexes
+
+    dict_to_search = {
+        "key1": {
+            "key2": [
+                {
+                    "key3": "A URL: https://www.evilcorp.com"
+                }
+            ]
+        }
+    })
+
+    search_dict_values(dict_to_search, url_regexes) --> "https://www.evilcorp.com"
+    """
+    for r in regexes:
+        if isinstance(d, str):
+            for match in r.finditer(d):
+                yield match.group()
+        elif isinstance(d, dict):
+            for _, v in d.items():
+                yield from search_dict_values(v, *regexes)
+        elif isinstance(d, list):
+            for v in d:
+                yield from search_dict_values(v, *regexes)
+
+
 def filter_dict(d, *key_names, fuzzy=False, invert=False, exclude_keys=None, prev_key=None):
     """
     Recursively filter a dictionary based on key names
diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index 2e1494d759..13f08a7d57 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -27,11 +27,16 @@
 email_regex = re.compile(_email_regex, re.I)
 _ptr_regex = r"(?:[0-9]{1,3}[-_\.]){3}[0-9]{1,3}"
 ptr_regex = re.compile(_ptr_regex)
+_url_regexes = (
+    r"https?://((?:\w|\w[\w\-]*\w)[\.]?)+(?:\w[\w\-]*\w|\w)(?::[0-9]{1,5})?.*$",
+    r"https?://\[" + _ipv6_regex + r"\](?::[0-9]{1,5})?.*$",
+)
+url_regexes = (re.compile(r, re.I) for r in _url_regexes)
 
 event_type_regexes = OrderedDict(
-    [
+    (
         (k, tuple(re.compile(r, re.I) for r in regexes))
-        for k, regexes in [
+        for k, regexes in (
             (
                 "DNS_NAME",
                 (r"^" + _dns_name_regex + r"$",),
@@ -49,13 +54,10 @@
             ),
             (
                 "URL",
-                (
-                    r"https?://((?:\w|\w[\w\-]*\w)[\.]?)+(?:\w[\w\-]*\w|\w)(?::[0-9]{1,5})?.*$",
-                    r"https?://\[" + _ipv6_regex + r"\](?::[0-9]{1,5})?.*$",
-                ),
+                _url_regexes,
             ),
-        ]
-    ]
+        )
+    )
 )
 
 event_id_regex = re.compile(r"[0-9a-f]{40}:[A-Z0-9_]+")
diff --git a/bbot/modules/azure_realm.py b/bbot/modules/azure_realm.py
new file mode 100644
index 0000000000..b1b876e9db
--- /dev/null
+++ b/bbot/modules/azure_realm.py
@@ -0,0 +1,33 @@
+from .base import BaseModule
+
+
+class azure_realm(BaseModule):
+    watched_events = ["DNS_NAME"]
+    produced_events = ["DNS_NAME"]
+    flags = ["affiliates", "subdomain-enum", "cloud-enum", "web-basic", "passive", "safe"]
+    meta = {"description": 'Retrieves the "AuthURL" from login.microsoftonline.com/getuserrealm'}
+
+    async def setup(self):
+        self.processed = set()
+        return True
+
+    async def handle_event(self, event):
+        _, domain = self.helpers.split_domain(event.data)
+        domain_hash = hash(domain)
+        if domain_hash not in self.processed:
+            self.processed.add(domain_hash)
+            auth_url = await self.getuserrealm(domain)
+            if auth_url:
+                self.emit_event(auth_url, "URL_UNVERIFIED", source=event, tags=["affiliate", "ms-auth-url"])
+
+    async def getuserrealm(self, domain):
+        url = f"https://login.microsoftonline.com/getuserrealm.srf?login=test@{domain}"
+        r = await self.helpers.request(url)
+        if r is None:
+            return
+        try:
+            json = r.json()
+        except Exception:
+            return
+        if json and isinstance(json, dict):
+            return json.get("AuthURL", "")
diff --git a/bbot/modules/azure_tenant.py b/bbot/modules/azure_tenant.py
index b2626810e1..c46e7ac2da 100644
--- a/bbot/modules/azure_tenant.py
+++ b/bbot/modules/azure_tenant.py
@@ -6,7 +6,7 @@
 class azure_tenant(viewdns):
     watched_events = ["DNS_NAME"]
     produced_events = ["DNS_NAME"]
-    flags = ["affiliates", "subdomain-enum", "passive", "safe"]
+    flags = ["affiliates", "subdomain-enum", "cloud-enum", "passive", "safe"]
     meta = {"description": "Query Azure for tenant sister domains"}
 
     base_url = "https://autodiscover-s.outlook.com"
diff --git a/bbot/modules/internal/excavate.py b/bbot/modules/internal/excavate.py
index cff1ce458b..1e60ce5d75 100644
--- a/bbot/modules/internal/excavate.py
+++ b/bbot/modules/internal/excavate.py
@@ -40,15 +40,8 @@ class HostnameExtractor(BaseExtractor):
     regexes = {}
 
     def __init__(self, excavate):
-        dns_targets = set(t.host for t in excavate.scan.target if t.host and isinstance(t.host, str))
-        dns_whitelist = set(t.host for t in excavate.scan.whitelist if t.host and isinstance(t.host, str))
-        dns_targets.update(dns_whitelist)
-        dns_targets = sorted(dns_targets, key=len)
-        dns_targets_set = set()
-        for i, t in enumerate(dns_targets):
-            if not any(x in dns_targets_set for x in excavate.helpers.domain_parents(t, include_self=True)):
-                dns_targets_set.add(t)
-                self.regexes[f"dns_name_{i+1}"] = r"((?:(?:[\w-]+)\.)+" + re.escape(t) + ")"
+        for i, r in enumerate(excavate.scan.dns_regexes):
+            self.regexes[f"dns_name_{i+1}"] = r.pattern
         super().__init__(excavate)
 
     def report(self, result, name, event, **kwargs):
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 6a9c4328fd..54afb81a08 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -194,8 +194,6 @@ async def _massdns(self, domain, subdomains):
             self.max_resolvers,
             "-t",
             "A",
-            "-t",
-            "AAAA",
             "-o",
             "J",
             "-q",
diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
new file mode 100644
index 0000000000..7d98ee7024
--- /dev/null
+++ b/bbot/modules/oauth.py
@@ -0,0 +1,132 @@
+from bbot.core.helpers.regexes import url_regexes
+
+from .base import BaseModule
+
+
+class OAUTH(BaseModule):
+    watched_events = ["DNS_NAME", "URL_UNVERIFIED"]
+    produced_events = ["DNS_NAME"]
+    flags = ["affiliates", "subdomain-enum", "cloud-enum", "web-basic", "active", "safe"]
+    meta = {"description": "Enumerate OAUTH and OpenID Connect services"}
+    options = {"try_all": False}
+    options_desc = {"try_all": "Check for OAUTH/IODC on every subdomain and URL."}
+
+    in_scope_only = False
+    scope_distance_modifier = 1
+    max_event_handlers = 2
+
+    async def setup(self):
+        self.processed = set()
+        self.regexes = list(url_regexes) + list(self.scan.dns_regexes)
+        self.try_all = self.config.get("try_all", False)
+        return True
+
+    async def filter_event(self, event):
+        if event.module == self or any(t in event.tags for t in ("target", "domain", "ms-auth-url")):
+            return True
+        elif self.try_all and event.scope_distance == 0:
+            return True
+        return False
+
+    async def handle_event(self, event):
+        oidc_tasks = []
+        _, domain = self.helpers.split_domain(event.data)
+        if event.scope_distance == 0:
+            domain_hash = hash(domain)
+            if domain_hash not in self.processed:
+                self.processed.add(domain_hash)
+                oidc_tasks.append(self.helpers.create_task(self.getoidc(f"https://login.windows.net/{domain}")))
+
+        if event.type == "URL_UNVERIFIED":
+            url = event.data
+        else:
+            url = f"https://{event.data}"
+
+        oauth_tasks = []
+        if self.try_all or any(t in event.tags for t in ("oauth-token-endpoint",)):
+            for u in self.url_and_base(url):
+                oauth_tasks.append(self.helpers.create_task(self.getoauth(u)))
+        if self.try_all or any(t in event.tags for t in ("ms-auth-url",)):
+            for u in self.url_and_base(url):
+                oidc_tasks.append(self.helpers.create_task(self.getoidc(u)))
+
+        for oidc_task in oidc_tasks:
+            url, token_endpoint, oidc_results = await oidc_task
+            if token_endpoint:
+                self.emit_event(
+                    {
+                        "description": f"OpenID Connect Endpoint found at {url}",
+                        "host": event.host,
+                        "url": url,
+                    },
+                    "FINDING",
+                    source=event,
+                )
+                self.emit_event(
+                    token_endpoint, "URL_UNVERIFIED", source=event, tags=["affiliate", "oauth-token-endpoint"]
+                )
+            for result in oidc_results:
+                if result not in (domain, event.data):
+                    event_type = "URL_UNVERIFIED" if self.helpers.is_url(result) else "DNS_NAME"
+                    self.emit_event(result, event_type, source=event, tags=["affiliate"])
+
+        for oauth_task in oauth_tasks:
+            url = await oauth_task
+            if url:
+                self.emit_event(
+                    {
+                        "description": f"Potentially Sprayable OAUTH Endpoint at {url}",
+                        "host": event.host,
+                        "url": url,
+                    },
+                    "FINDING",
+                    source=event,
+                )
+
+    def url_and_base(self, url):
+        yield url
+        parsed = self.helpers.urlparse(url)
+        baseurl = f"{parsed.scheme}://{parsed.netloc}"
+        if baseurl != url:
+            yield baseurl
+
+    async def getoidc(self, url):
+        results = set()
+        if not url.endswith("openid-configuration"):
+            url = url.strip("/") + "/.well-known/openid-configuration"
+        url_hash = hash("OIDC:" + url)
+        token_endpoint = ""
+        if url_hash not in self.processed:
+            self.processed.add(url_hash)
+            r = await self.helpers.request(url)
+            if r is None:
+                return url, token_endpoint, results
+            try:
+                json = r.json()
+            except Exception:
+                return url, token_endpoint, results
+            if json and isinstance(json, dict):
+                token_endpoint = json.get("token_endpoint", "")
+                for found in self.helpers.search_dict_values(json, *self.regexes):
+                    results.add(found)
+        results -= {token_endpoint}
+        return url, token_endpoint, results
+
+    async def getoauth(self, url):
+        data = {
+            "grant_type": "authorization_code",
+            "client_id": "xxx",
+            "redirect_uri": "https://www.blacklanternsecurity.com",
+            "code": "xxx",
+            "client_secret": "xxx",
+        }
+        url_hash = hash("OAUTH:" + url)
+        if url_hash not in self.processed:
+            self.processed.add(url_hash)
+            r = await self.helpers.request(url, method="POST", data=data)
+            if r is None:
+                return
+            if r.status_code in (400, 401):
+                if "json" in r.headers.get("content-type", "").lower():
+                    if any(x in r.text.lower() for x in ("invalid_grant", "invalid_client")):
+                        return url
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index df4bde4aae..47acc70033 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -1,3 +1,4 @@
+import re
 import asyncio
 import logging
 import traceback
@@ -179,6 +180,8 @@ def __init__(
 
         self._stopping = False
 
+        self._dns_regexes = None
+
     def _on_keyboard_interrupt(self, loop, event):
         self.stop()
 
@@ -742,6 +745,26 @@ def run_in_executor_mp(self, callback, *args, **kwargs):
         callback = partial(callback, **kwargs)
         return self._loop.run_in_executor(self.process_pool, callback, *args)
 
+    @property
+    def dns_regexes(self):
+        """
+        Return a list of regexes for extracting target hostnames
+        """
+        if self._dns_regexes is None:
+            dns_targets = set(t.host for t in self.target if t.host and isinstance(t.host, str))
+            dns_whitelist = set(t.host for t in self.whitelist if t.host and isinstance(t.host, str))
+            dns_targets.update(dns_whitelist)
+            dns_targets = sorted(dns_targets, key=len)
+            dns_targets_set = set()
+            dns_regexes = []
+            for t in dns_targets:
+                if not any(x in dns_targets_set for x in self.helpers.domain_parents(t, include_self=True)):
+                    dns_targets_set.add(t)
+                    dns_regexes.append(re.compile(r"((?:(?:[\w-]+)\.)+" + re.escape(t) + ")", re.I))
+            self._dns_regexes = dns_regexes
+
+        return self._dns_regexes
+
     def _handle_exception(self, e, context="scan", finally_callback=None):
         if callable(context):
             context = f"{context.__qualname__}()"
diff --git a/bbot/test/test.conf b/bbot/test/test.conf
index 9444e1d14c..194e7890d8 100644
--- a/bbot/test/test.conf
+++ b/bbot/test/test.conf
@@ -48,4 +48,5 @@ dns_wildcard_ignore:
   - notreal
   - google
   - google.com
-  - example.com
\ No newline at end of file
+  - example.com
+  - evilcorp.com
\ No newline at end of file
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index f7dd72c57f..fb38d3cc2a 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -5,7 +5,7 @@
 
 
 @pytest.mark.asyncio
-async def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
+async def test_helpers_misc(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver):
     ### URL ###
     bad_urls = (
         "http://e.co/index.html",
@@ -106,6 +106,12 @@ async def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver
         "b@b.com",
     )
 
+    assert helpers.split_domain("www.evilcorp.co.uk") == ("www", "evilcorp.co.uk")
+    assert helpers.split_domain("asdf.www.test.notreal") == ("asdf.www", "test.notreal")
+    assert helpers.split_domain("www.test.notreal") == ("www", "test.notreal")
+    assert helpers.split_domain("test.notreal") == ("", "test.notreal")
+    assert helpers.split_domain("notreal") == ("", "notreal")
+
     assert helpers.split_host_port("https://evilcorp.co.uk") == ("evilcorp.co.uk", 443)
     assert helpers.split_host_port("http://evilcorp.co.uk:666") == ("evilcorp.co.uk", 666)
     assert helpers.split_host_port("evilcorp.co.uk:666") == ("evilcorp.co.uk", 666)
@@ -154,6 +160,11 @@ async def test_helpers(helpers, scan, bbot_scanner, bbot_config, bbot_httpserver
     assert not list(helpers.search_dict_by_key("asdf", [{"wat": {"nope": 1}}, {"wat": [{"fdsa": "asdf"}]}]))
     assert not list(helpers.search_dict_by_key("asdf", "asdf"))
 
+    from bbot.core.helpers.regexes import url_regexes
+
+    dict_to_search = {"key1": {"key2": [{"key3": "A url of some kind: https://www.evilcorp.com/asdf"}]}}
+    assert list(helpers.search_dict_values(dict_to_search, *url_regexes)) == ["https://www.evilcorp.com/asdf"]
+
     filtered_dict = helpers.filter_dict(
         {"modules": {"c99": {"api_key": "1234", "filterme": "asdf"}, "ipneighbor": {"test": "test"}}}, "api_key"
     )
diff --git a/bbot/test/test_step_2/module_tests/test_module_azure_realm.py b/bbot/test/test_step_2/module_tests/test_module_azure_realm.py
new file mode 100644
index 0000000000..7ab5463c16
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_azure_realm.py
@@ -0,0 +1,31 @@
+from .base import ModuleTestBase
+
+
+class TestAzure_Realm(ModuleTestBase):
+    targets = ["evilcorp.com"]
+    config_overrides = {"scope_report_distance": 1}
+
+    response_json = {
+        "State": 3,
+        "UserState": 2,
+        "Login": "test@evilcorp.com",
+        "NameSpaceType": "Federated",
+        "DomainName": "evilcorp.com",
+        "FederationGlobalVersion": -1,
+        "AuthURL": "https://evilcorp.okta.com/app/office365/deadbeef/sso/wsfed/passive?username=test%40evilcorp.com&wa=wsignin1.0&wtrevilcorplm=urn%3afederation%3aMicrosoftOnline&wctx=",
+        "FederationBrandName": "EvilCorp",
+        "AuthNForwardType": 1,
+        "CloudInstanceName": "microsoftonline.com",
+        "CloudInstanceIssuerUri": "urn:federation:MicrosoftOnline",
+    }
+
+    async def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://login.microsoftonline.com/getuserrealm.srf?login=test@evilcorp.com",
+            json=self.response_json,
+        )
+
+    def check(self, module_test, events):
+        assert any(
+            e.data == "https://evilcorp.okta.com/app/office365/deadbeef/sso/wsfed/passive" for e in events
+        ), "Failed to detect URL"
diff --git a/bbot/test/test_step_2/module_tests/test_module_oauth.py b/bbot/test/test_step_2/module_tests/test_module_oauth.py
new file mode 100644
index 0000000000..e7189f2333
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_oauth.py
@@ -0,0 +1,230 @@
+from .base import ModuleTestBase
+
+from .test_module_azure_realm import TestAzure_Realm
+
+
+class TestOAUTH(ModuleTestBase):
+    targets = ["evilcorp.com"]
+    config_overrides = {"scope_report_distance": 1}
+    modules_overrides = ["azure_realm", "oauth"]
+    openid_config_azure = {
+        "token_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/token",
+        "token_endpoint_auth_methods_supported": ["client_secret_post", "private_key_jwt", "client_secret_basic"],
+        "jwks_uri": "https://login.windows.net/common/discovery/keys",
+        "response_modes_supported": ["query", "fragment", "form_post"],
+        "subject_types_supported": ["pairwise"],
+        "id_token_signing_alg_values_supported": ["RS256"],
+        "response_types_supported": ["code", "id_token", "code id_token", "token id_token", "token"],
+        "scopes_supported": ["openid"],
+        "issuer": "https://sts.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/",
+        "microsoft_multi_refresh_token": True,
+        "authorization_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/authorize",
+        "device_authorization_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/devicecode",
+        "http_logout_supported": True,
+        "frontchannel_logout_supported": True,
+        "end_session_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/logout",
+        "claims_supported": [
+            "sub",
+            "iss",
+            "cloud_instance_name",
+            "cloud_instance_host_name",
+            "cloud_graph_host_name",
+            "msgraph_host",
+            "aud",
+            "exp",
+            "iat",
+            "auth_time",
+            "acr",
+            "amr",
+            "nonce",
+            "email",
+            "given_name",
+            "family_name",
+            "nickname",
+        ],
+        "check_session_iframe": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/checksession",
+        "userinfo_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/openid/userinfo",
+        "kerberos_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/kerberos",
+        "tenant_region_scope": "NA",
+        "cloud_instance_name": "microsoftonline.com",
+        "cloud_graph_host_name": "graph.windows.net",
+        "msgraph_host": "graph.microsoft.com",
+        "rbac_url": "https://pas.windows.net",
+    }
+    openid_config_okta = {
+        "issuer": "https://evilcorp.okta.com",
+        "authorization_endpoint": "https://evilcorp.okta.com/oauth2/v1/authorize",
+        "token_endpoint": "https://evilcorp.okta.com/oauth2/v1/token",
+        "userinfo_endpoint": "https://evilcorp.okta.com/oauth2/v1/userinfo",
+        "registration_endpoint": "https://evilcorp.okta.com/oauth2/v1/clients",
+        "jwks_uri": "https://evilcorp.okta.com/oauth2/v1/keys",
+        "response_types_supported": [
+            "code",
+            "id_token",
+            "code id_token",
+            "code token",
+            "id_token token",
+            "code id_token token",
+        ],
+        "response_modes_supported": ["query", "fragment", "form_post", "okta_post_message"],
+        "grant_types_supported": [
+            "authorization_code",
+            "implicit",
+            "refresh_token",
+            "password",
+            "urn:ietf:params:oauth:grant-type:device_code",
+            "urn:openid:params:grant-type:ciba",
+        ],
+        "subject_types_supported": ["public"],
+        "id_token_signing_alg_values_supported": ["RS256"],
+        "scopes_supported": ["openid", "email", "profile", "address", "phone", "offline_access", "groups"],
+        "token_endpoint_auth_methods_supported": [
+            "client_secret_basic",
+            "client_secret_post",
+            "client_secret_jwt",
+            "private_key_jwt",
+            "none",
+        ],
+        "claims_supported": [
+            "iss",
+            "ver",
+            "sub",
+            "aud",
+            "iat",
+            "exp",
+            "jti",
+            "auth_time",
+            "amr",
+            "idp",
+            "nonce",
+            "name",
+            "nickname",
+            "preferred_username",
+            "given_name",
+            "middle_name",
+            "family_name",
+            "email",
+            "email_verified",
+            "profile",
+            "zoneinfo",
+            "locale",
+            "address",
+            "phone_number",
+            "picture",
+            "website",
+            "gender",
+            "birthdate",
+            "updated_at",
+            "at_hash",
+            "c_hash",
+        ],
+        "code_challenge_methods_supported": ["S256"],
+        "introspection_endpoint": "https://evilcorp.okta.com/oauth2/v1/introspect",
+        "introspection_endpoint_auth_methods_supported": [
+            "client_secret_basic",
+            "client_secret_post",
+            "client_secret_jwt",
+            "private_key_jwt",
+            "none",
+        ],
+        "revocation_endpoint": "https://evilcorp.okta.com/oauth2/v1/revoke",
+        "revocation_endpoint_auth_methods_supported": [
+            "client_secret_basic",
+            "client_secret_post",
+            "client_secret_jwt",
+            "private_key_jwt",
+            "none",
+        ],
+        "end_session_endpoint": "https://evilcorp.okta.com/oauth2/v1/logout",
+        "request_parameter_supported": True,
+        "request_object_signing_alg_values_supported": [
+            "HS256",
+            "HS384",
+            "HS512",
+            "RS256",
+            "RS384",
+            "RS512",
+            "ES256",
+            "ES384",
+            "ES512",
+        ],
+        "device_authorization_endpoint": "https://evilcorp.okta.com/oauth2/v1/device/authorize",
+        "pushed_authorization_request_endpoint": "https://evilcorp.okta.com/oauth2/v1/par",
+        "backchannel_token_delivery_modes_supported": ["poll"],
+        "backchannel_authentication_request_signing_alg_values_supported": [
+            "HS256",
+            "HS384",
+            "HS512",
+            "RS256",
+            "RS384",
+            "RS512",
+            "ES256",
+            "ES384",
+            "ES512",
+        ],
+    }
+
+    async def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://login.microsoftonline.com/getuserrealm.srf?login=test@evilcorp.com",
+            json=TestAzure_Realm.response_json,
+        )
+        module_test.httpx_mock.add_response(
+            url="https://login.windows.net/evilcorp.com/.well-known/openid-configuration",
+            json=self.openid_config_azure,
+        )
+        module_test.httpx_mock.add_response(
+            url="https://evilcorp.okta.com/.well-known/openid-configuration",
+            json=self.openid_config_okta,
+        )
+        module_test.httpx_mock.add_response(
+            url="https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/token",
+            json={
+                "error": "invalid_grant",
+                "error_description": "AADSTS9002313: Invalid request. Request is malformed or invalid.\r\nTrace ID: a3618b0d-d3b2-4669-96bc-ce414e202300\r\nCorrelation ID: fc54afc5-6f9d-4488-90ba-d8213515b847\r\nTimestamp: 2023-07-12 20:39:45Z",
+                "error_codes": [9002313],
+                "timestamp": "2023-07-12 20:39:45Z",
+                "trace_id": "a3618b0d-d3b2-4669-96bc-ce414e202300",
+                "correlation_id": "fc54afc5-6f9d-4488-90ba-d8213515b847",
+                "error_uri": "https://login.windows.net/error?code=9002313",
+            },
+            status_code=400,
+        )
+        module_test.httpx_mock.add_response(
+            url="https://evilcorp.okta.com/oauth2/v1/token",
+            json={
+                "errorCode": "invalid_client",
+                "errorSummary": "Invalid value for 'client_id' parameter.",
+                "errorLink": "invalid_client",
+                "errorId": "oae06YVQDq4Qz-WEuP3dU14XQ",
+                "errorCauses": [],
+            },
+            status_code=400,
+        )
+
+    def check(self, module_test, events):
+        assert any(
+            e.type == "FINDING"
+            and e.data["description"]
+            == "OpenID Connect Endpoint found at https://login.windows.net/evilcorp.com/.well-known/openid-configuration"
+            for e in events
+        )
+        assert any(
+            e.type == "FINDING"
+            and e.data["description"]
+            == "OpenID Connect Endpoint found at https://evilcorp.okta.com/.well-known/openid-configuration"
+            for e in events
+        )
+        assert any(
+            e.type == "FINDING"
+            and e.data["description"]
+            == "Potentially Sprayable OAUTH Endpoint at https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/token"
+            for e in events
+        )
+        assert any(
+            e.type == "FINDING"
+            and e.data["description"]
+            == "Potentially Sprayable OAUTH Endpoint at https://evilcorp.okta.com/oauth2/v1/token"
+            for e in events
+        )
+        assert any(e.data == "sts.windows.net" for e in events)
diff --git a/poetry.lock b/poetry.lock
index 1fb51fefd9..b30ee04c18 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1285,6 +1285,23 @@ pytest = ">=4.6"
 [package.extras]
 testing = ["fields", "hunter", "process-tests", "pytest-xdist", "six", "virtualenv"]
 
+[[package]]
+name = "pytest-env"
+version = "0.8.2"
+description = "py.test plugin that allows you to add environment variables."
+optional = false
+python-versions = ">=3.7"
+files = [
+    {file = "pytest_env-0.8.2-py3-none-any.whl", hash = "sha256:5e533273f4d9e6a41c3a3120e0c7944aae5674fa773b329f00a5eb1f23c53a38"},
+    {file = "pytest_env-0.8.2.tar.gz", hash = "sha256:baed9b3b6bae77bd75b9238e0ed1ee6903a42806ae9d6aeffb8754cd5584d4ff"},
+]
+
+[package.dependencies]
+pytest = ">=7.3.1"
+
+[package.extras]
+test = ["coverage (>=7.2.7)", "pytest-mock (>=3.10)"]
+
 [[package]]
 name = "pytest-httpserver"
 version = "1.0.8"
@@ -1762,4 +1779,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "d068843a460d48249082516ca2cb42e026230a8815329114a94c092c242ec6d7"
+content-hash = "e617e34873656bce6b2999d2c80dcf5d38909eb193d4849b11611a1eac619ec5"
diff --git a/pyproject.toml b/pyproject.toml
index 920fc8365c..280bada6fc 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -45,8 +45,9 @@ pytest-httpx = "^0.22.0"
 urllib3 = "^2.0.2"
 werkzeug = "^2.3.4"
 pytest-httpserver = "^1.0.8"
+pytest-env = "^0.8.2"
 
-[pytest]
+[tool.pytest.ini_options]
 env = [
     "BBOT_TESTING = True"
 ]    

From cc57970a8abce0e9a272589c2db1b1a6cc4dc0d8 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 17:34:49 -0400
Subject: [PATCH 231/387] per_host_only initial

---
 bbot/modules/base.py           | 19 +++++++++++++++++++
 bbot/modules/host_header.py    | 11 +----------
 bbot/modules/iis_shortnames.py | 12 ++++--------
 bbot/modules/robots.py         | 12 ++----------
 bbot/modules/smuggler.py       | 13 +------------
 bbot/modules/telerik.py        | 10 +---------
 bbot/modules/wafw00f.py        | 14 +-------------
 7 files changed, 29 insertions(+), 62 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 8ddf60f869..548a4febf6 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -32,6 +32,8 @@ class BaseModule:
     accept_dupes = False
     # Whether to block outgoing duplicate events
     suppress_dupes = True
+    # Limit the module to only scanning once per host. By default, defined by event.host, but can be customized by overriding
+    per_host_only = False
 
     # Scope distance modifier - accept/deny events based on scope distance
     # None == accept all events
@@ -102,6 +104,9 @@ def __init__(self, scan):
         self._event_queued = asyncio.Condition()
         self._event_dequeued = asyncio.Condition()
 
+        # used for optional "per host" tracking
+        self._per_host_tracker = set()
+
     async def setup(self):
         """
         Perform setup functions at the beginning of the scan.
@@ -427,6 +432,16 @@ async def _event_postcheck(self, event):
             if not filter_result:
                 return False, msg
 
+        if self.per_host_only:
+            self.critical("IN PER HOST ONLY")
+            self.hugewarning(event.data)
+            if self.get_per_host_hash(event) in self._per_host_tracker:
+                self.critical("ALREADY DID THIS HOST BLOCK IT")
+                return False, "per_host_only enabled and already seen host"
+            else:
+                self.critical("THIS IS A NEW HOST, ADD IT AND ALLOW IT")
+                self._per_host_tracker.add(self.get_per_host_hash(event))
+
         if self._type == "output" and not event._stats_recorded:
             event._stats_recorded = True
             self.scan.stats.event_produced(event)
@@ -501,6 +516,10 @@ def set_error_state(self, message=None):
                 # if there are leftover objects in the queue, the scan will hang.
                 self._incoming_event_queue = False
 
+    # override in the module to define different values to comprise the hash
+    def get_per_host_hash(self, event):
+        return hash(f"{event.parsed.scheme}://{event.parsed.netloc}/")
+
     @property
     def name(self):
         return str(self._name)
diff --git a/bbot/modules/host_header.py b/bbot/modules/host_header.py
index 69caea57c6..c20f4c4b40 100644
--- a/bbot/modules/host_header.py
+++ b/bbot/modules/host_header.py
@@ -9,12 +9,11 @@ class host_header(BaseModule):
     meta = {"description": "Try common HTTP Host header spoofing techniques"}
 
     in_scope_only = True
+    per_host_only = True
 
     deps_apt = ["curl"]
 
     async def setup(self):
-        self.scanned_hosts = set()
-
         self.subdomain_tags = {}
         if self.scan.config.get("interactsh_disable", False) == False:
             try:
@@ -74,14 +73,6 @@ async def cleanup(self):
                 self.warning(f"Interactsh failure: {e}")
 
     async def handle_event(self, event):
-        host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
-        host_hash = hash(host)
-        if host_hash in self.scanned_hosts:
-            self.debug(f"Host {host} was already scanned, exiting")
-            return
-        else:
-            self.scanned_hosts.add(host_hash)
-
         # get any set-cookie responses from the response and add them to the request
 
         added_cookies = {}
diff --git a/bbot/modules/iis_shortnames.py b/bbot/modules/iis_shortnames.py
index 7a5be37c14..b63e155180 100644
--- a/bbot/modules/iis_shortnames.py
+++ b/bbot/modules/iis_shortnames.py
@@ -1,5 +1,4 @@
 import re
-from threading import Lock
 
 from bbot.modules.base import BaseModule
 
@@ -47,7 +46,6 @@ async def detect(self, target):
         return detections
 
     async def setup(self):
-        self.scanned_tracker_lock = Lock()
         self.scanned_tracker = set()
         return True
 
@@ -145,8 +143,7 @@ async def solve_shortname_recursive(
 
     async def handle_event(self, event):
         normalized_url = self.normalize_url(event.data)
-        with self.scanned_tracker_lock:
-            self.scanned_tracker.add(normalized_url)
+        self.scanned_tracker.add(normalized_url)
 
         detections = await self.detect(normalized_url)
 
@@ -213,8 +210,7 @@ async def handle_event(self, event):
 
     async def filter_event(self, event):
         if "dir" in event.tags:
-            with self.scanned_tracker_lock:
-                if self.normalize_url(event.data) not in self.scanned_tracker:
-                    return True
-                return False
+            if self.normalize_url(event.data) not in self.scanned_tracker:
+                return True
+            return False
         return False
diff --git a/bbot/modules/robots.py b/bbot/modules/robots.py
index da4908fcef..48ce967097 100644
--- a/bbot/modules/robots.py
+++ b/bbot/modules/robots.py
@@ -15,21 +15,13 @@ class robots(BaseModule):
     }
 
     in_scope_only = True
+    per_host_only = True
 
     async def setup(self):
-        self.scanned_hosts = set()
         return True
 
     async def handle_event(self, event):
-        parsed_host = event.parsed
-        host = f"{parsed_host.scheme}://{parsed_host.netloc}/"
-        host_hash = hash(host)
-        if host_hash in self.scanned_hosts:
-            self.debug(f"Host {host} was already scanned, exiting")
-            return
-        else:
-            self.scanned_hosts.add(host_hash)
-
+        host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
         result = None
         url = f"{host}robots.txt"
         result = await self.helpers.request(url)
diff --git a/bbot/modules/smuggler.py b/bbot/modules/smuggler.py
index ca538d87d4..d1996456b4 100644
--- a/bbot/modules/smuggler.py
+++ b/bbot/modules/smuggler.py
@@ -15,6 +15,7 @@ class smuggler(BaseModule):
     meta = {"description": "Check for HTTP smuggling"}
 
     in_scope_only = True
+    per_host_only = True
 
     deps_ansible = [
         {
@@ -23,19 +24,7 @@ class smuggler(BaseModule):
         }
     ]
 
-    async def setup(self):
-        self.scanned_hosts = set()
-        return True
-
     async def handle_event(self, event):
-        host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
-        host_hash = hash(host)
-        if host_hash in self.scanned_hosts:
-            self.debug(f"Host {host} was already scanned, exiting")
-            return
-        else:
-            self.scanned_hosts.add(host_hash)
-
         command = [
             sys.executable,
             f"{self.scan.helpers.tools_dir}/smuggler/smuggler.py",
diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index 1fa5cc6425..58579f96b8 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -139,6 +139,7 @@ class telerik(BaseModule):
     options_desc = {"exploit_RAU_crypto": "Attempt to confirm any RAU AXD detections are vulnerable"}
 
     in_scope_only = True
+    per_host_only = True
 
     deps_pip = ["pycryptodome~=3.17"]
 
@@ -159,19 +160,10 @@ class telerik(BaseModule):
     max_event_handlers = 5
 
     async def setup(self):
-        self.scanned_hosts = set()
         self.timeout = self.scan.config.get("httpx_timeout", 5)
         return True
 
     async def handle_event(self, event):
-        host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
-        host_hash = hash(host)
-        if host_hash in self.scanned_hosts:
-            self.debug(f"Host {host} was already scanned, exiting")
-            return
-        else:
-            self.scanned_hosts.add(host_hash)
-
         webresource = "Telerik.Web.UI.WebResource.axd?type=rau"
         result, _ = await self.test_detector(event.data, webresource)
         if result:
diff --git a/bbot/modules/wafw00f.py b/bbot/modules/wafw00f.py
index 788e9d6254..421d9e6d10 100644
--- a/bbot/modules/wafw00f.py
+++ b/bbot/modules/wafw00f.py
@@ -18,21 +18,9 @@ class wafw00f(BaseModule):
     options_desc = {"generic_detect": "When no specific WAF detections are made, try to peform a generic detect"}
 
     in_scope_only = True
-
-    async def setup(self):
-        self.scanned_hosts = set()
-        return True
+    per_host_only = True
 
     async def handle_event(self, event):
-        parsed_host = event.parsed
-        host = f"{parsed_host.scheme}://{parsed_host.netloc}/"
-        host_hash = hash(host)
-        if host_hash in self.scanned_hosts:
-            self.debug(f"Host {host} was already scanned, exiting")
-            return
-        else:
-            self.scanned_hosts.add(host_hash)
-
         WW = await self.scan.run_in_executor(wafw00f_main.WAFW00F, host)
         waf_detections = await self.scan.run_in_executor(WW.identwaf)
         if waf_detections:

From 979d516d5c473b5d96b9e15bd8b17f2ef88b312b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 12 Jul 2023 17:35:32 -0400
Subject: [PATCH 232/387] fixed bug in dict searching helper

---
 bbot/core/helpers/misc.py | 23 ++++++++++++++---------
 1 file changed, 14 insertions(+), 9 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index fee0dc23c8..637d9cb294 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -699,16 +699,21 @@ def search_dict_values(d, *regexes):
 
     search_dict_values(dict_to_search, url_regexes) --> "https://www.evilcorp.com"
     """
-    for r in regexes:
-        if isinstance(d, str):
+    results = set()
+    if isinstance(d, str):
+        for r in regexes:
             for match in r.finditer(d):
-                yield match.group()
-        elif isinstance(d, dict):
-            for _, v in d.items():
-                yield from search_dict_values(v, *regexes)
-        elif isinstance(d, list):
-            for v in d:
-                yield from search_dict_values(v, *regexes)
+                result = match.group()
+                h = hash(result)
+                if not h in results:
+                    results.add(h)
+                    yield result
+    elif isinstance(d, dict):
+        for _, v in d.items():
+            yield from search_dict_values(v, *regexes)
+    elif isinstance(d, list):
+        for v in d:
+            yield from search_dict_values(v, *regexes)
 
 
 def filter_dict(d, *key_names, fuzzy=False, invert=False, exclude_keys=None, prev_key=None):

From f65d27da0e01887239c74837970b1043812e0ec6 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 17:42:51 -0400
Subject: [PATCH 233/387] wafw00f fix

---
 bbot/modules/base.py    | 4 ----
 bbot/modules/wafw00f.py | 1 +
 2 files changed, 1 insertion(+), 4 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 548a4febf6..9d059b5a35 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -433,13 +433,9 @@ async def _event_postcheck(self, event):
                 return False, msg
 
         if self.per_host_only:
-            self.critical("IN PER HOST ONLY")
-            self.hugewarning(event.data)
             if self.get_per_host_hash(event) in self._per_host_tracker:
-                self.critical("ALREADY DID THIS HOST BLOCK IT")
                 return False, "per_host_only enabled and already seen host"
             else:
-                self.critical("THIS IS A NEW HOST, ADD IT AND ALLOW IT")
                 self._per_host_tracker.add(self.get_per_host_hash(event))
 
         if self._type == "output" and not event._stats_recorded:
diff --git a/bbot/modules/wafw00f.py b/bbot/modules/wafw00f.py
index 421d9e6d10..57ff2a1790 100644
--- a/bbot/modules/wafw00f.py
+++ b/bbot/modules/wafw00f.py
@@ -21,6 +21,7 @@ class wafw00f(BaseModule):
     per_host_only = True
 
     async def handle_event(self, event):
+        host = f"{parsed_host.scheme}://{parsed_host.netloc}/"
         WW = await self.scan.run_in_executor(wafw00f_main.WAFW00F, host)
         waf_detections = await self.scan.run_in_executor(WW.identwaf)
         if waf_detections:

From b199267f44f4d83da2c6982b39fe7331322f2a94 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Wed, 12 Jul 2023 20:46:15 -0400
Subject: [PATCH 234/387] wafw00f completing transition to per_host_only mode

---
 bbot/modules/wafw00f.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/wafw00f.py b/bbot/modules/wafw00f.py
index 57ff2a1790..192cf83c88 100644
--- a/bbot/modules/wafw00f.py
+++ b/bbot/modules/wafw00f.py
@@ -21,7 +21,7 @@ class wafw00f(BaseModule):
     per_host_only = True
 
     async def handle_event(self, event):
-        host = f"{parsed_host.scheme}://{parsed_host.netloc}/"
+        host = f"{event.parsed.scheme}://{event.parsed.netloc}/"
         WW = await self.scan.run_in_executor(wafw00f_main.WAFW00F, host)
         waf_detections = await self.scan.run_in_executor(WW.identwaf)
         if waf_detections:

From e6f68b8570a4cbd249744fd551ba385533452e09 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 10:18:29 -0400
Subject: [PATCH 235/387] handle non-URL events

---
 bbot/modules/base.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 9d059b5a35..c4f17ead39 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -514,7 +514,12 @@ def set_error_state(self, message=None):
 
     # override in the module to define different values to comprise the hash
     def get_per_host_hash(self, event):
-        return hash(f"{event.parsed.scheme}://{event.parsed.netloc}/")
+        parsed = getattr(event, "parsed", None)
+        if parsed is None:
+            to_hash = self.helpers.make_netloc(event.host, event.port)
+        else:
+            to_hash = hash(f"{parsed.scheme}://{parsed.netloc}/")
+        return hash(to_hash)
 
     @property
     def name(self):

From fb30cc544c5947ceb504dbfebd87539667f32a59 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 11:19:59 -0400
Subject: [PATCH 236/387] fix tests

---
 bbot/test/test_step_2/module_tests/test_module_oauth.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_oauth.py b/bbot/test/test_step_2/module_tests/test_module_oauth.py
index e7189f2333..3b56b873ff 100644
--- a/bbot/test/test_step_2/module_tests/test_module_oauth.py
+++ b/bbot/test/test_step_2/module_tests/test_module_oauth.py
@@ -6,7 +6,7 @@
 class TestOAUTH(ModuleTestBase):
     targets = ["evilcorp.com"]
     config_overrides = {"scope_report_distance": 1}
-    modules_overrides = ["azure_realm", "oauth"]
+    modules_overrides = ["azure_realm", "oauth", "speculate"]
     openid_config_azure = {
         "token_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/token",
         "token_endpoint_auth_methods_supported": ["client_secret_post", "private_key_jwt", "client_secret_basic"],

From d46f531cda4f8ba9ec5c0cc04d232917363ee194 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 13 Jul 2023 13:02:49 -0400
Subject: [PATCH 237/387] adding tests for per_host_only mode

---
 bbot/test/test_step_1/test_modules_basic.py | 57 +++++++++++++++++++++
 1 file changed, 57 insertions(+)

diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index 92a771e804..b9f00422a6 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -76,6 +76,8 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
         valid, reason = await base_module._event_postcheck(events.localhost)
         assert valid
 
+
+
     base_output_module = BaseOutputModule(scan)
     base_output_module.watched_events = ["IP_ADDRESS"]
 
@@ -102,6 +104,61 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
                 not_async.append(f)
     assert not any(not_async)
 
+
+
+    # per host only
+
+    per_host_scan = bbot_scanner("evilcorp.com",
+        modules=list(set(available_modules + available_internal_modules)),
+        output_modules=list(available_output_modules),
+        config=bbot_config,
+    )
+
+    # ensure that multiple events to the same "host" (schema + host) are blocked and check the per host tracker
+    for module_name, module in sorted(per_host_scan.modules.items()):
+
+        if "URL" in module.watched_events:
+            
+            url_1 = per_host_scan.make_event("http://evilcorp.com/1", source=scan2.root_event)
+            url_2 = per_host_scan.make_event("http://evilcorp.com/2", source=scan2.root_event)
+            valid_1, reason_1 = await base_module._event_postcheck(url_1)
+            valid_2, reason_2 = await base_module._event_postcheck(url_2)
+
+            if module.per_host_only == True:
+                assert valid_1 == True
+                assert valid_2 == False
+                assert "http://evilcorp.com/" in module._per_host_tracker
+
+            else:
+                assert valid_1 == True
+                assert valid_2 == False
+
+        elif "DNS_NAME" in module.watched_events:
+            # no dns-based modules currently use per_host_only, so we have to simulate it
+            module.per_host_only = False
+
+            dns_1 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
+            dns_2 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
+            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(url_1)
+            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(url_2)
+
+            assert dns_valid_1 == True
+            assert dns_valid_2 == True
+
+            module.per_host_only = True
+
+            dns_1 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
+            dns_2 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
+            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(url_1)
+            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(url_2)
+
+            assert dns_valid_1 == True
+            assert dns_valid_2 == False
+
+            assert "evilcorp.com" in module._per_host_tracker
+
+
+
     # module preloading
     all_preloaded = module_loader.preloaded()
     assert "massdns" in all_preloaded

From a37b59c87216df9471029aa3f23ded2a61bd6334 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 13 Jul 2023 13:15:02 -0400
Subject: [PATCH 238/387] black

---
 bbot/test/test_step_1/test_modules_basic.py | 11 ++---------
 1 file changed, 2 insertions(+), 9 deletions(-)

diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index b9f00422a6..955dc9d375 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -76,8 +76,6 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
         valid, reason = await base_module._event_postcheck(events.localhost)
         assert valid
 
-
-
     base_output_module = BaseOutputModule(scan)
     base_output_module.watched_events = ["IP_ADDRESS"]
 
@@ -104,11 +102,10 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
                 not_async.append(f)
     assert not any(not_async)
 
-
-
     # per host only
 
-    per_host_scan = bbot_scanner("evilcorp.com",
+    per_host_scan = bbot_scanner(
+        "evilcorp.com",
         modules=list(set(available_modules + available_internal_modules)),
         output_modules=list(available_output_modules),
         config=bbot_config,
@@ -116,9 +113,7 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
 
     # ensure that multiple events to the same "host" (schema + host) are blocked and check the per host tracker
     for module_name, module in sorted(per_host_scan.modules.items()):
-
         if "URL" in module.watched_events:
-            
             url_1 = per_host_scan.make_event("http://evilcorp.com/1", source=scan2.root_event)
             url_2 = per_host_scan.make_event("http://evilcorp.com/2", source=scan2.root_event)
             valid_1, reason_1 = await base_module._event_postcheck(url_1)
@@ -157,8 +152,6 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
 
             assert "evilcorp.com" in module._per_host_tracker
 
-
-
     # module preloading
     all_preloaded = module_loader.preloaded()
     assert "massdns" in all_preloaded

From 16839f51579499a76a4e1514f2ddf22e3d2ef07e Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 13 Jul 2023 13:17:48 -0400
Subject: [PATCH 239/387] oops

---
 bbot/test/test_step_1/test_modules_basic.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index 955dc9d375..f8dc0c7151 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -134,8 +134,8 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
 
             dns_1 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
             dns_2 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
-            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(url_1)
-            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(url_2)
+            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(dns_1)
+            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(dns_2)
 
             assert dns_valid_1 == True
             assert dns_valid_2 == True
@@ -144,8 +144,8 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
 
             dns_1 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
             dns_2 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
-            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(url_1)
-            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(url_2)
+            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(dns_1)
+            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(dns_2)
 
             assert dns_valid_1 == True
             assert dns_valid_2 == False

From 904dc3ba569d3beeff005217d2f82af42bb82519 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 13 Jul 2023 13:44:28 -0400
Subject: [PATCH 240/387] revised test

---
 bbot/test/test_step_1/test_modules_basic.py | 34 ++++++++++++---------
 1 file changed, 19 insertions(+), 15 deletions(-)

diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index f8dc0c7151..0b7ec985d6 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -114,43 +114,47 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
     # ensure that multiple events to the same "host" (schema + host) are blocked and check the per host tracker
     for module_name, module in sorted(per_host_scan.modules.items()):
         if "URL" in module.watched_events:
-            url_1 = per_host_scan.make_event("http://evilcorp.com/1", source=scan2.root_event)
-            url_2 = per_host_scan.make_event("http://evilcorp.com/2", source=scan2.root_event)
-            valid_1, reason_1 = await base_module._event_postcheck(url_1)
-            valid_2, reason_2 = await base_module._event_postcheck(url_2)
+            url_1 = per_host_scan.make_event(
+                "URL", "http://evilcorp.com/1", source=per_host_scan.root_event, tags=["status-200"]
+            )
+            url_2 = per_host_scan.make_event(
+                "URL", "http://evilcorp.com/2", source=per_host_scan.root_event, tags=["status-200"]
+            )
+            valid_1, reason_1 = await module._event_postcheck(url_1)
+            valid_2, reason_2 = await module._event_postcheck(url_2)
 
             if module.per_host_only == True:
                 assert valid_1 == True
                 assert valid_2 == False
-                assert "http://evilcorp.com/" in module._per_host_tracker
+                assert hash("http://evilcorp.com/") in module._per_host_tracker
 
             else:
                 assert valid_1 == True
-                assert valid_2 == False
+                assert valid_2 == True
 
         elif "DNS_NAME" in module.watched_events:
             # no dns-based modules currently use per_host_only, so we have to simulate it
             module.per_host_only = False
 
-            dns_1 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
-            dns_2 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
-            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(dns_1)
-            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(dns_2)
+            dns_1 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
+            dns_2 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
+            dns_valid_1, dns_reason_1 = await module._event_postcheck(dns_1)
+            dns_valid_2, dns_reason_2 = await module._event_postcheck(dns_2)
 
             assert dns_valid_1 == True
             assert dns_valid_2 == True
 
             module.per_host_only = True
 
-            dns_1 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
-            dns_2 = per_host_scan.make_event("evilcorp.com", source=scan2.root_event)
-            dns_valid_1, dns_reason_1 = await base_module._event_postcheck(dns_1)
-            dns_valid_2, dns_reason_2 = await base_module._event_postcheck(dns_2)
+            dns_1 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
+            dns_2 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
+            dns_valid_1, dns_reason_1 = await module._event_postcheck(dns_1)
+            dns_valid_2, dns_reason_2 = await module._event_postcheck(dns_2)
 
             assert dns_valid_1 == True
             assert dns_valid_2 == False
 
-            assert "evilcorp.com" in module._per_host_tracker
+            assert hash("evilcorp.com") in module._per_host_tracker
 
     # module preloading
     all_preloaded = module_loader.preloaded()

From 1edd40efb299a83da79bfe17ed62c5dd1090ea72 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 14:01:29 -0400
Subject: [PATCH 241/387] consolidate actions

---
 .github/workflows/docs.yml  | 47 --------------------------
 .github/workflows/lint.yml  | 22 -------------
 .github/workflows/tests.yml | 66 ++++++++++++++++++++++++++++++++++++-
 3 files changed, 65 insertions(+), 70 deletions(-)
 delete mode 100644 .github/workflows/docs.yml
 delete mode 100644 .github/workflows/lint.yml

diff --git a/.github/workflows/docs.yml b/.github/workflows/docs.yml
deleted file mode 100644
index ef4a9f0af1..0000000000
--- a/.github/workflows/docs.yml
+++ /dev/null
@@ -1,47 +0,0 @@
-name: docs
-on:
-  push:
-    branches:
-      - material-docs
-      - dev
-permissions:
-  contents: write
-jobs:
-  docgen:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-      - name: Set up Python
-        uses: actions/setup-python@v4
-        with:
-          python-version: "3.10"
-      - name: Install dependencies
-        run: |
-          pip install poetry
-          poetry install
-      - name: Generate docs
-        run: |
-          poetry run bbot/scripts/docs.py
-      - name: Commit docs
-        uses: EndBug/add-and-commit@v9
-        with:
-          add: "*.md"
-          default_author: github_actions
-          message: "Refresh module docs"
-  deploy:
-    runs-on: ubuntu-latest
-    needs: docgen
-    steps:
-      - uses: actions/checkout@v3
-      - uses: actions/setup-python@v4
-        with:
-          python-version: 3.x
-      - run: echo "cache_id=$(date --utc '+%V')" >> $GITHUB_ENV
-      - uses: actions/cache@v3
-        with:
-          key: mkdocs-material-${{ env.cache_id }}
-          path: .cache
-          restore-keys: |
-            mkdocs-material-
-      - run: pip install mkdocs-material mkdocs-extra-sass-plugin livereload
-      - run: mkdocs gh-deploy --force
diff --git a/.github/workflows/lint.yml b/.github/workflows/lint.yml
deleted file mode 100644
index 886ac4d015..0000000000
--- a/.github/workflows/lint.yml
+++ /dev/null
@@ -1,22 +0,0 @@
-name: lint
-
-on: [push, pull_request]
-
-jobs:
-  lint:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v3
-      - uses: psf/black@stable
-        with:
-          options: "--check"
-      - name: Install Python 3
-        uses: actions/setup-python@v4
-        with:
-          python-version: 3.9
-      - name: Install dependencies
-        run: |
-          pip install flake8
-      - name: flake8
-        run: |
-          flake8 --select F,E722 --ignore F403,F405,F541 --per-file-ignores="*/__init__.py:F401,F403"
diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 7983b3acba..140115fadb 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -5,8 +5,28 @@ on:
   pull_request_target:
     types:
       - closed
+
 jobs:
+  lint:
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+      - uses: psf/black@stable
+        with:
+          options: "--check"
+      - name: Install Python 3
+        uses: actions/setup-python@v4
+        with:
+          python-version: 3.9
+      - name: Install dependencies
+        run: |
+          pip install flake8
+      - name: flake8
+        run: |
+          flake8 --select F,E722 --ignore F403,F405,F541 --per-file-ignores="*/__init__.py:F401,F403"
+
   test:
+    needs: lint
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v3
@@ -27,9 +47,53 @@ jobs:
           token: ${{ secrets.CODECOV_TOKEN }}
           files: ./cov.xml
           verbose: true
-  publish:
+
+  update_docs:
     needs: test
     runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: "3.10"
+      - name: Install dependencies
+        run: |
+          pip install poetry
+          poetry install
+      - name: Generate docs
+        run: |
+          poetry run bbot/scripts/docs.py
+      - name: Commit docs
+        uses: EndBug/add-and-commit@v9
+        continue-on-error: true
+        with:
+          add: "*.md"
+          default_author: github_actions
+          message: "Refresh module docs"
+
+  deploy_docs:
+    needs: update_docs
+    runs-on: ubuntu-latest
+    if: github.ref == 'refs/heads/dev'
+    steps:
+      - uses: actions/checkout@v3
+      - uses: actions/setup-python@v4
+        with:
+          python-version: 3.x
+      - run: echo "cache_id=$(date --utc '+%V')" >> $GITHUB_ENV
+      - uses: actions/cache@v3
+        with:
+          key: mkdocs-material-${{ env.cache_id }}
+          path: .cache
+          restore-keys: |
+            mkdocs-material-
+      - run: pip install mkdocs-material mkdocs-extra-sass-plugin livereload
+      - run: mkdocs gh-deploy --force
+
+  publish:
+    needs: update_docs
+    runs-on: ubuntu-latest
     if: github.event_name == 'pull_request_target' && github.event.pull_request.merged == true && (github.event.pull_request.base.ref == 'dev' || github.event.pull_request.base.ref == 'stable')
     continue-on-error: true
     steps:

From e51cd7a6648cfe92f7b00f6d6a0a8e6ce5fed68e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 14:05:25 -0400
Subject: [PATCH 242/387] better job names

---
 .github/workflows/tests.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 140115fadb..6b681d0fbe 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -72,7 +72,7 @@ jobs:
           default_author: github_actions
           message: "Refresh module docs"
 
-  deploy_docs:
+  publish_docs:
     needs: update_docs
     runs-on: ubuntu-latest
     if: github.ref == 'refs/heads/dev'
@@ -91,7 +91,7 @@ jobs:
       - run: pip install mkdocs-material mkdocs-extra-sass-plugin livereload
       - run: mkdocs gh-deploy --force
 
-  publish:
+  publish_code:
     needs: update_docs
     runs-on: ubuntu-latest
     if: github.event_name == 'pull_request_target' && github.event.pull_request.merged == true && (github.event.pull_request.base.ref == 'dev' || github.event.pull_request.base.ref == 'stable')

From 6e724e5f8d5cfd39a39184732461dfd1cbe07aa4 Mon Sep 17 00:00:00 2001
From: github-actions <41898282+github-actions[bot]@users.noreply.github.com>
Date: Thu, 13 Jul 2023 18:21:35 +0000
Subject: [PATCH 243/387] Refresh module docs

---
 docs/scanning/advanced.md        |  2 +-
 docs/scanning/configuration.md   | 26 ++++++++++++----
 docs/scanning/events.md          | 52 ++++++++++++++++----------------
 docs/scanning/index.md           | 44 +++++++++++++--------------
 docs/scanning/list_of_modules.md |  8 +++--
 5 files changed, 74 insertions(+), 58 deletions(-)

diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 42163e0c4f..ffd1e93cbd 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -61,7 +61,7 @@ Target:
 
 Modules:
   -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,naabu,nmap,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,myssl,naabu,nmap,nsec,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
   -l, --list-modules    List available modules.
   -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
                         Exclude these modules.
diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index c9dd55c8ad..eaa1cf4567 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -76,7 +76,7 @@ status_frequency: 15
 # HTTP proxy
 http_proxy: 
 # Web user-agent
-user_agent: Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36
+user_agent: Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/114.0.0.0 Safari/537.36
 
 ### WEB SPIDER ###
 
@@ -176,7 +176,7 @@ url_extension_httpx_only:
 omit_event_types:
     - HTTP_RESPONSE
     - URL_UNVERIFIED
-    # - DNS_NAME_UNRESOLVED
+    - DNS_NAME_UNRESOLVED
     # - IP_ADDRESS
 # URL of BBOT server
 agent_url: ''
@@ -188,6 +188,13 @@ interactsh_server: null
 interactsh_token: null
 interactsh_disable: false
 
+# For performance reasons, always skip these DNS queries
+# Microsoft's DNS infrastructure is misconfigured so that some queries to mail.protection.outlook.com always time out
+dns_omit_queries:
+  - SRV:mail.protection.outlook.com
+  - CNAME:mail.protection.outlook.com
+  - TXT:mail.protection.outlook.com
+
 ```
 <!-- END BBOT DEFAULT CONFIG -->
 
@@ -255,9 +262,15 @@ Many modules accept their own configuration options. These options have the abil
 | modules.nuclei.tags                            | str    | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
 | modules.nuclei.templates                       | str    | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |                                                                                                                                                                     |
 | modules.nuclei.version                         | str    | nuclei version                                                                                                                                                                                                                                                                                                  | 2.9.4                                                                                                                                                               |
-| modules.paramminer_cookies.wordlist            | str    | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
-| modules.paramminer_getparams.wordlist          | str    | Define the wordlist to be used to derive GET params                                                                                                                                                                                                                                                             | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/params                                                                                   |
-| modules.paramminer_headers.wordlist            | str    | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                | https://raw.githubusercontent.com/PortSwigger/param-miner/master/resources/headers                                                                                  |
+| modules.paramminer_cookies.http_extract        | bool   | Attempt to find additional wordlist words from the HTTP Response                                                                                                                                                                                                                                                | True                                                                                                                                                                |
+| modules.paramminer_cookies.skip_boring_words   | bool   | Remove commonly uninteresting words from the wordlist                                                                                                                                                                                                                                                           | True                                                                                                                                                                |
+| modules.paramminer_cookies.wordlist            | str    | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.paramminer_getparams.http_extract      | bool   | Attempt to find additional wordlist words from the HTTP Response                                                                                                                                                                                                                                                | True                                                                                                                                                                |
+| modules.paramminer_getparams.skip_boring_words | bool   | Remove commonly uninteresting words from the wordlist                                                                                                                                                                                                                                                           | True                                                                                                                                                                |
+| modules.paramminer_getparams.wordlist          | str    | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
+| modules.paramminer_headers.http_extract        | bool   | Attempt to find additional wordlist words from the HTTP Response                                                                                                                                                                                                                                                | True                                                                                                                                                                |
+| modules.paramminer_headers.skip_boring_words   | bool   | Remove commonly uninteresting words from the wordlist                                                                                                                                                                                                                                                           | True                                                                                                                                                                |
+| modules.paramminer_headers.wordlist            | str    | Define the wordlist to be used to derive headers                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
 | modules.robots.include_allow                   | bool   | Include 'Allow' Entries                                                                                                                                                                                                                                                                                         | True                                                                                                                                                                |
 | modules.robots.include_disallow                | bool   | Include 'Disallow' Entries                                                                                                                                                                                                                                                                                      | True                                                                                                                                                                |
 | modules.robots.include_sitemap                 | bool   | Include 'sitemap' entries                                                                                                                                                                                                                                                                                       | False                                                                                                                                                               |
@@ -281,6 +294,7 @@ Many modules accept their own configuration options. These options have the abil
 | modules.c99.api_key                            | str    | c99.nl API key                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
 | modules.censys.api_id                          | str    | Censys.io API ID                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
 | modules.censys.api_secret                      | str    | Censys.io API Secret                                                                                                                                                                                                                                                                                            |                                                                                                                                                                     |
+| modules.censys.max_pages                       | int    | Maximum number of pages to fetch (100 results per page)                                                                                                                                                                                                                                                         | 5                                                                                                                                                                   |
 | modules.columbus.limit                         | int    | Max number of subdomains to retrieve                                                                                                                                                                                                                                                                            | 500                                                                                                                                                                 |
 | modules.fullhunt.api_key                       | str    | FullHunt API Key                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
 | modules.github.api_key                         | str    | Github token                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
@@ -325,5 +339,5 @@ Many modules accept their own configuration options. These options have the abil
 | output_modules.websocket.token                 | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
 | output_modules.websocket.url                   | str    | Web URL                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                     |
 | internal_modules.speculate.max_hosts           | int    | Max number of IP_RANGE hosts to convert into IP_ADDRESS events                                                                                                                                                                                                                                                  | 65536                                                                                                                                                               |
-| internal_modules.speculate.ports               | list   | The set of ports to speculate on                                                                                                                                                                                                                                                                                | [80, 443]                                                                                                                                                           |
+| internal_modules.speculate.ports               | str    | The set of ports to speculate on                                                                                                                                                                                                                                                                                | 80,443                                                                                                                                                              |
 <!-- END BBOT MODULE OPTIONS -->
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index c8f77178ed..4e97f4d622 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -47,30 +47,30 @@ Below is a full list of event types along with which modules produce/consume the
 ## List of Event Types
 
 <!-- BBOT EVENTS -->
-| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         | Producing Modules                                                                                                                                                                                                                                                                                                                                                                 |
-|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                              |                                                                                                                                                                                                                                                                                                                                                                                   |
-| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | asn                                                                                                                                                                                                                                                                                                                                                                               |
-| DNS_NAME            | 46                    | 36                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, naabu, nmap, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
-| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |                                                                                                                                                                                                                                                                                                                                                                                   |
-| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                               |
-| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                |
-| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | ipstack                                                                                                                                                                                                                                                                                                                                                                           |
-| HTTP_RESPONSE       | 8                     | 1                     | badsecrets, excavate, host_header, hunt, ntlm, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                           | httpx                                                                                                                                                                                                                                                                                                                                                                             |
-| IP_ADDRESS          | 7                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                         | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                    |
-| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |                                                                                                                                                                                                                                                                                                                                                                                   |
-| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys                                                                                                                                                                                                                                                                                                                                                                            |
-| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                  |
-| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                              |
-| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                                                                                                                                                                                                                                   |
-| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | social                                                                                                                                                                                                                                                                                                                                                                            |
-| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                        |
-| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                             |
-| URL                 | 21                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                     | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                  |
-| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                    |
-| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                   |
-| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                | vhost                                                                                                                                                                                                                                                                                                                                                                             |
-| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                         |
-| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | wafw00f                                                                                                                                                                                                                                                                                                                                                                           |
-| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | gowitness                                                                                                                                                                                                                                                                                                                                                                         |
+| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | Producing Modules                                                                                                                                                                                                                                                                                                                                                                              |
+|---------------------|-----------------------|-----------------------|----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |                                                                                                                                                                                                                                                                                                                                                                                                |
+| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | asn                                                                                                                                                                                                                                                                                                                                                                                            |
+| DNS_NAME            | 48                    | 38                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, myssl, naabu, nmap, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, myssl, nsec, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
+| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |                                                                                                                                                                                                                                                                                                                                                                                                |
+| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                            |
+| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                             |
+| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | ipstack                                                                                                                                                                                                                                                                                                                                                                                        |
+| HTTP_RESPONSE       | 11                    | 1                     | badsecrets, excavate, host_header, hunt, ntlm, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                          | httpx                                                                                                                                                                                                                                                                                                                                                                                          |
+| IP_ADDRESS          | 7                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                                 |
+| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |                                                                                                                                                                                                                                                                                                                                                                                                |
+| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | censys                                                                                                                                                                                                                                                                                                                                                                                         |
+| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                               |
+| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                                           |
+| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |                                                                                                                                                                                                                                                                                                                                                                                                |
+| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | social                                                                                                                                                                                                                                                                                                                                                                                         |
+| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                  | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                                     |
+| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                                          |
+| URL                 | 18                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                                                                                                | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                               |
+| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                 |
+| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                                |
+| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | vhost                                                                                                                                                                                                                                                                                                                                                                                          |
+| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                                      |
+| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | wafw00f                                                                                                                                                                                                                                                                                                                                                                                        |
+| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | gowitness                                                                                                                                                                                                                                                                                                                                                                                      |
 <!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index ca14397151..4f1ad93b14 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -103,28 +103,28 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 ### List of Flags
 
 <!-- BBOT MODULE FLAGS -->
-| Flag             | # Modules   | Description                                   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
-|------------------|-------------|-----------------------------------------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| safe             | 58          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 42          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
-| active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                  |
-| subdomain-enum   | 35          | Enumerates subdomains                         | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
-| web-thorough     | 25          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                         |
-| aggressive       | 19          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                         |
-| web-basic        | 15          | Basic, non-intrusive web scan functionality   | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| slow             | 9           | May take a long time to complete              | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| cloud-enum       | 7           | Enumerates cloud resources                    | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| affiliates       | 6           | Discovers affiliated hostnames/domains        | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| email-enum       | 6           | Enumerates email addresses                    | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| portscan         | 3           | Discovers open ports                          | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
-| subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| Flag             | # Modules   | Description                                   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+|------------------|-------------|-----------------------------------------------|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 60          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, myssl, nsec, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 44          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, myssl, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
+| active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                               |
+| subdomain-enum   | 37          | Enumerates subdomains                         | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, myssl, nsec, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| web-thorough     | 25          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                                      |
+| aggressive       | 19          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| web-basic        | 15          | Basic, non-intrusive web scan functionality   | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
+| slow             | 9           | May take a long time to complete              | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| cloud-enum       | 7           | Enumerates cloud resources                    | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
+| affiliates       | 6           | Discovers affiliated hostnames/domains        | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |
+| email-enum       | 6           | Enumerates email addresses                    | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
+| deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
+| portscan         | 3           | Discovers open ports                          | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
+| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 <!-- END BBOT MODULE FLAGS --> 
 
 ## Dependencies
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index fb26ce3902..327b473b17 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -26,9 +26,9 @@
 | nmap                 | scan     | No              | Execute port scans with nmap                                           | active, aggressive, portscan, web-thorough                                          | DNS_NAME, IP_ADDRESS                                                                                    | OPEN_TCP_PORT                                            |
 | ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE, URL                                                                                      | DNS_NAME, FINDING                                        |
 | nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active, aggressive, deadly                                                          | URL                                                                                                     | FINDING, VULNERABILITY                                   |
-| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active, aggressive, slow, web-paramminer                                            | URL                                                                                                     | FINDING                                                  |
-| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active, aggressive, slow, web-paramminer                                            | URL                                                                                                     | FINDING                                                  |
-| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active, aggressive, slow, web-paramminer                                            | URL                                                                                                     | FINDING                                                  |
+| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
+| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
+| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
 | robots               | scan     | No              | Look for and parse robots.txt                                          | active, safe, web-basic, web-thorough                                               | URL                                                                                                     | URL_UNVERIFIED                                           |
 | secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                                  |
 | smuggler             | scan     | No              | Check for HTTP smuggling                                               | active, aggressive, slow, web-thorough                                              | URL                                                                                                     | FINDING                                                  |
@@ -64,6 +64,8 @@
 | ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive, safe                                                                       | IP_ADDRESS                                                                                              | GEOLOCATION                                              |
 | leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive, passive, slow, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| myssl                | scan     | No              | Query myssl.com's API for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| nsec                 | scan     | No              | Enumerate subdomains by NSEC-walking                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |

From 4fd17dc0bbe6e0dadaff3826a662ca48244b7a86 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 14:25:16 -0400
Subject: [PATCH 244/387] commit with PAT

---
 .github/workflows/tests.yml | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 6b681d0fbe..28c5eeac68 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -69,8 +69,10 @@ jobs:
         continue-on-error: true
         with:
           add: "*.md"
-          default_author: github_actions
+          author_name: "BBOT Docs Autopublish"
+          author_email: info@blacklanternsecurity.com
           message: "Refresh module docs"
+          token: ${{ secrets.BBOT_DOCS_UPDATER_PAT }}
 
   publish_docs:
     needs: update_docs

From 187571fc4d312ae884eaba635a3e1a35937440d2 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 14:36:17 -0400
Subject: [PATCH 245/387] upgrade codecov action

---
 .github/workflows/tests.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 28c5eeac68..625ee6eafd 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -42,7 +42,7 @@ jobs:
         run: |
           poetry run pytest --exitfirst --reruns 2 --disable-warnings --log-cli-level=DEBUG --cov-report xml:cov.xml --cov=bbot .
       - name: Upload Code Coverage
-        uses: codecov/codecov-action@v2
+        uses: codecov/codecov-action@v3
         with:
           token: ${{ secrets.CODECOV_TOKEN }}
           files: ./cov.xml

From cec7f0b94eedf485d973ef414e0222cd1b6be4a2 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 15:06:38 -0400
Subject: [PATCH 246/387] update docs

---
 docs/scanning/list_of_modules.md | 1 -
 1 file changed, 1 deletion(-)

diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 327b473b17..2f6b6006aa 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -65,7 +65,6 @@
 | leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive, passive, slow, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | myssl                | scan     | No              | Query myssl.com's API for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| nsec                 | scan     | No              | Enumerate subdomains by NSEC-walking                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |

From f5245e8f3a08fedf2b9c929969f951eef229e058 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 13 Jul 2023 15:13:56 -0400
Subject: [PATCH 247/387] revising test again

---
 bbot/modules/base.py                        |  2 +-
 bbot/test/test_step_1/test_modules_basic.py | 37 ++++++---------------
 2 files changed, 11 insertions(+), 28 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index c4f17ead39..9542336ea6 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -518,7 +518,7 @@ def get_per_host_hash(self, event):
         if parsed is None:
             to_hash = self.helpers.make_netloc(event.host, event.port)
         else:
-            to_hash = hash(f"{parsed.scheme}://{parsed.netloc}/")
+            to_hash = f"{parsed.scheme}://{parsed.netloc}/"
         return hash(to_hash)
 
     @property
diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index 0b7ec985d6..71a7004c10 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -107,19 +107,26 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
     per_host_scan = bbot_scanner(
         "evilcorp.com",
         modules=list(set(available_modules + available_internal_modules)),
-        output_modules=list(available_output_modules),
         config=bbot_config,
     )
 
+    await per_host_scan.load_modules()
+    await per_host_scan.setup_modules()
+    per_host_scan.status = "RUNNING"
+
     # ensure that multiple events to the same "host" (schema + host) are blocked and check the per host tracker
     for module_name, module in sorted(per_host_scan.modules.items()):
+        module.filter_event = base_module.filter_event
+
         if "URL" in module.watched_events:
             url_1 = per_host_scan.make_event(
-                "URL", "http://evilcorp.com/1", source=per_host_scan.root_event, tags=["status-200"]
+                "http://evilcorp.com/1", event_type="URL", source=per_host_scan.root_event, tags=["status-200"]
             )
+            url_1.set_scope_distance(0)
             url_2 = per_host_scan.make_event(
-                "URL", "http://evilcorp.com/2", source=per_host_scan.root_event, tags=["status-200"]
+                "http://evilcorp.com/2", event_type="URL", source=per_host_scan.root_event, tags=["status-200"]
             )
+            url_2.set_scope_distance(0)
             valid_1, reason_1 = await module._event_postcheck(url_1)
             valid_2, reason_2 = await module._event_postcheck(url_2)
 
@@ -132,30 +139,6 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
                 assert valid_1 == True
                 assert valid_2 == True
 
-        elif "DNS_NAME" in module.watched_events:
-            # no dns-based modules currently use per_host_only, so we have to simulate it
-            module.per_host_only = False
-
-            dns_1 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
-            dns_2 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
-            dns_valid_1, dns_reason_1 = await module._event_postcheck(dns_1)
-            dns_valid_2, dns_reason_2 = await module._event_postcheck(dns_2)
-
-            assert dns_valid_1 == True
-            assert dns_valid_2 == True
-
-            module.per_host_only = True
-
-            dns_1 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
-            dns_2 = per_host_scan.make_event("evilcorp.com", source=per_host_scan.root_event)
-            dns_valid_1, dns_reason_1 = await module._event_postcheck(dns_1)
-            dns_valid_2, dns_reason_2 = await module._event_postcheck(dns_2)
-
-            assert dns_valid_1 == True
-            assert dns_valid_2 == False
-
-            assert hash("evilcorp.com") in module._per_host_tracker
-
     # module preloading
     all_preloaded = module_loader.preloaded()
     assert "massdns" in all_preloaded

From 13e37f62b23eaf9feb1a07fd2da40ff8b86e974d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 15:27:50 -0400
Subject: [PATCH 248/387] update python version

---
 .github/workflows/tests.yml | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 625ee6eafd..a63a6bccbc 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -7,6 +7,7 @@ on:
       - closed
 
 jobs:
+  
   lint:
     runs-on: ubuntu-latest
     steps:
@@ -17,7 +18,7 @@ jobs:
       - name: Install Python 3
         uses: actions/setup-python@v4
         with:
-          python-version: 3.9
+          python-version: "3.x"
       - name: Install dependencies
         run: |
           pip install flake8
@@ -33,7 +34,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v4
         with:
-          python-version: "3.10"
+          python-version: "3.x"
       - name: Install dependencies
         run: |
           pip install poetry
@@ -56,7 +57,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v4
         with:
-          python-version: "3.10"
+          python-version: "3.x"
       - name: Install dependencies
         run: |
           pip install poetry
@@ -82,7 +83,7 @@ jobs:
       - uses: actions/checkout@v3
       - uses: actions/setup-python@v4
         with:
-          python-version: 3.x
+          python-version: "3.x"
       - run: echo "cache_id=$(date --utc '+%V')" >> $GITHUB_ENV
       - uses: actions/cache@v3
         with:
@@ -105,7 +106,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v4
         with:
-          python-version: "3.10"
+          python-version: "3.x"
       - name: Install dependencies
         run: |
           python -m pip install --upgrade pip

From 53548d51eccfc1be59031083babcb0f1f78b9619 Mon Sep 17 00:00:00 2001
From: BBOT Docs Autopublish <info@blacklanternsecurity.com>
Date: Thu, 13 Jul 2023 19:46:07 +0000
Subject: [PATCH 249/387] Refresh module docs

---
 docs/scanning/list_of_modules.md | 1 +
 1 file changed, 1 insertion(+)

diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 2f6b6006aa..327b473b17 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -65,6 +65,7 @@
 | leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive, passive, slow, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | myssl                | scan     | No              | Query myssl.com's API for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| nsec                 | scan     | No              | Enumerate subdomains by NSEC-walking                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |

From 3e69941c4bf380c6318413c6e162f3c9438fc287 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 13 Jul 2023 16:04:39 -0400
Subject: [PATCH 250/387] refactor test again

---
 bbot/test/test_step_1/test_modules_basic.py | 89 +++++++++++----------
 1 file changed, 45 insertions(+), 44 deletions(-)

diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index 71a7004c10..45bf375c7a 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -2,9 +2,14 @@
 
 from ..bbot_fixtures import *
 
+from bbot.modules.base import BaseModule
+from bbot.modules.output.base import BaseOutputModule
+from bbot.modules.report.base import BaseReportModule
+from bbot.modules.internal.base import BaseInternalModule
+
 
 @pytest.mark.asyncio
-async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, httpx_mock):
+async def test_modules_basic(scan, helpers, bbot_config, bbot_scanner, monkeypatch):
     fallback_nameservers = scan.helpers.temp_dir / "nameservers.txt"
     with open(fallback_nameservers, "w") as f:
         f.write("8.8.8.8\n")
@@ -12,12 +17,6 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
     for http_method in ("GET", "CONNECT", "HEAD", "POST", "PUT", "TRACE", "DEBUG", "PATCH", "DELETE", "OPTIONS"):
         httpx_mock.add_response(method=http_method, url=re.compile(r".*"), json={"test": "test"})
 
-    # event filtering
-    from bbot.modules.base import BaseModule
-    from bbot.modules.output.base import BaseOutputModule
-    from bbot.modules.report.base import BaseReportModule
-    from bbot.modules.internal.base import BaseInternalModule
-
     # output module specific event filtering tests
     base_output_module = BaseOutputModule(scan)
     base_output_module.watched_events = ["IP_ADDRESS"]
@@ -102,43 +101,6 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
                 not_async.append(f)
     assert not any(not_async)
 
-    # per host only
-
-    per_host_scan = bbot_scanner(
-        "evilcorp.com",
-        modules=list(set(available_modules + available_internal_modules)),
-        config=bbot_config,
-    )
-
-    await per_host_scan.load_modules()
-    await per_host_scan.setup_modules()
-    per_host_scan.status = "RUNNING"
-
-    # ensure that multiple events to the same "host" (schema + host) are blocked and check the per host tracker
-    for module_name, module in sorted(per_host_scan.modules.items()):
-        module.filter_event = base_module.filter_event
-
-        if "URL" in module.watched_events:
-            url_1 = per_host_scan.make_event(
-                "http://evilcorp.com/1", event_type="URL", source=per_host_scan.root_event, tags=["status-200"]
-            )
-            url_1.set_scope_distance(0)
-            url_2 = per_host_scan.make_event(
-                "http://evilcorp.com/2", event_type="URL", source=per_host_scan.root_event, tags=["status-200"]
-            )
-            url_2.set_scope_distance(0)
-            valid_1, reason_1 = await module._event_postcheck(url_1)
-            valid_2, reason_2 = await module._event_postcheck(url_2)
-
-            if module.per_host_only == True:
-                assert valid_1 == True
-                assert valid_2 == False
-                assert hash("http://evilcorp.com/") in module._per_host_tracker
-
-            else:
-                assert valid_1 == True
-                assert valid_2 == True
-
     # module preloading
     all_preloaded = module_loader.preloaded()
     assert "massdns" in all_preloaded
@@ -204,3 +166,42 @@ async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, h
         assert flag in flag_descriptions, f'Flag "{flag}" not listed in bbot/core/flags.py'
         description = flag_descriptions.get(flag, "")
         assert description, f'Flag "{flag}" has no description in bbot/core/flags.py'
+
+
+@pytest.mark.asyncio
+async def test_modules_basic_perhostonly(scan, helpers, events, bbot_config, bbot_scanner, httpx_mock, monkeypatch):
+    per_host_scan = bbot_scanner(
+        "evilcorp.com",
+        modules=list(set(available_modules + available_internal_modules)),
+        config=bbot_config,
+    )
+
+    await per_host_scan.load_modules()
+    await per_host_scan.setup_modules()
+    per_host_scan.status = "RUNNING"
+
+    # ensure that multiple events to the same "host" (schema + host) are blocked and check the per host tracker
+    for module_name, module in sorted(per_host_scan.modules.items()):
+        #    module.filter_event = base_module.filter_event
+        monkeypatch.setattr(module, "filter_event", BaseModule(per_host_scan).filter_event)
+
+        if "URL" in module.watched_events:
+            url_1 = per_host_scan.make_event(
+                "http://evilcorp.com/1", event_type="URL", source=per_host_scan.root_event, tags=["status-200"]
+            )
+            url_1.set_scope_distance(0)
+            url_2 = per_host_scan.make_event(
+                "http://evilcorp.com/2", event_type="URL", source=per_host_scan.root_event, tags=["status-200"]
+            )
+            url_2.set_scope_distance(0)
+            valid_1, reason_1 = await module._event_postcheck(url_1)
+            valid_2, reason_2 = await module._event_postcheck(url_2)
+
+            if module.per_host_only == True:
+                assert valid_1 == True
+                assert valid_2 == False
+                assert hash("http://evilcorp.com/") in module._per_host_tracker
+
+            else:
+                assert valid_1 == True
+                assert valid_2 == True

From b8cf47ba5db2959ccea7a9300e69e0d980571dd3 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 13 Jul 2023 16:16:03 -0400
Subject: [PATCH 251/387] had accidentally removed fixtures

---
 bbot/test/test_step_1/test_modules_basic.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/test_step_1/test_modules_basic.py b/bbot/test/test_step_1/test_modules_basic.py
index 45bf375c7a..e14f8c4022 100644
--- a/bbot/test/test_step_1/test_modules_basic.py
+++ b/bbot/test/test_step_1/test_modules_basic.py
@@ -9,7 +9,7 @@
 
 
 @pytest.mark.asyncio
-async def test_modules_basic(scan, helpers, bbot_config, bbot_scanner, monkeypatch):
+async def test_modules_basic(scan, helpers, events, bbot_config, bbot_scanner, httpx_mock):
     fallback_nameservers = scan.helpers.temp_dir / "nameservers.txt"
     with open(fallback_nameservers, "w") as f:
         f.write("8.8.8.8\n")

From 8a520d40b044a4f980eeb9a45b9af3139d8a9dd4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 16:19:49 -0400
Subject: [PATCH 252/387] actions debugging

---
 bbot/modules/oauth.py                                   | 2 ++
 bbot/test/test_step_2/module_tests/test_module_oauth.py | 6 ++++--
 2 files changed, 6 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
index 7d98ee7024..6fc7fafdb4 100644
--- a/bbot/modules/oauth.py
+++ b/bbot/modules/oauth.py
@@ -107,7 +107,9 @@ async def getoidc(self, url):
                 return url, token_endpoint, results
             if json and isinstance(json, dict):
                 token_endpoint = json.get("token_endpoint", "")
+                self.critical(f"JSON: {json}")
                 for found in self.helpers.search_dict_values(json, *self.regexes):
+                    self.critical(f"FOUND: {found}")
                     results.add(found)
         results -= {token_endpoint}
         return url, token_endpoint, results
diff --git a/bbot/test/test_step_2/module_tests/test_module_oauth.py b/bbot/test/test_step_2/module_tests/test_module_oauth.py
index 3b56b873ff..a901a23014 100644
--- a/bbot/test/test_step_2/module_tests/test_module_oauth.py
+++ b/bbot/test/test_step_2/module_tests/test_module_oauth.py
@@ -5,8 +5,8 @@
 
 class TestOAUTH(ModuleTestBase):
     targets = ["evilcorp.com"]
-    config_overrides = {"scope_report_distance": 1}
-    modules_overrides = ["azure_realm", "oauth", "speculate"]
+    config_overrides = {"scope_report_distance": 1, "omit_event_types": []}
+    modules_overrides = ["azure_realm", "oauth"]
     openid_config_azure = {
         "token_endpoint": "https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/token",
         "token_endpoint_auth_methods_supported": ["client_secret_post", "private_key_jwt", "client_secret_basic"],
@@ -203,6 +203,8 @@ async def setup_after_prep(self, module_test):
         )
 
     def check(self, module_test, events):
+        for e in events:
+            module_test.log.critical(f"{e.type}:{e.scope_distance}:{e.data}")
         assert any(
             e.type == "FINDING"
             and e.data["description"]

From aaa68c490120d9ba847ae0679c22dd8a342fc870 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 16:59:29 -0400
Subject: [PATCH 253/387] more debugging

---
 bbot/core/helpers/misc.py |  1 +
 poetry.lock               | 69 +++++++++------------------------------
 pyproject.toml            |  4 +--
 3 files changed, 19 insertions(+), 55 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 637d9cb294..77f8c4f256 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -700,6 +700,7 @@ def search_dict_values(d, *regexes):
     search_dict_values(dict_to_search, url_regexes) --> "https://www.evilcorp.com"
     """
     results = set()
+    log.critical(f"TYPE: {type(d)}: {d}")
     if isinstance(d, str):
         for r in regexes:
             for match in r.finditer(d):
diff --git a/poetry.lock b/poetry.lock
index b30ee04c18..8e669e5ee5 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -62,23 +62,24 @@ files = [
 
 [[package]]
 name = "anyio"
-version = "3.6.2"
+version = "3.7.1"
 description = "High level compatibility layer for multiple asynchronous event loop implementations"
 optional = false
-python-versions = ">=3.6.2"
+python-versions = ">=3.7"
 files = [
-    {file = "anyio-3.6.2-py3-none-any.whl", hash = "sha256:fbbe32bd270d2a2ef3ed1c5d45041250284e31fc0a4df4a5a6071842051a51e3"},
-    {file = "anyio-3.6.2.tar.gz", hash = "sha256:25ea0d673ae30af41a0c442f81cf3b38c7e79fdc7b60335a4c14e05eb0947421"},
+    {file = "anyio-3.7.1-py3-none-any.whl", hash = "sha256:91dee416e570e92c64041bd18b900d1d6fa78dff7048769ce5ac5ddad004fbb5"},
+    {file = "anyio-3.7.1.tar.gz", hash = "sha256:44a3c9aba0f5defa43261a8b3efb97891f2bd7d804e0e1f56419befa1adfc780"},
 ]
 
 [package.dependencies]
+exceptiongroup = {version = "*", markers = "python_version < \"3.11\""}
 idna = ">=2.8"
 sniffio = ">=1.1"
 
 [package.extras]
-doc = ["packaging", "sphinx-autodoc-typehints (>=1.2.0)", "sphinx-rtd-theme"]
-test = ["contextlib2", "coverage[toml] (>=4.5)", "hypothesis (>=4.0)", "mock (>=4)", "pytest (>=7.0)", "pytest-mock (>=3.6.1)", "trustme", "uvloop (<0.15)", "uvloop (>=0.15)"]
-trio = ["trio (>=0.16,<0.22)"]
+doc = ["Sphinx", "packaging", "sphinx-autodoc-typehints (>=1.2.0)", "sphinx-rtd-theme (>=1.2.2)", "sphinxcontrib-jquery"]
+test = ["anyio[trio]", "coverage[toml] (>=4.5)", "hypothesis (>=4.0)", "mock (>=4)", "psutil (>=5.9)", "pytest (>=7.0)", "pytest-mock (>=3.6.1)", "trustme", "uvloop (>=0.17)"]
+trio = ["trio (<0.22)"]
 
 [[package]]
 name = "appdirs"
@@ -628,41 +629,15 @@ files = [
     {file = "h11-0.14.0.tar.gz", hash = "sha256:8f19fbbe99e72420ff35c00b27a34cb9937e902a8b810e2c88300c6f0a3b699d"},
 ]
 
-[[package]]
-name = "h2"
-version = "4.1.0"
-description = "HTTP/2 State-Machine based protocol implementation"
-optional = false
-python-versions = ">=3.6.1"
-files = [
-    {file = "h2-4.1.0-py3-none-any.whl", hash = "sha256:03a46bcf682256c95b5fd9e9a99c1323584c3eec6440d379b9903d709476bc6d"},
-    {file = "h2-4.1.0.tar.gz", hash = "sha256:a83aca08fbe7aacb79fec788c9c0bac936343560ed9ec18b82a13a12c28d2abb"},
-]
-
-[package.dependencies]
-hpack = ">=4.0,<5"
-hyperframe = ">=6.0,<7"
-
-[[package]]
-name = "hpack"
-version = "4.0.0"
-description = "Pure-Python HPACK header compression"
-optional = false
-python-versions = ">=3.6.1"
-files = [
-    {file = "hpack-4.0.0-py3-none-any.whl", hash = "sha256:84a076fad3dc9a9f8063ccb8041ef100867b1878b25ef0ee63847a5d53818a6c"},
-    {file = "hpack-4.0.0.tar.gz", hash = "sha256:fc41de0c63e687ebffde81187a948221294896f6bdc0ae2312708df339430095"},
-]
-
 [[package]]
 name = "httpcore"
-version = "0.17.1"
+version = "0.17.3"
 description = "A minimal low-level HTTP client."
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "httpcore-0.17.1-py3-none-any.whl", hash = "sha256:628e768aaeec1f7effdc6408ba1c3cdbd7487c1fc570f7d66844ec4f003e1ca4"},
-    {file = "httpcore-0.17.1.tar.gz", hash = "sha256:caf508597c525f9b8bfff187e270666309f63115af30f7d68b16143a403c8356"},
+    {file = "httpcore-0.17.3-py3-none-any.whl", hash = "sha256:c2789b767ddddfa2a5782e3199b2b7f6894540b17b16ec26b2c4d8e103510b87"},
+    {file = "httpcore-0.17.3.tar.gz", hash = "sha256:a6f30213335e34c1ade7be6ec7c47f19f50c56db36abef1a9dfa3815b1cb3888"},
 ]
 
 [package.dependencies]
@@ -688,7 +663,6 @@ files = [
 
 [package.dependencies]
 certifi = "*"
-h2 = {version = ">=3,<5", optional = true, markers = "extra == \"http2\""}
 httpcore = ">=0.15.0,<0.18.0"
 idna = "*"
 sniffio = "*"
@@ -699,17 +673,6 @@ cli = ["click (==8.*)", "pygments (==2.*)", "rich (>=10,<14)"]
 http2 = ["h2 (>=3,<5)"]
 socks = ["socksio (==1.*)"]
 
-[[package]]
-name = "hyperframe"
-version = "6.0.1"
-description = "HTTP/2 framing layer for Python"
-optional = false
-python-versions = ">=3.6.1"
-files = [
-    {file = "hyperframe-6.0.1-py3-none-any.whl", hash = "sha256:0ec6bafd80d8ad2195c4f03aacba3a8265e57bc4cff261e802bf39970ed02a15"},
-    {file = "hyperframe-6.0.1.tar.gz", hash = "sha256:ae510046231dc8e9ecb1a6586f63d2347bf4c8905914aa84ba585ae85f28a914"},
-]
-
 [[package]]
 name = "idna"
 version = "3.4"
@@ -1229,13 +1192,13 @@ tests = ["coverage[toml] (==5.0.4)", "pytest (>=6.0.0,<7.0.0)"]
 
 [[package]]
 name = "pytest"
-version = "7.3.1"
+version = "7.4.0"
 description = "pytest: simple powerful testing with Python"
 optional = false
 python-versions = ">=3.7"
 files = [
-    {file = "pytest-7.3.1-py3-none-any.whl", hash = "sha256:3799fa815351fea3a5e96ac7e503a96fa51cc9942c3753cda7651b93c1cfa362"},
-    {file = "pytest-7.3.1.tar.gz", hash = "sha256:434afafd78b1d78ed0addf160ad2b77a30d35d4bdf8af234fe621919d9ed15e3"},
+    {file = "pytest-7.4.0-py3-none-any.whl", hash = "sha256:78bf16451a2eb8c7a2ea98e32dc119fd2aa758f1d5d66dbf0a59d69a3969df32"},
+    {file = "pytest-7.4.0.tar.gz", hash = "sha256:b4bf8c45bd59934ed84001ad51e11b4ee40d40a1229d2c79f9c592b0a3f6bd8a"},
 ]
 
 [package.dependencies]
@@ -1247,7 +1210,7 @@ pluggy = ">=0.12,<2.0"
 tomli = {version = ">=1.0.0", markers = "python_version < \"3.11\""}
 
 [package.extras]
-testing = ["argcomplete", "attrs (>=19.2.0)", "hypothesis (>=3.56)", "mock", "nose", "pygments (>=2.7.2)", "requests", "xmlschema"]
+testing = ["argcomplete", "attrs (>=19.2.0)", "hypothesis (>=3.56)", "mock", "nose", "pygments (>=2.7.2)", "requests", "setuptools", "xmlschema"]
 
 [[package]]
 name = "pytest-asyncio"
@@ -1779,4 +1742,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "e617e34873656bce6b2999d2c80dcf5d38909eb193d4849b11611a1eac619ec5"
+content-hash = "363a6c6ccef8e3319ecf00d8084ecc5a41e4fabb4c99a279a14af2a50b7e2b82"
diff --git a/pyproject.toml b/pyproject.toml
index 280bada6fc..d29ac2bd71 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -28,10 +28,11 @@ ansible = "^7.3.0"
 tabulate = "0.8.10"
 cloudcheck = "^2.0.0.34"
 websockets = "^11.0.2"
-httpx = {extras = ["http2"], version = "^0.24.0"}
 pyjwt = "^2.7.0"
 beautifulsoup4 = "^4.12.2"
 lxml = "^4.9.2"
+httpx = "^0.24.1"
+pytest-httpx = "^0.22.0"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"
@@ -41,7 +42,6 @@ pytest-cov = "^4.0.0"
 poetry-dynamic-versioning = "^0.21.4"
 pytest-rerunfailures = "^11.1.2"
 pytest-asyncio = "^0.21.0"
-pytest-httpx = "^0.22.0"
 urllib3 = "^2.0.2"
 werkzeug = "^2.3.4"
 pytest-httpserver = "^1.0.8"

From a24bf431f4028dedd818bbdcea0c64c1503d64cc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 17:21:50 -0400
Subject: [PATCH 254/387] even more debugging

---
 bbot/core/helpers/misc.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 77f8c4f256..98d78e7ee2 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -705,9 +705,11 @@ def search_dict_values(d, *regexes):
         for r in regexes:
             for match in r.finditer(d):
                 result = match.group()
+                log.critical(f"RESULT: {result}")
                 h = hash(result)
-                if not h in results:
+                if h not in results:
                     results.add(h)
+                    log.critical(f"YIELD: {result}")
                     yield result
     elif isinstance(d, dict):
         for _, v in d.items():

From cc7a57f9e4b659cde9e32153a9944a6c2b21a12c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 17:22:17 -0400
Subject: [PATCH 255/387] and more

---
 bbot/core/helpers/misc.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 98d78e7ee2..8f8fcaa36c 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -702,6 +702,7 @@ def search_dict_values(d, *regexes):
     results = set()
     log.critical(f"TYPE: {type(d)}: {d}")
     if isinstance(d, str):
+        log.critical(f"IS STR: {d}")
         for r in regexes:
             for match in r.finditer(d):
                 result = match.group()

From 6499b7dc068989ed86d6abf12832c26a12dfdc28 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 17:42:23 -0400
Subject: [PATCH 256/387] even more debugging

---
 bbot/core/helpers/misc.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 8f8fcaa36c..4bddfae111 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -703,7 +703,9 @@ def search_dict_values(d, *regexes):
     log.critical(f"TYPE: {type(d)}: {d}")
     if isinstance(d, str):
         log.critical(f"IS STR: {d}")
+        log.critical(f"REGEXES: {regexes}")
         for r in regexes:
+            log.critical(f"REGEX: {r}")
             for match in r.finditer(d):
                 result = match.group()
                 log.critical(f"RESULT: {result}")

From 16509d8f505a8f49d4f2b8c6d05d8ac0b37e4466 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 22:30:15 -0400
Subject: [PATCH 257/387] still more debugging

---
 bbot/core/helpers/misc.py                     | 22 +++++-----
 bbot/modules/oauth.py                         |  2 +
 bbot/modules/output/asset_inventory.py        |  2 +-
 bbot/test/test_step_1/test_helpers.py         | 12 +++++-
 .../test_module_asset_inventory.py            | 40 +++++++++++++------
 5 files changed, 52 insertions(+), 26 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 703edb8488..db610968d8 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -33,10 +33,10 @@
 from asyncio import as_completed, create_task, sleep, wait_for  # noqa
 
 from .url import *  # noqa F401
-from . import regexes
 from .. import errors
 from .punycode import *  # noqa F401
 from .logger import log_to_stderr
+from . import regexes as bbot_regexes
 from .names_generator import random_name, names, adjectives  # noqa F401
 
 log = logging.getLogger("bbot.core.helpers.misc")
@@ -71,12 +71,12 @@ def is_ptr(d):
     "wsc-11-22-33-44.evilcorp.com" --> True
     "www2.evilcorp.com" --> False
     """
-    return bool(regexes.ptr_regex.search(str(d)))
+    return bool(bbot_regexes.ptr_regex.search(str(d)))
 
 
 def is_url(u):
     u = str(u)
-    for r in regexes.event_type_regexes["URL"]:
+    for r in bbot_regexes.event_type_regexes["URL"]:
         if r.match(u):
             return True
     return False
@@ -226,9 +226,9 @@ def is_dns_name(d):
     if is_ip(d):
         return False
     d = smart_decode(d)
-    if regexes.hostname_regex.match(d):
+    if bbot_regexes.hostname_regex.match(d):
         return True
-    if regexes.dns_name_regex.match(d):
+    if bbot_regexes.dns_name_regex.match(d):
         return True
     return False
 
@@ -426,21 +426,21 @@ def extract_params_xml(xml_data):
 
 
 def extract_params_html(html_data):
-    input_tag = regexes.input_tag_regex.findall(html_data)
+    input_tag = bbot_regexes.input_tag_regex.findall(html_data)
 
     for i in input_tag:
         log.debug(f"FOUND PARAM ({i}) IN INPUT TAGS")
         yield i
 
     # check for jquery get parameters
-    jquery_get = regexes.jquery_get_regex.findall(html_data)
+    jquery_get = bbot_regexes.jquery_get_regex.findall(html_data)
 
     for i in jquery_get:
         log.debug(f"FOUND PARAM ({i}) IN JQUERY GET PARAMS")
         yield i
 
     # check for jquery post parameters
-    jquery_post = regexes.jquery_post_regex.findall(html_data)
+    jquery_post = bbot_regexes.jquery_post_regex.findall(html_data)
     if jquery_post:
         for i in jquery_post:
             for x in i.split(","):
@@ -448,7 +448,7 @@ def extract_params_html(html_data):
                 log.debug(f"FOUND PARAM ({s}) IN A JQUERY POST PARAMS")
                 yield s
 
-    a_tag = regexes.a_tag_regex.findall(html_data)
+    a_tag = bbot_regexes.a_tag_regex.findall(html_data)
     for s in a_tag:
         log.debug(f"FOUND PARAM ({s}) IN A TAG GET PARAMS")
         yield s
@@ -460,7 +460,7 @@ def extract_words(data, acronyms=True, wordninja=True, model=None, max_length=10
     Returns set() of extracted words
     """
     if word_regexes is None:
-        word_regexes = regexes.word_regexes
+        word_regexes = bbot_regexes.word_regexes
     words = set()
     data = smart_decode(data)
     for r in word_regexes:
@@ -904,7 +904,7 @@ def clean_old(d, keep=10, filter=lambda x: True, key=latest_mtime, reverse=True,
 
 
 def extract_emails(s):
-    for email in regexes.email_regex.findall(smart_decode(s)):
+    for email in bbot_regexes.email_regex.findall(smart_decode(s)):
         yield email.lower()
 
 
diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
index 6fc7fafdb4..3bdecd7859 100644
--- a/bbot/modules/oauth.py
+++ b/bbot/modules/oauth.py
@@ -17,7 +17,9 @@ class OAUTH(BaseModule):
 
     async def setup(self):
         self.processed = set()
+        self.critical(f"IMPORTED URL REGEXES: {url_regexes}")
         self.regexes = list(url_regexes) + list(self.scan.dns_regexes)
+        self.critical(f"COMBINED REGEXES: {self.regexes}")
         self.try_all = self.config.get("try_all", False)
         return True
 
diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index 6e5e61d6f4..0b0cfff73e 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -94,7 +94,7 @@ def sort_key(asset):
             ips = sorted([str(i) for i in getattr(asset, "ip_addresses", [])])
             host = getattr(asset, "host", "")
             if host:
-                domain = self.helpers.tldextract(host).registered_domain
+                _, domain = self.helpers.split_domain(host)
                 if domain:
                     increment_stat("Domains", domain)
             for ip in ips:
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index e7ed3311d3..7a6e146558 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -162,8 +162,16 @@ async def test_helpers_misc(helpers, scan, bbot_scanner, bbot_config, bbot_https
 
     from bbot.core.helpers.regexes import url_regexes
 
-    dict_to_search = {"key1": {"key2": [{"key3": "A url of some kind: https://www.evilcorp.com/asdf"}]}}
-    assert list(helpers.search_dict_values(dict_to_search, *url_regexes)) == ["https://www.evilcorp.com/asdf"]
+    dict_to_search = {
+        "key1": {
+            "key2": [{"key3": "A url of some kind: https://www.evilcorp.com/asdf"}],
+            "key4": "A url of some kind: https://www.evilcorp.com/fdsa",
+        }
+    }
+    assert set(helpers.search_dict_values(dict_to_search, *url_regexes)) == {
+        "https://www.evilcorp.com/asdf",
+        "https://www.evilcorp.com/fdsa",
+    }
 
     filtered_dict = helpers.filter_dict(
         {"modules": {"c99": {"api_key": "1234", "filterme": "asdf"}, "ipneighbor": {"test": "test"}}}, "api_key"
diff --git a/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py b/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
index b0ff63c8a5..b566d9f70b 100644
--- a/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
+++ b/bbot/test/test_step_2/module_tests/test_module_asset_inventory.py
@@ -2,23 +2,37 @@
 
 
 class TestAsset_Inventory(ModuleTestBase):
-    targets = ["8.8.8.8"]
+    targets = ["127.0.0.1", "bbottest.notreal"]
     scan_name = "asset_inventory_test"
-    config_overrides = {"dns_resolution": True}
+    config_overrides = {"dns_resolution": True, "internal_modules": {"speculate": {"ports": "9999"}}}
     modules_overrides = ["asset_inventory", "speculate", "sslcert"]
 
+    async def setup_before_prep(self, module_test):
+        old_resolve_fn = module_test.scan.helpers.dns.resolve_event
+
+        async def resolve_event(event, minimal=False):
+            if event.data == "www.bbottest.notreal":
+                return ["a-record"], True, False, {"A": {"127.0.0.1"}}
+            elif event.data == "127.0.0.1":
+                return ["ptr-record"], False, False, {"PTR": {"asdf.bbottest.notreal"}}
+            return await old_resolve_fn(event, minimal)
+
+        module_test.monkeypatch.setattr(module_test.scan.helpers.dns, "resolve_event", resolve_event)
+
     def check(self, module_test, events):
-        assert any(e.type == "OPEN_TCP_PORT" for e in events), "No open port found"
-        assert any(e.type == "DNS_NAME" for e in events), "No DNS name found"
+        assert any(e.data == "127.0.0.1:9999" for e in events), "No open port found"
+        assert any(e.data == "www.bbottest.notreal" for e in events), "No DNS name found"
         filename = next(module_test.scan.home.glob("asset-inventory.csv"))
         with open(filename) as f:
-            assert "8.8.8.8,,8.8.8.8" in f.read()
+            content = f.read()
+            assert "www.bbottest.notreal,,127.0.0.1" in content
         filename = next(module_test.scan.home.glob("asset-inventory-ip-addresses-table*.txt"))
         with open(filename) as f:
-            assert "8.8.0.0/16" in f.read()
+            assert "127.0.0.0/16" in f.read()
         filename = next(module_test.scan.home.glob("asset-inventory-domains-table*.txt"))
         with open(filename) as f:
-            assert "dns.google" in f.read()
+            content = f.read()
+            assert "bbottest.notreal" in content
 
 
 class TestAsset_InventoryEmitPrevious(TestAsset_Inventory):
@@ -26,14 +40,16 @@ class TestAsset_InventoryEmitPrevious(TestAsset_Inventory):
     modules_overrides = ["asset_inventory"]
 
     def check(self, module_test, events):
-        assert any(e.type == "OPEN_TCP_PORT" for e in events), "No open port found"
-        assert any(e.type == "DNS_NAME" for e in events), "No DNS name found"
+        assert any(e.data == "www.bbottest.notreal:9999" for e in events), "No open port found"
+        assert any(e.data == "www.bbottest.notreal" for e in events), "No DNS name found"
         filename = next(module_test.scan.home.glob("asset-inventory.csv"))
         with open(filename) as f:
-            assert "8.8.8.8,,8.8.8.8" in f.read()
+            content = f.read()
+            assert "www.bbottest.notreal,,127.0.0.1" in content
         filename = next(module_test.scan.home.glob("asset-inventory-ip-addresses-table*.txt"))
         with open(filename) as f:
-            assert "8.8.0.0/16" in f.read()
+            assert "127.0.0.0/16" in f.read()
         filename = next(module_test.scan.home.glob("asset-inventory-domains-table*.txt"))
         with open(filename) as f:
-            assert "dns.google" in f.read()
+            content = f.read()
+            assert "bbottest.notreal" in content

From 88076c50d9ea68fce81646b5fbcf7508e4512865 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 23:44:15 -0400
Subject: [PATCH 258/387] generator --> list

---
 bbot/core/helpers/regexes.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index 13f08a7d57..0a67185433 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -31,7 +31,7 @@
     r"https?://((?:\w|\w[\w\-]*\w)[\.]?)+(?:\w[\w\-]*\w|\w)(?::[0-9]{1,5})?.*$",
     r"https?://\[" + _ipv6_regex + r"\](?::[0-9]{1,5})?.*$",
 )
-url_regexes = (re.compile(r, re.I) for r in _url_regexes)
+url_regexes = list(re.compile(r, re.I) for r in _url_regexes)
 
 event_type_regexes = OrderedDict(
     (

From 89fc8e807784f4f596c5f00bbe6c68e5f0176df3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 23:45:57 -0400
Subject: [PATCH 259/387] tweak actions yaml

---
 .github/workflows/tests.yml | 5 -----
 1 file changed, 5 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index a63a6bccbc..57dd8b6383 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -7,7 +7,6 @@ on:
       - closed
 
 jobs:
-  
   lint:
     runs-on: ubuntu-latest
     steps:
@@ -25,7 +24,6 @@ jobs:
       - name: flake8
         run: |
           flake8 --select F,E722 --ignore F403,F405,F541 --per-file-ignores="*/__init__.py:F401,F403"
-
   test:
     needs: lint
     runs-on: ubuntu-latest
@@ -48,7 +46,6 @@ jobs:
           token: ${{ secrets.CODECOV_TOKEN }}
           files: ./cov.xml
           verbose: true
-
   update_docs:
     needs: test
     runs-on: ubuntu-latest
@@ -74,7 +71,6 @@ jobs:
           author_email: info@blacklanternsecurity.com
           message: "Refresh module docs"
           token: ${{ secrets.BBOT_DOCS_UPDATER_PAT }}
-
   publish_docs:
     needs: update_docs
     runs-on: ubuntu-latest
@@ -93,7 +89,6 @@ jobs:
             mkdocs-material-
       - run: pip install mkdocs-material mkdocs-extra-sass-plugin livereload
       - run: mkdocs gh-deploy --force
-
   publish_code:
     needs: update_docs
     runs-on: ubuntu-latest

From 49613c4933b768af6e4ebfdf982e602154fdcb43 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 13 Jul 2023 23:50:47 -0400
Subject: [PATCH 260/387] only run tests when pushing to stable/dev

---
 .github/workflows/tests.yml | 5 ++++-
 README.md                   | 1 -
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 57dd8b6383..e2d40f3ed2 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -1,6 +1,9 @@
 name: tests
 on:
   push:
+    branches:
+      - stable
+      - dev
   pull_request:
   pull_request_target:
     types:
@@ -74,7 +77,7 @@ jobs:
   publish_docs:
     needs: update_docs
     runs-on: ubuntu-latest
-    if: github.ref == 'refs/heads/dev'
+    if: github.event_name == 'pull_request_target' && github.event.pull_request.merged == true && github.event.pull_request.base.ref == 'dev'
     steps:
       - uses: actions/checkout@v3
       - uses: actions/setup-python@v4
diff --git a/README.md b/README.md
index 2745104568..694ad43c51 100644
--- a/README.md
+++ b/README.md
@@ -33,7 +33,6 @@ BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn
     - [How to Write a Module](https://www.blacklanternsecurity.com/bbot/contribution)
 - **Misc**
     - [Release History](https://www.blacklanternsecurity.com/bbot/release_history)
-    - [Troubleshooting](https://www.blacklanternsecurity.com/bbot/troubleshooting)
 <!-- END BBOT DOCS TOC -->
 
 ## Installation ([pip](https://pypi.org/project/bbot/))

From 9543ab90e413803fde3daf6918c23b0567b3eac3 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 00:35:41 -0400
Subject: [PATCH 261/387] remove debugging statements

---
 bbot/core/helpers/misc.py | 6 ------
 bbot/modules/oauth.py     | 7 +------
 2 files changed, 1 insertion(+), 12 deletions(-)

diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index db610968d8..cf8337ac55 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -700,19 +700,13 @@ def search_dict_values(d, *regexes):
     search_dict_values(dict_to_search, url_regexes) --> "https://www.evilcorp.com"
     """
     results = set()
-    log.critical(f"TYPE: {type(d)}: {d}")
     if isinstance(d, str):
-        log.critical(f"IS STR: {d}")
-        log.critical(f"REGEXES: {regexes}")
         for r in regexes:
-            log.critical(f"REGEX: {r}")
             for match in r.finditer(d):
                 result = match.group()
-                log.critical(f"RESULT: {result}")
                 h = hash(result)
                 if h not in results:
                     results.add(h)
-                    log.critical(f"YIELD: {result}")
                     yield result
     elif isinstance(d, dict):
         for _, v in d.items():
diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
index 3bdecd7859..78b94ba416 100644
--- a/bbot/modules/oauth.py
+++ b/bbot/modules/oauth.py
@@ -17,9 +17,7 @@ class OAUTH(BaseModule):
 
     async def setup(self):
         self.processed = set()
-        self.critical(f"IMPORTED URL REGEXES: {url_regexes}")
         self.regexes = list(url_regexes) + list(self.scan.dns_regexes)
-        self.critical(f"COMBINED REGEXES: {self.regexes}")
         self.try_all = self.config.get("try_all", False)
         return True
 
@@ -49,8 +47,7 @@ async def handle_event(self, event):
             for u in self.url_and_base(url):
                 oauth_tasks.append(self.helpers.create_task(self.getoauth(u)))
         if self.try_all or any(t in event.tags for t in ("ms-auth-url",)):
-            for u in self.url_and_base(url):
-                oidc_tasks.append(self.helpers.create_task(self.getoidc(u)))
+            oidc_tasks.append(self.helpers.create_task(self.getoidc(url)))
 
         for oidc_task in oidc_tasks:
             url, token_endpoint, oidc_results = await oidc_task
@@ -109,9 +106,7 @@ async def getoidc(self, url):
                 return url, token_endpoint, results
             if json and isinstance(json, dict):
                 token_endpoint = json.get("token_endpoint", "")
-                self.critical(f"JSON: {json}")
                 for found in self.helpers.search_dict_values(json, *self.regexes):
-                    self.critical(f"FOUND: {found}")
                     results.add(found)
         results -= {token_endpoint}
         return url, token_endpoint, results

From 9be8ab2351971424091863a8b781fabc2c0ac9cb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 09:50:31 -0400
Subject: [PATCH 262/387] fix tests

---
 bbot/modules/oauth.py                                   | 6 +++---
 bbot/test/test_step_2/module_tests/test_module_oauth.py | 2 --
 2 files changed, 3 insertions(+), 5 deletions(-)

diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
index 78b94ba416..fa711e6a65 100644
--- a/bbot/modules/oauth.py
+++ b/bbot/modules/oauth.py
@@ -44,10 +44,10 @@ async def handle_event(self, event):
 
         oauth_tasks = []
         if self.try_all or any(t in event.tags for t in ("oauth-token-endpoint",)):
-            for u in self.url_and_base(url):
-                oauth_tasks.append(self.helpers.create_task(self.getoauth(u)))
+            oauth_tasks.append(self.helpers.create_task(self.getoauth(url)))
         if self.try_all or any(t in event.tags for t in ("ms-auth-url",)):
-            oidc_tasks.append(self.helpers.create_task(self.getoidc(url)))
+            for u in self.url_and_base(url):
+                oidc_tasks.append(self.helpers.create_task(self.getoidc(u)))
 
         for oidc_task in oidc_tasks:
             url, token_endpoint, oidc_results = await oidc_task
diff --git a/bbot/test/test_step_2/module_tests/test_module_oauth.py b/bbot/test/test_step_2/module_tests/test_module_oauth.py
index a901a23014..abb88372cd 100644
--- a/bbot/test/test_step_2/module_tests/test_module_oauth.py
+++ b/bbot/test/test_step_2/module_tests/test_module_oauth.py
@@ -203,8 +203,6 @@ async def setup_after_prep(self, module_test):
         )
 
     def check(self, module_test, events):
-        for e in events:
-            module_test.log.critical(f"{e.type}:{e.scope_distance}:{e.data}")
         assert any(
             e.type == "FINDING"
             and e.data["description"]

From efd90a1843e38b4f98a40638214a6ed298424254 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 10:11:16 -0400
Subject: [PATCH 263/387] cancel in-progress tests

---
 .github/workflows/tests.yml | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index e2d40f3ed2..edec946082 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -9,6 +9,10 @@ on:
     types:
       - closed
 
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
+  cancel-in-progress: true
+
 jobs:
   lint:
     runs-on: ubuntu-latest

From 0d97e256a98fe9d3a8cb76bbc37b10b3a7715a6e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 10:21:38 -0400
Subject: [PATCH 264/387] add trailing slash

---
 bbot/modules/oauth.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
index fa711e6a65..e49503790a 100644
--- a/bbot/modules/oauth.py
+++ b/bbot/modules/oauth.py
@@ -85,7 +85,7 @@ async def handle_event(self, event):
     def url_and_base(self, url):
         yield url
         parsed = self.helpers.urlparse(url)
-        baseurl = f"{parsed.scheme}://{parsed.netloc}"
+        baseurl = f"{parsed.scheme}://{parsed.netloc}/"
         if baseurl != url:
             yield baseurl
 

From 381ea53aea6bf8f5ac439ba95a3f07de16d57fb6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 10:30:12 -0400
Subject: [PATCH 265/387] move pytest-httpx to dev group

---
 poetry.lock    | 2 +-
 pyproject.toml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/poetry.lock b/poetry.lock
index 8e669e5ee5..fd789de16e 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1742,4 +1742,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "363a6c6ccef8e3319ecf00d8084ecc5a41e4fabb4c99a279a14af2a50b7e2b82"
+content-hash = "d3fa4e88270fe10839c9e26fde15fbb8a0900060e8060571f7d397e85552425e"
diff --git a/pyproject.toml b/pyproject.toml
index d29ac2bd71..5f8104700c 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -32,7 +32,6 @@ pyjwt = "^2.7.0"
 beautifulsoup4 = "^4.12.2"
 lxml = "^4.9.2"
 httpx = "^0.24.1"
-pytest-httpx = "^0.22.0"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"
@@ -46,6 +45,7 @@ urllib3 = "^2.0.2"
 werkzeug = "^2.3.4"
 pytest-httpserver = "^1.0.8"
 pytest-env = "^0.8.2"
+pytest-httpx = "^0.22.0"
 
 [tool.pytest.ini_options]
 env = [

From 7cd9aed36d87312ede1d53730ef2ba73ab9f1719 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 11:04:11 -0400
Subject: [PATCH 266/387] re-add http2 support

---
 poetry.lock    | 40 +++++++++++++++++++++++++++++++++++++++-
 pyproject.toml |  2 +-
 2 files changed, 40 insertions(+), 2 deletions(-)

diff --git a/poetry.lock b/poetry.lock
index fd789de16e..e7cb0ce3b7 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -629,6 +629,32 @@ files = [
     {file = "h11-0.14.0.tar.gz", hash = "sha256:8f19fbbe99e72420ff35c00b27a34cb9937e902a8b810e2c88300c6f0a3b699d"},
 ]
 
+[[package]]
+name = "h2"
+version = "4.1.0"
+description = "HTTP/2 State-Machine based protocol implementation"
+optional = false
+python-versions = ">=3.6.1"
+files = [
+    {file = "h2-4.1.0-py3-none-any.whl", hash = "sha256:03a46bcf682256c95b5fd9e9a99c1323584c3eec6440d379b9903d709476bc6d"},
+    {file = "h2-4.1.0.tar.gz", hash = "sha256:a83aca08fbe7aacb79fec788c9c0bac936343560ed9ec18b82a13a12c28d2abb"},
+]
+
+[package.dependencies]
+hpack = ">=4.0,<5"
+hyperframe = ">=6.0,<7"
+
+[[package]]
+name = "hpack"
+version = "4.0.0"
+description = "Pure-Python HPACK header compression"
+optional = false
+python-versions = ">=3.6.1"
+files = [
+    {file = "hpack-4.0.0-py3-none-any.whl", hash = "sha256:84a076fad3dc9a9f8063ccb8041ef100867b1878b25ef0ee63847a5d53818a6c"},
+    {file = "hpack-4.0.0.tar.gz", hash = "sha256:fc41de0c63e687ebffde81187a948221294896f6bdc0ae2312708df339430095"},
+]
+
 [[package]]
 name = "httpcore"
 version = "0.17.3"
@@ -663,6 +689,7 @@ files = [
 
 [package.dependencies]
 certifi = "*"
+h2 = {version = ">=3,<5", optional = true, markers = "extra == \"http2\""}
 httpcore = ">=0.15.0,<0.18.0"
 idna = "*"
 sniffio = "*"
@@ -673,6 +700,17 @@ cli = ["click (==8.*)", "pygments (==2.*)", "rich (>=10,<14)"]
 http2 = ["h2 (>=3,<5)"]
 socks = ["socksio (==1.*)"]
 
+[[package]]
+name = "hyperframe"
+version = "6.0.1"
+description = "HTTP/2 framing layer for Python"
+optional = false
+python-versions = ">=3.6.1"
+files = [
+    {file = "hyperframe-6.0.1-py3-none-any.whl", hash = "sha256:0ec6bafd80d8ad2195c4f03aacba3a8265e57bc4cff261e802bf39970ed02a15"},
+    {file = "hyperframe-6.0.1.tar.gz", hash = "sha256:ae510046231dc8e9ecb1a6586f63d2347bf4c8905914aa84ba585ae85f28a914"},
+]
+
 [[package]]
 name = "idna"
 version = "3.4"
@@ -1742,4 +1780,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "d3fa4e88270fe10839c9e26fde15fbb8a0900060e8060571f7d397e85552425e"
+content-hash = "68da1ef5823d4a97677be49a1be0de993ad2606bc29ed4dd2e78bd1770ebcbf5"
diff --git a/pyproject.toml b/pyproject.toml
index 5f8104700c..a6aa95005f 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -31,7 +31,7 @@ websockets = "^11.0.2"
 pyjwt = "^2.7.0"
 beautifulsoup4 = "^4.12.2"
 lxml = "^4.9.2"
-httpx = "^0.24.1"
+httpx = {extras = ["http2"], version = "^0.24.1"}
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From c069dc136f2b793f4a2165102ed53fbcdfdbe9a0 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Fri, 14 Jul 2023 11:23:00 -0400
Subject: [PATCH 267/387] msg cleanup

---
 bbot/modules/deadly/ffuf.py     | 2 +-
 bbot/modules/ffuf_shortnames.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/deadly/ffuf.py b/bbot/modules/deadly/ffuf.py
index 2ef1938f9b..0dad1b63ff 100644
--- a/bbot/modules/deadly/ffuf.py
+++ b/bbot/modules/deadly/ffuf.py
@@ -57,7 +57,7 @@ async def setup(self):
         self.verbose(f"Generated dynamic wordlist with length [{str(tempfile_len)}]")
         try:
             self.extensions = parse_list_string(self.config.get("extensions", ""))
-            self.critical(f"Using custom extensions: [{','.join(self.extensions)}]")
+            self.debug(f"Using custom extensions: [{','.join(self.extensions)}]")
         except ValueError as e:
             self.warning(f"Error parsing extensions: {e}")
             return False
diff --git a/bbot/modules/ffuf_shortnames.py b/bbot/modules/ffuf_shortnames.py
index 3ac991967e..d78644e91f 100644
--- a/bbot/modules/ffuf_shortnames.py
+++ b/bbot/modules/ffuf_shortnames.py
@@ -90,7 +90,7 @@ async def setup(self):
 
         try:
             self.extensions = parse_list_string(self.config.get("extensions", ""))
-            self.critical(f"Using custom extensions: [{','.join(self.extensions)}]")
+            self.debug(f"Using custom extensions: [{','.join(self.extensions)}]")
         except ValueError as e:
             self.warning(f"Error parsing extensions: {e}")
             return False

From 55654da3649a6b1b32d04cffbaacca2fc4bf58d5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 12:38:36 -0400
Subject: [PATCH 268/387] fix wayback bug

---
 bbot/modules/wayback.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/wayback.py b/bbot/modules/wayback.py
index 133dc27e7b..40bbb9f5cb 100644
--- a/bbot/modules/wayback.py
+++ b/bbot/modules/wayback.py
@@ -33,13 +33,13 @@ async def query(self, query):
         r = await self.helpers.request(waybackurl, timeout=self.http_timeout + 10)
         if not r:
             self.warning(f'Error connecting to archive.org for query "{query}"')
-            return
+            return results
         try:
             j = r.json()
             assert type(j) == list
         except Exception:
             self.warning(f'Error JSON-decoding archive.org response for query "{query}"')
-            return
+            return results
 
         urls = []
         for result in j[1:]:

From 3aa9753aa87cb6a7f9305789532a456b25b3aa00 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 12:50:01 -0400
Subject: [PATCH 269/387] update docker workdir

---
 Dockerfile | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/Dockerfile b/Dockerfile
index fc763dca05..cf269c37e1 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -12,4 +12,6 @@ COPY . .
 
 RUN pip install .
 
+WORKDIR /root
+
 ENTRYPOINT [ "bbot" ]

From 1a7f9572d833241021ea28b0bef4a8e2c19a8582 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 13:14:19 -0400
Subject: [PATCH 270/387] silence bad error message

---
 Dockerfile                   |  2 +-
 bbot/core/helpers/command.py | 12 ++++++++----
 2 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/Dockerfile b/Dockerfile
index cf269c37e1..e893c7fb1a 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -6,7 +6,7 @@ ENV PIP_NO_CACHE_DIR=off
 
 WORKDIR /usr/src/bbot
 
-RUN apt-get update && apt-get install -y openssl gcc git make unzip curl wget nano sudo
+RUN apt-get update && apt-get install -y openssl gcc git make unzip curl wget vim nano sudo
 
 COPY . .
 
diff --git a/bbot/core/helpers/command.py b/bbot/core/helpers/command.py
index be66d04eec..d5b08d0120 100644
--- a/bbot/core/helpers/command.py
+++ b/bbot/core/helpers/command.py
@@ -26,8 +26,10 @@ async def run(self, *command, check=False, text=True, **kwargs):
 
         # surface stderr
         if text:
-            stderr = smart_decode(stderr)
-            stdout = smart_decode(stdout)
+            if stderr is not None:
+                stderr = smart_decode(stderr)
+            if stdout is not None:
+                stdout = smart_decode(stdout)
         if proc.returncode:
             if check:
                 raise CalledProcessError(proc.returncode, command, output=stdout, stderr=stderr)
@@ -70,8 +72,10 @@ async def run_live(self, *command, check=False, text=True, **kwargs):
         if proc.returncode:
             stdout, stderr = await proc.communicate()
             if text:
-                stderr = smart_decode(stderr)
-                stdout = smart_decode(stdout)
+                if stderr is not None:
+                    stderr = smart_decode(stderr)
+                if stdout is not None:
+                    stdout = smart_decode(stdout)
             if check:
                 raise CalledProcessError(proc.returncode, command, output=stdout, stderr=stderr)
             # surface stderr

From 5f7355238d3b435f64b39db6a70e5b343a877326 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Fri, 14 Jul 2023 13:33:47 -0400
Subject: [PATCH 271/387] fixing modifying while iterating error

---
 bbot/modules/paramminer_headers.py | 26 +++++++++++++++++---------
 1 file changed, 17 insertions(+), 9 deletions(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 96f8c59853..c476c8ddba 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -76,6 +76,7 @@ class paramminer_headers(BaseModule):
 
     async def setup(self):
         self.event_dict = {}
+        self.already_checked = set()
         wordlist = self.config.get("wordlist", "")
         if not wordlist:
             wordlist = f"{self.helpers.wordlist_dir}/{self.default_wordlist}"
@@ -90,13 +91,18 @@ async def setup(self):
 
         if self.config.get("skip_boring_words", True):
             self.wl -= self.boring_words
-        self.matched_words = {}
+        self.matched_words = set()
         return True
 
     def rand_string(self, *args, **kwargs):
         return self.helpers.rand_string(*args, **kwargs)
 
     async def do_mining(self, wl, url, batch_size, compare_helper):
+
+        for i in wl:
+            h = hash(i + url)
+            self.already_checked.add(h)
+
         results = set()
         abort_threshold = 15
         try:
@@ -155,7 +161,7 @@ async def handle_event(self, event):
             extracted_words = self.load_extracted_words(event.data.get("body"), event.data.get("content_type"))
             if extracted_words:
                 self.debug(f"Extracted {str(len(extracted_words))} words from {url}")
-                self.matched_words[url] = extracted_words
+                self.matched_words.update(extracted_words)
                 wl |= extracted_words
         if self.config.get("skip_boring_words", True):
             wl -= self.boring_words
@@ -217,21 +223,23 @@ async def check_batch(self, compare_helper, url, header_list):
         return await compare_helper.compare(url, headers=test_headers, check_reflection=(len(header_list) == 1))
 
     async def finish(self):
-        for url, (event, batch_size) in self.event_dict.items():
+        for url, (event, batch_size) in list(self.event_dict.items()):
+
             try:
                 compare_helper = self.helpers.http_compare(url)
             except HttpCompareError as e:
                 self.debug(f"Error initializing compare helper: {e}")
                 return
-            untested_matches = set()
-            for k, s in self.matched_words.items():
-                if k != url:
-                    untested_matches.update(s)
-
-            untested_matches -= self.wl
+            untested_matches = self.matched_words.copy()
 
             if self.config.get("skip_boring_words", True):
                 untested_matches -= self.boring_words
 
+            untested_matches_copy = untested_matches.copy()
+            for i in untested_matches_copy:
+                h = hash(i + url)
+                if h in self.already_checked:
+                    untested_matches.remove(i)
+
             results = await self.do_mining(untested_matches, url, batch_size, compare_helper)
             self.process_results(event, results)

From 3339fd3a1c6765ee0df71a32943df2e4c09acf4d Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Fri, 14 Jul 2023 13:35:49 -0400
Subject: [PATCH 272/387] black

---
 bbot/modules/paramminer_headers.py | 2 --
 1 file changed, 2 deletions(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index c476c8ddba..59d0543bec 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -98,7 +98,6 @@ def rand_string(self, *args, **kwargs):
         return self.helpers.rand_string(*args, **kwargs)
 
     async def do_mining(self, wl, url, batch_size, compare_helper):
-
         for i in wl:
             h = hash(i + url)
             self.already_checked.add(h)
@@ -224,7 +223,6 @@ async def check_batch(self, compare_helper, url, header_list):
 
     async def finish(self):
         for url, (event, batch_size) in list(self.event_dict.items()):
-
             try:
                 compare_helper = self.helpers.http_compare(url)
             except HttpCompareError as e:

From 4c23b1d3845566df7624c6f960ffb5da0d64ef78 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 16:26:59 -0400
Subject: [PATCH 273/387] fix regex bug, add regex tests

---
 bbot/core/event/helpers.py            |   1 -
 bbot/core/helpers/regexes.py          |  10 +-
 bbot/test/test_step_1/test_regexes.py | 185 ++++++++++++++++++++++++++
 3 files changed, 190 insertions(+), 6 deletions(-)
 create mode 100644 bbot/test/test_step_1/test_regexes.py

diff --git a/bbot/core/event/helpers.py b/bbot/core/event/helpers.py
index 7213bc57b5..bd1ace47e2 100644
--- a/bbot/core/event/helpers.py
+++ b/bbot/core/event/helpers.py
@@ -14,7 +14,6 @@ def get_event_type(data):
     """
     Attempt to divine event type from data
     """
-
     data = smart_decode_punycode(smart_decode(data).strip())
 
     # IP address
diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index 0a67185433..dac1a5b097 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -21,15 +21,15 @@
 num_regex = re.compile(r"\d+")
 _ipv6_regex = r"[A-F0-9:]*:[A-F0-9:]*:[A-F0-9:]*"
 ipv6_regex = re.compile(_ipv6_regex, re.I)
-_dns_name_regex = r"(?:(?:[\w-]+)\.)+(?:[^\W_0-9]{2,20})"
+_dns_name_regex = r"(?:\w(?:[\w-]{0,100}\w)?\.)+\w{1,63}"
 _hostname_regex = r"^[\w-]+$"
 _email_regex = r"(?:[^\W_][\w\-\.\+]{,100})@(?:\w[\w\-\._]{,100})\.(?:[^\W_0-9]{2,8})"
 email_regex = re.compile(_email_regex, re.I)
 _ptr_regex = r"(?:[0-9]{1,3}[-_\.]){3}[0-9]{1,3}"
 ptr_regex = re.compile(_ptr_regex)
 _url_regexes = (
-    r"https?://((?:\w|\w[\w\-]*\w)[\.]?)+(?:\w[\w\-]*\w|\w)(?::[0-9]{1,5})?.*$",
-    r"https?://\[" + _ipv6_regex + r"\](?::[0-9]{1,5})?.*$",
+    r"https?://" + _dns_name_regex + r"(?::[0-9]{1,5})?(?:(?:/|\?).*)?",
+    r"https?://\[" + _ipv6_regex + r"\](?::[0-9]{1,5})?(?:(?:/|\?).*)?",
 )
 url_regexes = list(re.compile(r, re.I) for r in _url_regexes)
 
@@ -48,13 +48,13 @@
             (
                 "OPEN_TCP_PORT",
                 (
-                    r"^((?:\w|\w[\w\-]*\w)[\.]?)+(?:\w[\w\-]*\w|\w):[0-9]{1,5}$",
+                    r"^" + _dns_name_regex + r":[0-9]{1,5}$",
                     r"^\[" + _ipv6_regex + r"\]:[0-9]{1,5}$",
                 ),
             ),
             (
                 "URL",
-                _url_regexes,
+                tuple(r"^" + r + r"$" for r in _url_regexes),
             ),
         )
     )
diff --git a/bbot/test/test_step_1/test_regexes.py b/bbot/test/test_step_1/test_regexes.py
new file mode 100644
index 0000000000..8f5d7290b0
--- /dev/null
+++ b/bbot/test/test_step_1/test_regexes.py
@@ -0,0 +1,185 @@
+from bbot.core.event.helpers import get_event_type
+from bbot.core.helpers import regexes
+from bbot.core.errors import ValidationError
+
+
+def test_dns_name_regexes():
+    bad_dns = [
+        "-evilcorp.com",  # DNS names cannot begin with a dash
+        "evilcorp-.com",  # DNS names cannot end with a dash
+        "evilcorp..com",  # DNS names cannot have two consecutive dots
+        ".evilcorp.com",  # DNS names cannot begin with a dot
+        "evilcorp.com.",  # DNS names cannot end with a dot (in most cases)
+        "ev*lcorp.com",  # DNS names cannot have special characters (other than dash and dot)
+        "evilcorp/.com",  # DNS names cannot have slashes
+        "evilcorp..",  # DNS names cannot end with a dot
+        "evilcorp.com/path",  # Paths are not part of DNS names
+        "evilcorp.com:80",  # Ports are not part of DNS names
+    ]
+
+    good_dns = [
+        "evilcorp.com",
+        "www.evilcorp.com",
+        "subdomain.evilcorp.com",
+        "deep.subdomain.evilcorp.com",
+        "evilcorp-test.com",
+        "evilcorp_com",
+        "evilcorpcom",
+        "1.2.3.4",
+        "1-2-3.net",
+        "single-character.tld",
+        "asdfasdfasdfasdfasdfasdfasdfasdfasdfasdfasdfasdfasdfasdfasdfa.com",
+        "asdfasdfasdfasdfgsdgasdfs.asdfasdfasdfasdfasdf.evilcorp.com",
+    ]
+
+    dns_name_regexes = regexes.event_type_regexes["DNS_NAME"]
+
+    for dns in bad_dns:
+        for r in dns_name_regexes:
+            assert not r.match(dns), f"BAD DNS NAME: {dns} matched regex: {r}"
+
+        try:
+            event_type = get_event_type(dns)
+            if event_type == "OPEN_TCP_PORT":
+                assert dns == "evilcorp.com:80"
+                continue
+            elif event_type == "IP_ADDRESS":
+                assert dns == "1.2.3.4"
+                continue
+            pytest.fail(f"BAD DNS NAME: {dns} matched returned event type: {event_type}")
+        except ValidationError:
+            continue
+        except Exception as e:
+            pytest.fail(f"BAD DNS NAME: {dns} raised unknown error: {e}")
+
+    for dns in good_dns:
+        matches = list(r.match(dns) for r in dns_name_regexes)
+        if not any(matches):
+            assert dns in ("evilcorp_com", "evilcorpcom"), f"Good DNS_NAME {dns} did not match regexes"
+        event_type = get_event_type(dns)
+        if not event_type == "DNS_NAME":
+            assert (
+                dns == "1.2.3.4" and event_type == "IP_ADDRESS"
+            ), f"Event type for DNS_NAME {dns} was not properly detected"
+
+
+def test_open_port_regexes():
+    bad_ports = [
+        "1.2.3.4",
+        "[dead::beef]",
+        "evilcorp.com",
+        "asdfasdfasdfasdfasdfasdf.asdfasdfasdfasdfasdf.evilcorp.com",
+        "asdfasdfasdfasdfasdfasdf.asdfasdfasdfasdfasdf.evilcorp.com/login",
+        "asdfasdfasdfasdfasdfasdf.asdfasdfasdfasdfasdf.evilcorp.com:80/login",
+        "192.0.2.1:-80",  # Ports cannot be negative
+        "192.0.2.1:800000",  # Ports cannot exceed 65535
+        "[2001:db8::]:-80",  # Ports cannot be negative
+        "[2001:db8::1]:800000",  # Ports cannot exceed 65535
+        "[2001:db8::1]:80/login",  # Ports cannot exceed 65535
+        "192.0.2.1:notaport",  # Ports must be a number
+        "[2001:db8::1]:notaport",  # Ports must be a number
+        "192.0.2.1:",  # Ports cannot be empty
+        "[2001:db8::1]:",  # Ports cannot be empty
+        "2001:db8::1:65535",  # IPv6 ports must be surrounded by []
+    ]
+
+    good_ports = [
+        "192.0.2.1:80",
+        "192.0.2.1:8080",
+        "192.0.2.1:65535",
+        "evilcorp.com:8080",
+        "asdfasdfasdfasdfasdfasdf.asdfasdfasdfasdfasdfasdf.asdfasdfasdfsadf.evilcorp.com:8080",
+        "[2001:db8::1]:80",
+        "[2001:db8::1]:8080",
+        "[2001:db8::1]:65535",
+    ]
+
+    open_port_regexes = regexes.event_type_regexes["OPEN_TCP_PORT"]
+
+    for open_port in bad_ports:
+        for r in open_port_regexes:
+            assert not r.match(open_port), f"BAD OPEN_TCP_PORT: {open_port} matched regex: {r}"
+
+        try:
+            event_type = get_event_type(open_port)
+            if event_type == "IP_ADDRESS":
+                assert open_port in ("1.2.3.4", "[dead::beef]")
+                continue
+            elif event_type == "DNS_NAME":
+                assert open_port in ("evilcorp.com", "asdfasdfasdfasdfasdfasdf.asdfasdfasdfasdfasdf.evilcorp.com")
+                continue
+            pytest.fail(f"BAD OPEN_TCP_PORT: {open_port} matched returned event type: {event_type}")
+        except ValidationError:
+            continue
+        except Exception as e:
+            pytest.fail(f"BAD OPEN_TCP_PORT: {open_port} raised unknown error: {e}")
+
+    for open_port in good_ports:
+        matches = list(r.match(open_port) for r in open_port_regexes)
+        assert any(matches), f"Good OPEN_TCP_PORT {open_port} did not match regexes"
+        event_type = get_event_type(open_port)
+        assert event_type == "OPEN_TCP_PORT"
+
+
+def test_url_regexes():
+    bad_urls = [
+        "http:/evilcorp.com",
+        "http:evilcorp.com",
+        "http://evilcorp..com",
+        "http:///evilcorp.com",
+        "http:// evilcorp.com",
+        "http://evilcorp com",
+        "http://evilcorp.",
+        "http://.com",
+        "evilcorp.com",
+        "http://ex..ample.com",
+        "http://evilcorp..com/path",
+        "http://evilcorp tool.com",
+        "http://evilcorp.com:this_is_not_a_port/path",
+        "http://-evilcorp.com",
+        "http://evilcorp-.com",
+        "http://evilcorp.com-",
+        "http://-evilcorp-.com",
+        "http://evilcorp-.com/path",
+        "http://evilcorp.com-/path",
+        "evilcorp.com/path" "asdfasdfasdfasdfgsdgasdfs.asdfasdfasdfasdfasdf.evilcorp.com/path",
+        "rhttps://evilcorp.com",
+        "https://[e]",
+        "https://[1]:80",
+    ]
+
+    good_urls = [
+        "https://evilcorp.com",
+        "https://asdf.www.evilcorp.com",
+        "https://asdf.www-test.evilcorp.com",
+        "https://a.www-test.evilcorp.c",
+        "https://evilcorp.com/asdf?a=b",
+        "https://evilcorp.com/asdf/asdf/asdf",
+        "https://1.2.3.4/",
+        "https://[dead::beef]/",
+        "https://[dead:c0de::beef]/",
+        "https://asdfasdfasdfasdfasdf.asdfasdfasdfasdfasdfa.sdfasdfasdfasdfsadf.evilcorp.com",
+    ]
+
+    url_regexes = regexes.event_type_regexes["URL"]
+
+    for bad_url in bad_urls:
+        for r in url_regexes:
+            assert not r.match(bad_url), f"BAD URL: {bad_url} matched regex: {r}"
+
+        event_type = ""
+        try:
+            event_type = get_event_type(bad_url)
+            if event_type == "DNS_NAME":
+                assert bad_url == "evilcorp.com"
+                continue
+            pytest.fail(f"BAD URL: {bad_url} matched returned event type: {event_type}")
+        except ValidationError:
+            continue
+        except Exception as e:
+            pytest.fail(f"BAD URL: {bad_url} raised unknown error: {e}")
+
+    for good_url in good_urls:
+        matches = list(r.match(good_url) for r in url_regexes)
+        assert any(matches), f"Good URL {good_url} did not match regexes"
+        assert get_event_type(good_url) == "URL_UNVERIFIED", f"Event type for URL {good_url} was not properly detected"

From 49abf5224bcfdfc4ea239ed5faa19e5cac5129cc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 16:29:52 -0400
Subject: [PATCH 274/387] fixed flake

---
 bbot/test/test_step_1/test_regexes.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/bbot/test/test_step_1/test_regexes.py b/bbot/test/test_step_1/test_regexes.py
index 8f5d7290b0..9ce4f96436 100644
--- a/bbot/test/test_step_1/test_regexes.py
+++ b/bbot/test/test_step_1/test_regexes.py
@@ -1,3 +1,5 @@
+import pytest
+
 from bbot.core.event.helpers import get_event_type
 from bbot.core.helpers import regexes
 from bbot.core.errors import ValidationError

From 492e9e14af4aa63e10b6712d837073c63ff85f4b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 16:38:25 -0400
Subject: [PATCH 275/387] converted task counter to async

---
 bbot/core/helpers/async_helpers.py | 4 ++--
 bbot/modules/base.py               | 8 ++++----
 bbot/scanner/manager.py            | 6 +++---
 bbot/scanner/scanner.py            | 2 +-
 4 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index df7219ec33..5adabf4b62 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -41,10 +41,10 @@ class TaskCounter:
     def __init__(self):
         self.value = 0
 
-    def __enter__(self):
+    def __aenter__(self):
         self.value += 1
 
-    def __exit__(self, exc_type, exc_val, exc_tb):
+    def __aexit__(self, exc_type, exc_val, exc_tb):
         self.value -= 1
 
 
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 9542336ea6..88b9a2b9d5 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -220,7 +220,7 @@ async def _handle_batch(self):
                 if events:
                     submitted = True
                     async with self.scan.acatch(context=f"{self.name}.handle_batch"):
-                        with self._task_counter:
+                        async with self._task_counter:
                             await self.handle_batch(*events)
                 if finish:
                     async with self.scan.acatch(context=f"{self.name}.finish"):
@@ -346,12 +346,12 @@ async def _worker(self):
                     if acceptable:
                         if event.type == "FINISHED":
                             async with self.scan.acatch(context=f"{self.name}.finish"):
-                                with self._task_counter:
+                                async with self._task_counter:
                                     await self.finish()
                         else:
                             self.scan.stats.event_consumed(event, self)
                             async with self.scan.acatch(context=f"{self.name}.handle_event"):
-                                with self._task_counter:
+                                async with self._task_counter:
                                     await self.handle_event(event)
 
     @property
@@ -451,7 +451,7 @@ async def _cleanup(self):
             for callback in [self.cleanup] + self.cleanup_callbacks:
                 if callable(callback):
                     async with self.scan.acatch(context=self.name):
-                        with self._task_counter:
+                        async with self._task_counter:
                             await self.helpers.execute_sync_or_async(callback)
 
     async def queue_event(self, event):
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index d0fa0f5f76..bfe3bb64cb 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -35,7 +35,7 @@ async def init_events(self):
         seed scanner with target events
         """
         async with self.scan.acatch(context=self.init_events):
-            with self._task_counter:
+            async with self._task_counter:
                 await self.distribute_event(self.scan.root_event)
                 sorted_events = sorted(self.scan.target.events, key=lambda e: len(e.data))
                 for event in sorted_events:
@@ -51,7 +51,7 @@ async def emit_event(self, event, *args, **kwargs):
         bbot.scanner: scan._event_thread_pool: running for 0 seconds: ScanManager._emit_event(DNS_NAME("sipfed.online.lync.com"))
         bbot.scanner: scan._event_thread_pool: running for 0 seconds: ScanManager._emit_event(DNS_NAME("sipfed.online.lync.com"))
         """
-        with self._task_counter:
+        async with self._task_counter:
             # skip event if it fails precheck
             if not self._event_precheck(event):
                 event._resolved.set()
@@ -316,7 +316,7 @@ def accept_event(self, event):
         return True
 
     async def _register_running(self, callback, *args, **kwargs):
-        with self._task_counter:
+        async with self._task_counter:
             return await callback(*args, **kwargs)
 
     async def distribute_event(self, *args, **kwargs):
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 47acc70033..f1e45e8dd0 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -418,7 +418,7 @@ def cancel_tasks(self):
     async def report(self):
         for mod in self.modules.values():
             async with self.acatch(context=mod.report):
-                with mod._task_counter:
+                async with mod._task_counter:
                     await mod.report()
 
     async def cleanup(self):

From cc3b417607f3ccf1e32328ff22a5da42c953f0bf Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 16:49:34 -0400
Subject: [PATCH 276/387] fix task counter

---
 bbot/core/helpers/async_helpers.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 5adabf4b62..6a5a10eda3 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -41,10 +41,11 @@ class TaskCounter:
     def __init__(self):
         self.value = 0
 
-    def __aenter__(self):
+    async def __aenter__(self):
         self.value += 1
+        return self
 
-    def __aexit__(self, exc_type, exc_val, exc_tb):
+    async def __aexit__(self, exc_type, exc_val, exc_tb):
         self.value -= 1
 
 
From 4ca4f7a99c214287229af54873ee88ded19e5d8e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 17:00:03 -0400
Subject: [PATCH 277/387] =?UTF-8?q?public=20execution=20of=20naabu=20?=
 =?UTF-8?q?=F0=9F=94=AB?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 bbot/core/helpers/modules.py                  |   2 +-
 bbot/modules/internal/speculate.py            |   2 +-
 bbot/modules/naabu.py                         | 120 ------------------
 .../module_tests/test_module_naabu.py         |  11 --
 4 files changed, 2 insertions(+), 133 deletions(-)
 delete mode 100644 bbot/modules/naabu.py
 delete mode 100644 bbot/test/test_step_2/module_tests/test_module_naabu.py

diff --git a/bbot/core/helpers/modules.py b/bbot/core/helpers/modules.py
index 8edd406b74..fe449a3ee2 100644
--- a/bbot/core/helpers/modules.py
+++ b/bbot/core/helpers/modules.py
@@ -208,7 +208,7 @@ def recommend_dependencies(self, modules):
         """
         resolve_choices = {}
         # step 1: build a dictionary containing event types and their associated modules
-        # {"IP_ADDRESS": set("naabu", "ipneighbor", ...)}
+        # {"IP_ADDRESS": set("nmap", "ipneighbor", ...)}
         watched = {}
         produced = {}
         for modname in modules:
diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index 0e2b6b9ce7..5b38bc6779 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -58,7 +58,7 @@ async def setup(self):
                 self.hugewarning(
                     f"Selected target ({target_len:,} hosts) is too large, skipping IP_RANGE --> IP_ADDRESS speculation"
                 )
-                self.hugewarning(f"Enabling a port scanner (naabu or masscan) module is highly recommended")
+                self.hugewarning(f"Enabling a port scanner (nmap or masscan) module is highly recommended")
             self.range_to_ip = False
 
         return True
diff --git a/bbot/modules/naabu.py b/bbot/modules/naabu.py
deleted file mode 100644
index f81424df89..0000000000
--- a/bbot/modules/naabu.py
+++ /dev/null
@@ -1,120 +0,0 @@
-import json
-import subprocess
-from bbot.modules.base import BaseModule
-
-
-class naabu(BaseModule):
-    watched_events = ["IP_ADDRESS", "DNS_NAME"]
-    produced_events = ["OPEN_TCP_PORT"]
-    flags = ["active", "portscan", "aggressive", "web-thorough"]
-    meta = {"description": "Execute port scans with naabu"}
-    options = {
-        "ports": "",
-        "top_ports": 100,
-        "skip_host_discovery": True,
-        "version": "2.1.1",
-    }
-    options_desc = {
-        "ports": "ports to scan",
-        "top_ports": "top ports to scan",
-        "skip_host_discovery": "skip host discovery (-Pn)",
-        "version": "naabu version",
-    }
-    max_event_handlers = 1
-    batch_size = 256
-    _priority = 2
-
-    deps_ansible = [
-        {
-            "name": "install libpcap (Debian)",
-            "package": {"name": "libpcap0.8", "state": "present"},
-            "become": True,
-            "when": """ansible_facts['os_family'] == 'Debian'""",
-            "ignore_errors": True,
-        },
-        {
-            "name": "install libpcap (others)",
-            "package": {"name": "libpcap", "state": "present"},
-            "become": True,
-            "when": """ansible_facts['os_family'] != 'Debian'""",
-            "ignore_errors": True,
-        },
-        {
-            "name": "symlink libpcap",
-            "file": {"src": "/usr/lib/libpcap.so", "dest": "#{BBOT_LIB}/libpcap.so.0.8", "state": "link"},
-            "when": """ansible_facts['os_family'] != 'Debian'""",
-            "ignore_errors": True,
-        },
-        {
-            "name": "Download naabu",
-            "unarchive": {
-                "src": "https://github.com/projectdiscovery/naabu/releases/download/v#{BBOT_MODULES_NAABU_VERSION}/naabu_#{BBOT_MODULES_NAABU_VERSION}_#{BBOT_OS}_#{BBOT_CPU_ARCH}.zip",
-                "include": "naabu",
-                "dest": "#{BBOT_TOOLS}",
-                "remote_src": True,
-            },
-        },
-    ]
-
-    async def setup(self):
-        self.helpers.depsinstaller.ensure_root(message="Naabu requires root privileges")
-        self.skip_host_discovery = self.config.get("skip_host_discovery", True)
-        return True
-
-    async def handle_batch(self, *events):
-        _input = [str(e.data) for e in events]
-        command = self.construct_command()
-        async for line in self.helpers.run_live(command, input=_input, stderr=subprocess.DEVNULL, sudo=False):
-            try:
-                j = json.loads(line)
-            except Exception as e:
-                self.debug(f'Error parsing line "{line}" as JSON: {e}')
-                break
-            host = j.get("host", j.get("ip"))
-            port = j.get("port")
-
-            source_event = None
-            # check exact matches first
-            for event in events:
-                if host == str(event.host):
-                    source_event = event
-                    break
-            # then make a broader check, for cidrs etc.
-            if source_event is None:
-                intermediary_event = None
-                for event in events:
-                    if host in event:
-                        intermediary_event = event
-                        break
-                if intermediary_event is not None:
-                    source_event = self.make_event(host, "IP_ADDRESS", source=intermediary_event)
-                    if source_event:
-                        self.emit_event(source_event)
-
-            if source_event is None:
-                self.warning(f'Failed to correlate source event for host "{host}"')
-                continue
-
-            self.emit_event(f"{host}:{port}", "OPEN_TCP_PORT", source=source_event)
-
-    def construct_command(self):
-        ports = self.config.get("ports", "")
-        top_ports = self.config.get("top_ports", "")
-        command = [
-            "naabu",
-            "-silent",
-            "-json",
-            # "-r",
-            # self.helpers.resolver_file
-        ]
-        if self.skip_host_discovery:
-            command += ["-Pn"]
-        if ports:
-            command += ["-p", ports]
-        else:
-            command += ["-top-ports", top_ports]
-        return command
-
-    async def cleanup(self):
-        resume_file = self.helpers.current_dir / "resume.cfg"
-        resume_file.unlink(missing_ok=True)
diff --git a/bbot/test/test_step_2/module_tests/test_module_naabu.py b/bbot/test/test_step_2/module_tests/test_module_naabu.py
deleted file mode 100644
index ed8cd049cc..0000000000
--- a/bbot/test/test_step_2/module_tests/test_module_naabu.py
+++ /dev/null
@@ -1,11 +0,0 @@
-from .base import ModuleTestBase
-
-
-class TestNaabu(ModuleTestBase):
-    async def setup_before_prep(self, module_test):
-        expect_args = {"method": "GET", "uri": "/"}
-        respond_args = {"response_data": "alive"}
-        module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
-
-    def check(self, module_test, events):
-        assert any(e.type == "OPEN_TCP_PORT" for e in events)

From f62060109bc11e9f44520b46ac43e2a2304191bc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 17:43:10 -0400
Subject: [PATCH 278/387] fix punycode tests

---
 bbot/core/helpers/punycode.py         | 63 +++++++++++++++++----------
 bbot/test/test_step_1/test_events.py  | 10 ++---
 bbot/test/test_step_1/test_helpers.py |  2 +
 3 files changed, 47 insertions(+), 28 deletions(-)

diff --git a/bbot/core/helpers/punycode.py b/bbot/core/helpers/punycode.py
index bbebbafb87..2003fc7ccd 100644
--- a/bbot/core/helpers/punycode.py
+++ b/bbot/core/helpers/punycode.py
@@ -1,27 +1,44 @@
+import re
 import idna
 from contextlib import suppress
 
 
-def smart_decode_punycode(data):
-    """
-    xn--eckwd4c7c.xn--zckzah --> ドメイン.テスト
-    """
-    if not isinstance(data, str):
-        raise ValueError(f"data must be a string, not {type(data)}")
-    if "xn--" in data:
-        with suppress(UnicodeError):
-            parts = data.split("@")
-            return "@".join(idna.decode(p) for p in parts)
-    return data
-
-
-def smart_encode_punycode(data):
-    """
-    ドメイン.テスト --> xn--eckwd4c7c.xn--zckzah
-    """
-    if not isinstance(data, str):
-        raise ValueError(f"data must be a string, not {type(data)}")
-    with suppress(UnicodeError):
-        parts = data.split("@")
-        return "@".join(idna.encode(p).decode(errors="ignore") for p in parts)
-    return data
+def split_text(text):
+    # Split text into segments by special characters
+    # We assume that only alphanumeric segments should be encoded
+    segments = re.split(r"([^\w-]+)", text)
+    return segments
+
+
+def smart_encode_punycode(text: str) -> str:
+    segments = split_text(text)
+    result_segments = []
+
+    for segment in segments:
+        try:
+            if re.match(r"^[\w-]+$", segment):  # Only encode alphanumeric segments
+                # segment = segment.encode('idna').decode('ascii')
+                segment = idna.encode(segment).decode(errors="ignore")
+        except UnicodeError:
+            pass  # If encoding fails, leave the segment as it is
+
+        result_segments.append(segment)
+
+    return "".join(result_segments)
+
+
+def smart_decode_punycode(text: str) -> str:
+    segments = split_text(text)
+    result_segments = []
+
+    for segment in segments:
+        try:
+            if re.match(r"^[\w-]+$", segment):  # Only decode alphanumeric segments
+                # segment = segment.encode('ascii').decode('idna')
+                segment = idna.decode(segment)
+        except UnicodeError:
+            pass  # If decoding fails, leave the segment as it is
+
+        result_segments.append(segment)
+
+    return "".join(result_segments)
diff --git a/bbot/test/test_step_1/test_events.py b/bbot/test/test_step_1/test_events.py
index 44a94c647f..124a6900f3 100644
--- a/bbot/test/test_step_1/test_events.py
+++ b/bbot/test/test_step_1/test_events.py
@@ -249,16 +249,16 @@ async def test_events(events, scan, helpers, bbot_config):
     assert scan.make_event("ドメイン.テスト:80", dummy=True).type == "OPEN_TCP_PORT"
     assert scan.make_event("http://ドメイン.テスト:80", dummy=True).type == "URL_UNVERIFIED"
 
-    assert scan.make_event("xn--eckwd4c7c.xn--zckzah", dummy=True).type == "DNS_NAME"
-    assert scan.make_event("bob@xn--eckwd4c7c.xn--zckzah", dummy=True).type == "EMAIL_ADDRESS"
-    assert scan.make_event("xn--eckwd4c7c.xn--zckzah:80", dummy=True).type == "OPEN_TCP_PORT"
-    assert scan.make_event("http://xn--eckwd4c7c.xn--zckzah:80", dummy=True).type == "URL_UNVERIFIED"
-
     assert scan.make_event("xn--eckwd4c7c.xn--zckzah", dummy=True).data == "ドメイン.テスト"
     assert scan.make_event("bob@xn--eckwd4c7c.xn--zckzah", dummy=True).data == "bob@ドメイン.テスト"
     assert scan.make_event("xn--eckwd4c7c.xn--zckzah:80", dummy=True).data == "ドメイン.テスト:80"
     assert scan.make_event("http://xn--eckwd4c7c.xn--zckzah:80", dummy=True).data == "http://ドメイン.テスト/"
 
+    assert scan.make_event("xn--eckwd4c7c.xn--zckzah", dummy=True).type == "DNS_NAME"
+    assert scan.make_event("bob@xn--eckwd4c7c.xn--zckzah", dummy=True).type == "EMAIL_ADDRESS"
+    assert scan.make_event("xn--eckwd4c7c.xn--zckzah:80", dummy=True).type == "OPEN_TCP_PORT"
+    assert scan.make_event("http://xn--eckwd4c7c.xn--zckzah:80", dummy=True).type == "URL_UNVERIFIED"
+
     # test event serialization
     from bbot.core.event import event_from_json
 
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 7a6e146558..24e77f983b 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -342,6 +342,8 @@ async def test_helpers_misc(helpers, scan, bbot_scanner, bbot_config, bbot_https
     assert helpers.smart_decode_punycode("evilcorp.com") == "evilcorp.com"
     assert helpers.smart_encode_punycode("bob@ドメイン.テスト") == "bob@xn--eckwd4c7c.xn--zckzah"
     assert helpers.smart_decode_punycode("bob@xn--eckwd4c7c.xn--zckzah") == "bob@ドメイン.テスト"
+    assert helpers.smart_encode_punycode("ドメイン.テスト:80") == "xn--eckwd4c7c.xn--zckzah:80"
+    assert helpers.smart_decode_punycode("xn--eckwd4c7c.xn--zckzah:80") == "ドメイン.テスト:80"
     with pytest.raises(ValueError):
         helpers.smart_decode_punycode(b"asdf")
     with pytest.raises(ValueError):

From 7b47dc9150b44b76715da5e7bd9ccdcf7ee88d43 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 14 Jul 2023 17:45:25 -0400
Subject: [PATCH 279/387] flaked

---
 bbot/core/helpers/punycode.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/core/helpers/punycode.py b/bbot/core/helpers/punycode.py
index 2003fc7ccd..c14dd69742 100644
--- a/bbot/core/helpers/punycode.py
+++ b/bbot/core/helpers/punycode.py
@@ -1,6 +1,5 @@
 import re
 import idna
-from contextlib import suppress
 
 
 def split_text(text):

From e8127086f6925c41a0767a907495d352a8ca3dcb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 15 Jul 2023 14:36:00 -0400
Subject: [PATCH 280/387] fix tests

---
 bbot/core/helpers/punycode.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/punycode.py b/bbot/core/helpers/punycode.py
index c14dd69742..26ea9618b2 100644
--- a/bbot/core/helpers/punycode.py
+++ b/bbot/core/helpers/punycode.py
@@ -5,7 +5,9 @@
 def split_text(text):
     # Split text into segments by special characters
     # We assume that only alphanumeric segments should be encoded
-    segments = re.split(r"([^\w-]+)", text)
+    if not isinstance(text, str):
+        raise ValueError(f"data must be a string, not {type(data)}")
+    segments = re.split(r"([a-z0-9-]+)", text)
     return segments
 
 
From 721f54f30ba5825ea7ee281d31dff449a9761989 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 15 Jul 2023 14:37:21 -0400
Subject: [PATCH 281/387] consistent punycode regexes

---
 bbot/core/helpers/punycode.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/bbot/core/helpers/punycode.py b/bbot/core/helpers/punycode.py
index 26ea9618b2..7798754ae0 100644
--- a/bbot/core/helpers/punycode.py
+++ b/bbot/core/helpers/punycode.py
@@ -17,8 +17,7 @@ def smart_encode_punycode(text: str) -> str:
 
     for segment in segments:
         try:
-            if re.match(r"^[\w-]+$", segment):  # Only encode alphanumeric segments
-                # segment = segment.encode('idna').decode('ascii')
+            if re.match(r"^[a-z0-9-]+$", segment):  # Only encode alphanumeric segments
                 segment = idna.encode(segment).decode(errors="ignore")
         except UnicodeError:
             pass  # If encoding fails, leave the segment as it is
@@ -34,8 +33,7 @@ def smart_decode_punycode(text: str) -> str:
 
     for segment in segments:
         try:
-            if re.match(r"^[\w-]+$", segment):  # Only decode alphanumeric segments
-                # segment = segment.encode('ascii').decode('idna')
+            if re.match(r"^[a-z0-9-]+$", segment):  # Only decode alphanumeric segments
                 segment = idna.decode(segment)
         except UnicodeError:
             pass  # If decoding fails, leave the segment as it is

From 1cc2d801f8b92ced24fe0ca638736b78a68eb57b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 15 Jul 2023 14:40:01 -0400
Subject: [PATCH 282/387] flaked

---
 bbot/core/helpers/punycode.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/punycode.py b/bbot/core/helpers/punycode.py
index 7798754ae0..b49159a9cc 100644
--- a/bbot/core/helpers/punycode.py
+++ b/bbot/core/helpers/punycode.py
@@ -6,7 +6,7 @@ def split_text(text):
     # Split text into segments by special characters
     # We assume that only alphanumeric segments should be encoded
     if not isinstance(text, str):
-        raise ValueError(f"data must be a string, not {type(data)}")
+        raise ValueError(f"data must be a string, not {type(text)}")
     segments = re.split(r"([a-z0-9-]+)", text)
     return segments
 

From 5cc160d8c0d97dbd4d851750c26b624480385de1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 15 Jul 2023 14:41:24 -0400
Subject: [PATCH 283/387] comments

---
 bbot/core/helpers/punycode.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/bbot/core/helpers/punycode.py b/bbot/core/helpers/punycode.py
index b49159a9cc..c18099f100 100644
--- a/bbot/core/helpers/punycode.py
+++ b/bbot/core/helpers/punycode.py
@@ -12,6 +12,9 @@ def split_text(text):
 
 
 def smart_encode_punycode(text: str) -> str:
+    """
+    ドメイン.テスト --> xn--eckwd4c7c.xn--zckzah
+    """
     segments = split_text(text)
     result_segments = []
 
@@ -28,6 +31,9 @@ def smart_encode_punycode(text: str) -> str:
 
 
 def smart_decode_punycode(text: str) -> str:
+    """
+    xn--eckwd4c7c.xn--zckzah --> ドメイン.テスト
+    """
     segments = split_text(text)
     result_segments = []
 

From 5e3e0e24f2a5132df0ecaba2b6be5fe16f1bb608 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 15 Jul 2023 16:02:12 -0400
Subject: [PATCH 284/387] fix punycode tests

---
 bbot/core/helpers/punycode.py         | 10 +++++++---
 bbot/test/test_step_1/test_helpers.py |  4 ++--
 2 files changed, 9 insertions(+), 5 deletions(-)

diff --git a/bbot/core/helpers/punycode.py b/bbot/core/helpers/punycode.py
index c18099f100..d7055f6dbc 100644
--- a/bbot/core/helpers/punycode.py
+++ b/bbot/core/helpers/punycode.py
@@ -2,12 +2,16 @@
 import idna
 
 
+alphanum_regex = re.compile(r"([\w-]+)")
+alphanum_anchored = re.compile(r"^[\w-]+$")
+
+
 def split_text(text):
     # Split text into segments by special characters
     # We assume that only alphanumeric segments should be encoded
     if not isinstance(text, str):
         raise ValueError(f"data must be a string, not {type(text)}")
-    segments = re.split(r"([a-z0-9-]+)", text)
+    segments = alphanum_regex.split(text)
     return segments
 
 
@@ -20,7 +24,7 @@ def smart_encode_punycode(text: str) -> str:
 
     for segment in segments:
         try:
-            if re.match(r"^[a-z0-9-]+$", segment):  # Only encode alphanumeric segments
+            if alphanum_anchored.match(segment):  # Only encode alphanumeric segments
                 segment = idna.encode(segment).decode(errors="ignore")
         except UnicodeError:
             pass  # If encoding fails, leave the segment as it is
@@ -39,7 +43,7 @@ def smart_decode_punycode(text: str) -> str:
 
     for segment in segments:
         try:
-            if re.match(r"^[a-z0-9-]+$", segment):  # Only decode alphanumeric segments
+            if alphanum_anchored.match(segment):  # Only decode alphanumeric segments
                 segment = idna.decode(segment)
         except UnicodeError:
             pass  # If decoding fails, leave the segment as it is
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 24e77f983b..2e1e74e96f 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -340,8 +340,8 @@ async def test_helpers_misc(helpers, scan, bbot_scanner, bbot_config, bbot_https
     assert helpers.smart_decode_punycode("xn--eckwd4c7c.xn--zckzah") == "ドメイン.テスト"
     assert helpers.smart_encode_punycode("evilcorp.com") == "evilcorp.com"
     assert helpers.smart_decode_punycode("evilcorp.com") == "evilcorp.com"
-    assert helpers.smart_encode_punycode("bob@ドメイン.テスト") == "bob@xn--eckwd4c7c.xn--zckzah"
-    assert helpers.smart_decode_punycode("bob@xn--eckwd4c7c.xn--zckzah") == "bob@ドメイン.テスト"
+    assert helpers.smart_encode_punycode("bob_smith@ドメイン.テスト") == "bob_smith@xn--eckwd4c7c.xn--zckzah"
+    assert helpers.smart_decode_punycode("bob_smith@xn--eckwd4c7c.xn--zckzah") == "bob_smith@ドメイン.テスト"
     assert helpers.smart_encode_punycode("ドメイン.テスト:80") == "xn--eckwd4c7c.xn--zckzah:80"
     assert helpers.smart_decode_punycode("xn--eckwd4c7c.xn--zckzah:80") == "ドメイン.テスト:80"
     with pytest.raises(ValueError):

From e425e21a91846f89e27da6b1fad579aaa76202ed Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 15 Jul 2023 19:30:26 -0400
Subject: [PATCH 285/387] improve hostname regex

---
 bbot/core/event/helpers.py            | 15 +--------------
 bbot/core/helpers/regexes.py          | 25 ++++++++++++++++++-------
 bbot/test/test_step_1/test_regexes.py |  4 ++--
 3 files changed, 21 insertions(+), 23 deletions(-)

diff --git a/bbot/core/event/helpers.py b/bbot/core/event/helpers.py
index bd1ace47e2..6df0fe2ee8 100644
--- a/bbot/core/event/helpers.py
+++ b/bbot/core/event/helpers.py
@@ -4,7 +4,7 @@
 
 from bbot.core.errors import ValidationError
 from bbot.core.helpers import sha1, smart_decode, smart_decode_punycode
-from bbot.core.helpers.regexes import event_type_regexes, event_id_regex, hostname_regex
+from bbot.core.helpers.regexes import event_type_regexes, event_id_regex
 
 
 log = logging.getLogger("bbot.core.event.helpers")
@@ -34,10 +34,6 @@ def get_event_type(data):
                     return "URL_UNVERIFIED"
                 return t
 
-    # Assume DNS_NAME for basic words
-    if hostname_regex.match(data):
-        return "DNS_NAME"
-
     raise ValidationError(f'Unable to autodetect event type from "{data}"')
 
 
@@ -49,12 +45,3 @@ def is_event_id(s):
 
 def make_event_id(data, event_type):
     return f"{event_type}:{sha1(data).hexdigest()}"
-
-
-host_types = ("URL", "DNS_NAME", "EMAIL_ADDRESS")
-
-port_types = ("OPEN_TCP_PORT",)
-
-host_ip_types = ("IP_ADDRESS", "IP_ADDRESS", "IP_RANGE", "IP_RANGE")
-
-scopable_types = host_types + port_types
diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index dac1a5b097..fa91c6c0dd 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -21,14 +21,25 @@
 num_regex = re.compile(r"\d+")
 _ipv6_regex = r"[A-F0-9:]*:[A-F0-9:]*:[A-F0-9:]*"
 ipv6_regex = re.compile(_ipv6_regex, re.I)
+# dns names with periods
 _dns_name_regex = r"(?:\w(?:[\w-]{0,100}\w)?\.)+\w{1,63}"
-_hostname_regex = r"^[\w-]+$"
+# dns names without periods
+_hostname_regex = r"(?!\w*\.\w+)\w(?:[\w-]{0,100}\w)?"
 _email_regex = r"(?:[^\W_][\w\-\.\+]{,100})@(?:\w[\w\-\._]{,100})\.(?:[^\W_0-9]{2,8})"
 email_regex = re.compile(_email_regex, re.I)
 _ptr_regex = r"(?:[0-9]{1,3}[-_\.]){3}[0-9]{1,3}"
 ptr_regex = re.compile(_ptr_regex)
+
+_open_port_regexes = (
+    _dns_name_regex + r":[0-9]{1,5}",
+    _hostname_regex + r":[0-9]{1,5}",
+    r"\[" + _ipv6_regex + r"\]:[0-9]{1,5}",
+)
+open_port_regexes = list(re.compile(r, re.I) for r in _open_port_regexes)
+
 _url_regexes = (
     r"https?://" + _dns_name_regex + r"(?::[0-9]{1,5})?(?:(?:/|\?).*)?",
+    r"https?://" + _hostname_regex + r"(?::[0-9]{1,5})?(?:(?:/|\?).*)?",
     r"https?://\[" + _ipv6_regex + r"\](?::[0-9]{1,5})?(?:(?:/|\?).*)?",
 )
 url_regexes = list(re.compile(r, re.I) for r in _url_regexes)
@@ -39,7 +50,10 @@
         for k, regexes in (
             (
                 "DNS_NAME",
-                (r"^" + _dns_name_regex + r"$",),
+                (
+                    r"^" + _dns_name_regex + r"$",
+                    r"^" + _hostname_regex + r"$",
+                ),
             ),
             (
                 "EMAIL_ADDRESS",
@@ -47,10 +61,7 @@
             ),
             (
                 "OPEN_TCP_PORT",
-                (
-                    r"^" + _dns_name_regex + r":[0-9]{1,5}$",
-                    r"^\[" + _ipv6_regex + r"\]:[0-9]{1,5}$",
-                ),
+                tuple(r"^" + r + r"$" for r in _open_port_regexes),
             ),
             (
                 "URL",
@@ -63,7 +74,7 @@
 event_id_regex = re.compile(r"[0-9a-f]{40}:[A-Z0-9_]+")
 dns_name_regex = re.compile(_dns_name_regex, re.I)
 scan_name_regex = re.compile(r"[a-z]{3,20}_[a-z]{3,20}")
-hostname_regex = re.compile(_hostname_regex, re.I)
+hostname_regex = re.compile(r"^" + _hostname_regex + r"$", re.I)
 
 # For use with extract_params_html helper
 input_tag_regex = re.compile(r"<input[^>]+?name=[\"\'](\w+)[\"\']")
diff --git a/bbot/test/test_step_1/test_regexes.py b/bbot/test/test_step_1/test_regexes.py
index 9ce4f96436..a371f62f0a 100644
--- a/bbot/test/test_step_1/test_regexes.py
+++ b/bbot/test/test_step_1/test_regexes.py
@@ -56,8 +56,7 @@ def test_dns_name_regexes():
 
     for dns in good_dns:
         matches = list(r.match(dns) for r in dns_name_regexes)
-        if not any(matches):
-            assert dns in ("evilcorp_com", "evilcorpcom"), f"Good DNS_NAME {dns} did not match regexes"
+        assert any(matches), f"Good DNS_NAME {dns} did not match regexes"
         event_type = get_event_type(dns)
         if not event_type == "DNS_NAME":
             assert (
@@ -89,6 +88,7 @@ def test_open_port_regexes():
         "192.0.2.1:80",
         "192.0.2.1:8080",
         "192.0.2.1:65535",
+        "localhost:8888",
         "evilcorp.com:8080",
         "asdfasdfasdfasdfasdfasdf.asdfasdfasdfasdfasdfasdf.asdfasdfasdfsadf.evilcorp.com:8080",
         "[2001:db8::1]:80",

From 8acb32953fc1fd29fc77010cab719edf2f7824c9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 15 Jul 2023 23:45:57 -0400
Subject: [PATCH 286/387] speed up paramminer tests

---
 .../test_step_2/module_tests/test_module_oauth.py    |  4 ++--
 .../module_tests/test_module_paramminer_cookies.py   |  4 ++--
 .../module_tests/test_module_paramminer_getparams.py | 12 ++++++------
 .../module_tests/test_module_paramminer_headers.py   |  8 ++++++--
 4 files changed, 16 insertions(+), 12 deletions(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_oauth.py b/bbot/test/test_step_2/module_tests/test_module_oauth.py
index abb88372cd..3a93e625e6 100644
--- a/bbot/test/test_step_2/module_tests/test_module_oauth.py
+++ b/bbot/test/test_step_2/module_tests/test_module_oauth.py
@@ -1,6 +1,6 @@
 from .base import ModuleTestBase
 
-from .test_module_azure_realm import TestAzure_Realm
+from .test_module_azure_realm import TestAzure_Realm as Azure_Realm
 
 
 class TestOAUTH(ModuleTestBase):
@@ -167,7 +167,7 @@ class TestOAUTH(ModuleTestBase):
     async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
             url=f"https://login.microsoftonline.com/getuserrealm.srf?login=test@evilcorp.com",
-            json=TestAzure_Realm.response_json,
+            json=Azure_Realm.response_json,
         )
         module_test.httpx_mock.add_response(
             url="https://login.windows.net/evilcorp.com/.well-known/openid-configuration",
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
index 4a8a27e56d..9a8d415338 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_cookies.py
@@ -1,7 +1,7 @@
-from .test_module_paramminer_headers import *
+from .test_module_paramminer_headers import Paramminer_Headers, tempwordlist, helper
 
 
-class TestParamminer_Cookies(TestParamminer_Headers):
+class TestParamminer_Cookies(Paramminer_Headers):
     modules_overrides = ["httpx", "paramminer_cookies"]
     config_overrides = {"modules": {"paramminer_cookies": {"wordlist": tempwordlist(["junkcookie", "admincookie"])}}}
 
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
index ac67a8823d..fa9a4cc20b 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_getparams.py
@@ -1,7 +1,7 @@
-from .test_module_paramminer_headers import *
+from .test_module_paramminer_headers import Paramminer_Headers, tempwordlist, helper
 
 
-class TestParamminer_Getparams(TestParamminer_Headers):
+class TestParamminer_Getparams(Paramminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
     config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "id"])}}}
 
@@ -110,7 +110,7 @@ def check(self, module_test, events):
         )
 
 
-class TestParamminer_Getparams_Extract_Json(TestParamminer_Headers):
+class TestParamminer_Getparams_Extract_Json(Paramminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
     config_overrides = {"modules": {"paramminer_getparams": {"wordlist": tempwordlist([]), "http_extract": True}}}
 
@@ -152,7 +152,7 @@ def check(self, module_test, events):
         )
 
 
-class TestParamminer_Getparams_Extract_Xml(TestParamminer_Headers):
+class TestParamminer_Getparams_Extract_Xml(Paramminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
     config_overrides = {
         "modules": {
@@ -199,7 +199,7 @@ def check(self, module_test, events):
         )
 
 
-class TestParamminer_Getparams_Extract_Html(TestParamminer_Headers):
+class TestParamminer_Getparams_Extract_Html(Paramminer_Headers):
     modules_overrides = ["httpx", "paramminer_getparams"]
     config_overrides = {
         "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary"]), "http_extract": True}}
@@ -237,7 +237,7 @@ def check(self, module_test, events):
         )
 
 
-class TestParamminer_Getparams_finish(TestParamminer_Headers):
+class TestParamminer_Getparams_finish(Paramminer_Headers):
     modules_overrides = ["httpx", "excavate", "paramminer_getparams"]
     config_overrides = {
         "modules": {"paramminer_getparams": {"wordlist": tempwordlist(["canary", "canary2"]), "http_extract": True}}
diff --git a/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py b/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
index 16e1a215cb..7cc8114e6f 100644
--- a/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
+++ b/bbot/test/test_step_2/module_tests/test_module_paramminer_headers.py
@@ -3,7 +3,7 @@
 from .base import ModuleTestBase, tempwordlist
 
 
-class TestParamminer_Headers(ModuleTestBase):
+class Paramminer_Headers(ModuleTestBase):
     targets = ["http://127.0.0.1:8888"]
     modules_overrides = ["httpx", "paramminer_headers"]
     config_overrides = {"modules": {"paramminer_headers": {"wordlist": tempwordlist(["junkword1", "tracestate"])}}}
@@ -49,7 +49,11 @@ def check(self, module_test, events):
         )
 
 
-class TestParamminer_Headers(TestParamminer_Headers):
+class TestParamminer_Headers(Paramminer_Headers):
+    pass
+
+
+class TestParamminer_Headers_noreflection(Paramminer_Headers):
     headers_body_match = """
     <html>
     <title>the title</title>

From 1a0c2e7e8985ee3763a6fb756fadbca54d5c1d1a Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 16 Jul 2023 12:15:00 -0400
Subject: [PATCH 287/387] rework to avoid memory insanity

---
 bbot/modules/paramminer_headers.py | 25 +++++++++++++------------
 1 file changed, 13 insertions(+), 12 deletions(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 59d0543bec..256f460bd2 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -91,7 +91,7 @@ async def setup(self):
 
         if self.config.get("skip_boring_words", True):
             self.wl -= self.boring_words
-        self.matched_words = set()
+        self.extracted_words_master = set()
         return True
 
     def rand_string(self, *args, **kwargs):
@@ -99,8 +99,9 @@ def rand_string(self, *args, **kwargs):
 
     async def do_mining(self, wl, url, batch_size, compare_helper):
         for i in wl:
-            h = hash(i + url)
-            self.already_checked.add(h)
+            if i not in self.wl:
+                h = hash(i + url)
+                self.already_checked.add(h)
 
         results = set()
         abort_threshold = 15
@@ -160,8 +161,9 @@ async def handle_event(self, event):
             extracted_words = self.load_extracted_words(event.data.get("body"), event.data.get("content_type"))
             if extracted_words:
                 self.debug(f"Extracted {str(len(extracted_words))} words from {url}")
-                self.matched_words.update(extracted_words)
+                self.extracted_words_master.update(extracted_words - wl)
                 wl |= extracted_words
+
         if self.config.get("skip_boring_words", True):
             wl -= self.boring_words
         results = await self.do_mining(wl, url, batch_size, compare_helper)
@@ -222,22 +224,21 @@ async def check_batch(self, compare_helper, url, header_list):
         return await compare_helper.compare(url, headers=test_headers, check_reflection=(len(header_list) == 1))
 
     async def finish(self):
+        untested_matches = self.extracted_words_master.copy()
+        if self.config.get("skip_boring_words", True):
+            untested_matches -= self.boring_words
+
         for url, (event, batch_size) in list(self.event_dict.items()):
             try:
                 compare_helper = self.helpers.http_compare(url)
             except HttpCompareError as e:
                 self.debug(f"Error initializing compare helper: {e}")
                 return
-            untested_matches = self.matched_words.copy()
-
-            if self.config.get("skip_boring_words", True):
-                untested_matches -= self.boring_words
-
             untested_matches_copy = untested_matches.copy()
-            for i in untested_matches_copy:
+            for i in untested_matches:
                 h = hash(i + url)
                 if h in self.already_checked:
-                    untested_matches.remove(i)
+                    untested_matches_copy.remove(i)
 
-            results = await self.do_mining(untested_matches, url, batch_size, compare_helper)
+            results = await self.do_mining(untested_matches_copy, url, batch_size, compare_helper)
             self.process_results(event, results)

From 0f41b9ff4f16caef2e6d2439826580a6f53112d0 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 16 Jul 2023 20:03:26 -0400
Subject: [PATCH 288/387] fixing missing await

---
 bbot/modules/url_manipulation.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/url_manipulation.py b/bbot/modules/url_manipulation.py
index 1af1316ccc..1b78e0077f 100644
--- a/bbot/modules/url_manipulation.py
+++ b/bbot/modules/url_manipulation.py
@@ -47,7 +47,7 @@ async def handle_event(self, event):
             self.debug(e)
             return
 
-        if compare_helper.canary_check(event.data, mode="getparam") == False:
+        if await compare_helper.canary_check(event.data, mode="getparam") == False:
             self.verbose(f'Aborting "{event.data}" due to failed canary check')
             return
 

From 828ed17bb9150fc733a12f77b54e8d036bca60c5 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 16 Jul 2023 20:26:23 -0400
Subject: [PATCH 289/387] improved error handling

---
 bbot/modules/paramminer_headers.py | 12 +++++++++---
 bbot/modules/url_manipulation.py   |  9 ++++++---
 2 files changed, 15 insertions(+), 6 deletions(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 256f460bd2..82f03ceca4 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -166,7 +166,11 @@ async def handle_event(self, event):
 
         if self.config.get("skip_boring_words", True):
             wl -= self.boring_words
-        results = await self.do_mining(wl, url, batch_size, compare_helper)
+
+        try:
+            results = await self.do_mining(wl, url, batch_size, compare_helper)
+        except HttpCompareError as e:
+            self.debug(f"Encountered HttpCompareError: [{e}] for URL [{event.data}]")
         self.process_results(event, results)
 
     async def count_test(self, url):
@@ -239,6 +243,8 @@ async def finish(self):
                 h = hash(i + url)
                 if h in self.already_checked:
                     untested_matches_copy.remove(i)
-
-            results = await self.do_mining(untested_matches_copy, url, batch_size, compare_helper)
+            try:
+                results = await self.do_mining(untested_matches_copy, url, batch_size, compare_helper)
+            except HttpCompareError:
+                self.debug(f"Encountered HttpCompareError: [{e}] for URL [{url}]")
             self.process_results(event, results)
diff --git a/bbot/modules/url_manipulation.py b/bbot/modules/url_manipulation.py
index 1b78e0077f..c41c68cc2a 100644
--- a/bbot/modules/url_manipulation.py
+++ b/bbot/modules/url_manipulation.py
@@ -53,9 +53,12 @@ async def handle_event(self, event):
 
         for sig in self.signatures:
             sig = self.format_signature(sig, event)
-            match, reasons, reflection, subject_response = await compare_helper.compare(
-                sig[1], method=sig[0], allow_redirects=self.allow_redirects
-            )
+            try:
+                match, reasons, reflection, subject_response = await compare_helper.compare(
+                    sig[1], method=sig[0], allow_redirects=self.allow_redirects
+                )
+            except HttpCompareError as e:
+                self.debug(f"Encountered HttpCompareError: [{e}] for URL [{event.data}]")
 
             if subject_response:
                 subject_content = "".join([str(x) for x in subject_response.headers])

From 79cb37b23ebef608e139173c8e7798fdd634e15d Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 16 Jul 2023 20:30:34 -0400
Subject: [PATCH 290/387] fixing try/except

---
 bbot/modules/paramminer_headers.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/paramminer_headers.py b/bbot/modules/paramminer_headers.py
index 82f03ceca4..8632ddf0df 100644
--- a/bbot/modules/paramminer_headers.py
+++ b/bbot/modules/paramminer_headers.py
@@ -245,6 +245,6 @@ async def finish(self):
                     untested_matches_copy.remove(i)
             try:
                 results = await self.do_mining(untested_matches_copy, url, batch_size, compare_helper)
-            except HttpCompareError:
+            except HttpCompareError as e:
                 self.debug(f"Encountered HttpCompareError: [{e}] for URL [{url}]")
             self.process_results(event, results)

From ae7e95b85235cfdf8c297529b07bad09c5aa9353 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 16 Jul 2023 21:55:59 -0400
Subject: [PATCH 291/387] bypass 403 collapse initial

---
 bbot/modules/bypass403.py                     | 44 ++++++++++++----
 .../module_tests/test_module_bypass403.py     | 51 +++++++++++++++++++
 2 files changed, 84 insertions(+), 11 deletions(-)

diff --git a/bbot/modules/bypass403.py b/bbot/modules/bypass403.py
index d798c03441..68500a5fdc 100644
--- a/bbot/modules/bypass403.py
+++ b/bbot/modules/bypass403.py
@@ -81,12 +81,8 @@ class bypass403(BaseModule):
     meta = {"description": "Check 403 pages for common bypasses"}
     in_scope_only = True
 
-    async def handle_event(self, event):
-        try:
-            compare_helper = self.helpers.http_compare(event.data, allow_redirects=True)
-        except HttpCompareError as e:
-            self.debug(e)
-            return
+    async def do_checks(self, compare_helper, event, collapse_threshold):
+        results = set()
 
         for sig in signatures:
             sig = self.format_signature(sig, event)
@@ -113,13 +109,39 @@ async def handle_event(self, event):
                     else:
                         reported_signature = f"Modified URL: {sig[0]} {sig[1]}"
                     description = f"403 Bypass Reasons: [{','.join(reasons)}] Sig: [{reported_signature}]"
-                    self.emit_event(
-                        {"description": description, "host": str(event.host), "url": event.data},
-                        "FINDING",
-                        source=event,
-                    )
+                    results.add(description)
+                    if len(results) > collapse_threshold:
+                        return results
                 else:
                     self.debug(f"Status code changed to {str(subject_response.status_code)}, ignoring")
+        return results
+
+    async def handle_event(self, event):
+        try:
+            compare_helper = self.helpers.http_compare(event.data, allow_redirects=True)
+        except HttpCompareError as e:
+            self.debug(e)
+            return
+
+        collapse_threshold = 10
+        results = await self.do_checks(compare_helper, event, collapse_threshold)
+        if len(results) > collapse_threshold:
+            self.emit_event(
+                {
+                    "description": f"403 Bypass MULTIPLE SIGNATURES (exceeded threshold {str(collapse_threshold)})",
+                    "host": str(event.host),
+                    "url": event.data,
+                },
+                "FINDING",
+                source=event,
+            )
+        else:
+            for description in results:
+                self.emit_event(
+                    {"description": description, "host": str(event.host), "url": event.data},
+                    "FINDING",
+                    source=event,
+                )
 
     async def filter_event(self, event):
         if ("status-403" in event.tags) or ("status-401" in event.tags):
diff --git a/bbot/test/test_step_2/module_tests/test_module_bypass403.py b/bbot/test/test_step_2/module_tests/test_module_bypass403.py
index 5bcbeebf31..fd64d3a914 100644
--- a/bbot/test/test_step_2/module_tests/test_module_bypass403.py
+++ b/bbot/test/test_step_2/module_tests/test_module_bypass403.py
@@ -19,6 +19,57 @@ def check(self, module_test, events):
         assert "http://127.0.0.1:8888/test..;/" in finding.data["description"]
 
 
+class TestBypass403_collapsethreshold(ModuleTestBase):
+    targets = ["http://127.0.0.1:8888/test"]
+    modules_overrides = ["bypass403", "httpx"]
+
+    async def setup_after_prep(self, module_test):
+        respond_args = {"response_data": "alive"}
+
+        # some of these wont word outside of the module because of the complex logic. This doesn't matter, we just need to get more alerts than the threshold.
+
+        query_payloads = [
+            "%09",
+            "%20",
+            "%23",
+            "%2e",
+            "%2f",
+            ".",
+            "?",
+            ";",
+            "..;",
+            ";%09",
+            ";%09..",
+            ";%09..;",
+            ";%2f..",
+            "*",
+            "/*",
+            "..;/",
+            ";/",
+            "/..;/",
+            "/;/",
+            "/./",
+            "//",
+            "/.",
+            "/?anything",
+            ".php",
+            ".json",
+            ".html",
+        ]
+
+        for qp in query_payloads:
+            expect_args = {"method": "GET", "uri": f"/test{qp}"}
+            module_test.set_expect_requests(expect_args=expect_args, respond_args=respond_args)
+
+        module_test.httpserver.no_handler_status_code = 403
+
+    def check(self, module_test, events):
+        findings = [e for e in events if e.type == "FINDING"]
+        assert len(findings) == 1
+        finding = findings[0]
+        assert "403 Bypass MULTIPLE SIGNATURES (exceeded threshold)" in finding.data["description"]
+
+
 class TestBypass403_aspnetcookieless(ModuleTestBase):
     targets = ["http://127.0.0.1:8888/admin.aspx"]
     modules_overrides = ["bypass403", "httpx"]

From 7ec612171fd692cabbf5098975815fbc34942760 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 16 Jul 2023 21:59:16 -0400
Subject: [PATCH 292/387] typo

---
 bbot/test/test_step_2/module_tests/test_module_bypass403.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_bypass403.py b/bbot/test/test_step_2/module_tests/test_module_bypass403.py
index fd64d3a914..b72f601c6f 100644
--- a/bbot/test/test_step_2/module_tests/test_module_bypass403.py
+++ b/bbot/test/test_step_2/module_tests/test_module_bypass403.py
@@ -26,7 +26,7 @@ class TestBypass403_collapsethreshold(ModuleTestBase):
     async def setup_after_prep(self, module_test):
         respond_args = {"response_data": "alive"}
 
-        # some of these wont word outside of the module because of the complex logic. This doesn't matter, we just need to get more alerts than the threshold.
+        # some of these wont work outside of the module because of the complex logic. This doesn't matter, we just need to get more alerts than the threshold.
 
         query_payloads = [
             "%09",

From 852e282a69c8b164c7e60e8dc1805fd0c7ce55b1 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Sun, 16 Jul 2023 22:14:25 -0400
Subject: [PATCH 293/387] small mistake with test

---
 bbot/test/test_step_2/module_tests/test_module_bypass403.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/test/test_step_2/module_tests/test_module_bypass403.py b/bbot/test/test_step_2/module_tests/test_module_bypass403.py
index b72f601c6f..8990f0d5ec 100644
--- a/bbot/test/test_step_2/module_tests/test_module_bypass403.py
+++ b/bbot/test/test_step_2/module_tests/test_module_bypass403.py
@@ -67,7 +67,7 @@ def check(self, module_test, events):
         findings = [e for e in events if e.type == "FINDING"]
         assert len(findings) == 1
         finding = findings[0]
-        assert "403 Bypass MULTIPLE SIGNATURES (exceeded threshold)" in finding.data["description"]
+        assert "403 Bypass MULTIPLE SIGNATURES (exceeded threshold" in finding.data["description"]
 
 
 class TestBypass403_aspnetcookieless(ModuleTestBase):

From 3c8ebcd291e23011745234c14f0d504e682318f8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 17 Jul 2023 17:37:17 -0400
Subject: [PATCH 294/387] include domain in oauth findings

---
 bbot/modules/azure_realm.py                    |  6 +++++-
 bbot/modules/oauth.py                          | 18 +++++++++++++-----
 .../module_tests/test_module_oauth.py          |  8 ++++----
 3 files changed, 22 insertions(+), 10 deletions(-)

diff --git a/bbot/modules/azure_realm.py b/bbot/modules/azure_realm.py
index b1b876e9db..869183a884 100644
--- a/bbot/modules/azure_realm.py
+++ b/bbot/modules/azure_realm.py
@@ -18,7 +18,11 @@ async def handle_event(self, event):
             self.processed.add(domain_hash)
             auth_url = await self.getuserrealm(domain)
             if auth_url:
-                self.emit_event(auth_url, "URL_UNVERIFIED", source=event, tags=["affiliate", "ms-auth-url"])
+                url_event = self.make_event(
+                    auth_url, "URL_UNVERIFIED", source=event, tags=["affiliate", "ms-auth-url"]
+                )
+                url_event.source_domain = domain
+                self.emit_event(url_event)
 
     async def getuserrealm(self, domain):
         url = f"https://login.microsoftonline.com/getuserrealm.srf?login=test@{domain}"
diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
index e49503790a..4a8dd06c56 100644
--- a/bbot/modules/oauth.py
+++ b/bbot/modules/oauth.py
@@ -49,21 +49,27 @@ async def handle_event(self, event):
             for u in self.url_and_base(url):
                 oidc_tasks.append(self.helpers.create_task(self.getoidc(u)))
 
+        source_domain = getattr(event, "source_domain", domain)
+
         for oidc_task in oidc_tasks:
             url, token_endpoint, oidc_results = await oidc_task
             if token_endpoint:
-                self.emit_event(
+                finding_event = self.make_event(
                     {
-                        "description": f"OpenID Connect Endpoint found at {url}",
+                        "description": f"OpenID Connect Endpoint (domain: {source_domain}) found at {url}",
                         "host": event.host,
                         "url": url,
                     },
                     "FINDING",
                     source=event,
                 )
-                self.emit_event(
+                finding_event.source_domain = source_domain
+                self.emit_event(finding_event)
+                url_event = self.make_event(
                     token_endpoint, "URL_UNVERIFIED", source=event, tags=["affiliate", "oauth-token-endpoint"]
                 )
+                url_event.source_domain = source_domain
+                self.emit_event(url_event)
             for result in oidc_results:
                 if result not in (domain, event.data):
                     event_type = "URL_UNVERIFIED" if self.helpers.is_url(result) else "DNS_NAME"
@@ -72,15 +78,17 @@ async def handle_event(self, event):
         for oauth_task in oauth_tasks:
             url = await oauth_task
             if url:
-                self.emit_event(
+                oauth_finding = self.make_event(
                     {
-                        "description": f"Potentially Sprayable OAUTH Endpoint at {url}",
+                        "description": f"Potentially Sprayable OAUTH Endpoint (domain: {source_domain}) at {url}",
                         "host": event.host,
                         "url": url,
                     },
                     "FINDING",
                     source=event,
                 )
+                oauth_finding.source_domain = source_domain
+                self.emit_event(oauth_finding)
 
     def url_and_base(self, url):
         yield url
diff --git a/bbot/test/test_step_2/module_tests/test_module_oauth.py b/bbot/test/test_step_2/module_tests/test_module_oauth.py
index 3a93e625e6..c586fb4199 100644
--- a/bbot/test/test_step_2/module_tests/test_module_oauth.py
+++ b/bbot/test/test_step_2/module_tests/test_module_oauth.py
@@ -206,25 +206,25 @@ def check(self, module_test, events):
         assert any(
             e.type == "FINDING"
             and e.data["description"]
-            == "OpenID Connect Endpoint found at https://login.windows.net/evilcorp.com/.well-known/openid-configuration"
+            == "OpenID Connect Endpoint (domain: evilcorp.com) found at https://login.windows.net/evilcorp.com/.well-known/openid-configuration"
             for e in events
         )
         assert any(
             e.type == "FINDING"
             and e.data["description"]
-            == "OpenID Connect Endpoint found at https://evilcorp.okta.com/.well-known/openid-configuration"
+            == "OpenID Connect Endpoint (domain: evilcorp.com) found at https://evilcorp.okta.com/.well-known/openid-configuration"
             for e in events
         )
         assert any(
             e.type == "FINDING"
             and e.data["description"]
-            == "Potentially Sprayable OAUTH Endpoint at https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/token"
+            == "Potentially Sprayable OAUTH Endpoint (domain: evilcorp.com) at https://login.windows.net/cc74fc12-4142-400e-a653-f98bdeadbeef/oauth2/token"
             for e in events
         )
         assert any(
             e.type == "FINDING"
             and e.data["description"]
-            == "Potentially Sprayable OAUTH Endpoint at https://evilcorp.okta.com/oauth2/v1/token"
+            == "Potentially Sprayable OAUTH Endpoint (domain: evilcorp.com) at https://evilcorp.okta.com/oauth2/v1/token"
             for e in events
         )
         assert any(e.data == "sts.windows.net" for e in events)

From 8f06dfd05ebe065937ca05badc5794f60600261c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 18 Jul 2023 12:33:49 -0400
Subject: [PATCH 295/387] fix asset inventory bug

---
 bbot/modules/output/asset_inventory.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/output/asset_inventory.py b/bbot/modules/output/asset_inventory.py
index 0b0cfff73e..d249ae1cd3 100644
--- a/bbot/modules/output/asset_inventory.py
+++ b/bbot/modules/output/asset_inventory.py
@@ -93,7 +93,7 @@ def sort_key(asset):
             ports = [str(p) for p in sorted([int(p) for p in asset.ports])]
             ips = sorted([str(i) for i in getattr(asset, "ip_addresses", [])])
             host = getattr(asset, "host", "")
-            if host:
+            if host and isinstance(host, str):
                 _, domain = self.helpers.split_domain(host)
                 if domain:
                     increment_stat("Domains", domain)

From 040426b294e08504094c03ab25b6227163c09c14 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 19 Jul 2023 17:29:44 -0400
Subject: [PATCH 296/387] advanced task debugging

---
 bbot/core/helpers/async_helpers.py | 28 +++++++++++++++++++-----
 bbot/core/helpers/web.py           |  6 +++--
 bbot/modules/base.py               | 35 ++++++++++++++----------------
 bbot/scanner/manager.py            | 34 ++++++++++++++++-------------
 bbot/scanner/scanner.py            |  6 ++---
 5 files changed, 64 insertions(+), 45 deletions(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 6a5a10eda3..5c1eaf8394 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -1,3 +1,4 @@
+import uuid
 import asyncio
 import logging
 import threading
@@ -39,14 +40,29 @@ async def lock(self, name):
 
 class TaskCounter:
     def __init__(self):
-        self.value = 0
+        self.tasks = {}
 
-    async def __aenter__(self):
-        self.value += 1
-        return self
+    @property
+    def value(self):
+        return len(self.tasks)
 
-    async def __aexit__(self, exc_type, exc_val, exc_tb):
-        self.value -= 1
+    def count(self, task_name):
+        if callable(task_name):
+            task_name = f"{task_name.__qualname__}()"
+        return self.Task(self, task_name)
+
+    class Task:
+        def __init__(self, manager, task_name):
+            self.manager = manager
+            self.task_name = task_name
+
+        async def __aenter__(self):
+            self.task_id = str(uuid.uuid4())  # generate a unique ID for the task
+            self.manager.tasks[self.task_id] = self.task_name
+            return self.task_id  # this will be passed as 'task_id' to __aexit__
+
+        async def __aexit__(self, exc_type, exc_val, exc_tb):
+            del self.manager.tasks[self.task_id]  # remove only current task
 
 
 def async_to_sync_gen(async_gen):
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 9372fbab96..28863318ed 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -97,6 +97,8 @@ async def request(self, *args, **kwargs):
             kwargs["url"] = args[0]
             args = []
 
+        url = kwargs.get("url", "")
+
         if not args and "method" not in kwargs:
             kwargs["method"] = "GET"
 
@@ -118,12 +120,12 @@ async def request(self, *args, **kwargs):
                     )
                 return response
             except httpx.RequestError as e:
-                log.debug(f"Error with request: {e}")
+                log.debug(f"Error with request to {url}: {e}")
                 log.trace(traceback.format_exc())
                 if raise_error:
                     raise
             except ssl.SSLError as e:
-                log.debug(f"SSL error with request: {e}")
+                log.debug(f"SSL error with request to {url}: {e}")
                 log.trace(traceback.format_exc())
 
     async def download(self, url, **kwargs):
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 88b9a2b9d5..fef950d772 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -214,20 +214,18 @@ async def _handle_batch(self):
         if self.batch_size <= 1:
             return
         if self.num_incoming_events > 0:
-            events, finish, report = await self.events_waiting()
+            events, finish = await self.events_waiting()
             if not self.errored:
                 self.debug(f"Handling batch of {len(events):,} events")
                 if events:
                     submitted = True
-                    async with self.scan.acatch(context=f"{self.name}.handle_batch"):
-                        async with self._task_counter:
-                            await self.handle_batch(*events)
+                    context = f"{self.name}.handle_batch"
+                    async with self.scan.acatch(context), self._task_counter.count(context):
+                        await self.handle_batch(*events)
                 if finish:
-                    async with self.scan.acatch(context=f"{self.name}.finish"):
+                    context = f"{self.name}.finish()"
+                    async with self.scan.acatch(context), self._task_counter.count(context):
                         await self.finish()
-                elif report:
-                    async with self.scan.acatch(context=f"{self.name}.report"):
-                        await self.report()
         return submitted
 
     def make_event(self, *args, **kwargs):
@@ -260,7 +258,6 @@ async def events_waiting(self):
         """
         events = []
         finish = False
-        report = False
         while self.incoming_event_queue:
             if len(events) > self.batch_size:
                 break
@@ -278,7 +275,7 @@ async def events_waiting(self):
                     self.debug(f"Not accepting {event} because {reason}")
             except asyncio.queues.QueueEmpty:
                 break
-        return events, finish, report
+        return events, finish
 
     @property
     def num_incoming_events(self):
@@ -345,14 +342,14 @@ async def _worker(self):
                         self.debug(f"Not accepting {event} because {reason}")
                     if acceptable:
                         if event.type == "FINISHED":
-                            async with self.scan.acatch(context=f"{self.name}.finish"):
-                                async with self._task_counter:
-                                    await self.finish()
+                            context = f"{self.name}.finish"
+                            async with self.scan.acatch(context), self._task_counter.count(context):
+                                await self.finish()
                         else:
+                            context = f"{self.name}.handle_event({event})"
                             self.scan.stats.event_consumed(event, self)
-                            async with self.scan.acatch(context=f"{self.name}.handle_event"):
-                                async with self._task_counter:
-                                    await self.handle_event(event)
+                            async with self.scan.acatch(context), self._task_counter.count(context):
+                                await self.handle_event(event)
 
     @property
     def max_scope_distance(self):
@@ -449,10 +446,10 @@ async def _cleanup(self):
         if not self._cleanedup:
             self._cleanedup = True
             for callback in [self.cleanup] + self.cleanup_callbacks:
+                context = f"{self.name}.cleanup()"
                 if callable(callback):
-                    async with self.scan.acatch(context=self.name):
-                        async with self._task_counter:
-                            await self.helpers.execute_sync_or_async(callback)
+                    async with self.scan.acatch(context), self._task_counter.count(context):
+                        await self.helpers.execute_sync_or_async(callback)
 
     async def queue_event(self, event):
         """
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index bfe3bb64cb..471125a988 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -34,15 +34,15 @@ async def init_events(self):
         """
         seed scanner with target events
         """
-        async with self.scan.acatch(context=self.init_events):
-            async with self._task_counter:
-                await self.distribute_event(self.scan.root_event)
-                sorted_events = sorted(self.scan.target.events, key=lambda e: len(e.data))
-                for event in sorted_events:
-                    self.scan.verbose(f"Target: {event}")
-                    self.queue_event(event)
-                await asyncio.sleep(0.1)
-                self.scan._finished_init = True
+        context = f"manager.init_events()"
+        async with self.scan.acatch(context), self._task_counter.count(context):
+            await self.distribute_event(self.scan.root_event)
+            sorted_events = sorted(self.scan.target.events, key=lambda e: len(e.data))
+            for event in sorted_events:
+                self.scan.verbose(f"Target: {event}")
+                self.queue_event(event)
+            await asyncio.sleep(0.1)
+            self.scan._finished_init = True
 
     async def emit_event(self, event, *args, **kwargs):
         """
@@ -51,7 +51,7 @@ async def emit_event(self, event, *args, **kwargs):
         bbot.scanner: scan._event_thread_pool: running for 0 seconds: ScanManager._emit_event(DNS_NAME("sipfed.online.lync.com"))
         bbot.scanner: scan._event_thread_pool: running for 0 seconds: ScanManager._emit_event(DNS_NAME("sipfed.online.lync.com"))
         """
-        async with self._task_counter:
+        async with self._task_counter.count(f"emit_event({event})"):
             # skip event if it fails precheck
             if not self._event_precheck(event):
                 event._resolved.set()
@@ -315,10 +315,6 @@ def accept_event(self, event):
             return False
         return True
 
-    async def _register_running(self, callback, *args, **kwargs):
-        async with self._task_counter:
-            return await callback(*args, **kwargs)
-
     async def distribute_event(self, *args, **kwargs):
         """
         Queue event with modules
@@ -493,13 +489,21 @@ def modules_status(self, _log=False):
                 scan_active_status.append(f"manager.active: {self.active}")
                 scan_active_status.append(f"    manager.running: {self.running}")
                 scan_active_status.append(f"        manager._task_counter.value: {self._task_counter.value}")
+                scan_active_status.append(f"        manager._task_counter.tasks:")
+                for task in self._task_counter.tasks.values():
+                    scan_active_status.append(f"            - {task}:")
                 scan_active_status.append(
                     f"        manager.incoming_event_queue.qsize(): {self.incoming_event_queue.qsize()}"
                 )
                 scan_active_status.append(f"    manager.modules_finished: {self.modules_finished}")
                 for m in self.scan.modules.values():
+                    running = m.running
                     scan_active_status.append(f"        {m}.finished: {m.finished}")
-                    scan_active_status.append(f"            running: {m.running}")
+                    scan_active_status.append(f"            running: {running}")
+                    if running:
+                        scan_active_status.append(f"            tasks:")
+                        for task in m._task_counter.tasks.values():
+                            scan_active_status.append(f"                - {task}:")
                     scan_active_status.append(f"            num_incoming_events: {m.num_incoming_events}")
                     scan_active_status.append(
                         f"            outgoing_event_queue.qsize(): {m.outgoing_event_queue.qsize()}"
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index f1e45e8dd0..4c81d00190 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -417,9 +417,9 @@ def cancel_tasks(self):
 
     async def report(self):
         for mod in self.modules.values():
-            async with self.acatch(context=mod.report):
-                async with mod._task_counter:
-                    await mod.report()
+            context = f"{mod.name}.report()"
+            async with self.acatch(context), mod._task_counter.count(context):
+                await mod.report()
 
     async def cleanup(self):
         # clean up modules

From 3fa4073381be56f2fe66b1e0ce06a4f6e1047c60 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 19 Jul 2023 17:31:30 -0400
Subject: [PATCH 297/387] don't stringify uuid

---
 bbot/core/helpers/async_helpers.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 5c1eaf8394..f7ae0f029c 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -57,7 +57,7 @@ def __init__(self, manager, task_name):
             self.task_name = task_name
 
         async def __aenter__(self):
-            self.task_id = str(uuid.uuid4())  # generate a unique ID for the task
+            self.task_id = uuid.uuid4()  # generate a unique ID for the task
             self.manager.tasks[self.task_id] = self.task_name
             return self.task_id  # this will be passed as 'task_id' to __aexit__
 

From ff2f34810cf4efc3d0815d312acadec24ed8dae8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 19 Jul 2023 17:45:35 -0400
Subject: [PATCH 298/387] clearer debug output

---
 bbot/core/helpers/web.py |  8 ++++++--
 bbot/modules/base.py     | 10 +++++-----
 bbot/scanner/manager.py  |  4 ++--
 3 files changed, 13 insertions(+), 9 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 28863318ed..f9dfa9bb0b 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -119,13 +119,17 @@ async def request(self, *args, **kwargs):
                         f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
                     )
                 return response
+            except httpx.ReadTimeout:
+                log.verbose(f"HTTP timeout to URL: {url}")
+                if raise_error:
+                    raise
             except httpx.RequestError as e:
-                log.debug(f"Error with request to {url}: {e}")
+                log.debug(f"Error with request to URL: {url}: {e}")
                 log.trace(traceback.format_exc())
                 if raise_error:
                     raise
             except ssl.SSLError as e:
-                log.debug(f"SSL error with request to {url}: {e}")
+                log.debug(f"SSL error with request to URL: {url}: {e}")
                 log.trace(traceback.format_exc())
 
     async def download(self, url, **kwargs):
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index fef950d772..8d721735af 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -219,11 +219,11 @@ async def _handle_batch(self):
                 self.debug(f"Handling batch of {len(events):,} events")
                 if events:
                     submitted = True
-                    context = f"{self.name}.handle_batch"
+                    context = "handle_batch()"
                     async with self.scan.acatch(context), self._task_counter.count(context):
                         await self.handle_batch(*events)
                 if finish:
-                    context = f"{self.name}.finish()"
+                    context = "finish()"
                     async with self.scan.acatch(context), self._task_counter.count(context):
                         await self.finish()
         return submitted
@@ -342,11 +342,11 @@ async def _worker(self):
                         self.debug(f"Not accepting {event} because {reason}")
                     if acceptable:
                         if event.type == "FINISHED":
-                            context = f"{self.name}.finish"
+                            context = "finish()"
                             async with self.scan.acatch(context), self._task_counter.count(context):
                                 await self.finish()
                         else:
-                            context = f"{self.name}.handle_event({event})"
+                            context = f"handle_event({event})"
                             self.scan.stats.event_consumed(event, self)
                             async with self.scan.acatch(context), self._task_counter.count(context):
                                 await self.handle_event(event)
@@ -446,7 +446,7 @@ async def _cleanup(self):
         if not self._cleanedup:
             self._cleanedup = True
             for callback in [self.cleanup] + self.cleanup_callbacks:
-                context = f"{self.name}.cleanup()"
+                context = f"cleanup()"
                 if callable(callback):
                     async with self.scan.acatch(context), self._task_counter.count(context):
                         await self.helpers.execute_sync_or_async(callback)
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 471125a988..e886ef227f 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -493,7 +493,7 @@ def modules_status(self, _log=False):
                 for task in self._task_counter.tasks.values():
                     scan_active_status.append(f"            - {task}:")
                 scan_active_status.append(
-                    f"        manager.incoming_event_queue.qsize(): {self.incoming_event_queue.qsize()}"
+                    f"        manager.incoming_event_queue.qsize: {self.incoming_event_queue.qsize()}"
                 )
                 scan_active_status.append(f"    manager.modules_finished: {self.modules_finished}")
                 for m in self.scan.modules.values():
@@ -506,7 +506,7 @@ def modules_status(self, _log=False):
                             scan_active_status.append(f"                - {task}:")
                     scan_active_status.append(f"            num_incoming_events: {m.num_incoming_events}")
                     scan_active_status.append(
-                        f"            outgoing_event_queue.qsize(): {m.outgoing_event_queue.qsize()}"
+                        f"            outgoing_event_queue.qsize: {m.outgoing_event_queue.qsize()}"
                     )
                 for line in scan_active_status:
                     self.scan.debug(line)

From 1e6386fa97583c5d48b586d697fc5d29fe2bf838 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 20 Jul 2023 12:28:02 -0400
Subject: [PATCH 299/387] include runtime in task debug messages

---
 bbot/core/helpers/async_helpers.py | 11 ++++++++++-
 1 file changed, 10 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index f7ae0f029c..d6758d04d4 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -2,7 +2,9 @@
 import asyncio
 import logging
 import threading
+from datetime import datetime
 from queue import Queue, Empty
+from .misc import human_timedelta
 from contextlib import asynccontextmanager
 
 log = logging.getLogger("bbot.core.helpers.async_helpers")
@@ -55,15 +57,22 @@ class Task:
         def __init__(self, manager, task_name):
             self.manager = manager
             self.task_name = task_name
+            self.task_id = None
+            self.start_time = None
 
         async def __aenter__(self):
             self.task_id = uuid.uuid4()  # generate a unique ID for the task
-            self.manager.tasks[self.task_id] = self.task_name
+            self.start_time = datetime.now()
+            self.manager.tasks[self.task_id] = self
             return self.task_id  # this will be passed as 'task_id' to __aexit__
 
         async def __aexit__(self, exc_type, exc_val, exc_tb):
             del self.manager.tasks[self.task_id]  # remove only current task
 
+        def __str__(self):
+            running_for = human_timedelta(datetime.now() - self.start_time)
+            return f"{self.task_name} (running for {running_for})"
+
 
 def async_to_sync_gen(async_gen):
     # Queue to hold generated values

From 2e948f80098507b1d6f9201a57d3f62e4a6e1dda Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 20 Jul 2023 23:26:11 -0400
Subject: [PATCH 300/387] updating badsecrets and adding support for severity
 pass through

---
 bbot/modules/badsecrets.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/badsecrets.py b/bbot/modules/badsecrets.py
index a058fe198d..064c908667 100644
--- a/bbot/modules/badsecrets.py
+++ b/bbot/modules/badsecrets.py
@@ -11,7 +11,7 @@ class badsecrets(BaseModule):
     flags = ["active", "safe", "web-basic", "web-thorough"]
     meta = {"description": "Library for detecting known or weak secrets across many web frameworks"}
     max_event_handlers = 2
-    deps_pip = ["badsecrets~=0.3.351"]
+    deps_pip = ["badsecrets~=0.4"]
 
     @property
     def _max_event_handlers(self):
@@ -40,7 +40,7 @@ async def handle_event(self, event):
                 for r in r_list:
                     if r["type"] == "SecretFound":
                         data = {
-                            "severity": "HIGH",
+                            "severity": r["description"]["severity"],
                             "description": f"Known Secret Found. Secret Type: [{r['description']['secret']}] Secret: [{r['secret']}] Product Type: [{r['description']['product']}] Product: [{r['product']}] Detecting Module: [{r['detecting_module']}] Details: [{r['details']}]",
                             "url": event.data["url"],
                             "host": str(event.host),

From e5cb5e96ceac211ad6512673fd2937697e2cbcfb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 21 Jul 2023 17:09:07 -0400
Subject: [PATCH 301/387] ASM debugging and sanity checking

---
 bbot/core/helpers/async_helpers.py |  2 +-
 bbot/core/helpers/misc.py          |  7 +++++--
 bbot/core/helpers/web.py           |  2 +-
 bbot/modules/badsecrets.py         | 10 +++++++---
 bbot/modules/base.py               | 13 +++++++------
 bbot/modules/hackertarget.py       |  3 ++-
 bbot/modules/ipneighbor.py         |  5 ++++-
 bbot/modules/report/asn.py         |  2 ++
 bbot/scanner/manager.py            |  6 +++---
 9 files changed, 32 insertions(+), 18 deletions(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index d6758d04d4..1ec8a5e578 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -67,7 +67,7 @@ async def __aenter__(self):
             return self.task_id  # this will be passed as 'task_id' to __aexit__
 
         async def __aexit__(self, exc_type, exc_val, exc_tb):
-            del self.manager.tasks[self.task_id]  # remove only current task
+            self.manager.tasks.pop(self.task_id, None)  # remove only current task
 
         def __str__(self):
             running_for = human_timedelta(datetime.now() - self.start_time)
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index cf8337ac55..27102ff7d5 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -239,7 +239,7 @@ def is_ip(d, version=None):
     "bad::c0de" --> True
     "evilcorp.com" --> False
     """
-    if type(d) in (ipaddress.IPv4Address, ipaddress.IPv6Address):
+    if isinstance(d, (ipaddress.IPv4Address, ipaddress.IPv6Address)):
         if version is None or version == d.version:
             return True
     try:
@@ -977,7 +977,10 @@ def human_timedelta(d):
         result.append(f"{minutes:,} minute" + ("s" if minutes > 1 else ""))
     if seconds:
         result.append(f"{seconds:,} second" + ("s" if seconds > 1 else ""))
-    return ", ".join(result)
+    ret = ", ".join(result)
+    if not ret:
+        ret = "0 seconds"
+    return ret
 
 
 def bytes_to_human(_bytes):
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index f9dfa9bb0b..6c72268159 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -119,7 +119,7 @@ async def request(self, *args, **kwargs):
                         f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
                     )
                 return response
-            except httpx.ReadTimeout:
+            except httpx.TimeoutException:
                 log.verbose(f"HTTP timeout to URL: {url}")
                 if raise_error:
                     raise
diff --git a/bbot/modules/badsecrets.py b/bbot/modules/badsecrets.py
index 064c908667..3ca03c2bfb 100644
--- a/bbot/modules/badsecrets.py
+++ b/bbot/modules/badsecrets.py
@@ -33,9 +33,13 @@ async def handle_event(self, event):
                     if len(c2) == 2:
                         resp_cookies[c2[0]] = c2[1]
         if resp_body or resp_cookies:
-            r_list = await self.scan.run_in_executor_mp(
-                carve_all_modules, body=resp_body, cookies=resp_cookies, url=event.data.get("url", None)
-            )
+            try:
+                r_list = await self.scan.run_in_executor_mp(
+                    carve_all_modules, body=resp_body, cookies=resp_cookies, url=event.data.get("url", None)
+                )
+            except Exception as e:
+                self.warning(f"Error processing {event}: {e}")
+                return
             if r_list:
                 for r in r_list:
                     if r["type"] == "SecretFound":
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 8d721735af..266aa62d35 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -280,7 +280,7 @@ async def events_waiting(self):
     @property
     def num_incoming_events(self):
         ret = 0
-        if self.incoming_event_queue:
+        if self.incoming_event_queue is not False:
             ret = self.incoming_event_queue.qsize()
         return ret
 
@@ -329,7 +329,7 @@ async def _worker(self):
 
                 else:
                     try:
-                        if self.incoming_event_queue:
+                        if self.incoming_event_queue is not False:
                             event = await self.incoming_event_queue.get()
                         else:
                             self.debug(f"Event queue is in bad state")
@@ -455,7 +455,7 @@ async def queue_event(self, event):
         """
         Queue (incoming) event with module
         """
-        if self.incoming_event_queue in (None, False):
+        if self.incoming_event_queue is False:
             self.debug(f"Not in an acceptable state to queue incoming event")
             return
         acceptable, reason = self._event_precheck(event)
@@ -495,12 +495,13 @@ def dequeue_outgoing_event_nowait(self):
 
     def set_error_state(self, message=None):
         if not self.errored:
+            log_msg = f"Setting error state for module {self.name}"
             if message is not None:
-                self.warning(str(message))
-            self.debug(f"Setting error state for module {self.name}")
+                log_msg += f": {message}"
+            self.warning(log_msg)
             self.errored = True
             # clear incoming queue
-            if self.incoming_event_queue:
+            if self.incoming_event_queue is not False:
                 self.debug(f"Emptying event_queue")
                 with suppress(asyncio.queues.QueueEmpty):
                     while 1:
diff --git a/bbot/modules/hackertarget.py b/bbot/modules/hackertarget.py
index ad476abec5..d6c3b4e3b7 100644
--- a/bbot/modules/hackertarget.py
+++ b/bbot/modules/hackertarget.py
@@ -21,4 +21,5 @@ def parse_results(self, r, query):
                 self.helpers.validators.validate_host(host)
                 yield host
             except ValueError:
-                self.set_error_state(host)
+                self.debug(f"Error validating API result: {line}")
+                continue
diff --git a/bbot/modules/ipneighbor.py b/bbot/modules/ipneighbor.py
index 207bbe99cb..5a8ed5bb6a 100644
--- a/bbot/modules/ipneighbor.py
+++ b/bbot/modules/ipneighbor.py
@@ -32,4 +32,7 @@ async def handle_event(self, event):
             self.processed.add(subnet_hash)
             for ip in network:
                 if ip != main_ip:
-                    self.emit_event(str(ip), "IP_ADDRESS", event, internal=True)
+                    ip_event = self.make_event(str(ip), "IP_ADDRESS", event, internal=True)
+                    # keep the scope distance low to give it one more hop for DNS resolution
+                    ip_event.scope_distance = max(1, event.scope_distance)
+                    self.emit_event(ip_event)
diff --git a/bbot/modules/report/asn.py b/bbot/modules/report/asn.py
index e23e3e4258..a8f57709aa 100644
--- a/bbot/modules/report/asn.py
+++ b/bbot/modules/report/asn.py
@@ -25,6 +25,8 @@ async def setup(self):
         return True
 
     async def filter_event(self, event):
+        if str(event.module) == "ipneighbor":
+            return False
         if getattr(event.host, "is_private", False):
             return False
         return True
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index e886ef227f..696a99ffdf 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -82,7 +82,7 @@ def _event_precheck(self, event, exclude=("DNS_NAME",)):
         if event == event.get_source():
             log.debug(f"Skipping event with self as source: {event}")
             return False
-        if not event._force_output and self.is_duplicate_event(event):
+        if self.is_duplicate_event(event) and not event._force_output:
             log.debug(f"Skipping {event} because it is a duplicate")
             return False
         return True
@@ -161,7 +161,7 @@ async def _emit_event(self, event, *args, **kwargs):
             event_is_duplicate = self.is_duplicate_event(event)
 
             # Scope shepherding
-            # here, we buff or nerf an event based on its attributes and certain scan settings
+            # here, we buff or nerf the scope distance of an event based on its attributes and certain scan settings
             event_is_duplicate = self.is_duplicate_event(event)
             event_in_report_distance = event.scope_distance <= self.scan.scope_report_distance
             set_scope_distance = event.scope_distance
@@ -179,7 +179,7 @@ async def _emit_event(self, event, *args, **kwargs):
                     source_trail = event.set_scope_distance(set_scope_distance)
                     # force re-emit internal source events
                     for s in source_trail:
-                        await self.emit_event(s, _block=False, _force_submit=True)
+                        self.queue_event(s)
                 else:
                     if event.scope_distance > self.scan.scope_report_distance:
                         log.debug(

From 9189b550dcf1dd96da4c38d76296ac11cd9c9827 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 21 Jul 2023 17:12:42 -0400
Subject: [PATCH 302/387] fix tests

---
 bbot/scanner/scanner.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 4c81d00190..e731e5bb13 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -264,7 +264,7 @@ async def async_start(self):
                     break
 
                 if "python" in self.modules:
-                    events, finish, report = await self.modules["python"].events_waiting()
+                    events, finish = await self.modules["python"].events_waiting()
                     for e in events:
                         yield e
 

From 7de4b718d073949b741bf6caafeb37eb518b140d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 21 Jul 2023 17:19:25 -0400
Subject: [PATCH 303/387] warn if memory usage exceeds 90%

---
 bbot/scanner/manager.py | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 696a99ffdf..a5d6bd8ca9 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -437,6 +437,15 @@ def modules_status(self, _log=False):
 
         modules_errored = [m for m, s in status["modules"].items() if s["errored"]]
 
+        max_mem_percent = 90
+        mem_status = self.scan.helpers.memory_status()
+        # abort if we don't have the memory
+        mem_percent = mem_status.percent
+        if mem_percent > max_mem_percent:
+            free_memory = mem_status.available
+            free_memory_human = self.scan.helpers.bytes_to_human(free_memory)
+            self.scan.warning(f"System memory is at {mem_percent:.1f}% ({free_memory_human} remaining)")
+
         if _log:
             modules_status = []
             for m, s in status["modules"].items():

From 893fcf4b23b61c97f445843e62c01dd6397654da Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 23 Jul 2023 11:29:09 -0400
Subject: [PATCH 304/387] fixed nuclei logging bug, better logging for module
 workers

---
 bbot/modules/base.py          | 73 +++++++++++++++++++----------------
 bbot/modules/deadly/nuclei.py | 11 +++---
 bbot/modules/oauth.py         |  2 +-
 3 files changed, 46 insertions(+), 40 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 266aa62d35..050de3639c 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -315,41 +315,46 @@ async def _setup(self):
 
     async def _worker(self):
         async with self.scan.acatch(context=self._worker):
-            while not self.scan.stopping:
-                # hold the reigns if our outgoing queue is full
-                if self._qsize > 0 and self.outgoing_event_queue.qsize() >= self._qsize:
-                    await asyncio.sleep(0.1)
-                    continue
-
-                if self.batch_size > 1:
-                    submitted = await self._handle_batch()
-                    if not submitted:
-                        async with self._event_received:
-                            await self._event_received.wait()
-
-                else:
-                    try:
-                        if self.incoming_event_queue is not False:
-                            event = await self.incoming_event_queue.get()
-                        else:
-                            self.debug(f"Event queue is in bad state")
-                            return
-                    except asyncio.queues.QueueEmpty:
+            try:
+                while not self.scan.stopping:
+                    # hold the reigns if our outgoing queue is full
+                    if self._qsize > 0 and self.outgoing_event_queue.qsize() >= self._qsize:
+                        await asyncio.sleep(0.1)
                         continue
-                    self.debug(f"Got {event} from {getattr(event, 'module', 'unknown_module')}")
-                    acceptable, reason = await self._event_postcheck(event)
-                    if not acceptable:
-                        self.debug(f"Not accepting {event} because {reason}")
-                    if acceptable:
-                        if event.type == "FINISHED":
-                            context = "finish()"
-                            async with self.scan.acatch(context), self._task_counter.count(context):
-                                await self.finish()
-                        else:
-                            context = f"handle_event({event})"
-                            self.scan.stats.event_consumed(event, self)
-                            async with self.scan.acatch(context), self._task_counter.count(context):
-                                await self.handle_event(event)
+
+                    if self.batch_size > 1:
+                        submitted = await self._handle_batch()
+                        if not submitted:
+                            async with self._event_received:
+                                await self._event_received.wait()
+
+                    else:
+                        try:
+                            if self.incoming_event_queue is not False:
+                                event = await self.incoming_event_queue.get()
+                            else:
+                                self.debug(f"Event queue is in bad state")
+                                break
+                        except asyncio.queues.QueueEmpty:
+                            continue
+                        self.debug(f"Got {event} from {getattr(event, 'module', 'unknown_module')}")
+                        acceptable, reason = await self._event_postcheck(event)
+                        if not acceptable:
+                            self.debug(f"Not accepting {event} because {reason}")
+                        if acceptable:
+                            if event.type == "FINISHED":
+                                context = "finish()"
+                                async with self.scan.acatch(context), self._task_counter.count(context):
+                                    await self.finish()
+                            else:
+                                context = f"handle_event({event})"
+                                self.scan.stats.event_consumed(event, self)
+                                async with self.scan.acatch(context), self._task_counter.count(context):
+                                    await self.handle_event(event)
+            except asyncio.CancelledError:
+                self.log.trace("Worker cancelled")
+                raise
+        self.log.trace(f"Worker stopped")
 
     @property
     def max_scope_distance(self):
diff --git a/bbot/modules/deadly/nuclei.py b/bbot/modules/deadly/nuclei.py
index 649f2b4df0..68d7dda1b8 100644
--- a/bbot/modules/deadly/nuclei.py
+++ b/bbot/modules/deadly/nuclei.py
@@ -115,7 +115,7 @@ async def setup(self):
 
             self.info("Processing nuclei templates to perform budget calculations...")
 
-            self.nucleibudget = NucleiBudget(self.budget, self.nuclei_templates_dir)
+            self.nucleibudget = NucleiBudget(self)
             self.budget_templates_file = self.helpers.tempfile(self.nucleibudget.collapsable_templates, pipe=False)
 
             self.info(
@@ -273,11 +273,12 @@ async def filter_event(self, event):
 
 
 class NucleiBudget:
-    def __init__(self, budget, templates_dir):
+    def __init__(self, nuclei_module):
+        self.parent = nuclei_module
         self._yaml_files = {}
-        self.templates_dir = templates_dir
+        self.templates_dir = nuclei_module.nuclei_templates_dir
         self.yaml_list = self.get_yaml_list()
-        self.budget_paths = self.find_budget_paths(budget)
+        self.budget_paths = self.find_budget_paths(nuclei_module.budget)
         self.collapsable_templates, self.severity_stats = self.find_collapsable_templates()
 
     def get_yaml_list(self):
@@ -364,6 +365,6 @@ def parse_yaml(self, yamlfile):
                     y = yaml.safe_load(stream)
                     self._yaml_files[yamlfile] = y
                 except yaml.YAMLError as e:
-                    self.warning(f"failed to load yaml file: {e}")
+                    self.parent.warning(f"failed to load yaml file: {e}")
                     return {}
         return self._yaml_files[yamlfile]
diff --git a/bbot/modules/oauth.py b/bbot/modules/oauth.py
index 4a8dd06c56..4ead86e21a 100644
--- a/bbot/modules/oauth.py
+++ b/bbot/modules/oauth.py
@@ -123,7 +123,7 @@ async def getoauth(self, url):
         data = {
             "grant_type": "authorization_code",
             "client_id": "xxx",
-            "redirect_uri": "https://www.blacklanternsecurity.com",
+            "redirect_uri": "https://example.com",
             "code": "xxx",
             "client_secret": "xxx",
         }

From 594e9f28a39c9ebd0e638b4cdf6c155256992fc1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 24 Jul 2023 09:57:47 -0400
Subject: [PATCH 305/387] fix web report tests

---
 bbot/modules/deadly/nuclei.py                                | 2 +-
 bbot/test/test_step_2/module_tests/test_module_web_report.py | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/deadly/nuclei.py b/bbot/modules/deadly/nuclei.py
index 68d7dda1b8..33b033bbce 100644
--- a/bbot/modules/deadly/nuclei.py
+++ b/bbot/modules/deadly/nuclei.py
@@ -13,7 +13,7 @@ class nuclei(BaseModule):
     batch_size = 25
 
     options = {
-        "version": "2.9.4",
+        "version": "2.9.9",
         "tags": "",
         "templates": "",
         "severity": "",
diff --git a/bbot/test/test_step_2/module_tests/test_module_web_report.py b/bbot/test/test_step_2/module_tests/test_module_web_report.py
index 0f931445fe..aa51d501a0 100644
--- a/bbot/test/test_step_2/module_tests/test_module_web_report.py
+++ b/bbot/test/test_step_2/module_tests/test_module_web_report.py
@@ -24,7 +24,7 @@ def check(self, module_test, events):
         report_file = module_test.scan.home / "web_report.html"
         with open(report_file) as f:
             report_content = f.read()
-        assert "<li>[HIGH] Known Secret Found" in report_content
+        assert "<li>[CRITICAL] Known Secret Found" in report_content
         assert (
             """<h3>URL</h3>
 <ul>

From 7d21cd18d41cb3fd244825f1b9a8a35fcea5a50e Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 24 Jul 2023 11:29:45 -0400
Subject: [PATCH 306/387] better httpx/subprocess error handling

---
 bbot/core/helpers/command.py | 3 ++-
 bbot/core/helpers/web.py     | 4 ++++
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/command.py b/bbot/core/helpers/command.py
index d5b08d0120..1204e21c70 100644
--- a/bbot/core/helpers/command.py
+++ b/bbot/core/helpers/command.py
@@ -65,7 +65,8 @@ async def run_live(self, *command, check=False, text=True, **kwargs):
         if input_task is not None:
             try:
                 await input_task
-            except BrokenPipeError:
+            except ConnectionError:
+                log.trace(f"ConnectionError in command: {command}, kwargs={kwargs}")
                 log.trace(traceback.format_exc())
         await proc.wait()
 
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 6c72268159..efbee5d9e0 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -123,6 +123,10 @@ async def request(self, *args, **kwargs):
                 log.verbose(f"HTTP timeout to URL: {url}")
                 if raise_error:
                     raise
+            except httpx.ConnectError:
+                log.verbose(f"HTTP connect failed to URL: {url}")
+                if raise_error:
+                    raise
             except httpx.RequestError as e:
                 log.debug(f"Error with request to URL: {url}: {e}")
                 log.trace(traceback.format_exc())

From b2a12aaedacc9ef61830ee4601be5046bb4a57bc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 24 Jul 2023 13:38:20 -0400
Subject: [PATCH 307/387] better scan status message

---
 bbot/core/helpers/async_helpers.py | 2 +-
 bbot/scanner/manager.py            | 2 ++
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 1ec8a5e578..96c25addc3 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -71,7 +71,7 @@ async def __aexit__(self, exc_type, exc_val, exc_tb):
 
         def __str__(self):
             running_for = human_timedelta(datetime.now() - self.start_time)
-            return f"{self.task_name} (running for {running_for})"
+            return f"{self.task_name} running for {running_for}"
 
 
 def async_to_sync_gen(async_gen):
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index a5d6bd8ca9..bc9b5d6dd9 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -461,6 +461,8 @@ def modules_status(self, _log=False):
             if modules_status:
                 modules_status_str = ", ".join([f"{m}({i:,}:{t:,}:{o:,})" for m, r, i, o, t, _ in modules_status])
                 running_modules_str = ", ".join([m[0] for m in modules_status if m[1]])
+                if not running_modules_str:
+                    running_modules_str = "None"
                 self.scan.info(f"{self.scan.name}: Modules running: {running_modules_str}")
                 self.scan.verbose(
                     f"{self.scan.name}: Modules status (incoming:processing:outgoing) {modules_status_str}"

From 108e220f348d15ac09f9a7499c4a43b493493357 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 24 Jul 2023 14:54:09 -0400
Subject: [PATCH 308/387] better sslcert error handling

---
 bbot/defaults.yml       |  2 +-
 bbot/modules/sslcert.py | 12 ++++++++++--
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/bbot/defaults.yml b/bbot/defaults.yml
index 2fc16db568..4e69371ba3 100644
--- a/bbot/defaults.yml
+++ b/bbot/defaults.yml
@@ -132,7 +132,7 @@ interactsh_token: null
 interactsh_disable: false
 
 # For performance reasons, always skip these DNS queries
-# Microsoft's DNS infrastructure is misconfigured so that some queries to mail.protection.outlook.com always time out
+# Microsoft's DNS infrastructure is misconfigured so that certain queries to mail.protection.outlook.com always time out
 dns_omit_queries:
   - SRV:mail.protection.outlook.com
   - CNAME:mail.protection.outlook.com
diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index ece8508a87..7b4f2c0465 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -150,8 +150,16 @@ async def visit_host(self, host, port):
                 return [], [], (host, port)
 
             # Get the certificate
-            der = ssl_object.getpeercert(binary_form=True)
-            cert = crypto.load_certificate(crypto.FILETYPE_ASN1, der)
+            try:
+                der = ssl_object.getpeercert(binary_form=True)
+            except Exception as e:
+                self.verbose(f"Error getting peer cert: {e}", trace=True)
+                return [], [], (host, port)
+            try:
+                cert = crypto.load_certificate(crypto.FILETYPE_ASN1, der)
+            except Exception as e:
+                self.verbose(f"Error loading certificate: {e}", trace=True)
+                return [], [], (host, port)
             issuer = cert.get_issuer()
             if issuer.emailAddress and self.helpers.regexes.email_regex.match(issuer.emailAddress):
                 emails.add(issuer.emailAddress)

From 312e7c9e6bc6563416d631960f84c21175221869 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 24 Jul 2023 15:01:02 -0400
Subject: [PATCH 309/387] speed up massdns

---
 bbot/modules/massdns.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 54afb81a08..a7168a745e 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -130,7 +130,7 @@ async def massdns(self, domain, subdomains):
                 return []
         self.verbose(f"Resolving batch of {len(results):,} results")
         resolved = dict(
-            [l async for l in self.helpers.resolve_batch(results, type=("A", "AAAA", "CNAME"), cache_result=True)]
+            [l async for l in self.helpers.resolve_batch(results, type=("A", "CNAME"), cache_result=True)]
         )
         resolved = {k: v for k, v in resolved.items() if v}
         for hostname in resolved:

From 61d6304d719f0fdc0de9cfa8f83736c30285c3d0 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 24 Jul 2023 15:24:15 -0400
Subject: [PATCH 310/387] blacked

---
 bbot/modules/massdns.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index a7168a745e..35254afef5 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -129,9 +129,7 @@ async def massdns(self, domain, subdomains):
                 self.info(abort_msg)
                 return []
         self.verbose(f"Resolving batch of {len(results):,} results")
-        resolved = dict(
-            [l async for l in self.helpers.resolve_batch(results, type=("A", "CNAME"), cache_result=True)]
-        )
+        resolved = dict([l async for l in self.helpers.resolve_batch(results, type=("A", "CNAME"), cache_result=True)])
         resolved = {k: v for k, v in resolved.items() if v}
         for hostname in resolved:
             self.add_found(hostname)

From 2d24bac88f4b88fb23215e5c7355f145cb9e488b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 24 Jul 2023 16:39:14 -0400
Subject: [PATCH 311/387] sort modules alphabetically in status message

---
 bbot/core/helpers/validators.py | 4 +---
 bbot/scanner/manager.py         | 2 +-
 2 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/bbot/core/helpers/validators.py b/bbot/core/helpers/validators.py
index 5082a2dd31..33e41fe821 100644
--- a/bbot/core/helpers/validators.py
+++ b/bbot/core/helpers/validators.py
@@ -6,7 +6,7 @@
 from bbot.core.helpers.punycode import smart_decode_punycode
 from bbot.core.helpers.misc import split_host_port, make_netloc
 
-log = logging.getLogger("bbot.core.helpers.")
+log = logging.getLogger("bbot.core.helpers.validators")
 
 
 def validator(func):
@@ -62,8 +62,6 @@ def validate_host(host):
             for r in regexes.event_type_regexes["DNS_NAME"]:
                 if r.match(host):
                     return host
-            if regexes.hostname_regex.match(host):
-                return host
     assert False, f'Invalid hostname: "{host}"'
 
 
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index bc9b5d6dd9..262da7cb9c 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -507,7 +507,7 @@ def modules_status(self, _log=False):
                     f"        manager.incoming_event_queue.qsize: {self.incoming_event_queue.qsize()}"
                 )
                 scan_active_status.append(f"    manager.modules_finished: {self.modules_finished}")
-                for m in self.scan.modules.values():
+                for m in sorted(self.scan.modules.values(), key=lambda m: m.name):
                     running = m.running
                     scan_active_status.append(f"        {m}.finished: {m.finished}")
                     scan_active_status.append(f"            running: {running}")

From d4df4de84d6fe8bea5ea413a399fc0b4c35ff1ca Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 09:56:01 -0400
Subject: [PATCH 312/387] remove ipneighbor scope distance tweak

---
 bbot/modules/ipneighbor.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/ipneighbor.py b/bbot/modules/ipneighbor.py
index 5a8ed5bb6a..1ce8cf0f9e 100644
--- a/bbot/modules/ipneighbor.py
+++ b/bbot/modules/ipneighbor.py
@@ -34,5 +34,5 @@ async def handle_event(self, event):
                 if ip != main_ip:
                     ip_event = self.make_event(str(ip), "IP_ADDRESS", event, internal=True)
                     # keep the scope distance low to give it one more hop for DNS resolution
-                    ip_event.scope_distance = max(1, event.scope_distance)
+                    # ip_event.scope_distance = max(1, event.scope_distance)
                     self.emit_event(ip_event)

From 8c76d62fbd161af46f0f2b3e802b371e225def0b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 12:36:29 -0400
Subject: [PATCH 313/387] Added digitorus module

---
 bbot/modules/digitorus.py | 25 +++++++++++++++++++++++++
 1 file changed, 25 insertions(+)
 create mode 100644 bbot/modules/digitorus.py

diff --git a/bbot/modules/digitorus.py b/bbot/modules/digitorus.py
new file mode 100644
index 0000000000..ef59fd173a
--- /dev/null
+++ b/bbot/modules/digitorus.py
@@ -0,0 +1,25 @@
+from .crobat import crobat
+
+
+class digitorus(crobat):
+    flags = ["subdomain-enum", "passive", "safe"]
+    watched_events = ["DNS_NAME"]
+    produced_events = ["DNS_NAME"]
+    meta = {"description": "Query certificatedetails.com for subdomains"}
+
+    base_url = "https://certificatedetails.com"
+
+    async def request_url(self, query):
+        url = f"{self.base_url}/{self.helpers.quote(query)}"
+        return await self.helpers.request(url)
+
+    def parse_results(self, r, query):
+        results = set()
+        content = getattr(r, "text", "")
+        if content:
+            for regex in self.scan.dns_regexes:
+                for match in regex.finditer(content):
+                    subdomain = match.group().lower()
+                    if subdomain:
+                        results.add(subdomain)
+        return results

From 0db80a919c445193bd1782490f6c2292ef6ebdef Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 12:44:53 -0400
Subject: [PATCH 314/387] improve regex performance

---
 bbot/modules/digitorus.py | 12 +++++++-----
 1 file changed, 7 insertions(+), 5 deletions(-)

diff --git a/bbot/modules/digitorus.py b/bbot/modules/digitorus.py
index ef59fd173a..3047652b2c 100644
--- a/bbot/modules/digitorus.py
+++ b/bbot/modules/digitorus.py
@@ -1,3 +1,5 @@
+import re
+
 from .crobat import crobat
 
 
@@ -16,10 +18,10 @@ async def request_url(self, query):
     def parse_results(self, r, query):
         results = set()
         content = getattr(r, "text", "")
+        extract_regex = re.compile(r"[\w.-]+\." + query, re.I)
         if content:
-            for regex in self.scan.dns_regexes:
-                for match in regex.finditer(content):
-                    subdomain = match.group().lower()
-                    if subdomain:
-                        results.add(subdomain)
+            for match in extract_regex.finditer(content):
+                subdomain = match.group().lower()
+                if subdomain and subdomain.endswith(f".{query}"):
+                    results.add(subdomain)
         return results

From 63e0e39d529210553233ace7c3c58a05c73c62f1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 12:48:30 -0400
Subject: [PATCH 315/387] add digitorus test

---
 .../module_tests/test_module_digitorus.py     | 20 +++++++++++++++++++
 1 file changed, 20 insertions(+)
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_digitorus.py

diff --git a/bbot/test/test_step_2/module_tests/test_module_digitorus.py b/bbot/test/test_step_2/module_tests/test_module_digitorus.py
new file mode 100644
index 0000000000..fc95a82c76
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_digitorus.py
@@ -0,0 +1,20 @@
+from .base import ModuleTestBase
+
+
+class TestDigitorus(ModuleTestBase):
+    web_response = """<a href="/b8198b95b449ef633d3b671fdd5e5096a81bbc161afb07fa50d29edaac33bf88/asdf.blacklanternsecurity.com" title="Show the certificate for www.blacklanternsecurity.com">www.blacklanternsecurity.com</a><br>
+<a href="/d92f154de36b1c3ea253a60a41c1a30e148e8964f92e10df4789692860ea80cb/zzzz.blacklanternsecurity.com" title="Show the certificate for chat.blacklanternsecurity.com">chat.blacklanternsecurity.com</a><br>
+<a href="/e8b44651bd01af5d077045c2792c6038f0bf3d26684bf2170546d9affed4bf52/zzzz.blacklanternsecurity.com" title="Show the certificate for www.blacklanternsecurity.com">www.blacklanternsecurity.com</a><br>
+<a href="/faef21c8c799d9ee1867ab6028ff33ade4d03c39277e65c9abe23e3633a10496/asdf.blacklanternsecurity.com" title="Show the certificate for tasks.blacklanternsecurity.com">tasks.blacklanternsecurity.com</a><br>
+<a href="/ff1075573cc59a60073e968e61728a30b66974c234a9feeb07d695dfd3391512/asdf.blacklanternsecurity.com" title="Show the certificate for gitlab.blacklanternsecurity.com">gitlab.blacklanternsecurity.com</a><br>
+"""
+
+    async def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://certificatedetails.com/blacklanternsecurity.com",
+            text=self.web_response,
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"

From 5782b40f35d4787b1c174c2d90acb85b3b5bcfe4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 14:50:17 -0400
Subject: [PATCH 316/387] update email regex

---
 bbot/core/helpers/regexes.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index fa91c6c0dd..918319acc6 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -25,7 +25,7 @@
 _dns_name_regex = r"(?:\w(?:[\w-]{0,100}\w)?\.)+\w{1,63}"
 # dns names without periods
 _hostname_regex = r"(?!\w*\.\w+)\w(?:[\w-]{0,100}\w)?"
-_email_regex = r"(?:[^\W_][\w\-\.\+]{,100})@(?:\w[\w\-\._]{,100})\.(?:[^\W_0-9]{2,8})"
+_email_regex = r"(?:[^\W_][\w\-\.\+]{,100})@" + _dns_name_regex
 email_regex = re.compile(_email_regex, re.I)
 _ptr_regex = r"(?:[0-9]{1,3}[-_\.]){3}[0-9]{1,3}"
 ptr_regex = re.compile(_ptr_regex)

From 6ae8c6a83795040e758502ca1690ce22e9825128 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 14:56:45 -0400
Subject: [PATCH 317/387] update docs with massdns thread count

---
 docs/scanning/tips_and_tricks.md | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
index c6c032da7b..c05738d356 100644
--- a/docs/scanning/tips_and_tricks.md
+++ b/docs/scanning/tips_and_tricks.md
@@ -9,6 +9,15 @@ Press enter during a BBOT scan to change the log level. This will allow you to s
 
 ## Common Config Changes
 
+### Boost Massdns Thread Count
+
+If you have a fast internet connection or are running BBOT from a cloud VM, you can speed up subdomain enumeration by cranking the threads for `massdns`. The default is `1000`, which is about 1MB/s of DNS traffic:
+
+```bash
+# massdns with 5x default thread count
+bbot -t evilcorp.com -f subdomain-enum -c modules.massdns.max_resolvers=5000
+```
+
 ### Web Spider
 
 The web spider is great for finding juicy data like subdomains, email addresses, and javascript secrets buried in webpages. However since it can lengthen the duration of a scan, it's disabled by default. To enable the web spider, you must increase the value of `web_spider_distance`.

From 92e254a99da52d6c1ba5717f93b42c441f6b9df1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 15:58:41 -0400
Subject: [PATCH 318/387] tweak dns name regex to disallow underscores in TLD

---
 bbot/core/helpers/regexes.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/helpers/regexes.py b/bbot/core/helpers/regexes.py
index 918319acc6..9eb01d9fa8 100644
--- a/bbot/core/helpers/regexes.py
+++ b/bbot/core/helpers/regexes.py
@@ -22,7 +22,7 @@
 _ipv6_regex = r"[A-F0-9:]*:[A-F0-9:]*:[A-F0-9:]*"
 ipv6_regex = re.compile(_ipv6_regex, re.I)
 # dns names with periods
-_dns_name_regex = r"(?:\w(?:[\w-]{0,100}\w)?\.)+\w{1,63}"
+_dns_name_regex = r"(?:\w(?:[\w-]{0,100}\w)?\.)+[^\W_]{1,63}"
 # dns names without periods
 _hostname_regex = r"(?!\w*\.\w+)\w(?:[\w-]{0,100}\w)?"
 _email_regex = r"(?:[^\W_][\w\-\.\+]{,100})@" + _dns_name_regex

From 8dc014f42f876d47c642926ea09c35956f862acb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 16:31:36 -0400
Subject: [PATCH 319/387] trace cancelled workers

---
 bbot/modules/base.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 050de3639c..85052059e0 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -353,6 +353,7 @@ async def _worker(self):
                                     await self.handle_event(event)
             except asyncio.CancelledError:
                 self.log.trace("Worker cancelled")
+                self.trace()
                 raise
         self.log.trace(f"Worker stopped")
 

From f58167d3a7cae0faf2bd804417875c7ed218f870 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 25 Jul 2023 21:44:48 -0400
Subject: [PATCH 320/387] squashed a big one

---
 bbot/core/helpers/dns.py       | 23 ++++++++---------------
 bbot/core/helpers/misc.py      | 11 ++++++++++-
 bbot/modules/bucket_aws.py     |  4 ++--
 bbot/modules/git.py            |  2 +-
 bbot/modules/iis_shortnames.py |  4 ++--
 bbot/modules/ntlm.py           |  5 ++---
 bbot/modules/sslcert.py        |  8 ++------
 bbot/modules/telerik.py        |  2 +-
 bbot/scanner/scanner.py        |  2 +-
 9 files changed, 29 insertions(+), 32 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 59ec705747..a3d88bb27d 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -1,4 +1,3 @@
-import asyncio
 import logging
 import ipaddress
 import traceback
@@ -10,7 +9,7 @@
 from bbot.core.helpers.ratelimiter import RateLimiter
 from bbot.core.helpers.async_helpers import NamedLock
 from bbot.core.errors import ValidationError, DNSError
-from .misc import is_ip, is_domain, is_dns_name, domain_parents, parent_domain, rand_string, cloudcheck
+from .misc import is_ip, is_domain, is_dns_name, domain_parents, parent_domain, rand_string, cloudcheck, as_completed
 
 log = logging.getLogger("bbot.core.helpers.dns")
 
@@ -307,8 +306,8 @@ async def resolve_event(self, event, minimal=False):
                     types = ("A", "AAAA")
 
             if types:
-                tasks = [asyncio.create_task(self.resolve_raw(event_host, type=t, cache_result=True)) for t in types]
-                for task in asyncio.as_completed(tasks):
+                tasks = [self.resolve_raw(event_host, type=t, cache_result=True) for t in types]
+                async for task in as_completed(tasks):
                     resolved_raw, errors = await task
                     for rdtype, e in errors:
                         if rdtype not in resolved_raw:
@@ -395,9 +394,7 @@ async def resolve_batch(self, queries, **kwargs):
         ]
         """
 
-        for task in asyncio.as_completed(
-            [asyncio.create_task(self._resolve_batch_coro_wrapper(q, **kwargs)) for q in queries]
-        ):
+        async for task in as_completed([self._resolve_batch_coro_wrapper(q, **kwargs) for q in queries]):
             yield await task
 
     def extract_targets(self, record):
@@ -495,12 +492,10 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
             # then resolve the query for all rdtypes
             for _rdtype in self.all_rdtypes:
                 # resolve the base query
-                wildcard_tasks[_rdtype].append(
-                    asyncio.create_task(self.resolve_raw(query, type=_rdtype, cache_result=True))
-                )
+                wildcard_tasks[_rdtype].append(self.resolve_raw(query, type=_rdtype, cache_result=True))
 
             for _rdtype, tasks in wildcard_tasks.items():
-                for task in asyncio.as_completed(tasks):
+                async for task in as_completed(tasks):
                     raw_results, errors = await task
                     if errors and not raw_results:
                         self.debug(f"Failed to resolve {query} ({_rdtype}) during wildcard detection")
@@ -584,15 +579,13 @@ async def is_wildcard_domain(self, domain, log_info=False):
                     #     continue
                     for _ in range(self.wildcard_tests):
                         rand_query = f"{rand_string(digits=False, length=10)}.{host}"
-                        wildcard_tasks[rdtype].append(
-                            asyncio.create_task(self.resolve(rand_query, type=rdtype, cache_result=False))
-                        )
+                        wildcard_tasks[rdtype].append(self.resolve(rand_query, type=rdtype, cache_result=False))
 
                 # combine the random results
                 is_wildcard = False
                 wildcard_results = dict()
                 for rdtype, tasks in wildcard_tasks.items():
-                    for task in asyncio.as_completed(tasks):
+                    async for task in as_completed(tasks):
                         results = await task
                         if results:
                             is_wildcard = True
diff --git a/bbot/core/helpers/misc.py b/bbot/core/helpers/misc.py
index 27102ff7d5..8ef44d8dc5 100644
--- a/bbot/core/helpers/misc.py
+++ b/bbot/core/helpers/misc.py
@@ -29,8 +29,8 @@
 import xml.etree.ElementTree as ET
 from collections.abc import Mapping
 from hashlib import sha1 as hashlib_sha1
+from asyncio import create_task, sleep, wait_for  # noqa
 from urllib.parse import urlparse, quote, unquote, urlunparse  # noqa F401
-from asyncio import as_completed, create_task, sleep, wait_for  # noqa
 
 from .url import *  # noqa F401
 from .. import errors
@@ -1278,3 +1278,12 @@ def parse_list_string(list_string):
             raise ValueError(f"Invalid character in string: {element}")
         result.append(element)
     return result
+
+
+async def as_completed(coros):
+    tasks = {coro if isinstance(coro, asyncio.Task) else asyncio.create_task(coro): coro for coro in coros}
+    while tasks:
+        done, _ = await asyncio.wait(tasks.keys(), return_when=asyncio.FIRST_COMPLETED)
+        for task in done:
+            tasks.pop(task)
+            yield task
diff --git a/bbot/modules/bucket_aws.py b/bbot/modules/bucket_aws.py
index ee354c365b..5aa9524b28 100644
--- a/bbot/modules/bucket_aws.py
+++ b/bbot/modules/bucket_aws.py
@@ -79,8 +79,8 @@ async def brute_buckets(self, buckets, permutations=False, omit_base=False):
             for region in self.regions:
                 for bucket_name in new_buckets:
                     url = self.build_url(bucket_name, base_domain, region)
-                    tasks.append(self.helpers.create_task(self._check_bucket_exists(bucket_name, url)))
-        for task in self.helpers.as_completed(tasks):
+                    tasks.append(self._check_bucket_exists(bucket_name, url))
+        async for task in self.helpers.as_completed(tasks):
             existent_bucket, tags, bucket_name, url = await task
             if existent_bucket:
                 yield bucket_name, url, tags
diff --git a/bbot/modules/git.py b/bbot/modules/git.py
index c7676ddeb8..dafe151d11 100644
--- a/bbot/modules/git.py
+++ b/bbot/modules/git.py
@@ -22,7 +22,7 @@ async def handle_event(self, event):
             urljoin(f"{base_url}/", ".git/config"),
         }
         tasks = [self.get_url(u) for u in urls]
-        for task in self.helpers.as_completed(tasks):
+        async for task in self.helpers.as_completed(tasks):
             result, url = await task
             text = getattr(result, "text", "")
             if not text:
diff --git a/bbot/modules/iis_shortnames.py b/bbot/modules/iis_shortnames.py
index b63e155180..69bb315e2f 100644
--- a/bbot/modules/iis_shortnames.py
+++ b/bbot/modules/iis_shortnames.py
@@ -109,10 +109,10 @@ async def solve_shortname_recursive(
             wildcard = "*" if extension_mode else "*~1*"
             payload = encode_all(f"{prefix}{c}{wildcard}")
             url = f"{target}{payload}{suffix}"
-            task = self.helpers.create_task(self.threaded_request(method, url, affirmative_status_code, c))
+            task = self.threaded_request(method, url, affirmative_status_code, c)
             tasks.append(task)
 
-        for task in self.helpers.as_completed(tasks):
+        async for task in self.helpers.as_completed(tasks):
             result, c = await task
             if result:
                 found_results = True
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index c05c5221ae..2d8ceee538 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -123,10 +123,9 @@ async def handle_url(self, event):
             if url_hash in self.processed:
                 continue
             self.processed.add(url_hash)
-            task = self.helpers.create_task(self.check_ntlm(url))
-            tasks.append(task)
+            tasks.append(self.helpers.create_task(self.check_ntlm(url)))
 
-        for task in self.helpers.as_completed(tasks):
+        async for task in self.helpers.as_completed(tasks):
             try:
                 result, url = await task
                 if result:
diff --git a/bbot/modules/sslcert.py b/bbot/modules/sslcert.py
index 7b4f2c0465..a9f269c55f 100644
--- a/bbot/modules/sslcert.py
+++ b/bbot/modules/sslcert.py
@@ -63,12 +63,8 @@ async def handle_event(self, event):
             abort_threshold = self.out_of_scope_abort_threshold
             log_fn = self.verbose
 
-        tasks = []
-        for host in hosts:
-            task = self.helpers.create_task(self.visit_host(host, port))
-            tasks.append(task)
-
-        for task in self.helpers.as_completed(tasks):
+        tasks = [self.visit_host(host, port) for host in hosts]
+        async for task in self.helpers.as_completed(tasks):
             result = await task
             if not isinstance(result, tuple) or not len(result) == 3:
                 continue
diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index 58579f96b8..29f8f1837b 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -213,7 +213,7 @@ async def handle_event(self, event):
             tasks.append(self.helpers.create_task(self.test_detector(event.data, f"{dh}?dp=1")))
 
         fail_count = 0
-        for task in self.helpers.as_completed(tasks):
+        async for task in self.helpers.as_completed(tasks):
             try:
                 result, dh = await task
             except asyncio.CancelledError:
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index e731e5bb13..6733ee3ae9 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -327,7 +327,7 @@ async def setup_modules(self, remove_failed=True):
         hard_failed = []
         soft_failed = []
 
-        for task in asyncio.as_completed([asyncio.create_task(m._setup()) for m in self.modules.values()]):
+        async for task in self.helpers.as_completed([m._setup() for m in self.modules.values()]):
             module_name, status, msg = await task
             if status == True:
                 self.debug(f"Setup succeeded for {module_name} ({msg})")

From a62b2c71679236c6fd6d3b2271622509aec63e74 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 26 Jul 2023 09:36:27 -0400
Subject: [PATCH 321/387] updated docs

---
 README.md                        | 46 +++++++++++++++++---------------
 docs/index.md                    |  3 ++-
 docs/scanning/tips_and_tricks.md |  2 +-
 extra_sass/style.css.scss        |  3 +++
 4 files changed, 30 insertions(+), 24 deletions(-)

diff --git a/README.md b/README.md
index 694ad43c51..cc35931703 100644
--- a/README.md
+++ b/README.md
@@ -1,3 +1,5 @@
+![bbot_banner](https://user-images.githubusercontent.com/20261699/158000235-6c1ace81-a267-4f8e-90a1-f4c16884ebac.png)
+
 # BEE·bot
 
 ### OSINT automation for hackers.
@@ -6,34 +8,13 @@
 
 BBOT is a modular, recursive OSINT framework that can execute the entire OSINT workflow in a single command.
 
-![bbot_banner](https://github.com/blacklanternsecurity/bbot/assets/20261699/af2e822c-d7d6-40e7-bcba-2ce52faa6c4c)
-
 BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but takes it to the next level with features like multi-target scans, lightning-fast asyncio performance, and NLP-powered subdomain mutations. It offers a wide range of functionality, including subdomain enumeration, port scanning, web screenshots, vulnerability scanning, and much more. 
 
 ![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/de0154c1-476e-4337-9599-45a1c5e0e78b)
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/bbot/how_it_works/).
 
-## Consider checking out our [Documentation](https://www.blacklanternsecurity.com/bbot):
-
-<!-- BBOT DOCS TOC -->
-- **Basics**
-    - [Getting Started](https://www.blacklanternsecurity.com/bbot/)
-    - [How it Works](https://www.blacklanternsecurity.com/bbot/how_it_works)
-    - [Comparison to Other Tools](https://www.blacklanternsecurity.com/bbot/comparison)
-- **Scanning**
-    - [Scanning Overview](https://www.blacklanternsecurity.com/bbot/scanning/)
-    - [Events](https://www.blacklanternsecurity.com/bbot/scanning/events)
-    - [Output](https://www.blacklanternsecurity.com/bbot/scanning/output)
-    - [Tips and Tricks](https://www.blacklanternsecurity.com/bbot/scanning/tips_and_tricks)
-    - [Advanced Usage](https://www.blacklanternsecurity.com/bbot/scanning/advanced)
-    - [Configuration](https://www.blacklanternsecurity.com/bbot/scanning/configuration)
-    - [List of Modules](https://www.blacklanternsecurity.com/bbot/scanning/list_of_modules)
-- **Contribution**
-    - [How to Write a Module](https://www.blacklanternsecurity.com/bbot/contribution)
-- **Misc**
-    - [Release History](https://www.blacklanternsecurity.com/bbot/release_history)
-<!-- END BBOT DOCS TOC -->
+Consider checking out our [Documentation](https://www.blacklanternsecurity.com/bbot).
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 
@@ -139,6 +120,27 @@ import asyncio
 asyncio.run(main())
 ```
 
+## Documentation
+
+<!-- BBOT DOCS TOC -->
+- **Basics**
+    - [Getting Started](https://www.blacklanternsecurity.com/bbot/)
+    - [How it Works](https://www.blacklanternsecurity.com/bbot/how_it_works)
+    - [Comparison to Other Tools](https://www.blacklanternsecurity.com/bbot/comparison)
+- **Scanning**
+    - [Scanning Overview](https://www.blacklanternsecurity.com/bbot/scanning/)
+    - [Events](https://www.blacklanternsecurity.com/bbot/scanning/events)
+    - [Output](https://www.blacklanternsecurity.com/bbot/scanning/output)
+    - [Tips and Tricks](https://www.blacklanternsecurity.com/bbot/scanning/tips_and_tricks)
+    - [Advanced Usage](https://www.blacklanternsecurity.com/bbot/scanning/advanced)
+    - [Configuration](https://www.blacklanternsecurity.com/bbot/scanning/configuration)
+    - [List of Modules](https://www.blacklanternsecurity.com/bbot/scanning/list_of_modules)
+- **Contribution**
+    - [How to Write a Module](https://www.blacklanternsecurity.com/bbot/contribution)
+- **Misc**
+    - [Release History](https://www.blacklanternsecurity.com/bbot/release_history)
+<!-- END BBOT DOCS TOC -->
+
 ## Acknowledgements
 
 Thanks to these amazing people for contributing to BBOT! :heart:
diff --git a/docs/index.md b/docs/index.md
index 7592d4451c..4309c6788d 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -14,7 +14,8 @@ BBOT offers multiple methods of installation, including **pipx** and **Docker**.
 
 ### [Python (pip / pipx)](https://pypi.org/project/bbot/)
 
-???+ note
+
+???+ note inline end
 
     `pipx` installs BBOT inside its own virtual environment.
 
diff --git a/docs/scanning/tips_and_tricks.md b/docs/scanning/tips_and_tricks.md
index c05738d356..f8afedbfd6 100644
--- a/docs/scanning/tips_and_tricks.md
+++ b/docs/scanning/tips_and_tricks.md
@@ -14,7 +14,7 @@ Press enter during a BBOT scan to change the log level. This will allow you to s
 If you have a fast internet connection or are running BBOT from a cloud VM, you can speed up subdomain enumeration by cranking the threads for `massdns`. The default is `1000`, which is about 1MB/s of DNS traffic:
 
 ```bash
-# massdns with 5x default thread count
+# massdns with 5000 resolvers, about 5MB/s
 bbot -t evilcorp.com -f subdomain-enum -c modules.massdns.max_resolvers=5000
 ```
 
diff --git a/extra_sass/style.css.scss b/extra_sass/style.css.scss
index 6d9c733a37..306a7174c3 100644
--- a/extra_sass/style.css.scss
+++ b/extra_sass/style.css.scss
@@ -47,6 +47,9 @@ article.md-content__inner {
   h5 {
     font-weight: 300;
   }
+  div.highlight {
+    background-color: unset !important;
+  }
 }
 
 table {

From 6368d0ec753ed986d5cc4b378af7399be202da27 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 26 Jul 2023 13:16:48 -0400
Subject: [PATCH 322/387] add subdomaincenter module

---
 README.md                                     |  2 -
 bbot/modules/subdomaincenter.py               | 40 +++++++++++++++++++
 .../test_module_subdomaincenter.py            | 13 ++++++
 3 files changed, 53 insertions(+), 2 deletions(-)
 create mode 100644 bbot/modules/subdomaincenter.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_subdomaincenter.py

diff --git a/README.md b/README.md
index cc35931703..0ca251ff0f 100644
--- a/README.md
+++ b/README.md
@@ -14,8 +14,6 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/bbot/how_it_works/).
 
-Consider checking out our [Documentation](https://www.blacklanternsecurity.com/bbot).
-
 ## Installation ([pip](https://pypi.org/project/bbot/))
 
 For more installation methods including [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot), see [Installation](https://www.blacklanternsecurity.com/bbot/#installation).
diff --git a/bbot/modules/subdomaincenter.py b/bbot/modules/subdomaincenter.py
new file mode 100644
index 0000000000..37cace0028
--- /dev/null
+++ b/bbot/modules/subdomaincenter.py
@@ -0,0 +1,40 @@
+from .crobat import crobat
+
+
+class subdomaincenter(crobat):
+    flags = ["subdomain-enum", "passive", "safe"]
+    watched_events = ["DNS_NAME"]
+    produced_events = ["DNS_NAME"]
+    meta = {"description": "Query subdomain.center's API for subdomains"}
+
+    base_url = "https://api.subdomain.center"
+    retries = 2
+
+    async def sleep(self, time_to_wait):
+        self.info(f"Sleeping for {time_to_wait} seconds to avoid rate limit")
+        await self.helpers.sleep(time_to_wait)
+
+    async def request_url(self, query):
+        url = f"{self.base_url}/?domain={self.helpers.quote(query)}"
+        response = None
+        status_code = 0
+        for i, _ in enumerate(range(self.retries + 1)):
+            if i > 0:
+                self.info(f"Retry #{i} for {query} after response code {status_code}")
+            self.hugeinfo(url)
+            response = await self.helpers.request(url)
+            status_code = getattr(response, "status_code", 0)
+            if status_code in (429, 0):
+                await self.sleep(20)
+            else:
+                break
+        return response
+
+    def parse_results(self, r, query):
+        results = set()
+        json = r.json()
+        if json and isinstance(json, list):
+            results = set(json)
+            self.hugesuccess(f"{query}: {results}")
+            return results
+        return results
diff --git a/bbot/test/test_step_2/module_tests/test_module_subdomaincenter.py b/bbot/test/test_step_2/module_tests/test_module_subdomaincenter.py
new file mode 100644
index 0000000000..2ec5e03612
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_subdomaincenter.py
@@ -0,0 +1,13 @@
+from .base import ModuleTestBase
+
+
+class TestSubdomainCenter(ModuleTestBase):
+    async def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://api.subdomain.center/?domain=blacklanternsecurity.com",
+            json=["asdf.blacklanternsecurity.com", "zzzz.blacklanternsecurity.com"],
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.blacklanternsecurity.com" for e in events), "Failed to detect subdomain"

From 108acbb86369695a69b009dffac8bda7bee861b5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 26 Jul 2023 13:19:48 -0400
Subject: [PATCH 323/387] removed debugging statements

---
 bbot/modules/subdomaincenter.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/subdomaincenter.py b/bbot/modules/subdomaincenter.py
index 37cace0028..aad3d8c6d6 100644
--- a/bbot/modules/subdomaincenter.py
+++ b/bbot/modules/subdomaincenter.py
@@ -20,11 +20,10 @@ async def request_url(self, query):
         status_code = 0
         for i, _ in enumerate(range(self.retries + 1)):
             if i > 0:
-                self.info(f"Retry #{i} for {query} after response code {status_code}")
-            self.hugeinfo(url)
+                self.verbose(f"Retry #{i} for {query} after response code {status_code}")
             response = await self.helpers.request(url)
             status_code = getattr(response, "status_code", 0)
-            if status_code in (429, 0):
+            if status_code == 429:
                 await self.sleep(20)
             else:
                 break
@@ -35,6 +34,5 @@ def parse_results(self, r, query):
         json = r.json()
         if json and isinstance(json, list):
             results = set(json)
-            self.hugesuccess(f"{query}: {results}")
             return results
         return results

From fd092bc191254373780933f2021f1eecec0a881b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 26 Jul 2023 13:20:12 -0400
Subject: [PATCH 324/387] code cleanup

---
 bbot/modules/subdomaincenter.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/modules/subdomaincenter.py b/bbot/modules/subdomaincenter.py
index aad3d8c6d6..218c49d306 100644
--- a/bbot/modules/subdomaincenter.py
+++ b/bbot/modules/subdomaincenter.py
@@ -34,5 +34,4 @@ def parse_results(self, r, query):
         json = r.json()
         if json and isinstance(json, list):
             results = set(json)
-            return results
         return results

From 8fbba55056c053a489d251f4b879c586da158f99 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 26 Jul 2023 14:51:12 -0400
Subject: [PATCH 325/387] tweak massdns wildcard canary

---
 bbot/modules/massdns.py | 23 +++++++++++++++--------
 1 file changed, 15 insertions(+), 8 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 35254afef5..cbc379edf1 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -120,12 +120,22 @@ def already_processed(self, hostname):
 
     async def massdns(self, domain, subdomains):
         abort_msg = f"Aborting massdns on {domain} due to false positives"
-        if await self._canary_check(domain):
+        canary_results = await self._canary_check(domain)
+        if canary_results:
+            self.log.trace(f"{len(canary_results):,} false positives on {domain}:")
+            for r in canary_results:
+                self.log.trace(f"    - {r}")
+        if len(canary_results) > 5:
             self.info(abort_msg)
             return []
         results = [l async for l in self._massdns(domain, subdomains)]
         if len(results) > 50:
-            if await self._canary_check(domain):
+            canary_results = await self._canary_check(domain)
+            if canary_results:
+                self.log.trace(f"{len(canary_results):,} false positives on {domain}:")
+                for r in canary_results:
+                    self.log.trace(f"    - {r}")
+            if len(canary_results) > 5:
                 self.info(abort_msg)
                 return []
         self.verbose(f"Resolving batch of {len(results):,} results")
@@ -139,13 +149,10 @@ async def _canary_check(self, domain, num_checks=50):
         random_subdomains = list(self.gen_random_subdomains(num_checks))
         self.verbose(f"Testing {len(random_subdomains):,} canaries against {domain}")
         canary_results = [l async for l in self._massdns(domain, random_subdomains)]
+        results = []
         async for result in self.helpers.resolve_batch(canary_results):
-            if result:
-                return True
-        # for result in canary_results:
-        #     if await self.helpers.resolve(result):
-        #         return True
-        return False
+            results.append(result)
+        return results
 
     async def _massdns(self, domain, subdomains):
         """

From e17fcf93bca10901cf184a66a60ec2e0cc4edc32 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Wed, 26 Jul 2023 16:10:34 -0400
Subject: [PATCH 326/387] async for loop etiquitte

---
 bbot/modules/massdns.py               | 34 +++++++++++----------------
 bbot/modules/ntlm.py                  |  5 ++--
 bbot/modules/telerik.py               |  5 ++--
 bbot/test/test_step_1/test_helpers.py | 18 +++++++++++++-
 4 files changed, 37 insertions(+), 25 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index cbc379edf1..e6748e9b31 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -119,24 +119,16 @@ def already_processed(self, hostname):
         return False
 
     async def massdns(self, domain, subdomains):
-        abort_msg = f"Aborting massdns on {domain} due to false positives"
-        canary_results = await self._canary_check(domain)
-        if canary_results:
-            self.log.trace(f"{len(canary_results):,} false positives on {domain}:")
-            for r in canary_results:
-                self.log.trace(f"    - {r}")
-        if len(canary_results) > 5:
-            self.info(abort_msg)
+        abort_msg = f"Aborting massdns on {domain} due to false positive"
+        canary_result = await self._canary_check(domain)
+        if canary_result:
+            self.info(abort_msg + f": {canary_result}")
             return []
         results = [l async for l in self._massdns(domain, subdomains)]
         if len(results) > 50:
-            canary_results = await self._canary_check(domain)
-            if canary_results:
-                self.log.trace(f"{len(canary_results):,} false positives on {domain}:")
-                for r in canary_results:
-                    self.log.trace(f"    - {r}")
-            if len(canary_results) > 5:
-                self.info(abort_msg)
+            canary_result = await self._canary_check(domain)
+            if canary_result:
+                self.info(abort_msg + f": {canary_result}")
                 return []
         self.verbose(f"Resolving batch of {len(results):,} results")
         resolved = dict([l async for l in self.helpers.resolve_batch(results, type=("A", "CNAME"), cache_result=True)])
@@ -145,14 +137,16 @@ async def massdns(self, domain, subdomains):
             self.add_found(hostname)
         return list(resolved)
 
-    async def _canary_check(self, domain, num_checks=50):
+    async def _canary_check(self, domain, num_checks=100):
         random_subdomains = list(self.gen_random_subdomains(num_checks))
         self.verbose(f"Testing {len(random_subdomains):,} canaries against {domain}")
         canary_results = [l async for l in self._massdns(domain, random_subdomains)]
-        results = []
-        async for result in self.helpers.resolve_batch(canary_results):
-            results.append(result)
-        return results
+        resolved_canaries = self.helpers.resolve_batch(canary_results)
+        async for query, result in resolved_canaries:
+            if result:
+                await resolved_canaries.aclose()
+                return f"{query}:{result}"
+        return False
 
     async def _massdns(self, domain, subdomains):
         """
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index 2d8ceee538..6bc662d82b 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -125,7 +125,8 @@ async def handle_url(self, event):
             self.processed.add(url_hash)
             tasks.append(self.helpers.create_task(self.check_ntlm(url)))
 
-        async for task in self.helpers.as_completed(tasks):
+        gen = self.helpers.as_completed(tasks)
+        async for task in gen:
             try:
                 result, url = await task
                 if result:
@@ -136,7 +137,7 @@ async def handle_url(self, event):
                     self.warning(str(e))
                 # cancel all the tasks if there's an error
                 await self.helpers.cancel_tasks(tasks)
-                break
+                await gen.aclose()
 
         return None, None
 
diff --git a/bbot/modules/telerik.py b/bbot/modules/telerik.py
index 29f8f1837b..cf5d701041 100644
--- a/bbot/modules/telerik.py
+++ b/bbot/modules/telerik.py
@@ -213,7 +213,8 @@ async def handle_event(self, event):
             tasks.append(self.helpers.create_task(self.test_detector(event.data, f"{dh}?dp=1")))
 
         fail_count = 0
-        async for task in self.helpers.as_completed(tasks):
+        gen = self.helpers.as_completed(tasks)
+        async for task in gen:
             try:
                 result, dh = await task
             except asyncio.CancelledError:
@@ -240,7 +241,7 @@ async def handle_event(self, event):
                         event,
                     )
                     # Once we have a match we need to stop, because the basic handler (Telerik.Web.UI.DialogHandler.aspx) usually works with a path wildcard
-                    break
+                    await gen.aclose()
 
         await self.helpers.cancel_tasks(tasks)
 
diff --git a/bbot/test/test_step_1/test_helpers.py b/bbot/test/test_step_1/test_helpers.py
index 2e1e74e96f..c3e61fb995 100644
--- a/bbot/test/test_step_1/test_helpers.py
+++ b/bbot/test/test_step_1/test_helpers.py
@@ -1,3 +1,4 @@
+import asyncio
 import datetime
 import ipaddress
 
@@ -584,8 +585,11 @@ async def web_request(r):
     assert 45 <= len(results) <= 55
 
 
-def test_async_helpers():
+@pytest.mark.asyncio
+async def test_async_helpers():
+    import random
     from bbot.core.helpers.async_helpers import async_to_sync_gen
+    from bbot.core.helpers.misc import as_completed
 
     # async to sync generator converter
     async def async_gen():
@@ -602,6 +606,18 @@ async def async_gen():
             break
     assert l == [0, 1, 2, 3, 4]
 
+    async def do_stuff(r):
+        await asyncio.sleep(r)
+        return r
+
+    random_ints = [random.random() for _ in range(1000)]
+    tasks = [do_stuff(r) for r in random_ints]
+    results = set()
+    async for t in as_completed(tasks):
+        results.add(await t)
+    assert len(results) == 1000
+    assert sorted(random_ints) == sorted(results)
+
 
 # test parse_port_string helper
 

From 67915873fb15687c8b02622ff863be6a25594fc6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 27 Jul 2023 11:57:36 -0400
Subject: [PATCH 327/387] updated tool comparison

---
 bbot/modules/massdns.py |  4 +++-
 docs/comparison.md      | 14 ++++++++++----
 2 files changed, 13 insertions(+), 5 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index e6748e9b31..543debca59 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -145,7 +145,9 @@ async def _canary_check(self, domain, num_checks=100):
         async for query, result in resolved_canaries:
             if result:
                 await resolved_canaries.aclose()
-                return f"{query}:{result}"
+                result = f"{query}:{result}"
+                self.log.trace(f"Found false positive: {result}")
+                return result
         return False
 
     async def _massdns(self, domain, subdomains):
diff --git a/docs/comparison.md b/docs/comparison.md
index 9d17b9ff4d..4ce8b4016c 100644
--- a/docs/comparison.md
+++ b/docs/comparison.md
@@ -1,9 +1,15 @@
 # Comparison to Other Tools
 
-BBOT isn't exclusively a subdomain enumeration tool. However since there's so many of them, subdomain enumeration tools are the easiest class of tool to compare it to.
+BBOT does a lot more than just subdomain enumeration. However, subdomain enumeration is arguably the most important part of OSINT, and since there's so many subdomain enumeration tools out there, they're the easiest class of tool to compare it to.
 
-Thanks to BBOT's recursive nature (and `massdns`' fancy subdomain mutations), it typically finds about 20-25% more than other tools such as `Amass` or `theHarvester`.
+Thanks to BBOT's recursive nature (and its `massdns` module with its NLP-powered subdomain mutations), it typically finds about 20-25% more than other tools such as `Amass` or `theHarvester`. This holds true even for larger targets like `delta.com` (1000+ subdomains):
 
-This holds true even for larger targets like `boeing.com` (1000+ subdomains):
+### Subdomains Found
 
-![subdomain-stats-boeing](https://github.com/blacklanternsecurity/bbot/assets/20261699/de0154c1-476e-4337-9599-45a1c5e0e78b)
+![subdomains](https://github.com/blacklanternsecurity/bbot/assets/20261699/0d7eb982-e68a-4a33-b33c-7c8ba8c7d6ad)
+
+### Runtimes (Lower is Better)
+
+![runtimes](https://github.com/blacklanternsecurity/bbot/assets/20261699/66cafb5f-045b-4d88-9ffa-7542b3dada4f)
+
+For a detailed analysis of this data, please see [Subdomain Enumeration Tool Face-Off](https://blog.blacklanternsecurity.com/p/subdomain-enumeration-tool-face-off-2023-edition)

From 5112bebd803866889931c4592079811a02bbc27f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 27 Jul 2023 15:34:14 -0400
Subject: [PATCH 328/387] update anyio to release candidate (troubleshooting
 CancelledError)

---
 poetry.lock    | 18 +++++++++---------
 pyproject.toml |  1 +
 2 files changed, 10 insertions(+), 9 deletions(-)

diff --git a/poetry.lock b/poetry.lock
index e7cb0ce3b7..8d6774a448 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -62,24 +62,24 @@ files = [
 
 [[package]]
 name = "anyio"
-version = "3.7.1"
+version = "4.0.0rc1"
 description = "High level compatibility layer for multiple asynchronous event loop implementations"
 optional = false
-python-versions = ">=3.7"
+python-versions = ">=3.8"
 files = [
-    {file = "anyio-3.7.1-py3-none-any.whl", hash = "sha256:91dee416e570e92c64041bd18b900d1d6fa78dff7048769ce5ac5ddad004fbb5"},
-    {file = "anyio-3.7.1.tar.gz", hash = "sha256:44a3c9aba0f5defa43261a8b3efb97891f2bd7d804e0e1f56419befa1adfc780"},
+    {file = "anyio-4.0.0rc1-py3-none-any.whl", hash = "sha256:596b09c520820e7eed961ddc889540972f92d5e8fcb081117fc054c409df34ae"},
+    {file = "anyio-4.0.0rc1.tar.gz", hash = "sha256:48d53f0b141f5757c38d648309e6fe254857fae092d67f938fa248d7c0f36804"},
 ]
 
 [package.dependencies]
-exceptiongroup = {version = "*", markers = "python_version < \"3.11\""}
+exceptiongroup = {version = ">=1.0.2", markers = "python_version < \"3.11\""}
 idna = ">=2.8"
 sniffio = ">=1.1"
 
 [package.extras]
-doc = ["Sphinx", "packaging", "sphinx-autodoc-typehints (>=1.2.0)", "sphinx-rtd-theme (>=1.2.2)", "sphinxcontrib-jquery"]
-test = ["anyio[trio]", "coverage[toml] (>=4.5)", "hypothesis (>=4.0)", "mock (>=4)", "psutil (>=5.9)", "pytest (>=7.0)", "pytest-mock (>=3.6.1)", "trustme", "uvloop (>=0.17)"]
-trio = ["trio (<0.22)"]
+doc = ["Sphinx (>=6.1.0,<6.2.0)", "packaging", "sphinx-autodoc-typehints (>=1.2.0)", "sphinx-rtd-theme", "sphinxcontrib-jquery"]
+test = ["anyio[trio]", "coverage[toml] (>=4.5)", "hypothesis (>=4.0)", "psutil (>=5.9)", "pytest (>=7.0)", "pytest-mock (>=3.6.1)", "trustme", "uvloop (>=0.17)"]
+trio = ["trio (>=0.22)"]
 
 [[package]]
 name = "appdirs"
@@ -1780,4 +1780,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "68da1ef5823d4a97677be49a1be0de993ad2606bc29ed4dd2e78bd1770ebcbf5"
+content-hash = "8e25d12ea22d24b6a153cab314f8df0c3e30c37a098aae2863b92db932a4bb1f"
diff --git a/pyproject.toml b/pyproject.toml
index a6aa95005f..ad240a9ded 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -32,6 +32,7 @@ pyjwt = "^2.7.0"
 beautifulsoup4 = "^4.12.2"
 lxml = "^4.9.2"
 httpx = {extras = ["http2"], version = "^0.24.1"}
+anyio = "4.0.0rc1"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From 859177a4f478b239b5547b4f1e4c5a3cffa286f9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 27 Jul 2023 16:02:23 -0400
Subject: [PATCH 329/387] prevent stack overflow by batching dns queries

---
 bbot/core/helpers/dns.py | 11 ++++++++---
 1 file changed, 8 insertions(+), 3 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index a3d88bb27d..ef6ad0f40f 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -393,9 +393,14 @@ async def resolve_batch(self, queries, **kwargs):
             ("evilcorp.com", {"2.2.2.2"})
         ]
         """
-
-        async for task in as_completed([self._resolve_batch_coro_wrapper(q, **kwargs) for q in queries]):
-            yield await task
+        queries = list(queries)
+        batch_size = 250
+        for i in range(0, len(queries), batch_size):
+            batch = queries[i : i + batch_size]
+            print(batch)
+            tasks = [self._resolve_batch_coro_wrapper(q, **kwargs) for q in batch]
+            async for task in as_completed(tasks):
+                yield await task
 
     def extract_targets(self, record):
         """

From fff8e541e39a6107e239aef35896d119cd0e39e6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 27 Jul 2023 16:03:01 -0400
Subject: [PATCH 330/387] remove debugging statement

---
 bbot/core/helpers/dns.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index ef6ad0f40f..4da1b944a2 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -397,7 +397,6 @@ async def resolve_batch(self, queries, **kwargs):
         batch_size = 250
         for i in range(0, len(queries), batch_size):
             batch = queries[i : i + batch_size]
-            print(batch)
             tasks = [self._resolve_batch_coro_wrapper(q, **kwargs) for q in batch]
             async for task in as_completed(tasks):
                 yield await task

From 110eace047c79779b101c7d006e1f5ca97487388 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 28 Jul 2023 14:02:38 -0400
Subject: [PATCH 331/387] better httpx error handling

---
 bbot/core/helpers/web.py | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index efbee5d9e0..4f6c049b0e 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -1,5 +1,6 @@
 import re
 import ssl
+import anyio
 import httpx
 import logging
 import traceback
@@ -128,13 +129,26 @@ async def request(self, *args, **kwargs):
                 if raise_error:
                     raise
             except httpx.RequestError as e:
-                log.debug(f"Error with request to URL: {url}: {e}")
+                log.trace(f"Error with request to URL: {url}: {e}")
                 log.trace(traceback.format_exc())
                 if raise_error:
                     raise
             except ssl.SSLError as e:
-                log.debug(f"SSL error with request to URL: {url}: {e}")
+                msg = f"SSL error with request to URL: {url}: {e}"
+                log.trace(msg)
                 log.trace(traceback.format_exc())
+                if raise_error:
+                    raise httpx.RequestError(msg)
+            except anyio.EndOfStream as e:
+                msg = f"AnyIO error with request to URL: {url}: {e}"
+                log.trace(msg)
+                log.trace(traceback.format_exc())
+                if raise_error:
+                    raise httpx.RequestError(msg)
+            except BaseException as e:
+                log.trace(f"Unhandled exception with request to URL: {url}: {e}")
+                log.trace(traceback.format_exc())
+                raise
 
     async def download(self, url, **kwargs):
         """

From 1f7194d47ba6414258be2d6a9a9159093a6f6d90 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 28 Jul 2023 15:19:52 -0400
Subject: [PATCH 332/387] improvements to massdns, columbus update

---
 bbot/modules/columbus.py                      | 10 ++--------
 bbot/modules/massdns.py                       | 19 +++++++++++++++++--
 .../module_tests/test_module_columbus.py      |  2 +-
 3 files changed, 20 insertions(+), 11 deletions(-)

diff --git a/bbot/modules/columbus.py b/bbot/modules/columbus.py
index 1f2e13f7eb..057a35c90d 100644
--- a/bbot/modules/columbus.py
+++ b/bbot/modules/columbus.py
@@ -6,22 +6,16 @@ class columbus(crobat):
     watched_events = ["DNS_NAME"]
     produced_events = ["DNS_NAME"]
     meta = {"description": "Query the Columbus Project API for subdomains"}
-    options = {"limit": 500}
-    options_desc = {"limit": "Max number of subdomains to retrieve"}
 
     base_url = "https://columbus.elmasy.com/api/lookup"
 
-    async def setup(self):
-        self.limit = self.config.get("limit", 500)
-        return await super().setup()
-
     async def request_url(self, query):
-        url = f"{self.base_url}/{self.helpers.quote(query)}"
+        url = f"{self.base_url}/{self.helpers.quote(query)}?days=365"
         return await self.request_with_fail_count(url)
 
     def parse_results(self, r, query):
         results = set()
         json = r.json()
         if json and isinstance(json, list):
-            return set([f"{s.lower()}.{query}" for s in json[: self.limit]])
+            return set([f"{s.lower()}.{query}" for s in json])
         return results
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 543debca59..00c1ae0cbd 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -119,17 +119,31 @@ def already_processed(self, hostname):
         return False
 
     async def massdns(self, domain, subdomains):
+        subdomains = list(subdomains)
+
+        # before we start, do a canary check for wildcards
         abort_msg = f"Aborting massdns on {domain} due to false positive"
         canary_result = await self._canary_check(domain)
         if canary_result:
             self.info(abort_msg + f": {canary_result}")
             return []
+
         results = [l async for l in self._massdns(domain, subdomains)]
+
+        # do another canary check for good measure
         if len(results) > 50:
             canary_result = await self._canary_check(domain)
             if canary_result:
                 self.info(abort_msg + f": {canary_result}")
                 return []
+
+        # abort if there are a suspiciously high number of results
+        # (the results are over 2000, and this is more than 20 percent of the input size)
+        if len(results) > 2000 and len(results)/len(subdomains) > .2:
+            self.info(f"Aborting because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})")
+            return []
+
+        # everything checks out
         self.verbose(f"Resolving batch of {len(results):,} results")
         resolved = dict([l async for l in self.helpers.resolve_batch(results, type=("A", "CNAME"), cache_result=True)])
         resolved = {k: v for k, v in resolved.items() if v}
@@ -350,8 +364,9 @@ def gen_random_subdomains(self, n=50):
             d = delimeters[i % len(delimeters)]
             l = lengths[i % len(lengths)]
             segments = list(random.choice(self.devops_mutations) for _ in range(l))
-            subdomains = d.join(segments)
-            yield subdomains
+            segments.append(self.helpers.rand_string(length=8, digits=False))
+            subdomain = d.join(segments)
+            yield subdomain
 
     def get_source_event(self, hostname):
         for p in self.helpers.domain_parents(hostname):
diff --git a/bbot/test/test_step_2/module_tests/test_module_columbus.py b/bbot/test/test_step_2/module_tests/test_module_columbus.py
index 76174683d7..55d456ce31 100644
--- a/bbot/test/test_step_2/module_tests/test_module_columbus.py
+++ b/bbot/test/test_step_2/module_tests/test_module_columbus.py
@@ -4,7 +4,7 @@
 class TestColumbus(ModuleTestBase):
     async def setup_after_prep(self, module_test):
         module_test.httpx_mock.add_response(
-            url=f"https://columbus.elmasy.com/api/lookup/blacklanternsecurity.com",
+            url=f"https://columbus.elmasy.com/api/lookup/blacklanternsecurity.com?days=365",
             json=["asdf", "zzzz"],
         )
 

From dcca342ec068f499a938b49fac23c92a43795e74 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 28 Jul 2023 15:20:02 -0400
Subject: [PATCH 333/387] blacked

---
 bbot/modules/massdns.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 00c1ae0cbd..d2a3fbbd17 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -139,8 +139,10 @@ async def massdns(self, domain, subdomains):
 
         # abort if there are a suspiciously high number of results
         # (the results are over 2000, and this is more than 20 percent of the input size)
-        if len(results) > 2000 and len(results)/len(subdomains) > .2:
-            self.info(f"Aborting because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})")
+        if len(results) > 2000 and len(results) / len(subdomains) > 0.2:
+            self.info(
+                f"Aborting because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})"
+            )
             return []
 
         # everything checks out

From dda65fbd2bf3aff7c4ecf25afeda4c175f5e5a2d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 11:27:57 -0400
Subject: [PATCH 334/387] reuse http client without persisting cookies

---
 bbot/core/helpers/web.py                      | 110 ++++++++++--------
 .../module_tests/test_module_ntlm.py          |   2 +
 2 files changed, 63 insertions(+), 49 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 4f6c049b0e..8d98585182 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -7,16 +7,33 @@
 from pathlib import Path
 from bs4 import BeautifulSoup
 
+from httpx._models import Cookies
+
 from bbot.core.errors import WordlistError, CurlError
 from bbot.core.helpers.ratelimiter import RateLimiter
 
 log = logging.getLogger("bbot.core.helpers.web")
 
 
+class DummyCookies(Cookies):
+    """
+    Class to disable cookie parsing
+    """
+    def extract_cookies(self, *args, **kwargs):
+        pass
+
+
 class BBOTAsyncClient(httpx.AsyncClient):
     def __init__(self, *args, **kwargs):
+
         self._bbot_scan = kwargs.pop("_bbot_scan")
 
+        http_debug = self._bbot_scan.config.get("http_debug", None)
+        if http_debug:
+            log.debug(f"Creating AsyncClient: {args}, {kwargs}")
+
+        self._persist_cookies = kwargs.pop("persist_cookies", True)
+
         # timeout
         http_timeout = self._bbot_scan.config.get("http_timeout", 20)
         if not "timeout" in kwargs:
@@ -35,11 +52,9 @@ def __init__(self, *args, **kwargs):
         proxies = self._bbot_scan.config.get("http_proxy", None)
         kwargs["proxies"] = proxies
 
-        http_debug = self._bbot_scan.config.get("http_debug", None)
-        if http_debug:
-            log.debug(f"Creating AsyncClient: {args}, {kwargs}")
-
         super().__init__(*args, **kwargs)
+        if not self._persist_cookies:
+            self._cookies = DummyCookies()
 
     def build_request(self, *args, **kwargs):
         request = super().build_request(*args, **kwargs)
@@ -75,6 +90,7 @@ def __init__(self, parent_helper):
         self.ssl_verify = self.parent_helper.config.get("ssl_verify", False)
         self.web_requests_per_second = self.parent_helper.config.get("web_requests_per_second", 50)
         self.web_rate_limiter = RateLimiter(self.web_requests_per_second, "Web")
+        self.web_client = self.AsyncClient(persist_cookies=False)
 
     def AsyncClient(self, *args, **kwargs):
         kwargs["_bbot_scan"] = self.parent_helper.scan
@@ -88,6 +104,8 @@ async def request(self, *args, **kwargs):
         # TODO: use this
         cache_for = kwargs.pop("cache_for", None)  # noqa
 
+        client = kwargs.get("client", self.web_client)
+
         # allow vs follow, httpx why??
         allow_redirects = kwargs.pop("allow_redirects", None)
         if allow_redirects is not None and "follow_redirects" not in kwargs:
@@ -103,52 +121,46 @@ async def request(self, *args, **kwargs):
         if not args and "method" not in kwargs:
             kwargs["method"] = "GET"
 
-        client_kwargs = {}
-        for k in list(kwargs):
-            if k in self.client_options:
-                v = kwargs.pop(k)
-                client_kwargs[k] = v
-        async with self.AsyncClient(**client_kwargs) as client:
-            try:
-                if self.http_debug:
-                    logstr = f"Web request: {str(args)}, {str(kwargs)}"
-                    log.debug(logstr)
-                async with self.web_rate_limiter:
-                    response = await client.request(*args, **kwargs)
-                if self.http_debug:
-                    log.debug(
-                        f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
-                    )
-                return response
-            except httpx.TimeoutException:
-                log.verbose(f"HTTP timeout to URL: {url}")
-                if raise_error:
-                    raise
-            except httpx.ConnectError:
-                log.verbose(f"HTTP connect failed to URL: {url}")
-                if raise_error:
-                    raise
-            except httpx.RequestError as e:
-                log.trace(f"Error with request to URL: {url}: {e}")
-                log.trace(traceback.format_exc())
-                if raise_error:
-                    raise
-            except ssl.SSLError as e:
-                msg = f"SSL error with request to URL: {url}: {e}"
-                log.trace(msg)
-                log.trace(traceback.format_exc())
-                if raise_error:
-                    raise httpx.RequestError(msg)
-            except anyio.EndOfStream as e:
-                msg = f"AnyIO error with request to URL: {url}: {e}"
-                log.trace(msg)
-                log.trace(traceback.format_exc())
-                if raise_error:
-                    raise httpx.RequestError(msg)
-            except BaseException as e:
-                log.trace(f"Unhandled exception with request to URL: {url}: {e}")
-                log.trace(traceback.format_exc())
+        try:
+            if self.http_debug:
+                logstr = f"Web request: {str(args)}, {str(kwargs)}"
+                log.debug(logstr)
+            async with self.web_rate_limiter:
+                response = await client.request(*args, **kwargs)
+            if self.http_debug:
+                log.debug(
+                    f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
+                )
+            return response
+        except httpx.TimeoutException:
+            log.verbose(f"HTTP timeout to URL: {url}")
+            if raise_error:
+                raise
+        except httpx.ConnectError:
+            log.verbose(f"HTTP connect failed to URL: {url}")
+            if raise_error:
+                raise
+        except httpx.RequestError as e:
+            log.trace(f"Error with request to URL: {url}: {e}")
+            log.trace(traceback.format_exc())
+            if raise_error:
                 raise
+        except ssl.SSLError as e:
+            msg = f"SSL error with request to URL: {url}: {e}"
+            log.trace(msg)
+            log.trace(traceback.format_exc())
+            if raise_error:
+                raise httpx.RequestError(msg)
+        except anyio.EndOfStream as e:
+            msg = f"AnyIO error with request to URL: {url}: {e}"
+            log.trace(msg)
+            log.trace(traceback.format_exc())
+            if raise_error:
+                raise httpx.RequestError(msg)
+        except BaseException as e:
+            log.trace(f"Unhandled exception with request to URL: {url}: {e}")
+            log.trace(traceback.format_exc())
+            raise
 
     async def download(self, url, **kwargs):
         """
diff --git a/bbot/test/test_step_2/module_tests/test_module_ntlm.py b/bbot/test/test_step_2/module_tests/test_module_ntlm.py
index 790f2e0d22..4b8e6fed5e 100644
--- a/bbot/test/test_step_2/module_tests/test_module_ntlm.py
+++ b/bbot/test/test_step_2/module_tests/test_module_ntlm.py
@@ -20,4 +20,6 @@ async def setup_after_prep(self, module_test):
         module_test.set_expect_requests(request_args, respond_args)
 
     def check(self, module_test, events):
+        for e in events:
+            module_test.log.critical(e)
         assert any(e.type == "FINDING" and "EXC01.vno.local" in e.data["description"] for e in events)

From 2607c023cb6809113603e2c7ff0954cd31283c01 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 11:28:07 -0400
Subject: [PATCH 335/387] blacked

---
 bbot/core/helpers/web.py | 6 ++----
 1 file changed, 2 insertions(+), 4 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 8d98585182..67f5adce8f 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -19,13 +19,13 @@ class DummyCookies(Cookies):
     """
     Class to disable cookie parsing
     """
+
     def extract_cookies(self, *args, **kwargs):
         pass
 
 
 class BBOTAsyncClient(httpx.AsyncClient):
     def __init__(self, *args, **kwargs):
-
         self._bbot_scan = kwargs.pop("_bbot_scan")
 
         http_debug = self._bbot_scan.config.get("http_debug", None)
@@ -128,9 +128,7 @@ async def request(self, *args, **kwargs):
             async with self.web_rate_limiter:
                 response = await client.request(*args, **kwargs)
             if self.http_debug:
-                log.debug(
-                    f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}"
-                )
+                log.debug(f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}")
             return response
         except httpx.TimeoutException:
             log.verbose(f"HTTP timeout to URL: {url}")

From d24f432911a125f43c60f514a209452d1e13159c Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 11:30:17 -0400
Subject: [PATCH 336/387] fix github auth for docs publishing

---
 .github/workflows/tests.yml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index edec946082..39bcf87a43 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -58,6 +58,8 @@ jobs:
     runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v3
+        with:
+          token: ${{ secrets.BBOT_DOCS_UPDATER_PAT }}
       - name: Set up Python
         uses: actions/setup-python@v4
         with:
@@ -77,7 +79,6 @@ jobs:
           author_name: "BBOT Docs Autopublish"
           author_email: info@blacklanternsecurity.com
           message: "Refresh module docs"
-          token: ${{ secrets.BBOT_DOCS_UPDATER_PAT }}
   publish_docs:
     needs: update_docs
     runs-on: ubuntu-latest

From f13c72302062957fea154d62bff562e4139248f9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 11:37:37 -0400
Subject: [PATCH 337/387] update readme

---
 README.md | 8 +++++---
 1 file changed, 5 insertions(+), 3 deletions(-)

diff --git a/README.md b/README.md
index 0ca251ff0f..5bd250d476 100644
--- a/README.md
+++ b/README.md
@@ -14,6 +14,8 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/bbot/how_it_works/).
 
+## [Documenation](https://www.blacklanternsecurity.com/bbot/)
+
 ## Installation ([pip](https://pypi.org/project/bbot/))
 
 For more installation methods including [Docker](https://hub.docker.com/r/blacklanternsecurity/bbot), see [Installation](https://www.blacklanternsecurity.com/bbot/#installation).
@@ -34,7 +36,7 @@ bbot --help
 
 ## Example Commands
 
-Scan output, logs, etc. are saved to `~/.bbot`. For more detailed examples and explanations, see [Scanning](https://www.blacklanternsecurity.com/scanning).
+Scan output, logs, etc. are saved to `~/.bbot`. For more detailed examples and explanations, see [Scanning](https://www.blacklanternsecurity.com/bbot/scanning).
 
 <!-- BBOT EXAMPLE COMMANDS -->
 **Subdomains:**
@@ -82,14 +84,14 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap g
 
 ## Targets
 
-BBOT accepts an unlimited number of targets which you can specify either directly on the command line or in files (or both!). Targets can be any of the following:
+BBOT accepts an unlimited number of targets. You can specify targets either directly on the command line or in files (or both!). Targets can be any of the following:
 
 - DNS_NAME (`evilcorp.com`)
 - IP_ADDRESS (`1.2.3.4`)
 - IP_RANGE (`1.2.3.0/24`)
 - URL (`https://www.evilcorp.com`)
 
-For more information, see [Targets](https://www.blacklanternsecurity.com/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/scanning/#scope).
+For more information, see [Targets](https://www.blacklanternsecurity.com/bbot/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/bbot/scanning/#scope).
 
 ## BBOT as a Python library
 

From 8211cc8eab97479f3df66ebe605492ac5e8f2203 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 11:37:56 -0400
Subject: [PATCH 338/387] update readme

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index 5bd250d476..c3c53e512a 100644
--- a/README.md
+++ b/README.md
@@ -14,7 +14,7 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/bbot/how_it_works/).
 
-## [Documenation](https://www.blacklanternsecurity.com/bbot/)
+## [Documentation](https://www.blacklanternsecurity.com/bbot/)
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 

From 275cd579b854bb3969387de75b44823688e62f55 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 11:38:30 -0400
Subject: [PATCH 339/387] update readme

---
 README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/README.md b/README.md
index c3c53e512a..bbfc323dc4 100644
--- a/README.md
+++ b/README.md
@@ -14,7 +14,7 @@ BBOT is inspired by [Spiderfoot](https://github.com/smicallef/spiderfoot) but ta
 
 BBOT typically outperforms other subdomain enumeration tools by 20-25%. To learn how this is possible, see [How It Works](https://www.blacklanternsecurity.com/bbot/how_it_works/).
 
-## [Documentation](https://www.blacklanternsecurity.com/bbot/)
+## Full Documentation [Here](https://www.blacklanternsecurity.com/bbot/).
 
 ## Installation ([pip](https://pypi.org/project/bbot/))
 

From 21cc8d26e48200c07d6ca755617367f8c9bfdeeb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 12:22:38 -0400
Subject: [PATCH 340/387] one client, allow cookies

---
 bbot/core/helpers/web.py          | 18 +++++------------
 bbot/test/test_step_1/test_web.py | 32 +++++++++++++++++++++++++++++++
 2 files changed, 37 insertions(+), 13 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 67f5adce8f..72e0f73f2d 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -7,23 +7,12 @@
 from pathlib import Path
 from bs4 import BeautifulSoup
 
-from httpx._models import Cookies
-
 from bbot.core.errors import WordlistError, CurlError
 from bbot.core.helpers.ratelimiter import RateLimiter
 
 log = logging.getLogger("bbot.core.helpers.web")
 
 
-class DummyCookies(Cookies):
-    """
-    Class to disable cookie parsing
-    """
-
-    def extract_cookies(self, *args, **kwargs):
-        pass
-
-
 class BBOTAsyncClient(httpx.AsyncClient):
     def __init__(self, *args, **kwargs):
         self._bbot_scan = kwargs.pop("_bbot_scan")
@@ -53,8 +42,6 @@ def __init__(self, *args, **kwargs):
         kwargs["proxies"] = proxies
 
         super().__init__(*args, **kwargs)
-        if not self._persist_cookies:
-            self._cookies = DummyCookies()
 
     def build_request(self, *args, **kwargs):
         request = super().build_request(*args, **kwargs)
@@ -66,6 +53,11 @@ def build_request(self, *args, **kwargs):
                     request.headers[hk] = hv
         return request
 
+    def _merge_cookies(self, cookies):
+        if self._persist_cookies:
+            return super()._merge_cookies(cookies)
+        return cookies
+
 
 class WebHelper:
     """
diff --git a/bbot/test/test_step_1/test_web.py b/bbot/test/test_step_1/test_web.py
index 4635e80956..19a7252333 100644
--- a/bbot/test/test_step_1/test_web.py
+++ b/bbot/test/test_step_1/test_web.py
@@ -211,3 +211,35 @@ async def test_http_ssl(bbot_scanner, bbot_config, bbot_httpserver_ssl):
     r2 = await scan2.helpers.request(url)
     assert r2 is not None, "Request to self-signed SSL server failed even with ssl_verify=False"
     assert r2.status_code == 200 and r2.text == "test_http_ssl_yep"
+
+
+@pytest.mark.asyncio
+async def test_web_cookies(bbot_scanner, bbot_config, httpx_mock):
+    import httpx
+
+    # make sure cookies work when enabled
+    httpx_mock.add_response(url="http://www.evilcorp.com/cookies", headers=[("set-cookie", "wat=asdf; path=/")])
+    scan = bbot_scanner(config=bbot_config)
+    client = scan.helpers.AsyncClient(persist_cookies=True)
+    r = await client.get(url="http://www.evilcorp.com/cookies")
+    assert r.cookies["wat"] == "asdf"
+    httpx_mock.add_response(url="http://www.evilcorp.com/cookies/test", match_headers={"cookie": "wat=asdf"})
+    r = await client.get(url="http://www.evilcorp.com/cookies/test")
+    # make sure we can manually send cookies
+    httpx_mock.add_response(url="http://www.evilcorp.com/cookies/test2", match_headers={"cookie": "asdf=wat"})
+    r = await scan.helpers.request(url="http://www.evilcorp.com/cookies/test2", cookies={"asdf": "wat"})
+
+    # make sure they don't when they're not
+    httpx_mock.add_response(url="http://www2.evilcorp.com/cookies", headers=[("set-cookie", "wats=fdsa; path=/")])
+    scan = bbot_scanner(config=bbot_config)
+    client2 = scan.helpers.AsyncClient(persist_cookies=False)
+    r = await client2.get(url="http://www2.evilcorp.com/cookies")
+    # make sure we can access the cookies
+    assert "wats" in r.cookies
+    httpx_mock.add_response(url="http://www2.evilcorp.com/cookies/test", match_headers={"cookie": "wats=fdsa"})
+    # but that they're not sent in the response
+    with pytest.raises(httpx.TimeoutException):
+        r = await client2.get(url="http://www2.evilcorp.com/cookies/test")
+    # make sure we can manually send cookies
+    httpx_mock.add_response(url="http://www2.evilcorp.com/cookies/test2", match_headers={"cookie": "fdsa=wats"})
+    r = await client2.get(url="http://www2.evilcorp.com/cookies/test2", cookies={"fdsa": "wats"})

From 6c3a6581b3e907c71877ba2fc13230268ea49858 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 12:29:22 -0400
Subject: [PATCH 341/387] don't accumulate cookies in the client

---
 bbot/core/helpers/web.py          | 9 +++++++++
 bbot/test/test_step_1/test_web.py | 2 ++
 2 files changed, 11 insertions(+)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 72e0f73f2d..d30424de88 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -7,12 +7,19 @@
 from pathlib import Path
 from bs4 import BeautifulSoup
 
+from httpx._models import Cookies
+
 from bbot.core.errors import WordlistError, CurlError
 from bbot.core.helpers.ratelimiter import RateLimiter
 
 log = logging.getLogger("bbot.core.helpers.web")
 
 
+class DummyCookies(Cookies):
+    def extract_cookies(self, *args, **kwargs):
+        pass
+
+
 class BBOTAsyncClient(httpx.AsyncClient):
     def __init__(self, *args, **kwargs):
         self._bbot_scan = kwargs.pop("_bbot_scan")
@@ -42,6 +49,8 @@ def __init__(self, *args, **kwargs):
         kwargs["proxies"] = proxies
 
         super().__init__(*args, **kwargs)
+        if not self._persist_cookies:
+            self._cookies = DummyCookies()
 
     def build_request(self, *args, **kwargs):
         request = super().build_request(*args, **kwargs)
diff --git a/bbot/test/test_step_1/test_web.py b/bbot/test/test_step_1/test_web.py
index 19a7252333..334410f277 100644
--- a/bbot/test/test_step_1/test_web.py
+++ b/bbot/test/test_step_1/test_web.py
@@ -228,6 +228,7 @@ async def test_web_cookies(bbot_scanner, bbot_config, httpx_mock):
     # make sure we can manually send cookies
     httpx_mock.add_response(url="http://www.evilcorp.com/cookies/test2", match_headers={"cookie": "asdf=wat"})
     r = await scan.helpers.request(url="http://www.evilcorp.com/cookies/test2", cookies={"asdf": "wat"})
+    assert client.cookies["wat"] == "asdf"
 
     # make sure they don't when they're not
     httpx_mock.add_response(url="http://www2.evilcorp.com/cookies", headers=[("set-cookie", "wats=fdsa; path=/")])
@@ -243,3 +244,4 @@ async def test_web_cookies(bbot_scanner, bbot_config, httpx_mock):
     # make sure we can manually send cookies
     httpx_mock.add_response(url="http://www2.evilcorp.com/cookies/test2", match_headers={"cookie": "fdsa=wats"})
     r = await client2.get(url="http://www2.evilcorp.com/cookies/test2", cookies={"fdsa": "wats"})
+    assert not client2.cookies

From 48343ea731fff0b67359bea44eeca3ab7ee09fb6 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 12:46:56 -0400
Subject: [PATCH 342/387] retries bug fix

---
 bbot/core/helpers/web.py | 17 +++++++++--------
 1 file changed, 9 insertions(+), 8 deletions(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index d30424de88..59e8a80ec9 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -73,15 +73,8 @@ class WebHelper:
     For making HTTP requests
     """
 
-    client_options = (
-        "auth",
-        "params",
-        "headers",
+    client_only_options = (
         "retries",
-        "cookies",
-        "verify",
-        "timeout",
-        "follow_redirects",
         "max_redirects",
     )
 
@@ -122,6 +115,14 @@ async def request(self, *args, **kwargs):
         if not args and "method" not in kwargs:
             kwargs["method"] = "GET"
 
+        client_kwargs = {}
+        for k in list(kwargs):
+            if k in self.client_only_options:
+                v = kwargs.pop(k)
+                client_kwargs[k] = v
+        if client_kwargs:
+            client = self.AsyncClient(**client_kwargs)
+
         try:
             if self.http_debug:
                 logstr = f"Web request: {str(args)}, {str(kwargs)}"

From e2e708514b3b2b4eabfd3243dda1db00b29b935f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 18:50:17 -0400
Subject: [PATCH 343/387] removed debugging statement

---
 bbot/core/helpers/names_generator.py                   | 1 +
 bbot/test/test_step_2/module_tests/test_module_ntlm.py | 2 --
 2 files changed, 1 insertion(+), 2 deletions(-)

diff --git a/bbot/core/helpers/names_generator.py b/bbot/core/helpers/names_generator.py
index 46e46b2a24..bb233c080e 100644
--- a/bbot/core/helpers/names_generator.py
+++ b/bbot/core/helpers/names_generator.py
@@ -25,6 +25,7 @@
     "childish",
     "chiseled",
     "cold",
+    "condescending",
     "considerate",
     "constipated",
     "contentious",
diff --git a/bbot/test/test_step_2/module_tests/test_module_ntlm.py b/bbot/test/test_step_2/module_tests/test_module_ntlm.py
index 4b8e6fed5e..790f2e0d22 100644
--- a/bbot/test/test_step_2/module_tests/test_module_ntlm.py
+++ b/bbot/test/test_step_2/module_tests/test_module_ntlm.py
@@ -20,6 +20,4 @@ async def setup_after_prep(self, module_test):
         module_test.set_expect_requests(request_args, respond_args)
 
     def check(self, module_test, events):
-        for e in events:
-            module_test.log.critical(e)
         assert any(e.type == "FINDING" and "EXC01.vno.local" in e.data["description"] for e in events)

From 26e0f0710790d917a69f62e38b0d6aa9bf0473a9 Mon Sep 17 00:00:00 2001
From: BBOT Docs Autopublish <info@blacklanternsecurity.com>
Date: Sun, 30 Jul 2023 10:19:23 +0000
Subject: [PATCH 344/387] Refresh module docs

---
 README.md                        |  1 +
 docs/scanning/advanced.md        |  2 +-
 docs/scanning/configuration.md   | 10 ++----
 docs/scanning/events.md          | 52 ++++++++++++++++----------------
 docs/scanning/index.md           | 44 +++++++++++++--------------
 docs/scanning/list_of_modules.md |  7 +++--
 6 files changed, 58 insertions(+), 58 deletions(-)

diff --git a/README.md b/README.md
index bbfc323dc4..d95bca933a 100644
--- a/README.md
+++ b/README.md
@@ -139,6 +139,7 @@ asyncio.run(main())
     - [How to Write a Module](https://www.blacklanternsecurity.com/bbot/contribution)
 - **Misc**
     - [Release History](https://www.blacklanternsecurity.com/bbot/release_history)
+    - [Troubleshooting](https://www.blacklanternsecurity.com/bbot/troubleshooting)
 <!-- END BBOT DOCS TOC -->
 
 ## Acknowledgements
diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index ffd1e93cbd..8e16a62b5f 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -61,7 +61,7 @@ Target:
 
 Modules:
   -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,myssl,naabu,nmap,nsec,ntlm,nuclei,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_realm,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,digitorus,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,myssl,nmap,nsec,ntlm,nuclei,oauth,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,subdomaincenter,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
   -l, --list-modules    List available modules.
   -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
                         Exclude these modules.
diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index eaa1cf4567..87951916df 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -189,7 +189,7 @@ interactsh_token: null
 interactsh_disable: false
 
 # For performance reasons, always skip these DNS queries
-# Microsoft's DNS infrastructure is misconfigured so that some queries to mail.protection.outlook.com always time out
+# Microsoft's DNS infrastructure is misconfigured so that certain queries to mail.protection.outlook.com always time out
 dns_omit_queries:
   - SRV:mail.protection.outlook.com
   - CNAME:mail.protection.outlook.com
@@ -243,10 +243,6 @@ Many modules accept their own configuration options. These options have the abil
 | modules.masscan.rate                           | int    | Rate in packets per second                                                                                                                                                                                                                                                                                      | 600                                                                                                                                                                 |
 | modules.masscan.use_cache                      | bool   | Instead of scanning, use the results from the previous scan                                                                                                                                                                                                                                                     | False                                                                                                                                                               |
 | modules.masscan.wait                           | int    | Seconds to wait for replies after scan is complete                                                                                                                                                                                                                                                              | 10                                                                                                                                                                  |
-| modules.naabu.ports                            | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
-| modules.naabu.skip_host_discovery              | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
-| modules.naabu.top_ports                        | int    | top ports to scan                                                                                                                                                                                                                                                                                               | 100                                                                                                                                                                 |
-| modules.naabu.version                          | str    | naabu version                                                                                                                                                                                                                                                                                                   | 2.1.1                                                                                                                                                               |
 | modules.nmap.ports                             | str    | ports to scan                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                     |
 | modules.nmap.skip_host_discovery               | bool   | skip host discovery (-Pn)                                                                                                                                                                                                                                                                                       | True                                                                                                                                                                |
 | modules.nmap.timing                            | str    |` -T<0-5>: Set timing template (higher is faster)                                                                                                                                                                                                                                                                 `| T4                                                                                                                                                                  |
@@ -261,7 +257,8 @@ Many modules accept their own configuration options. These options have the abil
 | modules.nuclei.severity                        | str    | Filter based on severity field available in the template.                                                                                                                                                                                                                                                       |                                                                                                                                                                     |
 | modules.nuclei.tags                            | str    | execute a subset of templates that contain the provided tags                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
 | modules.nuclei.templates                       | str    | template or template directory paths to include in the scan                                                                                                                                                                                                                                                     |                                                                                                                                                                     |
-| modules.nuclei.version                         | str    | nuclei version                                                                                                                                                                                                                                                                                                  | 2.9.4                                                                                                                                                               |
+| modules.nuclei.version                         | str    | nuclei version                                                                                                                                                                                                                                                                                                  | 2.9.9                                                                                                                                                               |
+| modules.oauth.try_all                          | bool   | Check for OAUTH/IODC on every subdomain and URL.                                                                                                                                                                                                                                                                | False                                                                                                                                                               |
 | modules.paramminer_cookies.http_extract        | bool   | Attempt to find additional wordlist words from the HTTP Response                                                                                                                                                                                                                                                | True                                                                                                                                                                |
 | modules.paramminer_cookies.skip_boring_words   | bool   | Remove commonly uninteresting words from the wordlist                                                                                                                                                                                                                                                           | True                                                                                                                                                                |
 | modules.paramminer_cookies.wordlist            | str    | Define the wordlist to be used to derive cookies                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
@@ -295,7 +292,6 @@ Many modules accept their own configuration options. These options have the abil
 | modules.censys.api_id                          | str    | Censys.io API ID                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
 | modules.censys.api_secret                      | str    | Censys.io API Secret                                                                                                                                                                                                                                                                                            |                                                                                                                                                                     |
 | modules.censys.max_pages                       | int    | Maximum number of pages to fetch (100 results per page)                                                                                                                                                                                                                                                         | 5                                                                                                                                                                   |
-| modules.columbus.limit                         | int    | Max number of subdomains to retrieve                                                                                                                                                                                                                                                                            | 500                                                                                                                                                                 |
 | modules.fullhunt.api_key                       | str    | FullHunt API Key                                                                                                                                                                                                                                                                                                |                                                                                                                                                                     |
 | modules.github.api_key                         | str    | Github token                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                     |
 | modules.hunterio.api_key                       | str    | Hunter.IO API key                                                                                                                                                                                                                                                                                               |                                                                                                                                                                     |
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index 4e97f4d622..6b6161d770 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -47,30 +47,30 @@ Below is a full list of event types along with which modules produce/consume the
 ## List of Event Types
 
 <!-- BBOT EVENTS -->
-| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | Producing Modules                                                                                                                                                                                                                                                                                                                                                                              |
-|---------------------|-----------------------|-----------------------|----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |                                                                                                                                                                                                                                                                                                                                                                                                |
-| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | asn                                                                                                                                                                                                                                                                                                                                                                                            |
-| DNS_NAME            | 48                    | 38                    | anubisdb, asset_inventory, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, myssl, naabu, nmap, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, myssl, nsec, ntlm, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
-| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            |                                                                                                                                                                                                                                                                                                                                                                                                |
-| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                            |
-| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                             |
-| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | ipstack                                                                                                                                                                                                                                                                                                                                                                                        |
-| HTTP_RESPONSE       | 11                    | 1                     | badsecrets, excavate, host_header, hunt, ntlm, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                          | httpx                                                                                                                                                                                                                                                                                                                                                                                          |
-| IP_ADDRESS          | 7                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                                 |
-| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |                                                                                                                                                                                                                                                                                                                                                                                                |
-| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | censys                                                                                                                                                                                                                                                                                                                                                                                         |
-| OPEN_TCP_PORT       | 4                     | 5                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | asset_inventory, masscan, naabu, nmap, speculate                                                                                                                                                                                                                                                                                                                                               |
-| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                                           |
-| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |                                                                                                                                                                                                                                                                                                                                                                                                |
-| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | social                                                                                                                                                                                                                                                                                                                                                                                         |
-| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                  | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                                     |
-| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                                          |
-| URL                 | 18                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                                                                                                | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                               |
-| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                 |
-| URL_UNVERIFIED      | 3                     | 10                    | httpx, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                                |
-| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | vhost                                                                                                                                                                                                                                                                                                                                                                                          |
-| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                                      |
-| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | wafw00f                                                                                                                                                                                                                                                                                                                                                                                        |
-| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | gowitness                                                                                                                                                                                                                                                                                                                                                                                      |
+| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | Producing Modules                                                                                                                                                                                                                                                                                                                                                                                                                              |
+|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | asn                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| DNS_NAME            | 51                    | 42                    | anubisdb, asset_inventory, azure_realm, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, myssl, nmap, nsec, oauth, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, myssl, nsec, ntlm, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, subdomaincenter, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
+| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                            |
+| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                                                                             |
+| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | ipstack                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| HTTP_RESPONSE       | 11                    | 1                     | badsecrets, excavate, host_header, hunt, ntlm, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                   | httpx                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| IP_ADDRESS          | 6                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                                                                                 |
+| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | censys                                                                                                                                                                                                                                                                                                                                                                                                                                         |
+| OPEN_TCP_PORT       | 4                     | 4                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   | asset_inventory, masscan, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                      |
+| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | social                                                                                                                                                                                                                                                                                                                                                                                                                                         |
+| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                                                                                     |
+| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| URL                 | 18                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                                                                                                                                         | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                                                                               |
+| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| URL_UNVERIFIED      | 4                     | 10                    | httpx, oauth, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                                                                                |
+| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | vhost                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                                                                                      |
+| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                      |
 <!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 4f1ad93b14..cff31c57ef 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -103,28 +103,28 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 ### List of Flags
 
 <!-- BBOT MODULE FLAGS -->
-| Flag             | # Modules   | Description                                   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-|------------------|-------------|-----------------------------------------------|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| safe             | 60          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, myssl, nsec, ntlm, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 44          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, myssl, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                   |
-| active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, naabu, nmap, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                               |
-| subdomain-enum   | 37          | Enumerates subdomains                         | anubisdb, asn, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, myssl, nsec, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
-| web-thorough     | 25          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, naabu, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                                      |
-| aggressive       | 19          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, naabu, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                      |
-| web-basic        | 15          | Basic, non-intrusive web scan functionality   | badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
-| slow             | 9           | May take a long time to complete              | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
-| cloud-enum       | 7           | Enumerates cloud resources                    | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
-| affiliates       | 6           | Discovers affiliated hostnames/domains        | affiliates, azure_tenant, builtwith, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |
-| email-enum       | 6           | Enumerates email addresses                    | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
-| deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
-| portscan         | 3           | Discovers open ports                          | masscan, naabu, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
-| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| Flag             | # Modules   | Description                                   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+|------------------|-------------|-----------------------------------------------|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 64          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, myssl, nsec, ntlm, oauth, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 47          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, myssl, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                          |
+| subdomain-enum   | 41          | Enumerates subdomains                         | anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, myssl, nsec, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, subdomaincenter, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, nmap, ntlm, nuclei, oauth, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                                                                               |
+| web-thorough     | 24          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                             |
+| aggressive       | 18          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| web-basic        | 17          | Basic, non-intrusive web scan functionality   | azure_realm, badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, oauth, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| cloud-enum       | 10          | Enumerates cloud resources                    | azure_realm, azure_tenant, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, oauth, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |
+| slow             | 9           | May take a long time to complete              | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| affiliates       | 8           | Discovers affiliated hostnames/domains        | affiliates, azure_realm, azure_tenant, builtwith, oauth, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| email-enum       | 6           | Enumerates email addresses                    | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
+| deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
+| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| portscan         | 2           | Discovers open ports                          | masscan, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 <!-- END BBOT MODULE FLAGS --> 
 
 ## Dependencies
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 327b473b17..cebe2e1f0b 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -22,10 +22,10 @@
 | hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                                  |
 | iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active, iis-shortnames, safe, web-basic, web-thorough                               | URL                                                                                                     | URL_HINT                                                 |
 | masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active, aggressive, portscan                                                        | SCAN                                                                                                    | OPEN_TCP_PORT                                            |
-| naabu                | scan     | No              | Execute port scans with naabu                                          | active, aggressive, portscan, web-thorough                                          | DNS_NAME, IP_ADDRESS                                                                                    | OPEN_TCP_PORT                                            |
 | nmap                 | scan     | No              | Execute port scans with nmap                                           | active, aggressive, portscan, web-thorough                                          | DNS_NAME, IP_ADDRESS                                                                                    | OPEN_TCP_PORT                                            |
 | ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE, URL                                                                                      | DNS_NAME, FINDING                                        |
 | nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active, aggressive, deadly                                                          | URL                                                                                                     | FINDING, VULNERABILITY                                   |
+| oauth                | scan     | No              | Enumerate OAUTH and OpenID Connect services                            | active, affiliates, cloud-enum, safe, subdomain-enum, web-basic                     | DNS_NAME, URL_UNVERIFIED                                                                                | DNS_NAME                                                 |
 | paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
 | paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
 | paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
@@ -43,7 +43,8 @@
 | affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates, passive, report, safe                                                   | *                                                                                                       |                                                          |
 | anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive, report, safe, subdomain-enum                                               | IP_ADDRESS                                                                                              | ASN                                                      |
-| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| azure_realm          | scan     | No              | Retrieves the "AuthURL" from login.microsoftonline.com/getuserrealm    | affiliates, cloud-enum, passive, safe, subdomain-enum, web-basic                    | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates, cloud-enum, passive, safe, subdomain-enum                               | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |
 | binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
@@ -53,6 +54,7 @@
 | columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| digitorus            | scan     | No              | Query certificatedetails.com for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
@@ -74,6 +76,7 @@
 | securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
+| subdomaincenter      | scan     | No              | Query subdomain.center's API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |

From 51941b2c6f644039b3144d333dd46f43d353f405 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 16:12:19 -0400
Subject: [PATCH 345/387] fix bug where scan sometimes finished prematurely

---
 bbot/modules/base.py | 73 +++++++++++++++++++++++---------------------
 1 file changed, 38 insertions(+), 35 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 85052059e0..ed14015b0e 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -210,22 +210,23 @@ def get_watched_events(self):
         return self._watched_events
 
     async def _handle_batch(self):
-        submitted = False
-        if self.batch_size <= 1:
-            return
-        if self.num_incoming_events > 0:
-            events, finish = await self.events_waiting()
-            if not self.errored:
-                self.debug(f"Handling batch of {len(events):,} events")
-                if events:
-                    submitted = True
-                    context = "handle_batch()"
-                    async with self.scan.acatch(context), self._task_counter.count(context):
-                        await self.handle_batch(*events)
-                if finish:
-                    context = "finish()"
-                    async with self.scan.acatch(context), self._task_counter.count(context):
-                        await self.finish()
+        finish = False
+        async with self._task_counter.count("handle_batch()"):
+            submitted = False
+            if self.batch_size <= 1:
+                return
+            if self.num_incoming_events > 0:
+                events, finish = await self.events_waiting()
+                if not self.errored:
+                    self.debug(f"Handling batch of {len(events):,} events")
+                    if events:
+                        submitted = True
+                        async with self.scan.acatch("handle_batch()"):
+                            await self.handle_batch(*events)
+        if finish:
+            context = "finish()"
+            async with self.scan.acatch(context), self._task_counter.count(context):
+                await self.finish()
         return submitted
 
     def make_event(self, *args, **kwargs):
@@ -338,7 +339,8 @@ async def _worker(self):
                         except asyncio.queues.QueueEmpty:
                             continue
                         self.debug(f"Got {event} from {getattr(event, 'module', 'unknown_module')}")
-                        acceptable, reason = await self._event_postcheck(event)
+                        async with self._task_counter.count(f"event_postcheck({event})"):
+                            acceptable, reason = await self._event_postcheck(event)
                         if not acceptable:
                             self.debug(f"Not accepting {event} because {reason}")
                         if acceptable:
@@ -461,24 +463,25 @@ async def queue_event(self, event):
         """
         Queue (incoming) event with module
         """
-        if self.incoming_event_queue is False:
-            self.debug(f"Not in an acceptable state to queue incoming event")
-            return
-        acceptable, reason = self._event_precheck(event)
-        if not acceptable:
-            if reason and reason != "its type is not in watched_events":
-                self.debug(f"Not accepting {event} because {reason}")
-            return
-        else:
-            self.debug(f"Accepting {event} because {reason}")
-        try:
-            self.incoming_event_queue.put_nowait(event)
-            async with self._event_received:
-                self._event_received.notify()
-            if event.type != "FINISHED":
-                self.scan.manager._new_activity = True
-        except AttributeError:
-            self.debug(f"Not in an acceptable state to queue incoming event")
+        async with self._task_counter.count("queue_event()"):
+            if self.incoming_event_queue is False:
+                self.debug(f"Not in an acceptable state to queue incoming event")
+                return
+            acceptable, reason = self._event_precheck(event)
+            if not acceptable:
+                if reason and reason != "its type is not in watched_events":
+                    self.debug(f"Not accepting {event} because {reason}")
+                return
+            else:
+                self.debug(f"Accepting {event} because {reason}")
+            try:
+                self.incoming_event_queue.put_nowait(event)
+                async with self._event_received:
+                    self._event_received.notify()
+                if event.type != "FINISHED":
+                    self.scan.manager._new_activity = True
+            except AttributeError:
+                self.debug(f"Not in an acceptable state to queue incoming event")
 
     def queue_outgoing_event(self, event, **kwargs):
         """

From 2ba309c20e3ab7350aacb19b0481a5bb930d11b9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 18:34:07 -0400
Subject: [PATCH 346/387] added subdomains output module

---
 bbot/cli.py                                   |  9 ++++-
 bbot/modules/output/base.py                   |  2 +-
 bbot/modules/output/human.py                  |  6 ++-
 bbot/modules/output/subdomains.py             | 38 +++++++++++++++++++
 .../module_tests/test_module_subdomains.py    | 29 ++++++++++++++
 5 files changed, 79 insertions(+), 5 deletions(-)
 create mode 100644 bbot/modules/output/subdomains.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_subdomains.py

diff --git a/bbot/cli.py b/bbot/cli.py
index d2009ab702..34d55af591 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -101,6 +101,7 @@ async def _main():
             from bbot.scanner import Scanner
 
             try:
+                output_modules = set(options.output_modules)
                 module_filtering = False
                 if (options.list_modules or options.help_all) and not any([options.flags, options.modules]):
                     module_filtering = True
@@ -109,6 +110,7 @@ async def _main():
                     modules = set(options.modules)
                     # enable modules by flags
                     for m, c in module_loader.preloaded().items():
+                        module_type = c.get("type", "scan")
                         if m not in modules:
                             flags = c.get("flags", [])
                             if "deadly" in flags:
@@ -116,7 +118,10 @@ async def _main():
                             for f in options.flags:
                                 if f in flags:
                                     log.verbose(f'Enabling {m} because it has flag "{f}"')
-                                    modules.add(m)
+                                    if module_type == "output":
+                                        output_modules.add(m)
+                                    else:
+                                        modules.add(m)
 
                 default_output_modules = ["human", "json", "csv"]
 
@@ -132,7 +137,7 @@ async def _main():
                 scanner = Scanner(
                     *options.targets,
                     modules=list(modules),
-                    output_modules=options.output_modules,
+                    output_modules=list(output_modules),
                     config=config,
                     name=options.name,
                     whitelist=options.whitelist,
diff --git a/bbot/modules/output/base.py b/bbot/modules/output/base.py
index 67880009f5..1b8a699b82 100644
--- a/bbot/modules/output/base.py
+++ b/bbot/modules/output/base.py
@@ -33,7 +33,7 @@ def _prep_output_dir(self, filename):
 
     @property
     def file(self):
-        if self._file is None:
+        if getattr(self, "_file", None) is None:
             self._file = open(self.output_file, mode="a")
         return self._file
 
diff --git a/bbot/modules/output/human.py b/bbot/modules/output/human.py
index c6fc32c9fd..e1f4746c42 100644
--- a/bbot/modules/output/human.py
+++ b/bbot/modules/output/human.py
@@ -12,8 +12,10 @@ class Human(BaseOutputModule):
     vuln_severity_map = {"LOW": "HUGEWARNING", "MEDIUM": "HUGEWARNING", "HIGH": "CRITICAL", "CRITICAL": "CRITICAL"}
     accept_dupes = False
 
+    output_filename = "output.txt"
+
     async def setup(self):
-        self._prep_output_dir("output.txt")
+        self._prep_output_dir(self.output_filename)
         return True
 
     async def handle_event(self, event):
@@ -43,5 +45,5 @@ async def cleanup(self):
                 self.file.close()
 
     async def report(self):
-        if self._file is not None:
+        if getattr(self, "_file", None) is not None:
             self.info(f"Saved TXT output to {self.output_file}")
diff --git a/bbot/modules/output/subdomains.py b/bbot/modules/output/subdomains.py
new file mode 100644
index 0000000000..819be9a67a
--- /dev/null
+++ b/bbot/modules/output/subdomains.py
@@ -0,0 +1,38 @@
+from contextlib import suppress
+
+from bbot.modules.output.human import Human
+
+
+class Subdomains(Human):
+    watched_events = ["DNS_NAME", "DNS_NAME_UNRESOLVED"]
+    flags = ["subdomain-enum"]
+    meta = {"description": "Output only resolved, in-scope subdomains"}
+    options = {"output_file": "", "include_unresolved": False}
+    options_desc = {"output_file": "Output to file", "include_unresolved": "Include unresolved subdomains in output"}
+    accept_dupes = False
+    in_scope_only = True
+
+    output_filename = "subdomains.txt"
+
+    async def setup(self):
+        self.include_unresolved = self.config.get("include_unresolved", False)
+        return await super().setup()
+
+    async def filter_event(self, event):
+        if event.type == "DNS_NAME_UNRESOLVED" and not self.include_unresolved:
+            return False, "Not accepting unresolved subdomain (include_unresolved=False)"
+        return True
+
+    async def handle_event(self, event):
+        if self.file is not None:
+            self.file.write(f"{event.data}\n")
+            self.file.flush()
+
+    async def cleanup(self):
+        if getattr(self, "_file", None) is not None:
+            with suppress(Exception):
+                self.file.close()
+
+    async def report(self):
+        if getattr(self, "_file", None) is not None:
+            self.info(f"Saved subdomains to {self.output_file}")
diff --git a/bbot/test/test_step_2/module_tests/test_module_subdomains.py b/bbot/test/test_step_2/module_tests/test_module_subdomains.py
new file mode 100644
index 0000000000..9aa9f7b5e1
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_subdomains.py
@@ -0,0 +1,29 @@
+from .base import ModuleTestBase
+
+
+class TestSubdomains(ModuleTestBase):
+    modules_overrides = ["subdomains", "subdomaincenter"]
+
+    async def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"https://api.subdomain.center/?domain=blacklanternsecurity.com",
+            json=["asdfasdf.blacklanternsecurity.com", "zzzzzzzz.blacklanternsecurity.com"],
+        )
+
+    def check(self, module_test, events):
+        sub_file = module_test.scan.home / "subdomains.txt"
+        subdomains = set(open(sub_file).read().splitlines())
+        assert subdomains == {"blacklanternsecurity.com"}
+
+
+class TestSubdomainsUnresolved(TestSubdomains):
+    config_overrides = {"output_modules": {"subdomains": {"include_unresolved": True}}}
+
+    def check(self, module_test, events):
+        sub_file = module_test.scan.home / "subdomains.txt"
+        subdomains = set(open(sub_file).read().splitlines())
+        assert subdomains == {
+            "blacklanternsecurity.com",
+            "asdfasdf.blacklanternsecurity.com",
+            "zzzzzzzz.blacklanternsecurity.com",
+        }

From ec598f867a20985caab24ee7485164d0663ded56 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 18:38:54 -0400
Subject: [PATCH 347/387] toss a coin to your witcher

---
 bbot/core/helpers/names_generator.py | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/bbot/core/helpers/names_generator.py b/bbot/core/helpers/names_generator.py
index bb233c080e..80da115d6c 100644
--- a/bbot/core/helpers/names_generator.py
+++ b/bbot/core/helpers/names_generator.py
@@ -336,6 +336,7 @@
     "christine",
     "christopher",
     "cindy",
+    "ciri",
     "clara",
     "clarence",
     "cody",
@@ -346,6 +347,7 @@
     "curtis",
     "cynthia",
     "dale",
+    "dandelion",
     "daniel",
     "danielle",
     "danny",
@@ -413,6 +415,7 @@
     "geordi",
     "george",
     "gerald",
+    "geralt",
     "gimli",
     "gladys",
     "glenn",
@@ -445,6 +448,7 @@
     "jane",
     "janet",
     "janice",
+    "jaskier",
     "jasmine",
     "jason",
     "jean",
@@ -567,6 +571,7 @@
     "rebecca",
     "richard",
     "rita",
+    "roach",
     "robert",
     "robin",
     "rodney",
@@ -619,6 +624,7 @@
     "tracy",
     "travis",
     "treebeard",
+    "triss",
     "tyler",
     "tyrell",
     "vader",
@@ -639,6 +645,7 @@
     "worf",
     "wormtongue",
     "xavier",
+    "yennefer",
     "yoda",
     "zachary",
 ]

From 7aafd00e71312a7d7c0c0101cc9e1819dfacca2a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 19:13:53 -0400
Subject: [PATCH 348/387] better filter_event inheritance for output modules,
 subdomains output module documentation

---
 bbot/modules/base.py              | 29 +++++++++++++++++------------
 bbot/modules/output/base.py       |  3 +++
 bbot/modules/output/subdomains.py |  4 ++++
 docs/scanning/output.md           | 11 +++++++++++
 4 files changed, 35 insertions(+), 12 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 85052059e0..0f93ca0244 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -412,18 +412,9 @@ async def _event_postcheck(self, event):
             return False, "it is not in whitelist and module has active flag"
 
         # check scope distance
-        if self._type != "output":
-            if self.in_scope_only:
-                if event.scope_distance > 0:
-                    return False, "it did not meet in_scope_only filter criteria"
-            if self.scope_distance_modifier is not None:
-                if event.scope_distance < 0:
-                    return False, f"its scope_distance ({event.scope_distance}) is invalid."
-                elif event.scope_distance > self.max_scope_distance:
-                    return (
-                        False,
-                        f"its scope_distance ({event.scope_distance}) exceeds the maximum allowed by the scan ({self.scan.scope_search_distance}) + the module ({self.scope_distance_modifier}) == {self.max_scope_distance}",
-                    )
+        filter_result, reason = self._scope_distance_check(event)
+        if not filter_result:
+            return filter_result, reason
 
         # custom filtering
         async with self.scan.acatch(context=self.filter_event):
@@ -448,6 +439,20 @@ async def _event_postcheck(self, event):
         self.debug(f"{event} passed post-check")
         return True, ""
 
+    def _scope_distance_check(self, event):
+        if self.in_scope_only:
+            if event.scope_distance > 0:
+                return False, "it did not meet in_scope_only filter criteria"
+        if self.scope_distance_modifier is not None:
+            if event.scope_distance < 0:
+                return False, f"its scope_distance ({event.scope_distance}) is invalid."
+            elif event.scope_distance > self.max_scope_distance:
+                return (
+                    False,
+                    f"its scope_distance ({event.scope_distance}) exceeds the maximum allowed by the scan ({self.scan.scope_search_distance}) + the module ({self.scope_distance_modifier}) == {self.max_scope_distance}",
+                )
+        return True, ""
+
     async def _cleanup(self):
         if not self._cleanedup:
             self._cleanedup = True
diff --git a/bbot/modules/output/base.py b/bbot/modules/output/base.py
index 1b8a699b82..7f5b02b339 100644
--- a/bbot/modules/output/base.py
+++ b/bbot/modules/output/base.py
@@ -31,6 +31,9 @@ def _prep_output_dir(self, filename):
         self.helpers.mkdir(self.output_file.parent)
         self._file = None
 
+    def _scope_distance_check(self, event):
+        return True, ""
+
     @property
     def file(self):
         if getattr(self, "_file", None) is None:
diff --git a/bbot/modules/output/subdomains.py b/bbot/modules/output/subdomains.py
index 819be9a67a..819018d65a 100644
--- a/bbot/modules/output/subdomains.py
+++ b/bbot/modules/output/subdomains.py
@@ -1,5 +1,6 @@
 from contextlib import suppress
 
+from bbot.modules.base import BaseModule
 from bbot.modules.output.human import Human
 
 
@@ -23,6 +24,9 @@ async def filter_event(self, event):
             return False, "Not accepting unresolved subdomain (include_unresolved=False)"
         return True
 
+    def _scope_distance_check(self, event):
+        return BaseModule._scope_distance_check(self, event)
+
     async def handle_event(self, event):
         if self.file is not None:
             self.file.write(f"{event.data}\n")
diff --git a/docs/scanning/output.md b/docs/scanning/output.md
index e5c5ece1b6..edfb0c9926 100644
--- a/docs/scanning/output.md
+++ b/docs/scanning/output.md
@@ -103,6 +103,17 @@ The `asset_inventory` module produces a CSV like this:
 | www.evilcorp.com   | cdn-github  | 2.3.4.5 | Active | 22,80,443  |
 | admin.evilcorp.com | cloud-azure | 5.6.7.8 | N/A    |            |
 
+### Subdomains
+
+The `subdomains` output module produces simple text file containing only in-scope and resolved subdomains:
+
+```text title="subdomains.txt"
+evilcorp.com
+www.evilcorp.com
+mail.evilcorp.com
+portal.evilcorp.com
+```
+
 ## Neo4j
 
 Neo4j is the funnest (and prettiest) way to view and interact with BBOT data.

From 32cfedf910a5dd8099fe3fb549b49fd5691a7728 Mon Sep 17 00:00:00 2001
From: BBOT Docs Autopublish <info@blacklanternsecurity.com>
Date: Mon, 31 Jul 2023 03:25:07 +0000
Subject: [PATCH 349/387] Refresh module docs

---
 docs/scanning/advanced.md        |  2 +-
 docs/scanning/configuration.md   |  2 ++
 docs/scanning/events.md          | 52 ++++++++++++++++----------------
 docs/scanning/index.md           |  2 +-
 docs/scanning/list_of_modules.md |  1 +
 5 files changed, 31 insertions(+), 28 deletions(-)

diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 8e16a62b5f..752b7f3fe5 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -73,7 +73,7 @@ Modules:
   -ef FLAG [FLAG ...], --exclude-flags FLAG [FLAG ...]
                         Disable modules with these flags. (e.g. -ef aggressive)
   -om MODULE [MODULE ...], --output-modules MODULE [MODULE ...]
-                        Output module(s). Choices: asset_inventory,csv,http,human,json,neo4j,python,web_report,websocket
+                        Output module(s). Choices: asset_inventory,csv,http,human,json,neo4j,python,subdomains,web_report,websocket
   --allow-deadly        Enable the use of highly aggressive modules
 
 Scan:
diff --git a/docs/scanning/configuration.md b/docs/scanning/configuration.md
index 87951916df..8a641ea15d 100644
--- a/docs/scanning/configuration.md
+++ b/docs/scanning/configuration.md
@@ -330,6 +330,8 @@ Many modules accept their own configuration options. These options have the abil
 | output_modules.neo4j.password                  | str    | Neo4j password                                                                                                                                                                                                                                                                                                  | bbotislife                                                                                                                                                          |
 | output_modules.neo4j.uri                       | str    | Neo4j server + port                                                                                                                                                                                                                                                                                             | bolt://localhost:7687                                                                                                                                               |
 | output_modules.neo4j.username                  | str    | Neo4j username                                                                                                                                                                                                                                                                                                  | neo4j                                                                                                                                                               |
+| output_modules.subdomains.include_unresolved   | bool   | Include unresolved subdomains in output                                                                                                                                                                                                                                                                         | False                                                                                                                                                               |
+| output_modules.subdomains.output_file          | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
 | output_modules.web_report.css_theme_file       | str    | CSS theme URL for HTML output                                                                                                                                                                                                                                                                                   | https://cdnjs.cloudflare.com/ajax/libs/github-markdown-css/5.1.0/github-markdown.min.css                                                                            |
 | output_modules.web_report.output_file          | str    | Output to file                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                     |
 | output_modules.websocket.token                 | str    | Authorization Bearer token                                                                                                                                                                                                                                                                                      |                                                                                                                                                                     |
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index 6b6161d770..d100ecd6d7 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -47,30 +47,30 @@ Below is a full list of event types along with which modules produce/consume the
 ## List of Event Types
 
 <!-- BBOT EVENTS -->
-| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | Producing Modules                                                                                                                                                                                                                                                                                                                                                                                                                              |
-|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | asn                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| DNS_NAME            | 51                    | 42                    | anubisdb, asset_inventory, azure_realm, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, myssl, nmap, nsec, oauth, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, myssl, nsec, ntlm, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, subdomaincenter, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
-| DNS_NAME_UNRESOLVED | 2                     | 0                     | speculate, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                            |
-| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                                                                             |
-| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | ipstack                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| HTTP_RESPONSE       | 11                    | 1                     | badsecrets, excavate, host_header, hunt, ntlm, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                   | httpx                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| IP_ADDRESS          | 6                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                                                                                 |
-| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | censys                                                                                                                                                                                                                                                                                                                                                                                                                                         |
-| OPEN_TCP_PORT       | 4                     | 4                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   | asset_inventory, masscan, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                      |
-| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | social                                                                                                                                                                                                                                                                                                                                                                                                                                         |
-| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                                                                                     |
-| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| URL                 | 18                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                                                                                                                                         | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                                                                               |
-| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| URL_UNVERIFIED      | 4                     | 10                    | httpx, oauth, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                                                                                |
-| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                      | vhost                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                                                                                      |
-| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | Producing Modules                                                                                                                                                                                                                                                                                                                                                                                                                              |
+|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | asn                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| DNS_NAME            | 52                    | 42                    | anubisdb, asset_inventory, azure_realm, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, myssl, nmap, nsec, oauth, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, subdomaincenter, subdomains, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, myssl, nsec, ntlm, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, subdomaincenter, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
+| DNS_NAME_UNRESOLVED | 3                     | 0                     | speculate, subdomain_hijack, subdomains                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                            |
+| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                                                                             |
+| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | ipstack                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| HTTP_RESPONSE       | 11                    | 1                     | badsecrets, excavate, host_header, hunt, ntlm, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                               | httpx                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| IP_ADDRESS          | 6                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                                                                                 |
+| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | censys                                                                                                                                                                                                                                                                                                                                                                                                                                         |
+| OPEN_TCP_PORT       | 4                     | 4                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | asset_inventory, masscan, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                      |
+| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                           |
+| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | social                                                                                                                                                                                                                                                                                                                                                                                                                                         |
+| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                                                                                     |
+| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| URL                 | 18                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                                                                                                                                                     | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                                                                               |
+| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| URL_UNVERIFIED      | 4                     | 10                    | httpx, oauth, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                                                                                |
+| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | vhost                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                                                                                      |
+| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                      |
 <!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index cff31c57ef..09a827fcfb 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -107,7 +107,7 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 |------------------|-------------|-----------------------------------------------|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
 | safe             | 64          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, myssl, nsec, ntlm, oauth, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
 | passive          | 47          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, myssl, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                          |
-| subdomain-enum   | 41          | Enumerates subdomains                         | anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, myssl, nsec, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, subdomaincenter, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                                           |
+| subdomain-enum   | 42          | Enumerates subdomains                         | anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, myssl, nsec, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, subdomaincenter, subdomains, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                               |
 | active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, nmap, ntlm, nuclei, oauth, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                                                                               |
 | web-thorough     | 24          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                             |
 | aggressive       | 18          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index cebe2e1f0b..4fa7e1d292 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -91,6 +91,7 @@
 | json                 | output   | No              | Output to JSON                                                         |                                                                                     | *                                                                                                       |                                                          |
 | neo4j                | output   | No              | Output to Neo4j                                                        |                                                                                     | *                                                                                                       |                                                          |
 | python               | output   | No              | Output via Python API                                                  |                                                                                     | *                                                                                                       |                                                          |
+| subdomains           | output   | No              | Output only resolved, in-scope subdomains                              | subdomain-enum                                                                      | DNS_NAME, DNS_NAME_UNRESOLVED                                                                           |                                                          |
 | web_report           | output   | No              | Create a markdown report with web assets                               |                                                                                     | FINDING, TECHNOLOGY, URL, VHOST, VULNERABILITY                                                          |                                                          |
 | websocket            | output   | No              | Output to websockets                                                   |                                                                                     | *                                                                                                       |                                                          |
 | aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive, safe                                                                       |                                                                                                         |                                                          |

From 917cee0d05f87ea335085dcb8056714ce9470c14 Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 3 Aug 2023 15:01:39 -0400
Subject: [PATCH 350/387] better error handling iis_shortnames

---
 bbot/modules/iis_shortnames.py | 5 +++++
 1 file changed, 5 insertions(+)

diff --git a/bbot/modules/iis_shortnames.py b/bbot/modules/iis_shortnames.py
index 69bb315e2f..a4b0ec0ca0 100644
--- a/bbot/modules/iis_shortnames.py
+++ b/bbot/modules/iis_shortnames.py
@@ -78,6 +78,11 @@ async def duplicate_check(self, target, method, url_hint, affirmative_status_cod
             duplicate_check_results = await self.helpers.request(
                 method=method, url=url, allow_redirects=False, retries=2, timeout=10
             )
+
+            if not duplicate_check_results:
+                self.debug("Deplucate check produced NoneType sample")
+                break
+
             if duplicate_check_results.status_code != affirmative_status_code:
                 break
             else:

From b1b914ac89610b8a2931900655f865729ed011de Mon Sep 17 00:00:00 2001
From: liquidsec <paul.mueller08@gmail.com>
Date: Thu, 3 Aug 2023 17:09:26 -0400
Subject: [PATCH 351/387] typo fix

---
 bbot/modules/iis_shortnames.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/iis_shortnames.py b/bbot/modules/iis_shortnames.py
index a4b0ec0ca0..9e3566ac8f 100644
--- a/bbot/modules/iis_shortnames.py
+++ b/bbot/modules/iis_shortnames.py
@@ -80,7 +80,7 @@ async def duplicate_check(self, target, method, url_hint, affirmative_status_cod
             )
 
             if not duplicate_check_results:
-                self.debug("Deplucate check produced NoneType sample")
+                self.debug("duplicate check produced NoneType sample")
                 break
 
             if duplicate_check_results.status_code != affirmative_status_code:

From fc4865d23baf9cdc0dbf7bff37061073bdd1cdc1 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 18:55:01 -0400
Subject: [PATCH 352/387] massdns wildcard safeguard

---
 bbot/modules/massdns.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index d2a3fbbd17..6d36eb34a9 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -203,6 +203,9 @@ async def _massdns(self, domain, subdomains):
                 if results:
                     domain_wildcard_rdtypes.add(rdtype)
 
+        if "A" in domain_wildcard_rdtypes:
+            self.info(f"Aborting run on {domain} because it's a wildcard domain")
+
         command = (
             "massdns",
             "-r",

From c485e9ec43fa4ca90b67ce1252cc1b6df01bcc09 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 19:02:34 -0400
Subject: [PATCH 353/387] remove domain from found if it's a wildcard

---
 bbot/modules/massdns.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 6d36eb34a9..a82dd42ce7 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -141,7 +141,7 @@ async def massdns(self, domain, subdomains):
         # (the results are over 2000, and this is more than 20 percent of the input size)
         if len(results) > 2000 and len(results) / len(subdomains) > 0.2:
             self.info(
-                f"Aborting because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})"
+                f"Aborting massdns on {domain} because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})"
             )
             return []
 
@@ -204,7 +204,8 @@ async def _massdns(self, domain, subdomains):
                     domain_wildcard_rdtypes.add(rdtype)
 
         if "A" in domain_wildcard_rdtypes:
-            self.info(f"Aborting run on {domain} because it's a wildcard domain")
+            self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
+            self.found.pop(domain, None)
 
         command = (
             "massdns",

From 6e016692d9419226622648ff39e4e7f334d47c76 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 19:06:32 -0400
Subject: [PATCH 354/387] whoops

---
 bbot/modules/massdns.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index a82dd42ce7..d6ac3c19fa 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -206,6 +206,7 @@ async def _massdns(self, domain, subdomains):
         if "A" in domain_wildcard_rdtypes:
             self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
             self.found.pop(domain, None)
+            return
 
         command = (
             "massdns",

From 7f53733e69ad84514d9b0204208e2fa10ca6280f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 19:11:20 -0400
Subject: [PATCH 355/387] troubleshooting

---
 bbot/modules/massdns.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index d6ac3c19fa..1a31f6026a 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -203,10 +203,10 @@ async def _massdns(self, domain, subdomains):
                 if results:
                     domain_wildcard_rdtypes.add(rdtype)
 
-        if "A" in domain_wildcard_rdtypes:
-            self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
-            self.found.pop(domain, None)
-            return
+        # if "A" in domain_wildcard_rdtypes:
+        #     self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
+        #     self.found.pop(domain, None)
+        #     return
 
         command = (
             "massdns",

From 7c5456db212ea876ebe41876c1aa92f73b16248b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 20:51:31 -0400
Subject: [PATCH 356/387] massdns improvements

---
 bbot/cli.py             |  2 +-
 bbot/modules/massdns.py | 67 +++++++++++++++++++++++------------------
 2 files changed, 38 insertions(+), 31 deletions(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index 34d55af591..6ccf0dccfc 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -292,7 +292,7 @@ async def _main():
                         log.hugeinfo("This is a passive scan. No connections will be made to target")
                     if slow_modules:
                         log.warning(
-                            f"You have enabled the following slow modules: {','.join(slow_modules)}. Scan may take longer than usual"
+                            f"You have enabled the following slow modules: {','.join(slow_modules)}. Scan may take a while"
                         )
 
                 scanner.helpers.word_cloud.load()
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 1a31f6026a..74c7341afe 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -121,6 +121,17 @@ def already_processed(self, hostname):
     async def massdns(self, domain, subdomains):
         subdomains = list(subdomains)
 
+        domain_wildcard_rdtypes = set()
+        for domain, rdtypes in (await self.helpers.is_wildcard_domain(domain)).items():
+            for rdtype, results in rdtypes.items():
+                if results:
+                    domain_wildcard_rdtypes.add(rdtype)
+
+        if "A" in domain_wildcard_rdtypes:
+            self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
+            self.found.pop(domain, None)
+            return
+
         # before we start, do a canary check for wildcards
         abort_msg = f"Aborting massdns on {domain} due to false positive"
         canary_result = await self._canary_check(domain)
@@ -128,7 +139,21 @@ async def massdns(self, domain, subdomains):
             self.info(abort_msg + f": {canary_result}")
             return []
 
-        results = [l async for l in self._massdns(domain, subdomains)]
+        results = []
+        async for hostname, ip in self._massdns(domain, subdomains):
+            # allow brute-forcing of wildcard domains
+            # this is dead code but it's kinda cool so it can live here
+            if "A" in domain_wildcard_rdtypes:
+                # skip wildcard checking on multi-level subdomains for performance reasons
+                stem = hostname.split(domain)[0].strip(".")
+                if "." in stem:
+                    self.debug(f"Skipping {hostname}:A because it may be a wildcard (reason: performance)")
+                    continue
+                wildcard_rdtypes = await self.helpers.is_wildcard(hostname, ips=(ip,))
+                if "A" in wildcard_rdtypes:
+                    self.debug(f"Skipping {hostname}:A because it's a wildcard")
+                    continue
+            results.append(hostname)
 
         # do another canary check for good measure
         if len(results) > 50:
@@ -153,17 +178,20 @@ async def massdns(self, domain, subdomains):
             self.add_found(hostname)
         return list(resolved)
 
-    async def _canary_check(self, domain, num_checks=100):
+    async def _canary_check(self, domain, num_checks=50):
         random_subdomains = list(self.gen_random_subdomains(num_checks))
         self.verbose(f"Testing {len(random_subdomains):,} canaries against {domain}")
-        canary_results = [l async for l in self._massdns(domain, random_subdomains)]
+        canary_results = [l async for l,i in self._massdns(domain, random_subdomains)]
+        self.log.trace(f"canary results for {domain}: {canary_results}")
         resolved_canaries = self.helpers.resolve_batch(canary_results)
+        self.log.trace(f"resolved canary results for {domain}: {canary_results}")
         async for query, result in resolved_canaries:
             if result:
                 await resolved_canaries.aclose()
                 result = f"{query}:{result}"
                 self.log.trace(f"Found false positive: {result}")
                 return result
+        self.log.trace(f"Passed canary check for {domain}")
         return False
 
     async def _massdns(self, domain, subdomains):
@@ -197,17 +225,6 @@ async def _massdns(self, domain, subdomains):
         if self.scan.stopping:
             return
 
-        domain_wildcard_rdtypes = set()
-        for domain, rdtypes in (await self.helpers.is_wildcard_domain(domain)).items():
-            for rdtype, results in rdtypes.items():
-                if results:
-                    domain_wildcard_rdtypes.add(rdtype)
-
-        # if "A" in domain_wildcard_rdtypes:
-        #     self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
-        #     self.found.pop(domain, None)
-        #     return
-
         command = (
             "massdns",
             "-r",
@@ -238,23 +255,10 @@ async def _massdns(self, domain, subdomains):
                     # avoid garbage answers like this:
                     # 8AAAA queries have been locally blocked by dnscrypt-proxy/Set block_ipv6 to false to disable this feature
                     if data and rdtype and not " " in data:
-                        # skip wildcards
-                        if rdtype in domain_wildcard_rdtypes:
-                            # skip wildcard checking on multi-level subdomains for performance reasons
-                            stem = hostname.split(domain)[0].strip(".")
-                            if "." in stem:
-                                self.debug(
-                                    f"Skipping {hostname}:{rdtype} because it may be a wildcard (reason: performance)"
-                                )
-                                continue
-                            wildcard_rdtypes = await self.helpers.is_wildcard(hostname, ips=(data,))
-                            if rdtype in wildcard_rdtypes:
-                                self.debug(f"Skipping {hostname}:{rdtype} because it's a wildcard")
-                                continue
                         hostname_hash = hash(hostname)
                         if hostname_hash not in hosts_yielded:
                             hosts_yielded.add(hostname_hash)
-                            yield hostname
+                            yield hostname, data
 
     async def finish(self):
         found = sorted(self.found.items(), key=lambda x: len(x[-1]), reverse=True)
@@ -366,14 +370,17 @@ async def gen_subdomains(self, prefixes, domain):
 
     def gen_random_subdomains(self, n=50):
         delimeters = (".", "-")
-        lengths = list(range(10, 20))
-        for i in range(0, n):
+        lengths = list(range(3, 8))
+        for i in range(0, max(0, n - 5)):
             d = delimeters[i % len(delimeters)]
             l = lengths[i % len(lengths)]
             segments = list(random.choice(self.devops_mutations) for _ in range(l))
             segments.append(self.helpers.rand_string(length=8, digits=False))
             subdomain = d.join(segments)
+            self.hugesuccess(subdomain)
             yield subdomain
+        for _ in range(5):
+            yield self.helpers.rand_string(length=8, digits=False)
 
     def get_source_event(self, hostname):
         for p in self.helpers.domain_parents(hostname):

From 90c8ceb8c37785b04e00f7036aef68c9018387c5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 20:52:20 -0400
Subject: [PATCH 357/387] remove debugging statement

---
 bbot/modules/massdns.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 74c7341afe..8f9ea1958f 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -377,7 +377,6 @@ def gen_random_subdomains(self, n=50):
             segments = list(random.choice(self.devops_mutations) for _ in range(l))
             segments.append(self.helpers.rand_string(length=8, digits=False))
             subdomain = d.join(segments)
-            self.hugesuccess(subdomain)
             yield subdomain
         for _ in range(5):
             yield self.helpers.rand_string(length=8, digits=False)

From 14804117b300ec1a342908bf772bafacf0df3de0 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 20:57:03 -0400
Subject: [PATCH 358/387] blacked

---
 bbot/modules/massdns.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 8f9ea1958f..f08d929478 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -181,7 +181,7 @@ async def massdns(self, domain, subdomains):
     async def _canary_check(self, domain, num_checks=50):
         random_subdomains = list(self.gen_random_subdomains(num_checks))
         self.verbose(f"Testing {len(random_subdomains):,} canaries against {domain}")
-        canary_results = [l async for l,i in self._massdns(domain, random_subdomains)]
+        canary_results = [l async for l, i in self._massdns(domain, random_subdomains)]
         self.log.trace(f"canary results for {domain}: {canary_results}")
         resolved_canaries = self.helpers.resolve_batch(canary_results)
         self.log.trace(f"resolved canary results for {domain}: {canary_results}")

From a88fe983cb217f8bd23d79d1b54b37b4c417f95f Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sat, 29 Jul 2023 20:59:35 -0400
Subject: [PATCH 359/387] fix massdns bug

---
 bbot/modules/massdns.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index f08d929478..91a047a7d5 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -130,7 +130,7 @@ async def massdns(self, domain, subdomains):
         if "A" in domain_wildcard_rdtypes:
             self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
             self.found.pop(domain, None)
-            return
+            return []
 
         # before we start, do a canary check for wildcards
         abort_msg = f"Aborting massdns on {domain} due to false positive"

From d9cc32cadd63dbdebbdc630924bff7ec6a12a183 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 4 Aug 2023 09:45:37 -0400
Subject: [PATCH 360/387] merge dev

---
 bbot/core/helpers/dns.py | 3 ++-
 bbot/core/helpers/web.py | 3 ++-
 2 files changed, 4 insertions(+), 2 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 4da1b944a2..ee17992fc7 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -229,10 +229,11 @@ async def handle_wildcard_event(self, event, children):
         event_host = str(event.host)
         # wildcard checks
         if not is_ip(event.host):
+            parent = parent_domain(event_host)
             # check if this domain is using wildcard dns
             event_target = "target" in event.tags
             for hostname, wildcard_domain_rdtypes in (
-                await self.is_wildcard_domain(event_host, log_info=event_target)
+                await self.is_wildcard_domain(parent, log_info=event_target)
             ).items():
                 if wildcard_domain_rdtypes:
                     event.add_tag("wildcard-domain")
diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 59e8a80ec9..8a010a1694 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -120,6 +120,7 @@ async def request(self, *args, **kwargs):
             if k in self.client_only_options:
                 v = kwargs.pop(k)
                 client_kwargs[k] = v
+
         if client_kwargs:
             client = self.AsyncClient(**client_kwargs)
 
@@ -130,7 +131,7 @@ async def request(self, *args, **kwargs):
             async with self.web_rate_limiter:
                 response = await client.request(*args, **kwargs)
             if self.http_debug:
-                log.debug(f"Web response: {response} (Length: {len(response.content)}) headers: {response.headers}")
+                log.debug(f"Web response from {url}: {response} (Length: {len(response.content)}) headers: {response.headers}")
             return response
         except httpx.TimeoutException:
             log.verbose(f"HTTP timeout to URL: {url}")

From 8efc6e290668df38125107d50ee930633047cd72 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 16:08:34 -0400
Subject: [PATCH 361/387] wildcard performance improvements, mild bugfixes

---
 bbot/core/errors.py               |   4 +
 bbot/core/helpers/dns.py          | 178 +++++++++++++++++-------------
 bbot/modules/massdns.py           |  69 ++++++------
 bbot/test/test_step_1/test_dns.py |  40 ++++---
 4 files changed, 168 insertions(+), 123 deletions(-)

diff --git a/bbot/core/errors.py b/bbot/core/errors.py
index df134f66c2..8d39919cb6 100644
--- a/bbot/core/errors.py
+++ b/bbot/core/errors.py
@@ -45,5 +45,9 @@ class DNSError(BBOTError):
     pass
 
 
+class DNSWildcardBreak(DNSError):
+    pass
+
+
 class CurlError(BBOTError):
     pass
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index ee17992fc7..ed506ae1db 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -1,14 +1,16 @@
+import asyncio
 import logging
 import ipaddress
 import traceback
 import contextlib
 import dns.exception
 import dns.asyncresolver
+from contextlib import suppress
 
 from .regexes import dns_name_regex
 from bbot.core.helpers.ratelimiter import RateLimiter
 from bbot.core.helpers.async_helpers import NamedLock
-from bbot.core.errors import ValidationError, DNSError
+from bbot.core.errors import ValidationError, DNSError, DNSWildcardBreak
 from .misc import is_ip, is_domain, is_dns_name, domain_parents, parent_domain, rand_string, cloudcheck, as_completed
 
 log = logging.getLogger("bbot.core.helpers.dns")
@@ -229,16 +231,6 @@ async def handle_wildcard_event(self, event, children):
         event_host = str(event.host)
         # wildcard checks
         if not is_ip(event.host):
-            parent = parent_domain(event_host)
-            # check if this domain is using wildcard dns
-            event_target = "target" in event.tags
-            for hostname, wildcard_domain_rdtypes in (
-                await self.is_wildcard_domain(parent, log_info=event_target)
-            ).items():
-                if wildcard_domain_rdtypes:
-                    event.add_tag("wildcard-domain")
-                    for rdtype, ips in wildcard_domain_rdtypes.items():
-                        event.add_tag(f"{rdtype.lower()}-wildcard-domain")
             # check if the dns name itself is a wildcard entry
             wildcard_rdtypes = await self.is_wildcard(event_host)
             for rdtype, (is_wildcard, wildcard_host) in wildcard_rdtypes.items():
@@ -249,27 +241,37 @@ async def handle_wildcard_event(self, event, children):
                 event.add_tag(f"{rdtype.lower()}-{wildcard_tag}")
 
         # wildcard event modification (www.evilcorp.com --> _wildcard.evilcorp.com)
-        if not is_ip(event.host) and wildcard_rdtypes and children:
-            # these are the rdtypes that successfully resolve
-            resolved_rdtypes = set([c.upper() for c in children])
-            # these are the rdtypes that have wildcards
-            wildcard_rdtypes_set = set(wildcard_rdtypes)
-            # consider the event a full wildcard if all its records are wildcards
-            event_is_wildcard = False
-            if resolved_rdtypes:
-                event_is_wildcard = all(r in wildcard_rdtypes_set for r in resolved_rdtypes)
-            # if event_is_wildcard and event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
-            if event_is_wildcard:
-                if event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
-                    wildcard_parent = self.parent_helper.parent_domain(event_host)
-                    for rdtype, (_is_wildcard, _parent_domain) in wildcard_rdtypes.items():
-                        if _is_wildcard:
-                            wildcard_parent = _parent_domain
-                            break
-                    wildcard_data = f"_wildcard.{wildcard_parent}"
-                    if wildcard_data != event.data:
-                        log.debug(f'Wildcard detected, changing event.data "{event.data}" --> "{wildcard_data}"')
-                        event.data = wildcard_data
+        if not is_ip(event.host) and children:
+            if wildcard_rdtypes:
+                # these are the rdtypes that successfully resolve
+                resolved_rdtypes = set([c.upper() for c in children])
+                # these are the rdtypes that have wildcards
+                wildcard_rdtypes_set = set(wildcard_rdtypes)
+                # consider the event a full wildcard if all its records are wildcards
+                event_is_wildcard = False
+                if resolved_rdtypes:
+                    event_is_wildcard = all(r in wildcard_rdtypes_set for r in resolved_rdtypes)
+
+                if event_is_wildcard:
+                    if event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
+                        wildcard_parent = self.parent_helper.parent_domain(event_host)
+                        for rdtype, (_is_wildcard, _parent_domain) in wildcard_rdtypes.items():
+                            if _is_wildcard:
+                                wildcard_parent = _parent_domain
+                                break
+                        wildcard_data = f"_wildcard.{wildcard_parent}"
+                        if wildcard_data != event.data:
+                            log.debug(f'Wildcard detected, changing event.data "{event.data}" --> "{wildcard_data}"')
+                            event.data = wildcard_data
+            else:
+                # check if this domain is using wildcard dns
+                event_target = "target" in event.tags
+                wildcard_domain_results = await self.is_wildcard_domain(event_host, log_info=event_target)
+                for hostname, wildcard_domain_rdtypes in wildcard_domain_results.items():
+                    if wildcard_domain_rdtypes:
+                        event.add_tag("wildcard-domain")
+                        for rdtype, ips in wildcard_domain_rdtypes.items():
+                            event.add_tag(f"{rdtype.lower()}-wildcard-domain")
 
     async def resolve_event(self, event, minimal=False):
         """
@@ -467,6 +469,9 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
         """
         result = {}
 
+        if [ips, rdtype].count(None) == 1:
+            raise ValueError("Both ips and rdtype must be specified")
+
         if not is_dns_name(query):
             return {}
 
@@ -476,9 +481,6 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
                 log.debug(f"Skipping wildcard detection on {query} because it is excluded in the config")
                 return {}
 
-        if rdtype is None:
-            rdtype = "ANY"
-
         query = self._clean_dns_record(query)
         # skip check if it's an IP
         if is_ip(query) or not "." in query:
@@ -490,57 +492,74 @@ async def is_wildcard(self, query, ips=None, rdtype=None):
         parent = parent_domain(query)
         parents = list(domain_parents(query))
 
-        wildcard_tasks = {t: [] for t in self.all_rdtypes}
+        rdtypes_to_check = [rdtype] if rdtype is not None else self.all_rdtypes
+
         base_query_ips = dict()
         # if the caller hasn't already done the work of resolving the IPs
         if ips is None:
             # then resolve the query for all rdtypes
-            for _rdtype in self.all_rdtypes:
-                # resolve the base query
-                wildcard_tasks[_rdtype].append(self.resolve_raw(query, type=_rdtype, cache_result=True))
-
-            for _rdtype, tasks in wildcard_tasks.items():
-                async for task in as_completed(tasks):
-                    raw_results, errors = await task
-                    if errors and not raw_results:
-                        self.debug(f"Failed to resolve {query} ({_rdtype}) during wildcard detection")
-                        result[_rdtype] = (None, parent)
-                        continue
-                    for __rdtype, answers in raw_results:
-                        base_query_ips[__rdtype] = set()
-                        for answer in answers:
-                            for _, t in self.extract_targets(answer):
-                                base_query_ips[__rdtype].add(t)
+            base_query_tasks = {
+                t: asyncio.create_task(self.resolve_raw(query, type=t, cache_result=True)) for t in rdtypes_to_check
+            }
+            for _rdtype, task in base_query_tasks.items():
+                raw_results, errors = await task
+                if errors and not raw_results:
+                    self.debug(f"Failed to resolve {query} ({_rdtype}) during wildcard detection")
+                    result[_rdtype] = (None, parent)
+                    continue
+                for __rdtype, answers in raw_results:
+                    base_query_results = set()
+                    for answer in answers:
+                        for _, t in self.extract_targets(answer):
+                            base_query_results.add(t)
+                    if base_query_results:
+                        base_query_ips[__rdtype] = base_query_results
         else:
             # otherwise, we can skip all that
-            base_query_ips[rdtype] = set([self._clean_dns_record(ip) for ip in ips])
+            cleaned_ips = set([self._clean_dns_record(ip) for ip in ips])
+            if not cleaned_ips:
+                raise ValueError("Valid IPs must be specified")
+            base_query_ips[rdtype] = cleaned_ips
         if not base_query_ips:
             return result
 
         # once we've resolved the base query and have IP addresses to work with
         # we can compare the IPs to the ones we have on file for wildcards
-        # for every rdtype
-        for _rdtype in self.all_rdtypes:
-            # get the IPs from above
-            query_ips = base_query_ips.get("ANY", base_query_ips.get(_rdtype, set()))
-            if not query_ips:
-                continue
-            # for every parent domain, starting with the longest
+
+        # for every parent domain, starting with the shortest
+        try:
             for host in parents[::-1]:
-                host_hash = hash(host)
-                # make sure we've checked that domain for wildcards
-                await self.is_wildcard_domain(host)
-                if host_hash in self._wildcard_cache:
-                    # then get its IPs from our wildcard cache
-                    wildcard_rdtypes = self._wildcard_cache[host_hash]
-                    # then check to see if our IPs match the wildcard ones
-                    if _rdtype in wildcard_rdtypes:
-                        wildcard_ips = wildcard_rdtypes[_rdtype]
-                        # if our IPs match the wildcard ones, then ladies and gentlemen we have a wildcard
-                        is_wildcard = any(r in wildcard_ips for r in query_ips)
-                        if is_wildcard:
-                            result[_rdtype] = (True, host)
-                            break
+                # for every rdtype
+                for _rdtype in list(base_query_ips):
+                    # get the IPs from above
+                    query_ips = base_query_ips.get(_rdtype, set())
+                    # make sure we've checked that domain for wildcards
+                    await self.is_wildcard_domain(host)
+                    host_hash = hash(host)
+
+                    if host_hash in self._wildcard_cache:
+                        # then get its IPs from our wildcard cache
+                        wildcard_rdtypes = self._wildcard_cache[host_hash]
+
+                        # then check to see if our IPs match the wildcard ones
+                        if _rdtype in wildcard_rdtypes:
+                            wildcard_ips = wildcard_rdtypes[_rdtype]
+                            # if our IPs match the wildcard ones, then ladies and gentlemen we have a wildcard
+                            is_wildcard = any(r in wildcard_ips for r in query_ips)
+
+                            if is_wildcard and not result.get(_rdtype, (None, None))[0] is True:
+                                result[_rdtype] = (True, host)
+
+                    # if we've reached a point where the dns name is a complete wildcard, class can be dismissed early
+                    base_query_rdtypes = set(base_query_ips)
+                    wildcard_rdtypes_set = set([k for k, v in result.items() if v[0] is True])
+                    if base_query_rdtypes and wildcard_rdtypes_set and base_query_rdtypes == wildcard_rdtypes_set:
+                        log.debug(
+                            f"Breaking from wildcard detection for {query} at {host} because base query rdtypes ({base_query_rdtypes}) == wildcard rdtypes ({wildcard_rdtypes_set})"
+                        )
+                        raise DNSWildcardBreak()
+        except DNSWildcardBreak:
+            pass
 
         return result
 
@@ -551,6 +570,7 @@ async def is_wildcard_domain(self, domain, log_info=False):
         Returns a dictionary containing any DNS record types that are wildcards, and their associated IPs
             is_wildcard_domain("github.io") --> {"A": {"1.2.3.4",}, "AAAA": {"dead::beef",}}
         """
+
         wildcard_domain_results = {}
         domain = self._clean_dns_record(domain)
 
@@ -563,6 +583,8 @@ async def is_wildcard_domain(self, domain, log_info=False):
                 log.debug(f"Skipping wildcard detection on {domain} because it is excluded in the config")
                 return {}
 
+        rdtypes_to_check = set(self.all_rdtypes)
+
         # make a list of its parents
         parents = list(domain_parents(domain, include_self=True))
         # and check each of them, beginning with the highest parent (i.e. the root domain)
@@ -576,9 +598,9 @@ async def is_wildcard_domain(self, domain, log_info=False):
                     continue
 
                 # determine if this is a wildcard domain
-                wildcard_tasks = {t: [] for t in self.all_rdtypes}
+                wildcard_tasks = {t: [] for t in rdtypes_to_check}
                 # resolve a bunch of random subdomains of the same parent
-                for rdtype in self.all_rdtypes:
+                for rdtype in rdtypes_to_check:
                     # continue if a wildcard was already found for this rdtype
                     # if rdtype in self._wildcard_cache[host_hash]:
                     #     continue
@@ -597,6 +619,10 @@ async def is_wildcard_domain(self, domain, log_info=False):
                             if not rdtype in wildcard_results:
                                 wildcard_results[rdtype] = set()
                             wildcard_results[rdtype].update(results)
+                            # we know this rdtype is a wildcard
+                            # so we don't need to check it anymore
+                            with suppress(KeyError):
+                                rdtypes_to_check.remove(rdtype)
 
                 self._wildcard_cache.update({host_hash: wildcard_results})
                 wildcard_domain_results.update({host: wildcard_results})
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 91a047a7d5..cc0df57e24 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -57,7 +57,7 @@ class massdns(crobat):
             "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
         },
     ]
-    reject_wildcards = "strict"
+    reject_wildcards = "cloud_only"
     _qsize = 100
 
     digit_regex = re.compile(r"\d+")
@@ -127,48 +127,49 @@ async def massdns(self, domain, subdomains):
                 if results:
                     domain_wildcard_rdtypes.add(rdtype)
 
-        if "A" in domain_wildcard_rdtypes:
-            self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
-            self.found.pop(domain, None)
-            return []
+        # if "A" in domain_wildcard_rdtypes:
+        #     self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
+        #     self.found.pop(domain, None)
+        #     return []
 
         # before we start, do a canary check for wildcards
-        abort_msg = f"Aborting massdns on {domain} due to false positive"
-        canary_result = await self._canary_check(domain)
-        if canary_result:
-            self.info(abort_msg + f": {canary_result}")
-            return []
+        # abort_msg = f"Aborting massdns on {domain} due to false positive"
+        # canary_result = await self._canary_check(domain)
+        # if canary_result:
+        #     self.info(abort_msg + f": {canary_result}")
+        #     return []
 
         results = []
-        async for hostname, ip in self._massdns(domain, subdomains):
+        async for hostname, ip, rdtype in self._massdns(domain, subdomains):
             # allow brute-forcing of wildcard domains
             # this is dead code but it's kinda cool so it can live here
-            if "A" in domain_wildcard_rdtypes:
+            if rdtype in domain_wildcard_rdtypes:
                 # skip wildcard checking on multi-level subdomains for performance reasons
-                stem = hostname.split(domain)[0].strip(".")
-                if "." in stem:
-                    self.debug(f"Skipping {hostname}:A because it may be a wildcard (reason: performance)")
-                    continue
-                wildcard_rdtypes = await self.helpers.is_wildcard(hostname, ips=(ip,))
-                if "A" in wildcard_rdtypes:
-                    self.debug(f"Skipping {hostname}:A because it's a wildcard")
+                # stem = hostname.split(domain)[0].strip(".")
+                # if "." in stem:
+                #     self.debug(f"Skipping {hostname}:A because it may be a wildcard (reason: performance)")
+                #     continue
+                wildcard_rdtypes = await self.helpers.is_wildcard(hostname, ips=(ip,), rdtype=rdtype)
+                if rdtype in wildcard_rdtypes:
+                    self.debug(f"Skipping {hostname}:{rdtype} because it's a wildcard")
                     continue
+            # self.hugesuccess(f"{hostname}:wildcard_rdtypes:{wildcard_rdtypes}, domain_wildcard_rdtypes:{domain_wildcard_rdtypes}")
             results.append(hostname)
 
         # do another canary check for good measure
-        if len(results) > 50:
-            canary_result = await self._canary_check(domain)
-            if canary_result:
-                self.info(abort_msg + f": {canary_result}")
-                return []
+        # if len(results) > 50:
+        #     canary_result = await self._canary_check(domain)
+        #     if canary_result:
+        #         self.info(abort_msg + f": {canary_result}")
+        #         return []
 
         # abort if there are a suspiciously high number of results
         # (the results are over 2000, and this is more than 20 percent of the input size)
-        if len(results) > 2000 and len(results) / len(subdomains) > 0.2:
-            self.info(
-                f"Aborting massdns on {domain} because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})"
-            )
-            return []
+        # if len(results) > 2000 and len(results) / len(subdomains) > 0.2:
+        #     self.info(
+        #         f"Aborting massdns on {domain} because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})"
+        #     )
+        #     return []
 
         # everything checks out
         self.verbose(f"Resolving batch of {len(results):,} results")
@@ -181,7 +182,7 @@ async def massdns(self, domain, subdomains):
     async def _canary_check(self, domain, num_checks=50):
         random_subdomains = list(self.gen_random_subdomains(num_checks))
         self.verbose(f"Testing {len(random_subdomains):,} canaries against {domain}")
-        canary_results = [l async for l, i in self._massdns(domain, random_subdomains)]
+        canary_results = [h async for h, d, r in self._massdns(domain, random_subdomains)]
         self.log.trace(f"canary results for {domain}: {canary_results}")
         resolved_canaries = self.helpers.resolve_batch(canary_results)
         self.log.trace(f"resolved canary results for {domain}: {canary_results}")
@@ -258,7 +259,7 @@ async def _massdns(self, domain, subdomains):
                         hostname_hash = hash(hostname)
                         if hostname_hash not in hosts_yielded:
                             hosts_yielded.add(hostname_hash)
-                            yield hostname, data
+                            yield hostname, data, rdtype
 
     async def finish(self):
         found = sorted(self.found.items(), key=lambda x: len(x[-1]), reverse=True)
@@ -344,7 +345,7 @@ def add_mutation(_domain_hash, m):
                             source_event = self.get_source_event(hostname)
                             if source_event is None:
                                 self.warning(f"Could not correlate source event from: {hostname}")
-                                continue
+                                source_event = self.scan.root_event
                             self.emit_result(hostname, source_event, query)
                         if results:
                             continue
@@ -357,7 +358,9 @@ def add_found(self, host):
             host = host.data
         if self.helpers.is_subdomain(host):
             subdomain, domain = host.split(".", 1)
-            if not self.helpers.is_ptr(subdomain):
+            is_ptr = self.helpers.is_ptr(subdomain)
+            in_scope = self.scan.in_scope(domain)
+            if in_scope and not is_ptr:
                 try:
                     self.found[domain].add(subdomain)
                 except KeyError:
diff --git a/bbot/test/test_step_1/test_dns.py b/bbot/test/test_step_1/test_dns.py
index ab1bcecc18..e2ea53691c 100644
--- a/bbot/test/test_step_1/test_dns.py
+++ b/bbot/test/test_step_1/test_dns.py
@@ -3,7 +3,7 @@
 
 @pytest.mark.asyncio
 async def test_dns(bbot_scanner, bbot_config):
-    scan = bbot_scanner("8.8.8.8")
+    scan = bbot_scanner("8.8.8.8", config=bbot_config)
     helpers = scan.helpers
 
     # lowest level functions
@@ -62,12 +62,34 @@ async def test_dns(bbot_scanner, bbot_config):
     assert hash(f"dns.google:A") in helpers.dns._dns_cache
     assert hash(f"dns.google:AAAA") in helpers.dns._dns_cache
 
+    # Ensure events with hosts have resolved_hosts attribute populated
+    resolved_hosts_event1 = scan.make_event("dns.google", "DNS_NAME", dummy=True)
+    resolved_hosts_event2 = scan.make_event("http://dns.google/", "URL_UNVERIFIED", dummy=True)
+    event_tags1, event_whitelisted1, event_blacklisted1, children1 = await scan.helpers.resolve_event(
+        resolved_hosts_event1
+    )
+    event_tags2, event_whitelisted2, event_blacklisted2, children2 = await scan.helpers.resolve_event(
+        resolved_hosts_event2
+    )
+    assert "8.8.8.8" in [str(x) for x in children1["A"]]
+    assert "8.8.8.8" in [str(x) for x in children2["A"]]
+    assert set(children1.keys()) == set(children2.keys())
+
+
+@pytest.mark.asyncio
+async def test_wildcards(bbot_scanner, bbot_config):
+    scan = bbot_scanner("8.8.8.8", config=bbot_config)
+    helpers = scan.helpers
+
     # wildcards
     wildcard_domains = await helpers.is_wildcard_domain("asdf.github.io")
+    assert hash("github.io") in helpers.dns._wildcard_cache
+    assert hash("asdf.github.io") in helpers.dns._wildcard_cache
     assert "github.io" in wildcard_domains
     assert "A" in wildcard_domains["github.io"]
     assert "SRV" not in wildcard_domains["github.io"]
     assert wildcard_domains["github.io"]["A"] and all(helpers.is_ip(r) for r in wildcard_domains["github.io"]["A"])
+    helpers.dns._wildcard_cache.clear()
 
     wildcard_rdtypes = await helpers.is_wildcard("blacklanternsecurity.github.io")
     assert "A" in wildcard_rdtypes
@@ -82,6 +104,9 @@ async def test_dns(bbot_scanner, bbot_config):
     assert "SRV" not in wildcard_rdtypes
     assert wildcard_rdtypes["A"] == (True, "github.io")
     assert hash("github.io") in helpers.dns._wildcard_cache
+    assert not hash("asdf.github.io") in helpers.dns._wildcard_cache
+    assert not hash("asdf.asdf.github.io") in helpers.dns._wildcard_cache
+    assert not hash("asdf.asdf.asdf.github.io") in helpers.dns._wildcard_cache
     assert len(helpers.dns._wildcard_cache[hash("github.io")]) > 0
     wildcard_event1 = scan.make_event("wat.asdf.fdsa.github.io", "DNS_NAME", dummy=True)
     wildcard_event2 = scan.make_event("wats.asd.fdsa.github.io", "DNS_NAME", dummy=True)
@@ -106,16 +131,3 @@ async def test_dns(bbot_scanner, bbot_config):
     assert "wildcard-domain" in wildcard_event3.tags
     assert "a-wildcard-domain" in wildcard_event3.tags
     assert "srv-wildcard-domain" not in wildcard_event3.tags
-
-    # Ensure events with hosts have resolved_hosts attribute populated
-    resolved_hosts_event1 = scan.make_event("dns.google", "DNS_NAME", dummy=True)
-    resolved_hosts_event2 = scan.make_event("http://dns.google/", "URL_UNVERIFIED", dummy=True)
-    event_tags1, event_whitelisted1, event_blacklisted1, children1 = await scan.helpers.resolve_event(
-        resolved_hosts_event1
-    )
-    event_tags2, event_whitelisted2, event_blacklisted2, children2 = await scan.helpers.resolve_event(
-        resolved_hosts_event2
-    )
-    assert "8.8.8.8" in [str(x) for x in children1["A"]]
-    assert "8.8.8.8" in [str(x) for x in children2["A"]]
-    assert set(children1.keys()) == set(children2.keys())

From 1b3c1c84fdb949b1ede95fbdf188df44646c6749 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 16:14:34 -0400
Subject: [PATCH 362/387] fix docs publishing

---
 .github/workflows/tests.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index 39bcf87a43..ee79ff685a 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -82,7 +82,7 @@ jobs:
   publish_docs:
     needs: update_docs
     runs-on: ubuntu-latest
-    if: github.event_name == 'pull_request_target' && github.event.pull_request.merged == true && github.event.pull_request.base.ref == 'dev'
+    if: github.event_name == 'push' && github.event.pull_request.base.ref == 'dev'
     steps:
       - uses: actions/checkout@v3
       - uses: actions/setup-python@v4

From bf93dcdaf57b53756d417972cb04f501da0a3a13 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 16:17:38 -0400
Subject: [PATCH 363/387] better cancellation for github actions

---
 .github/workflows/tests.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/tests.yml b/.github/workflows/tests.yml
index ee79ff685a..660ec4329b 100644
--- a/.github/workflows/tests.yml
+++ b/.github/workflows/tests.yml
@@ -10,7 +10,7 @@ on:
       - closed
 
 concurrency:
-  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}
+  group: ${{ github.workflow }}-${{ github.event_name }}-${{ github.event.pull_request.number || github.ref }}
   cancel-in-progress: true
 
 jobs:

From ffd34023715fd9b18d87c1af83625726d6cb22dc Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 22:33:33 -0400
Subject: [PATCH 364/387] suppress annoying beautifulsoup warnings

---
 bbot/core/helpers/web.py | 7 +++++++
 1 file changed, 7 insertions(+)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index 8a010a1694..adb189306b 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -3,6 +3,7 @@
 import anyio
 import httpx
 import logging
+import warnings
 import traceback
 from pathlib import Path
 from bs4 import BeautifulSoup
@@ -12,6 +13,12 @@
 from bbot.core.errors import WordlistError, CurlError
 from bbot.core.helpers.ratelimiter import RateLimiter
 
+from bs4 import MarkupResemblesLocatorWarning
+from bs4.builder import XMLParsedAsHTMLWarning
+
+warnings.filterwarnings("ignore", category=XMLParsedAsHTMLWarning)
+warnings.filterwarnings("ignore", category=MarkupResemblesLocatorWarning)
+
 log = logging.getLogger("bbot.core.helpers.web")
 
 
From 0f6c0e985f7e3f34cff10924e0e6bcfe0c0e9f30 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 09:37:29 -0400
Subject: [PATCH 365/387] massdns wildcard debugging

---
 bbot/modules/massdns.py | 53 ++++++++++++++++++++++-------------------
 1 file changed, 29 insertions(+), 24 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index cc0df57e24..175f681474 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -57,7 +57,7 @@ class massdns(crobat):
             "copy": {"src": "#{BBOT_TEMP}/massdns/bin/massdns", "dest": "#{BBOT_TOOLS}/", "mode": "u+x,g+x,o+x"},
         },
     ]
-    reject_wildcards = "cloud_only"
+    reject_wildcards = "strict"
     _qsize = 100
 
     digit_regex = re.compile(r"\d+")
@@ -127,17 +127,17 @@ async def massdns(self, domain, subdomains):
                 if results:
                     domain_wildcard_rdtypes.add(rdtype)
 
-        # if "A" in domain_wildcard_rdtypes:
-        #     self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
-        #     self.found.pop(domain, None)
-        #     return []
+        if "A" in domain_wildcard_rdtypes:
+            self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
+            self.found.pop(domain, None)
+            return []
 
         # before we start, do a canary check for wildcards
-        # abort_msg = f"Aborting massdns on {domain} due to false positive"
-        # canary_result = await self._canary_check(domain)
-        # if canary_result:
-        #     self.info(abort_msg + f": {canary_result}")
-        #     return []
+        abort_msg = f"Aborting massdns on {domain} due to false positive"
+        canary_result = await self._canary_check(domain)
+        if canary_result:
+            self.info(abort_msg + f": {canary_result}")
+            return []
 
         results = []
         async for hostname, ip, rdtype in self._massdns(domain, subdomains):
@@ -145,10 +145,10 @@ async def massdns(self, domain, subdomains):
             # this is dead code but it's kinda cool so it can live here
             if rdtype in domain_wildcard_rdtypes:
                 # skip wildcard checking on multi-level subdomains for performance reasons
-                # stem = hostname.split(domain)[0].strip(".")
-                # if "." in stem:
-                #     self.debug(f"Skipping {hostname}:A because it may be a wildcard (reason: performance)")
-                #     continue
+                stem = hostname.split(domain)[0].strip(".")
+                if "." in stem:
+                    self.debug(f"Skipping {hostname}:A because it may be a wildcard (reason: performance)")
+                    continue
                 wildcard_rdtypes = await self.helpers.is_wildcard(hostname, ips=(ip,), rdtype=rdtype)
                 if rdtype in wildcard_rdtypes:
                     self.debug(f"Skipping {hostname}:{rdtype} because it's a wildcard")
@@ -157,19 +157,24 @@ async def massdns(self, domain, subdomains):
             results.append(hostname)
 
         # do another canary check for good measure
-        # if len(results) > 50:
-        #     canary_result = await self._canary_check(domain)
-        #     if canary_result:
-        #         self.info(abort_msg + f": {canary_result}")
-        #         return []
+        if len(results) > 50:
+            canary_result = await self._canary_check(domain)
+            if canary_result:
+                self.info(abort_msg + f": {canary_result}")
+                return []
 
         # abort if there are a suspiciously high number of results
         # (the results are over 2000, and this is more than 20 percent of the input size)
-        # if len(results) > 2000 and len(results) / len(subdomains) > 0.2:
-        #     self.info(
-        #         f"Aborting massdns on {domain} because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})"
-        #     )
-        #     return []
+        if len(results) > 2000:
+            if len(results) / len(subdomains) > 0.2:
+                self.info(
+                    f"Aborting because the number of results ({len(results):,}) is suspiciously high for the length of the wordlist ({len(subdomains):,})"
+                )
+                return []
+            else:
+                self.info(
+                    f"{len(results):,} results returned from massdns against {domain} (wordlist size = {len(subdomains):,})"
+                )
 
         # everything checks out
         self.verbose(f"Resolving batch of {len(results):,} results")

From 5f5270a9de54d94c47f0a4f49912e1d100bf39fa Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 10:12:39 -0400
Subject: [PATCH 366/387] better debugging messages for massdns

---
 bbot/modules/massdns.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 175f681474..845f31a392 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -128,9 +128,11 @@ async def massdns(self, domain, subdomains):
                     domain_wildcard_rdtypes.add(rdtype)
 
         if "A" in domain_wildcard_rdtypes:
-            self.info(f"Aborting massdns on {domain} because it's a wildcard domain")
+            self.info(f"Aborting massdns on {domain} because it's a wildcard domain ({','.join(domain_wildcard_rdtypes)})")
             self.found.pop(domain, None)
             return []
+        else:
+            self.trace(f"{domain}: A is not in domain_wildcard_rdtypes:{domain_wildcard_rdtypes}")
 
         # before we start, do a canary check for wildcards
         abort_msg = f"Aborting massdns on {domain} due to false positive"
@@ -138,6 +140,8 @@ async def massdns(self, domain, subdomains):
         if canary_result:
             self.info(abort_msg + f": {canary_result}")
             return []
+        else:
+            self.trace(f"Canary result for {domain}: {canary_result}")
 
         results = []
         async for hostname, ip, rdtype in self._massdns(domain, subdomains):
@@ -162,6 +166,8 @@ async def massdns(self, domain, subdomains):
             if canary_result:
                 self.info(abort_msg + f": {canary_result}")
                 return []
+            else:
+                self.trace(f"Canary result for {domain}: {canary_result}")
 
         # abort if there are a suspiciously high number of results
         # (the results are over 2000, and this is more than 20 percent of the input size)

From 9dd9be80ed7a6e98677398d70a289b75ab6b8dd4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 10:14:40 -0400
Subject: [PATCH 367/387] trace bugfix

---
 bbot/modules/massdns.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 845f31a392..56b270e985 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -132,7 +132,7 @@ async def massdns(self, domain, subdomains):
             self.found.pop(domain, None)
             return []
         else:
-            self.trace(f"{domain}: A is not in domain_wildcard_rdtypes:{domain_wildcard_rdtypes}")
+            self.log.trace(f"{domain}: A is not in domain_wildcard_rdtypes:{domain_wildcard_rdtypes}")
 
         # before we start, do a canary check for wildcards
         abort_msg = f"Aborting massdns on {domain} due to false positive"
@@ -141,7 +141,7 @@ async def massdns(self, domain, subdomains):
             self.info(abort_msg + f": {canary_result}")
             return []
         else:
-            self.trace(f"Canary result for {domain}: {canary_result}")
+            self.log.trace(f"Canary result for {domain}: {canary_result}")
 
         results = []
         async for hostname, ip, rdtype in self._massdns(domain, subdomains):
@@ -167,7 +167,7 @@ async def massdns(self, domain, subdomains):
                 self.info(abort_msg + f": {canary_result}")
                 return []
             else:
-                self.trace(f"Canary result for {domain}: {canary_result}")
+                self.log.trace(f"Canary result for {domain}: {canary_result}")
 
         # abort if there are a suspiciously high number of results
         # (the results are over 2000, and this is more than 20 percent of the input size)

From d42231e6b72ccbf22809cdce2f4daf955d3c95b7 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 10:24:16 -0400
Subject: [PATCH 368/387] succeed dammit

---
 bbot/modules/massdns.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index 56b270e985..c6ecd075a8 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -128,7 +128,9 @@ async def massdns(self, domain, subdomains):
                     domain_wildcard_rdtypes.add(rdtype)
 
         if "A" in domain_wildcard_rdtypes:
-            self.info(f"Aborting massdns on {domain} because it's a wildcard domain ({','.join(domain_wildcard_rdtypes)})")
+            self.info(
+                f"Aborting massdns on {domain} because it's a wildcard domain ({','.join(domain_wildcard_rdtypes)})"
+            )
             self.found.pop(domain, None)
             return []
         else:

From a95ea26745d712cc14419073ccd5c351f2b4f7c4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 15:22:44 -0400
Subject: [PATCH 369/387] fixed command buffer error

---
 bbot/core/helpers/command.py          | 13 ++++++++++---
 bbot/test/test_step_1/test_command.py | 22 ++++++++++++++++++++++
 2 files changed, 32 insertions(+), 3 deletions(-)

diff --git a/bbot/core/helpers/command.py b/bbot/core/helpers/command.py
index 1204e21c70..0d03ccac17 100644
--- a/bbot/core/helpers/command.py
+++ b/bbot/core/helpers/command.py
@@ -53,7 +53,13 @@ async def run_live(self, *command, check=False, text=True, **kwargs):
             input_task = asyncio.create_task(_write_stdin(proc, _input))
 
         while 1:
-            line = await proc.stdout.readline()
+            try:
+                line = await proc.stdout.readline()
+            except ValueError as e:
+                command_str = " ".join([str(c) for c in command])
+                log.warning(f"Error executing command {command_str}: {e}")
+                log.trace(traceback.format_exc())
+                continue
             if not line:
                 break
             if text:
@@ -118,8 +124,9 @@ async def _write_stdin(proc, _input):
 
 
 def _prepare_command_kwargs(self, command, kwargs):
-    # limit = 10MB (this is needed for cases like httpx that are sending large JSON blobs over stdout)
-    kwargs["limit"] = 1024 * 1024 * 10
+    # limit = 100MB (this is needed for cases like httpx that are sending large JSON blobs over stdout)
+    if not "limit" in kwargs:
+        kwargs["limit"] = 1024 * 1024 * 100
     if not "stdout" in kwargs:
         kwargs["stdout"] = asyncio.subprocess.PIPE
     if not "stderr" in kwargs:
diff --git a/bbot/test/test_step_1/test_command.py b/bbot/test/test_step_1/test_command.py
index b45039c319..8827bcdad0 100644
--- a/bbot/test/test_step_1/test_command.py
+++ b/bbot/test/test_step_1/test_command.py
@@ -18,6 +18,28 @@ async def test_command(bbot_scanner, bbot_config):
     result = (await scan1.helpers.run(["cat"], input=[b"some", b"random", b"stdin"], text=False)).stdout
     assert result.splitlines() == [b"some", b"random", b"stdin"]
 
+    # test overflow - run
+    tmpfile_path = Path("/tmp/test_bigfile")
+    with open(tmpfile_path, "w") as f:
+        # write 2MB
+        f.write("A" * 1024 * 1024 * 2)
+    result = (await scan1.helpers.run(["cat", str(tmpfile_path)], limit=1024 * 64, text=False)).stdout
+    assert len(result) == 1024 * 1024 * 2
+    tmpfile_path.unlink(missing_ok=True)
+    # test overflow - run_live
+    tmpfile_path = Path("/tmp/test_bigfile")
+    with open(tmpfile_path, "w") as f:
+        # write 2MB
+        f.write("A" * 10 + "\n")
+        f.write("B" * 1024 * 1024 * 2 + "\n")
+        f.write("C" * 10 + "\n")
+    lines = []
+    async for line in scan1.helpers.run_live(["cat", str(tmpfile_path)], limit=1024 * 64):
+        lines.append(line)
+    # only a small bit of the overflowed line survives, that's okay.
+    assert lines == ["AAAAAAAAAA", "BBBBBBBBBBB", "CCCCCCCCCC"]
+    tmpfile_path.unlink(missing_ok=True)
+
     # run_live
     lines = []
     async for line in scan1.helpers.run_live(["echo", "plumbus"]):

From ad1e04cb0f7d74b470f6503e0cdfddec53e986b8 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 1 Aug 2023 10:13:47 -0400
Subject: [PATCH 370/387] hard-pinned anyio version, better logging

---
 bbot/core/helpers/dns.py                   | 11 +++++++----
 bbot/modules/base.py                       | 10 +++++-----
 bbot/modules/httpx.py                      |  6 +++---
 bbot/modules/internal/speculate.py         |  1 -
 bbot/scanner/manager.py                    | 10 ++++------
 bbot/test/test_step_2/module_tests/base.py |  2 ++
 pyproject.toml                             |  2 +-
 7 files changed, 22 insertions(+), 20 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index ed506ae1db..eaf679f79f 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -162,10 +162,13 @@ async def _resolve_hostname(self, query, **kwargs):
                 except KeyError:
                     error_count = self._errors.get(parent_hash, 0)
                     if error_count >= self.abort_threshold:
-                        log.verbose(
-                            f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
-                        )
-                        return results, errors
+                        query_in_scope = self.parent_helper.scan.in_scope(query)
+                        # don't abort if the query is in scope
+                        if not query_in_scope:
+                            log.verbose(
+                                f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                            )
+                            return results, errors
                     async with self.dns_rate_limiter:
                         results = await self._catch(self.resolver.resolve, query, **kwargs)
                     if cache_result:
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 23aa5d97db..c147f8ffac 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -217,12 +217,12 @@ async def _handle_batch(self):
                 return
             if self.num_incoming_events > 0:
                 events, finish = await self.events_waiting()
-                if not self.errored:
+                if events and not self.errored:
                     self.debug(f"Handling batch of {len(events):,} events")
-                    if events:
-                        submitted = True
-                        async with self.scan.acatch("handle_batch()"):
-                            await self.handle_batch(*events)
+                    submitted = True
+                    async with self.scan.acatch("handle_batch()"):
+                        await self.handle_batch(*events)
+                    self.debug(f"Finished handling batch of {len(events):,} events")
         if finish:
             context = "finish()"
             async with self.scan.acatch(context), self._task_counter.count(context):
diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index 9e95cf2bb6..7ac7257ca1 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -10,7 +10,7 @@ class httpx(BaseModule):
     flags = ["active", "safe", "web-basic", "web-thorough", "social-enum", "subdomain-enum", "cloud-enum"]
     meta = {"description": "Visit webpages. Many other modules rely on httpx"}
 
-    batch_size = 500
+    batch_size = 100
     options = {"threads": 50, "in_scope_only": True, "version": "1.2.5", "max_response_size": 5242880}
     options_desc = {
         "threads": "Number of httpx threads to use",
@@ -30,6 +30,7 @@ class httpx(BaseModule):
         }
     ]
 
+    max_event_handlers = 2
     scope_distance_modifier = 1
     _priority = 2
 
@@ -59,8 +60,7 @@ async def filter_event(self, event):
         safe_to_visit = "httpx-safe" in event.tags
         if not safe_to_visit and (in_scope_only and not self.scan.in_scope(event)):
             return False, "event is not in scope"
-        # reject base URLs to avoid visiting a resource twice
-        # note: speculate makes open ports from
+
         return True
 
     async def handle_batch(self, *events):
diff --git a/bbot/modules/internal/speculate.py b/bbot/modules/internal/speculate.py
index 5b38bc6779..4aa3bb6166 100644
--- a/bbot/modules/internal/speculate.py
+++ b/bbot/modules/internal/speculate.py
@@ -30,7 +30,6 @@ class speculate(BaseInternalModule):
         "max_hosts": "Max number of IP_RANGE hosts to convert into IP_ADDRESS events",
         "ports": "The set of ports to speculate on",
     }
-    max_event_handlers = 5
     scope_distance_modifier = 1
     _scope_shepherding = False
     _priority = 4
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 262da7cb9c..014c76c702 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -460,13 +460,11 @@ def modules_status(self, _log=False):
 
             if modules_status:
                 modules_status_str = ", ".join([f"{m}({i:,}:{t:,}:{o:,})" for m, r, i, o, t, _ in modules_status])
-                running_modules_str = ", ".join([m[0] for m in modules_status if m[1]])
-                if not running_modules_str:
-                    running_modules_str = "None"
-                self.scan.info(f"{self.scan.name}: Modules running: {running_modules_str}")
-                self.scan.verbose(
-                    f"{self.scan.name}: Modules status (incoming:processing:outgoing) {modules_status_str}"
+                self.scan.info(
+                    f"{self.scan.name}: Modules running (incoming:processing:outgoing) {modules_status_str}"
                 )
+            else:
+                self.scan.info(f"{self.scan.name}: No modules running")
             event_type_summary = sorted(
                 self.scan.stats.events_emitted_by_type.items(), key=lambda x: x[-1], reverse=True
             )
diff --git a/bbot/test/test_step_2/module_tests/base.py b/bbot/test/test_step_2/module_tests/base.py
index b598989535..d2fcd78261 100644
--- a/bbot/test/test_step_2/module_tests/base.py
+++ b/bbot/test/test_step_2/module_tests/base.py
@@ -102,6 +102,7 @@ def mock_record(self, *args, **kwargs):
     @pytest_asyncio.fixture
     async def module_test(self, httpx_mock, bbot_httpserver, bbot_httpserver_ssl, monkeypatch, request):
         module_test = self.ModuleTest(self, httpx_mock, bbot_httpserver, bbot_httpserver_ssl, monkeypatch, request)
+        module_test.log.info(f"Starting {self.name} module test")
         await self.setup_before_prep(module_test)
         await module_test.scan.prep()
         await self.setup_after_prep(module_test)
@@ -111,6 +112,7 @@ async def module_test(self, httpx_mock, bbot_httpserver, bbot_httpserver_ssl, mo
     @pytest.mark.asyncio
     async def test_module_run(self, module_test):
         self.check(module_test, module_test.events)
+        module_test.log.info(f"Finished {self.name} module test")
 
     def check(self, module_test, events):
         assert False, f"Must override {self.name}.check()"
diff --git a/pyproject.toml b/pyproject.toml
index ad240a9ded..52f9624e3d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -32,7 +32,7 @@ pyjwt = "^2.7.0"
 beautifulsoup4 = "^4.12.2"
 lxml = "^4.9.2"
 httpx = {extras = ["http2"], version = "^0.24.1"}
-anyio = "4.0.0rc1"
+anyio = "==4.0.0rc1"
 
 [tool.poetry.group.dev.dependencies]
 pytest = "^7.2.2"

From fd3665da14620cdaaeb887444f203799e0b910a9 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Tue, 1 Aug 2023 16:57:28 -0400
Subject: [PATCH 371/387] task debugging

---
 bbot/core/helpers/async_helpers.py | 11 ++++++++---
 bbot/core/helpers/dns.py           | 27 +++++++++++++++++----------
 bbot/core/logger/logger.py         | 17 +++++++++--------
 bbot/modules/azure_tenant.py       |  4 ++--
 bbot/modules/base.py               | 19 +++++++++++--------
 bbot/scanner/scanner.py            |  2 +-
 6 files changed, 48 insertions(+), 32 deletions(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 96c25addc3..6eb6cb71e5 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -43,6 +43,7 @@ async def lock(self, name):
 class TaskCounter:
     def __init__(self):
         self.tasks = {}
+        self.lock = asyncio.Lock()  # create a new lock
 
     @property
     def value(self):
@@ -62,12 +63,16 @@ def __init__(self, manager, task_name):
 
         async def __aenter__(self):
             self.task_id = uuid.uuid4()  # generate a unique ID for the task
-            self.start_time = datetime.now()
-            self.manager.tasks[self.task_id] = self
+            log.trace(f"Starting task {self.task_name} ({self.task_id})")
+            async with self.manager.lock:  # acquire the lock
+                self.start_time = datetime.now()
+                self.manager.tasks[self.task_id] = self
             return self.task_id  # this will be passed as 'task_id' to __aexit__
 
         async def __aexit__(self, exc_type, exc_val, exc_tb):
-            self.manager.tasks.pop(self.task_id, None)  # remove only current task
+            async with self.manager.lock:  # acquire the lock
+                self.manager.tasks.pop(self.task_id, None)  # remove only current task
+            log.trace(f"Finished task {self.task_name} ({self.task_id})")
 
         def __str__(self):
             running_for = human_timedelta(datetime.now() - self.start_time)
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index eaf679f79f..66fbe5e814 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -91,13 +91,19 @@ async def resolve(self, query, **kwargs):
         }
         """
         results = set()
-        r = await self.resolve_raw(query, **kwargs)
-        if r:
-            raw_results, errors = r
-            for rdtype, answers in raw_results:
-                for answer in answers:
-                    for _, t in self.extract_targets(answer):
-                        results.add(t)
+        try:
+            r = await self.resolve_raw(query, **kwargs)
+            if r:
+                raw_results, errors = r
+                for rdtype, answers in raw_results:
+                    for answer in answers:
+                        for _, t in self.extract_targets(answer):
+                            results.add(t)
+        except BaseException:
+            log.trace(f"Caught exception in resolve({query}, {kwargs}):")
+            log.trace(traceback.format_exc())
+            raise
+
         return results
 
     async def resolve_raw(self, query, **kwargs):
@@ -106,8 +112,8 @@ async def resolve_raw(self, query, **kwargs):
         # kwargs["tcp"] = True
         results = []
         errors = []
-        query = str(query).strip()
         try:
+            query = str(query).strip()
             if is_ip(query):
                 kwargs.pop("type", None)
                 kwargs.pop("rdtype", None)
@@ -131,9 +137,10 @@ async def resolve_raw(self, query, **kwargs):
                         results.append((t, r))
                     for error in e:
                         errors.append((t, error))
-        except RuntimeError as e:
-            log.debug(f"Error in resolve_raw({query}, kwargs={kwargs}): {e}")
+        except BaseException:
+            log.trace(f"Caught exception in resolve_raw({query}, {kwargs}):")
             log.trace(traceback.format_exc())
+            raise
 
         return (results, errors)
 
diff --git a/bbot/core/logger/logger.py b/bbot/core/logger/logger.py
index 97241e343b..af534ff07c 100644
--- a/bbot/core/logger/logger.py
+++ b/bbot/core/logger/logger.py
@@ -122,13 +122,15 @@ def log_worker_setup(logging_queue):
     This needs to be run whenever a new multiprocessing.Process() is spawned
     """
     log_level = get_log_level()
-    log = logging.getLogger("bbot")
+    bbot_log = logging.getLogger("bbot")
+    asyncio_log = logging.getLogger("asyncio")
     # Don't do this more than once
-    if len(log.handlers) == 0:
-        log.setLevel(log_level)
+    if len(bbot_log.handlers) == 0:
         queue_handler = QueueHandler(logging_queue)
-        log.addHandler(queue_handler)
-    return log
+        for log in (bbot_log, asyncio_log):
+            log.setLevel(log_level)
+            log.addHandler(queue_handler)
+    return bbot_log
 
 
 def log_listener_setup(logging_queue):
@@ -222,9 +224,8 @@ def set_log_level(level, logger=None):
         logger.hugeinfo(f"Setting log level to {logging.getLevelName(level)}")
     config["silent"] = False
     _log_level_override = level
-    log = logging.getLogger("bbot")
-    log.setLevel(level)
-    logging.getLogger("asyncio").setLevel(level)
+    for logname in ("bbot", "asyncio"):
+        logging.getLogger(logname).setLevel(level)
 
 
 def toggle_log_level(logger=None):
diff --git a/bbot/modules/azure_tenant.py b/bbot/modules/azure_tenant.py
index c46e7ac2da..9a44c7b23a 100644
--- a/bbot/modules/azure_tenant.py
+++ b/bbot/modules/azure_tenant.py
@@ -56,10 +56,10 @@ async def query(self, domain):
 
         self.debug(f"Retrieving tenant domains at {url}")
 
-        r = await self.request_with_fail_count(url, method="POST", headers=headers, data=data)
+        r = await self.helpers.request(url, method="POST", headers=headers, data=data)
         status_code = getattr(r, "status_code", 0)
         if status_code not in (200, 421):
-            self.warning(f'Error retrieving azure_tenant domains for "{domain}" (status code: {status_code})')
+            self.verbose(f'Error retrieving azure_tenant domains for "{domain}" (status code: {status_code})')
             return set(), set()
         found_domains = list(set(self.d_xml_regex.findall(r.text)))
         domains = set()
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index c147f8ffac..7c1a971ff3 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -4,7 +4,7 @@
 from sys import exc_info
 from contextlib import suppress
 
-from ..core.helpers.misc import get_size
+from ..core.helpers.misc import get_size  # noqa
 from ..core.helpers.async_helpers import TaskCounter
 from ..core.errors import ValidationError, WordlistError
 
@@ -211,7 +211,7 @@ def get_watched_events(self):
 
     async def _handle_batch(self):
         finish = False
-        async with self._task_counter.count("handle_batch()"):
+        async with self._task_counter.count(f"{self.name}.handle_batch()"):
             submitted = False
             if self.batch_size <= 1:
                 return
@@ -220,11 +220,11 @@ async def _handle_batch(self):
                 if events and not self.errored:
                     self.debug(f"Handling batch of {len(events):,} events")
                     submitted = True
-                    async with self.scan.acatch("handle_batch()"):
+                    async with self.scan.acatch(f"{self.name}.handle_batch()"):
                         await self.handle_batch(*events)
                     self.debug(f"Finished handling batch of {len(events):,} events")
         if finish:
-            context = "finish()"
+            context = f"{self.name}.finish()"
             async with self.scan.acatch(context), self._task_counter.count(context):
                 await self.finish()
         return submitted
@@ -345,14 +345,16 @@ async def _worker(self):
                             self.debug(f"Not accepting {event} because {reason}")
                         if acceptable:
                             if event.type == "FINISHED":
-                                context = "finish()"
+                                context = f"{self.name}.finish()"
                                 async with self.scan.acatch(context), self._task_counter.count(context):
                                     await self.finish()
                             else:
-                                context = f"handle_event({event})"
+                                context = f"{self.name}.handle_event({event})"
                                 self.scan.stats.event_consumed(event, self)
+                                self.debug(f"Handling {event}")
                                 async with self.scan.acatch(context), self._task_counter.count(context):
                                     await self.handle_event(event)
+                                self.debug(f"Finished handling {event}")
             except asyncio.CancelledError:
                 self.log.trace("Worker cancelled")
                 self.trace()
@@ -622,8 +624,9 @@ def memory_usage(self):
         """
         Return how much memory the module is currently using in bytes
         """
-        seen = {self.scan, self.helpers, self.log}
-        return get_size(self, max_depth=3, seen=seen)
+        seen = {self.scan, self.helpers, self.log}  # noqa
+        # return get_size(self, max_depth=3, seen=seen)
+        return 0
 
     def __str__(self):
         return self.name
diff --git a/bbot/scanner/scanner.py b/bbot/scanner/scanner.py
index 6733ee3ae9..af936eff0c 100644
--- a/bbot/scanner/scanner.py
+++ b/bbot/scanner/scanner.py
@@ -781,4 +781,4 @@ def _handle_exception(self, e, context="scan", finally_callback=None):
             log.error(f"Error in {context}: {filename}:{lineno}:{funcname}(): {e}")
             log.trace(traceback.format_exc())
         if callable(finally_callback):
-            self.helpers.execute_sync_or_async(finally_callback, e)
+            finally_callback(e)

From cd90522881c7e22b5f77b5019f76cbfee8ccf922 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 3 Aug 2023 10:34:49 -0400
Subject: [PATCH 372/387] silence unnecessary debugging output

---
 bbot/cli.py                        |  4 ++--
 bbot/core/helpers/async_helpers.py | 13 ++++++++-----
 bbot/core/helpers/dns.py           | 17 +++++++++++------
 bbot/modules/azure_tenant.py       |  2 +-
 bbot/modules/base.py               |  4 ++--
 bbot/scanner/manager.py            |  4 ++--
 poetry.lock                        |  2 +-
 7 files changed, 27 insertions(+), 19 deletions(-)

diff --git a/bbot/cli.py b/bbot/cli.py
index 6ccf0dccfc..4f3d70fe2f 100755
--- a/bbot/cli.py
+++ b/bbot/cli.py
@@ -131,8 +131,8 @@ async def _main():
                 ]
 
                 # if none of the output modules provided on the command line are consoleable, don't turn off the defaults. Instead, just add the one specified to the defaults.
-                if not any(o in consoleable_output_modules for o in options.output_modules):
-                    options.output_modules += default_output_modules
+                if not any(o in consoleable_output_modules for o in output_modules):
+                    output_modules += default_output_modules
 
                 scanner = Scanner(
                     *options.targets,
diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 6eb6cb71e5..8f4bb72638 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -49,21 +49,23 @@ def __init__(self):
     def value(self):
         return len(self.tasks)
 
-    def count(self, task_name):
+    def count(self, task_name, _log):
         if callable(task_name):
             task_name = f"{task_name.__qualname__}()"
-        return self.Task(self, task_name)
+        return self.Task(self, task_name, _log)
 
     class Task:
-        def __init__(self, manager, task_name):
+        def __init__(self, manager, task_name, _log=True):
             self.manager = manager
             self.task_name = task_name
             self.task_id = None
             self.start_time = None
+            self.log = _log
 
         async def __aenter__(self):
             self.task_id = uuid.uuid4()  # generate a unique ID for the task
-            log.trace(f"Starting task {self.task_name} ({self.task_id})")
+            if self.log:
+                log.trace(f"Starting task {self.task_name} ({self.task_id})")
             async with self.manager.lock:  # acquire the lock
                 self.start_time = datetime.now()
                 self.manager.tasks[self.task_id] = self
@@ -72,7 +74,8 @@ async def __aenter__(self):
         async def __aexit__(self, exc_type, exc_val, exc_tb):
             async with self.manager.lock:  # acquire the lock
                 self.manager.tasks.pop(self.task_id, None)  # remove only current task
-            log.trace(f"Finished task {self.task_name} ({self.task_id})")
+            if self.log:
+                log.trace(f"Finished task {self.task_name} ({self.task_id})")
 
         def __str__(self):
             running_for = human_timedelta(datetime.now() - self.start_time)
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 66fbe5e814..f35e2ca458 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -169,13 +169,18 @@ async def _resolve_hostname(self, query, **kwargs):
                 except KeyError:
                     error_count = self._errors.get(parent_hash, 0)
                     if error_count >= self.abort_threshold:
-                        query_in_scope = self.parent_helper.scan.in_scope(query)
+                        # query_in_scope = self.parent_helper.scan.in_scope(query)
                         # don't abort if the query is in scope
-                        if not query_in_scope:
-                            log.verbose(
-                                f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                        # if not query_in_scope:
+                        log.info(
+                            f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                        )
+                        if parent_hash not in self._dns_warnings:
+                            log.warning(
+                                f'Aborting future {rdtype} queries to "{parent}" because error count ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
                             )
-                            return results, errors
+                        self._dns_warnings.add(parent_hash)
+                        return results, errors
                     async with self.dns_rate_limiter:
                         results = await self._catch(self.resolver.resolve, query, **kwargs)
                     if cache_result:
@@ -453,7 +458,7 @@ async def _catch(self, callback, *args, **kwargs):
         except dns.resolver.NoNameservers:
             raise
         except (dns.exception.Timeout, dns.resolver.LifetimeTimeout):
-            log.debug(f"DNS query with args={args}, kwargs={kwargs} timed out after {self.timeout} seconds")
+            log.verbose(f"DNS query with args={args}, kwargs={kwargs} timed out after {self.timeout} seconds")
             raise
         except dns.exception.DNSException as e:
             self.debug(f"{e} (args={args}, kwargs={kwargs})")
diff --git a/bbot/modules/azure_tenant.py b/bbot/modules/azure_tenant.py
index 9a44c7b23a..0ed5f83841 100644
--- a/bbot/modules/azure_tenant.py
+++ b/bbot/modules/azure_tenant.py
@@ -21,7 +21,7 @@ async def handle_event(self, event):
         _, query = self.helpers.split_domain(event.data)
         domains, _ = await self.query(query)
         if domains:
-            self.success(f'Found {len(domains):,} domains under tenant for "{query}"')
+            self.success(f'Found {len(domains):,} domains under tenant for "{query}": {", ".join(sorted(domains))}')
         for domain in domains:
             if domain != query:
                 self.emit_event(domain, "DNS_NAME", source=event, tags=["affiliate"])
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 7c1a971ff3..7bef5c55b7 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -461,7 +461,7 @@ async def _cleanup(self):
         if not self._cleanedup:
             self._cleanedup = True
             for callback in [self.cleanup] + self.cleanup_callbacks:
-                context = f"cleanup()"
+                context = f"{self.name}.cleanup()"
                 if callable(callback):
                     async with self.scan.acatch(context), self._task_counter.count(context):
                         await self.helpers.execute_sync_or_async(callback)
@@ -470,7 +470,7 @@ async def queue_event(self, event):
         """
         Queue (incoming) event with module
         """
-        async with self._task_counter.count("queue_event()"):
+        async with self._task_counter.count("queue_event()", _log=False):
             if self.incoming_event_queue is False:
                 self.debug(f"Not in an acceptable state to queue incoming event")
                 return
diff --git a/bbot/scanner/manager.py b/bbot/scanner/manager.py
index 014c76c702..3bae7990b6 100644
--- a/bbot/scanner/manager.py
+++ b/bbot/scanner/manager.py
@@ -499,7 +499,7 @@ def modules_status(self, _log=False):
                 scan_active_status.append(f"    manager.running: {self.running}")
                 scan_active_status.append(f"        manager._task_counter.value: {self._task_counter.value}")
                 scan_active_status.append(f"        manager._task_counter.tasks:")
-                for task in self._task_counter.tasks.values():
+                for task in list(self._task_counter.tasks.values()):
                     scan_active_status.append(f"            - {task}:")
                 scan_active_status.append(
                     f"        manager.incoming_event_queue.qsize: {self.incoming_event_queue.qsize()}"
@@ -511,7 +511,7 @@ def modules_status(self, _log=False):
                     scan_active_status.append(f"            running: {running}")
                     if running:
                         scan_active_status.append(f"            tasks:")
-                        for task in m._task_counter.tasks.values():
+                        for task in list(m._task_counter.tasks.values()):
                             scan_active_status.append(f"                - {task}:")
                     scan_active_status.append(f"            num_incoming_events: {m.num_incoming_events}")
                     scan_active_status.append(
diff --git a/poetry.lock b/poetry.lock
index 8d6774a448..faa63b9ca7 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1780,4 +1780,4 @@ xmltodict = ">=0.12.0,<0.13.0"
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.9"
-content-hash = "8e25d12ea22d24b6a153cab314f8df0c3e30c37a098aae2863b92db932a4bb1f"
+content-hash = "4e1c3bdd376ba5b7b626e58adb54624fe46c37763304aff23881f97a3524936c"

From dca013250c0fe3673f688bef672d054ff94fae2a Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 3 Aug 2023 15:49:34 -0400
Subject: [PATCH 373/387] fix dnspython deadlock bug

---
 bbot/core/helpers/async_helpers.py |   2 +-
 bbot/core/helpers/dns.py           | 319 +++++++++++++++--------------
 poetry.lock                        |  13 +-
 3 files changed, 177 insertions(+), 157 deletions(-)

diff --git a/bbot/core/helpers/async_helpers.py b/bbot/core/helpers/async_helpers.py
index 8f4bb72638..df69ff6c78 100644
--- a/bbot/core/helpers/async_helpers.py
+++ b/bbot/core/helpers/async_helpers.py
@@ -49,7 +49,7 @@ def __init__(self):
     def value(self):
         return len(self.tasks)
 
-    def count(self, task_name, _log):
+    def count(self, task_name, _log=True):
         if callable(task_name):
             task_name = f"{task_name.__qualname__}()"
         return self.Task(self, task_name, _log)
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index f35e2ca458..9acb4a7fd4 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -149,6 +149,7 @@ async def _resolve_hostname(self, query, **kwargs):
         results = []
         errors = []
         rdtype = kwargs.get("rdtype", "A")
+        allow_abort = kwargs.pop("allow_abort", True)
 
         # skip certain queries if requested
         if rdtype in self.dns_omit_queries:
@@ -167,20 +168,23 @@ async def _resolve_hostname(self, query, **kwargs):
                 try:
                     results = self._dns_cache[dns_cache_hash]
                 except KeyError:
-                    error_count = self._errors.get(parent_hash, 0)
-                    if error_count >= self.abort_threshold:
-                        # query_in_scope = self.parent_helper.scan.in_scope(query)
-                        # don't abort if the query is in scope
-                        # if not query_in_scope:
-                        log.info(
-                            f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
-                        )
-                        if parent_hash not in self._dns_warnings:
-                            log.warning(
-                                f'Aborting future {rdtype} queries to "{parent}" because error count ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
-                            )
-                        self._dns_warnings.add(parent_hash)
-                        return results, errors
+                    if allow_abort:
+                        error_count = self._errors.get(parent_hash, 0)
+                        if error_count >= self.abort_threshold:
+                            dns_server_working = await self.resolve("www.google.com", type="A", allow_abort=False)
+                            if not dns_server_working:
+                                log.warning(f"DNS queries are failing, you may be blasting a little too hard")
+                                self._errors.clear()
+                            else:
+                                log.info(
+                                    f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                                )
+                                if parent_hash not in self._dns_warnings:
+                                    log.warning(
+                                        f'Aborting future {rdtype} queries to "{parent}" because error count ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                                    )
+                                self._dns_warnings.add(parent_hash)
+                                return results, errors
                     async with self.dns_rate_limiter:
                         results = await self._catch(self.resolver.resolve, query, **kwargs)
                     if cache_result:
@@ -188,7 +192,12 @@ async def _resolve_hostname(self, query, **kwargs):
                     if parent_hash in self._errors:
                         self._errors[parent_hash] = 0
                 break
-            except (dns.resolver.NoNameservers, dns.exception.Timeout, dns.resolver.LifetimeTimeout) as e:
+            except (
+                dns.resolver.NoNameservers,
+                dns.exception.Timeout,
+                dns.resolver.LifetimeTimeout,
+                asyncio.TimeoutError,
+            ) as e:
                 try:
                     self._errors[parent_hash] += 1
                 except KeyError:
@@ -243,50 +252,56 @@ async def _resolve_ip(self, query, **kwargs):
         return results, errors
 
     async def handle_wildcard_event(self, event, children):
-        event_host = str(event.host)
-        # wildcard checks
-        if not is_ip(event.host):
-            # check if the dns name itself is a wildcard entry
-            wildcard_rdtypes = await self.is_wildcard(event_host)
-            for rdtype, (is_wildcard, wildcard_host) in wildcard_rdtypes.items():
-                wildcard_tag = "error"
-                if is_wildcard == True:
-                    event.add_tag("wildcard")
-                    wildcard_tag = "wildcard"
-                event.add_tag(f"{rdtype.lower()}-{wildcard_tag}")
-
-        # wildcard event modification (www.evilcorp.com --> _wildcard.evilcorp.com)
-        if not is_ip(event.host) and children:
-            if wildcard_rdtypes:
-                # these are the rdtypes that successfully resolve
-                resolved_rdtypes = set([c.upper() for c in children])
-                # these are the rdtypes that have wildcards
-                wildcard_rdtypes_set = set(wildcard_rdtypes)
-                # consider the event a full wildcard if all its records are wildcards
-                event_is_wildcard = False
-                if resolved_rdtypes:
-                    event_is_wildcard = all(r in wildcard_rdtypes_set for r in resolved_rdtypes)
-
-                if event_is_wildcard:
-                    if event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
-                        wildcard_parent = self.parent_helper.parent_domain(event_host)
-                        for rdtype, (_is_wildcard, _parent_domain) in wildcard_rdtypes.items():
-                            if _is_wildcard:
-                                wildcard_parent = _parent_domain
-                                break
-                        wildcard_data = f"_wildcard.{wildcard_parent}"
-                        if wildcard_data != event.data:
-                            log.debug(f'Wildcard detected, changing event.data "{event.data}" --> "{wildcard_data}"')
-                            event.data = wildcard_data
-            else:
-                # check if this domain is using wildcard dns
-                event_target = "target" in event.tags
-                wildcard_domain_results = await self.is_wildcard_domain(event_host, log_info=event_target)
-                for hostname, wildcard_domain_rdtypes in wildcard_domain_results.items():
-                    if wildcard_domain_rdtypes:
-                        event.add_tag("wildcard-domain")
-                        for rdtype, ips in wildcard_domain_rdtypes.items():
-                            event.add_tag(f"{rdtype.lower()}-wildcard-domain")
+        log.debug(f"Entering handle_wildcard_event({event}, children={children})")
+        try:
+            event_host = str(event.host)
+            # wildcard checks
+            if not is_ip(event.host):
+                # check if the dns name itself is a wildcard entry
+                wildcard_rdtypes = await self.is_wildcard(event_host)
+                for rdtype, (is_wildcard, wildcard_host) in wildcard_rdtypes.items():
+                    wildcard_tag = "error"
+                    if is_wildcard == True:
+                        event.add_tag("wildcard")
+                        wildcard_tag = "wildcard"
+                    event.add_tag(f"{rdtype.lower()}-{wildcard_tag}")
+
+            # wildcard event modification (www.evilcorp.com --> _wildcard.evilcorp.com)
+            if not is_ip(event.host) and children:
+                if wildcard_rdtypes:
+                    # these are the rdtypes that successfully resolve
+                    resolved_rdtypes = set([c.upper() for c in children])
+                    # these are the rdtypes that have wildcards
+                    wildcard_rdtypes_set = set(wildcard_rdtypes)
+                    # consider the event a full wildcard if all its records are wildcards
+                    event_is_wildcard = False
+                    if resolved_rdtypes:
+                        event_is_wildcard = all(r in wildcard_rdtypes_set for r in resolved_rdtypes)
+
+                    if event_is_wildcard:
+                        if event.type in ("DNS_NAME",) and not "_wildcard" in event.data.split("."):
+                            wildcard_parent = self.parent_helper.parent_domain(event_host)
+                            for rdtype, (_is_wildcard, _parent_domain) in wildcard_rdtypes.items():
+                                if _is_wildcard:
+                                    wildcard_parent = _parent_domain
+                                    break
+                            wildcard_data = f"_wildcard.{wildcard_parent}"
+                            if wildcard_data != event.data:
+                                log.debug(
+                                    f'Wildcard detected, changing event.data "{event.data}" --> "{wildcard_data}"'
+                                )
+                                event.data = wildcard_data
+                else:
+                    # check if this domain is using wildcard dns
+                    event_target = "target" in event.tags
+                    wildcard_domain_results = await self.is_wildcard_domain(event_host, log_info=event_target)
+                    for hostname, wildcard_domain_rdtypes in wildcard_domain_results.items():
+                        if wildcard_domain_rdtypes:
+                            event.add_tag("wildcard-domain")
+                            for rdtype, ips in wildcard_domain_rdtypes.items():
+                                event.add_tag(f"{rdtype.lower()}-wildcard-domain")
+        finally:
+            log.debug(f"Finished handle_wildcard_event({event}, children={children})")
 
     async def resolve_event(self, event, minimal=False):
         """
@@ -300,96 +315,100 @@ async def resolve_event(self, event, minimal=False):
         event_whitelisted = False
         event_blacklisted = False
 
-        if not event.host or event.type in ("IP_RANGE",):
-            return event_tags, event_whitelisted, event_blacklisted, dns_children
-
-        # lock to ensure resolution of the same host doesn't start while we're working here
-        async with self._event_cache_locks.lock(event_host):
-            # try to get data from cache
-            _event_tags, _event_whitelisted, _event_blacklisted, _dns_children = self.event_cache_get(event_host)
-            event_tags.update(_event_tags)
-            # if we found it, return it
-            if _event_whitelisted is not None:
-                return event_tags, _event_whitelisted, _event_blacklisted, _dns_children
-
-            # then resolve
-            types = ()
-            if self.parent_helper.is_ip(event.host):
-                if not minimal:
-                    types = ("PTR",)
-            else:
-                if event.type == "DNS_NAME" and not minimal:
-                    types = self.all_rdtypes
+        try:
+            if not event.host or event.type in ("IP_RANGE",):
+                return event_tags, event_whitelisted, event_blacklisted, dns_children
+
+            # lock to ensure resolution of the same host doesn't start while we're working here
+            async with self._event_cache_locks.lock(event_host):
+                # try to get data from cache
+                _event_tags, _event_whitelisted, _event_blacklisted, _dns_children = self.event_cache_get(event_host)
+                event_tags.update(_event_tags)
+                # if we found it, return it
+                if _event_whitelisted is not None:
+                    return event_tags, _event_whitelisted, _event_blacklisted, _dns_children
+
+                # then resolve
+                types = ()
+                if self.parent_helper.is_ip(event.host):
+                    if not minimal:
+                        types = ("PTR",)
                 else:
-                    types = ("A", "AAAA")
-
-            if types:
-                tasks = [self.resolve_raw(event_host, type=t, cache_result=True) for t in types]
-                async for task in as_completed(tasks):
-                    resolved_raw, errors = await task
-                    for rdtype, e in errors:
-                        if rdtype not in resolved_raw:
-                            event_tags.add(f"{rdtype.lower()}-error")
-                    for rdtype, records in resolved_raw:
-                        rdtype = str(rdtype).upper()
-                        if records:
-                            event_tags.add("resolved")
-                            event_tags.add(f"{rdtype.lower()}-record")
-
-                        # whitelisting and blacklisting of IPs
-                        for r in records:
-                            for _, t in self.extract_targets(r):
-                                if t:
-                                    ip = self.parent_helper.make_ip_type(t)
-
-                                    if rdtype in ("A", "AAAA", "CNAME"):
-                                        with contextlib.suppress(ValidationError):
-                                            if self.parent_helper.is_ip(ip):
-                                                if self.parent_helper.scan.whitelisted(ip):
-                                                    event_whitelisted = True
-                                        with contextlib.suppress(ValidationError):
-                                            if self.parent_helper.scan.blacklisted(ip):
-                                                event_blacklisted = True
-
-                                    if self.filter_bad_ptrs and rdtype in ("PTR") and self.parent_helper.is_ptr(t):
-                                        self.debug(f"Filtering out bad PTR: {t}")
-                                        continue
-
-                                    try:
-                                        dns_children[rdtype].add(ip)
-                                    except KeyError:
-                                        dns_children[rdtype] = {ip}
-
-                # tag with cloud providers
-                if not self.parent_helper.in_tests:
-                    to_check = set()
-                    if event.type == "IP_ADDRESS":
-                        to_check.add(event.data)
+                    if event.type == "DNS_NAME" and not minimal:
+                        types = self.all_rdtypes
+                    else:
+                        types = ("A", "AAAA")
+
+                if types:
+                    tasks = [self.resolve_raw(event_host, type=t, cache_result=True) for t in types]
+                    async for task in as_completed(tasks):
+                        resolved_raw, errors = await task
+                        for rdtype, e in errors:
+                            if rdtype not in resolved_raw:
+                                event_tags.add(f"{rdtype.lower()}-error")
+                        for rdtype, records in resolved_raw:
+                            rdtype = str(rdtype).upper()
+                            if records:
+                                event_tags.add("resolved")
+                                event_tags.add(f"{rdtype.lower()}-record")
+
+                            # whitelisting and blacklisting of IPs
+                            for r in records:
+                                for _, t in self.extract_targets(r):
+                                    if t:
+                                        ip = self.parent_helper.make_ip_type(t)
+
+                                        if rdtype in ("A", "AAAA", "CNAME"):
+                                            with contextlib.suppress(ValidationError):
+                                                if self.parent_helper.is_ip(ip):
+                                                    if self.parent_helper.scan.whitelisted(ip):
+                                                        event_whitelisted = True
+                                            with contextlib.suppress(ValidationError):
+                                                if self.parent_helper.scan.blacklisted(ip):
+                                                    event_blacklisted = True
+
+                                        if self.filter_bad_ptrs and rdtype in ("PTR") and self.parent_helper.is_ptr(t):
+                                            self.debug(f"Filtering out bad PTR: {t}")
+                                            continue
+
+                                        try:
+                                            dns_children[rdtype].add(ip)
+                                        except KeyError:
+                                            dns_children[rdtype] = {ip}
+
+                    # tag with cloud providers
+                    if not self.parent_helper.in_tests:
+                        to_check = set()
+                        if event.type == "IP_ADDRESS":
+                            to_check.add(event.data)
+                        for rdtype, ips in dns_children.items():
+                            if rdtype in ("A", "AAAA"):
+                                for ip in ips:
+                                    to_check.add(ip)
+                        for ip in to_check:
+                            provider, provider_type, subnet = cloudcheck(ip)
+                            if provider:
+                                event_tags.add(f"{provider_type}-{provider}")
+
+                    # if needed, mark as unresolved
+                    if not is_ip(event_host) and "resolved" not in event_tags:
+                        event_tags.add("unresolved")
+                    # check for private IPs
                     for rdtype, ips in dns_children.items():
-                        if rdtype in ("A", "AAAA"):
-                            for ip in ips:
-                                to_check.add(ip)
-                    for ip in to_check:
-                        provider, provider_type, subnet = cloudcheck(ip)
-                        if provider:
-                            event_tags.add(f"{provider_type}-{provider}")
-
-                # if needed, mark as unresolved
-                if not is_ip(event_host) and "resolved" not in event_tags:
-                    event_tags.add("unresolved")
-                # check for private IPs
-                for rdtype, ips in dns_children.items():
-                    for ip in ips:
-                        try:
-                            ip = ipaddress.ip_address(ip)
-                            if ip.is_private:
-                                event_tags.add("private-ip")
-                        except ValueError:
-                            continue
-
-                self._event_cache[event_host] = (event_tags, event_whitelisted, event_blacklisted, dns_children)
-
-        return event_tags, event_whitelisted, event_blacklisted, dns_children
+                        for ip in ips:
+                            try:
+                                ip = ipaddress.ip_address(ip)
+                                if ip.is_private:
+                                    event_tags.add("private-ip")
+                            except ValueError:
+                                continue
+
+                    self._event_cache[event_host] = (event_tags, event_whitelisted, event_blacklisted, dns_children)
+
+            return event_tags, event_whitelisted, event_blacklisted, dns_children
+
+        finally:
+            log.debug(f"Finished resolving {event}")
 
     def event_cache_get(self, host):
         try:
@@ -454,10 +473,12 @@ def _clean_dns_record(record):
 
     async def _catch(self, callback, *args, **kwargs):
         try:
-            return await callback(*args, **kwargs)
+            # wait_for exists here because of this:
+            #  https://github.com/rthalley/dnspython/issues/976
+            return await asyncio.wait_for(callback(*args, **kwargs), self.timeout + 0.1)
         except dns.resolver.NoNameservers:
             raise
-        except (dns.exception.Timeout, dns.resolver.LifetimeTimeout):
+        except (dns.exception.Timeout, dns.resolver.LifetimeTimeout, asyncio.TimeoutError):
             log.verbose(f"DNS query with args={args}, kwargs={kwargs} timed out after {self.timeout} seconds")
             raise
         except dns.exception.DNSException as e:
diff --git a/poetry.lock b/poetry.lock
index faa63b9ca7..546d72867c 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -530,19 +530,18 @@ optimize = ["orjson"]
 
 [[package]]
 name = "dnspython"
-version = "2.3.0"
+version = "2.4.1"
 description = "DNS toolkit"
 optional = false
-python-versions = ">=3.7,<4.0"
+python-versions = ">=3.8,<4.0"
 files = [
-    {file = "dnspython-2.3.0-py3-none-any.whl", hash = "sha256:89141536394f909066cabd112e3e1a37e4e654db00a25308b0f130bc3152eb46"},
-    {file = "dnspython-2.3.0.tar.gz", hash = "sha256:224e32b03eb46be70e12ef6d64e0be123a64e621ab4c0822ff6d450d52a540b9"},
+    {file = "dnspython-2.4.1-py3-none-any.whl", hash = "sha256:5b7488477388b8c0b70a8ce93b227c5603bc7b77f1565afe8e729c36c51447d7"},
+    {file = "dnspython-2.4.1.tar.gz", hash = "sha256:c33971c79af5be968bb897e95c2448e11a645ee84d93b265ce0b7aabe5dfdca8"},
 ]
 
 [package.extras]
-curio = ["curio (>=1.2,<2.0)", "sniffio (>=1.1,<2.0)"]
-dnssec = ["cryptography (>=2.6,<40.0)"]
-doh = ["h2 (>=4.1.0)", "httpx (>=0.21.1)", "requests (>=2.23.0,<3.0.0)", "requests-toolbelt (>=0.9.1,<0.11.0)"]
+dnssec = ["cryptography (>=2.6,<42.0)"]
+doh = ["h2 (>=4.1.0)", "httpcore (>=0.17.3)", "httpx (>=0.24.1)"]
 doq = ["aioquic (>=0.9.20)"]
 idna = ["idna (>=2.1,<4.0)"]
 trio = ["trio (>=0.14,<0.23)"]

From 37b5ed7331424b66711eaf26940a9873de7ca9bd Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Thu, 3 Aug 2023 16:50:06 -0400
Subject: [PATCH 374/387] dns timeout tweaks

---
 bbot/core/helpers/dns.py | 64 ++++++++++++++++++++++++----------------
 1 file changed, 39 insertions(+), 25 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 9acb4a7fd4..36db84ae25 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -149,7 +149,6 @@ async def _resolve_hostname(self, query, **kwargs):
         results = []
         errors = []
         rdtype = kwargs.get("rdtype", "A")
-        allow_abort = kwargs.pop("allow_abort", True)
 
         # skip certain queries if requested
         if rdtype in self.dns_omit_queries:
@@ -168,25 +167,35 @@ async def _resolve_hostname(self, query, **kwargs):
                 try:
                     results = self._dns_cache[dns_cache_hash]
                 except KeyError:
-                    if allow_abort:
-                        error_count = self._errors.get(parent_hash, 0)
-                        if error_count >= self.abort_threshold:
-                            dns_server_working = await self.resolve("www.google.com", type="A", allow_abort=False)
-                            if not dns_server_working:
-                                log.warning(f"DNS queries are failing, you may be blasting a little too hard")
-                                self._errors.clear()
-                            else:
-                                log.info(
-                                    f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                    error_count = self._errors.get(parent_hash, 0)
+                    if error_count >= self.abort_threshold:
+                        try:
+                            dns_server_working = list(
+                                await asyncio.wait_for(
+                                    self.resolver.resolve("www.google.com", rdtype="A"), self.timeout + 0.1
                                 )
-                                if parent_hash not in self._dns_warnings:
-                                    log.warning(
-                                        f'Aborting future {rdtype} queries to "{parent}" because error count ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
-                                    )
-                                self._dns_warnings.add(parent_hash)
-                                return results, errors
+                            )
+                        except Exception:
+                            dns_server_working = []
+                        if not dns_server_working:
+                            log.warning(f"DNS queries are failing, you may be blasting a little too hard")
+                            self._errors.clear()
+                        else:
+                            log.info(
+                                f'Aborting query "{query}" because failed {rdtype} queries for "{parent}" ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                            )
+                            if parent_hash not in self._dns_warnings:
+                                log.warning(
+                                    f'Aborting future {rdtype} queries to "{parent}" because error count ({error_count:,}) exceeded abort threshold ({self.abort_threshold:,})'
+                                )
+                            self._dns_warnings.add(parent_hash)
+                            return results, errors
                     async with self.dns_rate_limiter:
-                        results = await self._catch(self.resolver.resolve, query, **kwargs)
+                        # wait_for exists here because of this:
+                        #  https://github.com/rthalley/dnspython/issues/976
+                        results = await asyncio.wait_for(
+                            self._catch(self.resolver.resolve, query, **kwargs), self.timeout + 0.1
+                        )
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = results
                     if parent_hash in self._errors:
@@ -196,7 +205,7 @@ async def _resolve_hostname(self, query, **kwargs):
                 dns.resolver.NoNameservers,
                 dns.exception.Timeout,
                 dns.resolver.LifetimeTimeout,
-                asyncio.TimeoutError,
+                TimeoutError,
             ) as e:
                 try:
                     self._errors[parent_hash] += 1
@@ -233,11 +242,18 @@ async def _resolve_ip(self, query, **kwargs):
                     results = self._dns_cache[dns_cache_hash]
                 except KeyError:
                     async with self.dns_rate_limiter:
-                        results = await self._catch(self.resolver.resolve_address, query, **kwargs)
+                        results = await asyncio.wait_for(
+                            self._catch(self.resolver.resolve_address, query, **kwargs), self.timeout + 0.1
+                        )
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = results
                 break
-            except (dns.exception.Timeout, dns.resolver.LifetimeTimeout, dns.resolver.NoNameservers) as e:
+            except (
+                dns.exception.Timeout,
+                dns.resolver.LifetimeTimeout,
+                dns.resolver.NoNameservers,
+                TimeoutError,
+            ) as e:
                 errors.append(e)
                 # don't retry if we get a SERVFAIL
                 if isinstance(e, dns.resolver.NoNameservers):
@@ -473,12 +489,10 @@ def _clean_dns_record(record):
 
     async def _catch(self, callback, *args, **kwargs):
         try:
-            # wait_for exists here because of this:
-            #  https://github.com/rthalley/dnspython/issues/976
-            return await asyncio.wait_for(callback(*args, **kwargs), self.timeout + 0.1)
+            return await callback(*args, **kwargs)
         except dns.resolver.NoNameservers:
             raise
-        except (dns.exception.Timeout, dns.resolver.LifetimeTimeout, asyncio.TimeoutError):
+        except (dns.exception.Timeout, dns.resolver.LifetimeTimeout, TimeoutError):
             log.verbose(f"DNS query with args={args}, kwargs={kwargs} timed out after {self.timeout} seconds")
             raise
         except dns.exception.DNSException as e:

From 3ed610e9032b036c4dddf727581121c3a220b75b Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 23:03:14 -0400
Subject: [PATCH 375/387] added sitedossier module

---
 bbot/modules/crobat.py                        |   2 +-
 bbot/modules/sitedossier.py                   |  34 +++++
 .../module_tests/test_module_sitedossier.py   | 142 ++++++++++++++++++
 3 files changed, 177 insertions(+), 1 deletion(-)
 create mode 100644 bbot/modules/sitedossier.py
 create mode 100644 bbot/test/test_step_2/module_tests/test_module_sitedossier.py

diff --git a/bbot/modules/crobat.py b/bbot/modules/crobat.py
index d21447e8b6..5aecf3f6e7 100644
--- a/bbot/modules/crobat.py
+++ b/bbot/modules/crobat.py
@@ -125,7 +125,7 @@ async def query(self, query, parse_fn=None, request_fn=None):
         try:
             response = await request_fn(query)
             if response is None:
-                self.info(f'Query "{query}" failed')
+                self.info(f'Query "{query}" failed (no response)')
                 return []
             try:
                 results = list(parse_fn(response, query))
diff --git a/bbot/modules/sitedossier.py b/bbot/modules/sitedossier.py
new file mode 100644
index 0000000000..9fa128cd10
--- /dev/null
+++ b/bbot/modules/sitedossier.py
@@ -0,0 +1,34 @@
+from .crobat import crobat
+
+
+class sitedossier(crobat):
+    flags = ["subdomain-enum", "passive", "safe"]
+    watched_events = ["DNS_NAME"]
+    produced_events = ["DNS_NAME"]
+    meta = {"description": "Query sitedossier.com for subdomains"}
+
+    base_url = "http://www.sitedossier.com/parentdomain"
+    max_pages = 10
+
+    async def query(self, query, parse_fn=None, request_fn=None):
+        results = set()
+        base_url = f"{self.base_url}/{self.helpers.quote(query)}"
+        url = str(base_url)
+        for page in range(1, 100 * self.max_pages + 2, 100):
+            if page > 1:
+                url = f"{base_url}/{page}"
+            response = await self.request_with_fail_count(url)
+            if response is None:
+                self.info(f'Query "{query}" failed (no response)')
+                return results
+            if response.status_code == 302:
+                self.verbose("Hit rate limit captcha")
+                break
+            for regex in self.scan.dns_regexes:
+                for match in regex.finditer(response.text):
+                    hostname = match.group().lower()
+                    results.add(hostname)
+            if "Show next 100 items" not in response.text:
+                break
+
+        return results
diff --git a/bbot/test/test_step_2/module_tests/test_module_sitedossier.py b/bbot/test/test_step_2/module_tests/test_module_sitedossier.py
new file mode 100644
index 0000000000..2156a5ae77
--- /dev/null
+++ b/bbot/test/test_step_2/module_tests/test_module_sitedossier.py
@@ -0,0 +1,142 @@
+from .base import ModuleTestBase
+
+page1 = """
+
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN"
+            "http://www.w3.org/TR/html4/loose.dtd">
+<html>
+<head>
+<title>Parent domain: evilcorp.com</title>
+<style type="text/css">
+body {background: #dae5da; margin: 0; padding: 0; text-align: left; font-size: 10pt; font-style: normal; font-family: verdana, arial; color: #202020; height: 100%;  }
+a:link { color: #2020ff; }
+a:visited { color: #78208c; }
+div.mid {background: repeat-y #8fb38f; min-height: 100%; height: 100%; }
+div.header {background: repeat-y #8fb38f; }
+div.footer {background: repeat-y #8fb38f; }
+div.stripe1 {background: repeat-y #cadbca;}
+div.stripe2 {background: repeat-y #bad1ba;}
+div.stripe3 {background: repeat-y #abc7ab;}
+div.stripe4 {background: repeat-y #9dbd9d;}
+H1 {font-size: 18pt; font-style: normal; font-family: arial; color: #202020; margin: 5px 5px 5px; }
+H2 {font-size: 12pt; font-style: normal; font-family: arial; color: #202020; margin: 5px 5px 5px; }
+H3 {font-size: 12pt; font-style: normal; font-family: arial; color: #202020; margin: 5px 5px 5px; }
+</style>
+<META NAME="ROBOTS" CONTENT="NOARCHIVE">
+</head>
+<body>
+<center>
+<div class="header">
+<img src="/i/sdlogonew2.jpg" alt="logo">
+<br>
+<div class="stripe4"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+<div class="stripe3"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+<div class="stripe2"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+<div class="stripe1"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+</div>
+<br>
+<table border=0 cellspacing=0 cellpadding=0 width=750>
+<tr><td width=30><img src="/i/corner-nw-dae5da.png" alt="nw" width=30 height=30></td><td width=690 height=30 bgcolor="#ffffff"></td><td width=30><img src="/i/corner-ne-dae5da.png" alt="ne" width=30 height=30></td></tr>
+<tr><td width=30 height="100%" bgcolor="#ffffff"></td>
+<td bgcolor="#ffffff" width=690 align="left">
+<h1>Parent domain: evilcorp.com</h1>
+<br>
+<font style="font-size: 9pt; font-style: normal; font-family: arial; color: #000000;">
+<dd> <i>Displaying items 101 to 200, out of a total of 685</i>
+<br>
+<ol start=101>
+<li> &nbsp; <a href="/site/asdf.evilcorp.com">http://asdf.evilcorp.com/</a><br>
+<li> &nbsp; <a href="/site/zzzz.evilcorp.com">http://zzzz.evilcorp.com/</a><br>
+</ol>
+<a href="/parentdomain/evilcorp.com/101"><b>Show next 100 items</b></a><br>
+</font>
+</td>
+<td width=30 height="100%" bgcolor="#ffffff"></td></tr>
+<tr><td width=30><img src="/i/corner-sw-dae5da.png" alt="sw" width=30 height=30></td><td width=690 height=30 bgcolor="#ffffff"></td><td width=30><img src="/i/corner-se-dae5da.png" alt="se" width=30 height=30></td></tr>
+</table>
+<br>
+<br>
+<br>
+</body>
+</html>
+"""
+
+page2 = """
+
+<!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01 Transitional//EN"
+            "http://www.w3.org/TR/html4/loose.dtd">
+<html>
+<head>
+<title>Parent domain: evilcorp.com</title>
+<style type="text/css">
+body {background: #dae5da; margin: 0; padding: 0; text-align: left; font-size: 10pt; font-style: normal; font-family: verdana, arial; color: #202020; height: 100%;  }
+a:link { color: #2020ff; }
+a:visited { color: #78208c; }
+div.mid {background: repeat-y #8fb38f; min-height: 100%; height: 100%; }
+div.header {background: repeat-y #8fb38f; }
+div.footer {background: repeat-y #8fb38f; }
+div.stripe1 {background: repeat-y #cadbca;}
+div.stripe2 {background: repeat-y #bad1ba;}
+div.stripe3 {background: repeat-y #abc7ab;}
+div.stripe4 {background: repeat-y #9dbd9d;}
+H1 {font-size: 18pt; font-style: normal; font-family: arial; color: #202020; margin: 5px 5px 5px; }
+H2 {font-size: 12pt; font-style: normal; font-family: arial; color: #202020; margin: 5px 5px 5px; }
+H3 {font-size: 12pt; font-style: normal; font-family: arial; color: #202020; margin: 5px 5px 5px; }
+</style>
+<META NAME="ROBOTS" CONTENT="NOARCHIVE">
+</head>
+<body>
+<center>
+<div class="header">
+<img src="/i/sdlogonew2.jpg" alt="logo">
+<br>
+<div class="stripe4"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+<div class="stripe3"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+<div class="stripe2"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+<div class="stripe1"><img src="/i/1x1.gif" alt="" width="100%" height=1></div>
+</div>
+<br>
+<table border=0 cellspacing=0 cellpadding=0 width=750>
+<tr><td width=30><img src="/i/corner-nw-dae5da.png" alt="nw" width=30 height=30></td><td width=690 height=30 bgcolor="#ffffff"></td><td width=30><img src="/i/corner-ne-dae5da.png" alt="ne" width=30 height=30></td></tr>
+<tr><td width=30 height="100%" bgcolor="#ffffff"></td>
+<td bgcolor="#ffffff" width=690 align="left">
+<h1>Parent domain: evilcorp.com</h1>
+<br>
+<font style="font-size: 9pt; font-style: normal; font-family: arial; color: #000000;">
+<dd> <i>Displaying items 101 to 200, out of a total of 685</i>
+<br>
+<ol start=101>
+<li> &nbsp; <a href="/site/xxxx.evilcorp.com">http://xxxx.evilcorp.com/</a><br>
+<li> &nbsp; <a href="/site/ffff.evilcorp.com">http://ffff.evilcorp.com/</a><br>
+</ol>
+</font>
+</td>
+<td width=30 height="100%" bgcolor="#ffffff"></td></tr>
+<tr><td width=30><img src="/i/corner-sw-dae5da.png" alt="sw" width=30 height=30></td><td width=690 height=30 bgcolor="#ffffff"></td><td width=30><img src="/i/corner-se-dae5da.png" alt="se" width=30 height=30></td></tr>
+</table>
+<br>
+<br>
+<br>
+</body>
+</html>
+"""
+
+
+class TestSitedossier(ModuleTestBase):
+    targets = ["evilcorp.com"]
+
+    async def setup_after_prep(self, module_test):
+        module_test.httpx_mock.add_response(
+            url=f"http://www.sitedossier.com/parentdomain/evilcorp.com",
+            text=page1,
+        )
+        module_test.httpx_mock.add_response(
+            url=f"http://www.sitedossier.com/parentdomain/evilcorp.com/101",
+            text=page2,
+        )
+
+    def check(self, module_test, events):
+        assert any(e.data == "asdf.evilcorp.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "zzzz.evilcorp.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "xxxx.evilcorp.com" for e in events), "Failed to detect subdomain"
+        assert any(e.data == "ffff.evilcorp.com" for e in events), "Failed to detect subdomain"

From 3aa5cc6e926ec1e38c617cab6842cfe2033a65d4 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Sun, 30 Jul 2023 23:38:16 -0400
Subject: [PATCH 376/387] fix pagination bug

---
 bbot/modules/sitedossier.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/sitedossier.py b/bbot/modules/sitedossier.py
index 9fa128cd10..33d7548c4c 100644
--- a/bbot/modules/sitedossier.py
+++ b/bbot/modules/sitedossier.py
@@ -28,7 +28,7 @@ async def query(self, query, parse_fn=None, request_fn=None):
                 for match in regex.finditer(response.text):
                     hostname = match.group().lower()
                     results.add(hostname)
-            if "Show next 100 items" not in response.text:
+            if '<a href="/parentdomain/' not in response.text:
                 break
 
         return results

From 48faf782a5845cb0f7346960c244b1cfc3412ee5 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 10:43:16 -0400
Subject: [PATCH 377/387] don't fail the module

---
 bbot/modules/sitedossier.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/sitedossier.py b/bbot/modules/sitedossier.py
index 33d7548c4c..811a26e7dc 100644
--- a/bbot/modules/sitedossier.py
+++ b/bbot/modules/sitedossier.py
@@ -17,7 +17,7 @@ async def query(self, query, parse_fn=None, request_fn=None):
         for page in range(1, 100 * self.max_pages + 2, 100):
             if page > 1:
                 url = f"{base_url}/{page}"
-            response = await self.request_with_fail_count(url)
+            response = await self.request(url)
             if response is None:
                 self.info(f'Query "{query}" failed (no response)')
                 return results

From cc2472f26ad37df413c5ff886bdc922247a51fae Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 11:19:42 -0400
Subject: [PATCH 378/387] fixed typo

---
 bbot/modules/sitedossier.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/modules/sitedossier.py b/bbot/modules/sitedossier.py
index 811a26e7dc..fd470cdf53 100644
--- a/bbot/modules/sitedossier.py
+++ b/bbot/modules/sitedossier.py
@@ -17,7 +17,7 @@ async def query(self, query, parse_fn=None, request_fn=None):
         for page in range(1, 100 * self.max_pages + 2, 100):
             if page > 1:
                 url = f"{base_url}/{page}"
-            response = await self.request(url)
+            response = await self.helpers.request(url)
             if response is None:
                 self.info(f'Query "{query}" failed (no response)')
                 return results

From 4d2a975b994717b1deb5d0673fe533ef68863f30 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Mon, 31 Jul 2023 12:16:11 -0400
Subject: [PATCH 379/387] better rate limit handling

---
 bbot/modules/base.py        | 19 ++++++++-----------
 bbot/modules/sitedossier.py | 23 ++++++++++++++++++-----
 2 files changed, 26 insertions(+), 16 deletions(-)

diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 7bef5c55b7..525a57f48b 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -102,7 +102,6 @@ def __init__(self, scan):
         self._tasks = []
         self._event_received = asyncio.Condition()
         self._event_queued = asyncio.Condition()
-        self._event_dequeued = asyncio.Condition()
 
         # used for optional "per host" tracking
         self._per_host_tracker = set()
@@ -253,6 +252,14 @@ def emit_event(self, *args, **kwargs):
         if event:
             self.queue_outgoing_event(event, **emit_kwargs)
 
+    async def emit_event_wait(self, *args, **kwargs):
+        """
+        Same as emit_event except we wait on the outgoing queue
+        """
+        while self.outgoing_event_queue.qsize() > self._qsize:
+            await self.helpers.sleep(0.2)
+        return self.emit_event(*args, **kwargs)
+
     async def events_waiting(self):
         """
         yields all events in queue, up to maximum batch size
@@ -499,16 +506,6 @@ def queue_outgoing_event(self, event, **kwargs):
         except AttributeError:
             self.debug(f"Not in an acceptable state to queue outgoing event")
 
-    async def dequeue_outgoing_event(self):
-        await self.outgoing_event_queue.get()
-        with self._event_dequeued:
-            self._event_dequeued.notify()
-
-    def dequeue_outgoing_event_nowait(self):
-        return self.outgoing_event_queue.get_nowait()
-        with self._event_dequeued:
-            self._event_dequeued.notify()
-
     def set_error_state(self, message=None):
         if not self.errored:
             log_msg = f"Setting error state for module {self.name}"
diff --git a/bbot/modules/sitedossier.py b/bbot/modules/sitedossier.py
index fd470cdf53..f9180f1db7 100644
--- a/bbot/modules/sitedossier.py
+++ b/bbot/modules/sitedossier.py
@@ -10,25 +10,38 @@ class sitedossier(crobat):
     base_url = "http://www.sitedossier.com/parentdomain"
     max_pages = 10
 
+    async def handle_event(self, event):
+        query = self.make_query(event)
+        async for hostname in self.query(query):
+            try:
+                hostname = self.helpers.validators.validate_host(hostname)
+            except ValueError as e:
+                self.verbose(e)
+                continue
+            if hostname and hostname.endswith(f".{query}") and not hostname == event.data:
+                await self.emit_event_wait(hostname, "DNS_NAME", event, abort_if=self.abort_if)
+
     async def query(self, query, parse_fn=None, request_fn=None):
         results = set()
         base_url = f"{self.base_url}/{self.helpers.quote(query)}"
         url = str(base_url)
-        for page in range(1, 100 * self.max_pages + 2, 100):
+        for i, page in enumerate(range(1, 100 * self.max_pages + 2, 100)):
+            self.verbose(f"Fetching page #{i+1} for {query}")
             if page > 1:
                 url = f"{base_url}/{page}"
             response = await self.helpers.request(url)
             if response is None:
                 self.info(f'Query "{query}" failed (no response)')
-                return results
+                break
             if response.status_code == 302:
                 self.verbose("Hit rate limit captcha")
                 break
             for regex in self.scan.dns_regexes:
                 for match in regex.finditer(response.text):
                     hostname = match.group().lower()
-                    results.add(hostname)
+                    if hostname and hostname not in results:
+                        results.add(hostname)
+                        yield hostname
             if '<a href="/parentdomain/' not in response.text:
+                self.verbose(f"Next page not found in {response.text}")
                 break
-
-        return results

From 6031abbf9100ce6e8506aa53a51ee3ac18c5f255 Mon Sep 17 00:00:00 2001
From: BBOT Docs Autopublish <info@blacklanternsecurity.com>
Date: Thu, 3 Aug 2023 21:28:55 +0000
Subject: [PATCH 380/387] Refresh module docs

---
 docs/scanning/advanced.md        |  2 +-
 docs/scanning/events.md          | 26 --------------------------
 docs/scanning/index.md           | 22 ----------------------
 docs/scanning/list_of_modules.md |  1 +
 4 files changed, 2 insertions(+), 49 deletions(-)

diff --git a/docs/scanning/advanced.md b/docs/scanning/advanced.md
index 752b7f3fe5..0afe70bbd8 100644
--- a/docs/scanning/advanced.md
+++ b/docs/scanning/advanced.md
@@ -61,7 +61,7 @@ Target:
 
 Modules:
   -m MODULE [MODULE ...], --modules MODULE [MODULE ...]
-                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_realm,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,digitorus,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,myssl,nmap,nsec,ntlm,nuclei,oauth,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,skymem,smuggler,social,sslcert,subdomain_hijack,subdomaincenter,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
+                        Modules to enable. Choices: affiliates,anubisdb,asn,azure_realm,azure_tenant,badsecrets,bevigil,binaryedge,bucket_aws,bucket_azure,bucket_digitalocean,bucket_firebase,bucket_gcp,builtwith,bypass403,c99,censys,certspotter,columbus,crobat,crt,digitorus,dnscommonsrv,dnsdumpster,dnszonetransfer,emailformat,ffuf,ffuf_shortnames,fingerprintx,fullhunt,generic_ssrf,git,github,gowitness,hackertarget,host_header,httpx,hunt,hunterio,iis_shortnames,ipneighbor,ipstack,leakix,masscan,massdns,myssl,nmap,nsec,ntlm,nuclei,oauth,otx,paramminer_cookies,paramminer_getparams,paramminer_headers,passivetotal,pgp,rapiddns,riddler,robots,secretsdb,securitytrails,shodan_dns,sitedossier,skymem,smuggler,social,sslcert,subdomain_hijack,subdomaincenter,sublist3r,telerik,threatminer,url_manipulation,urlscan,vhost,viewdns,virustotal,wafw00f,wappalyzer,wayback,zoomeye
   -l, --list-modules    List available modules.
   -em MODULE [MODULE ...], --exclude-modules MODULE [MODULE ...]
                         Exclude these modules.
diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index d100ecd6d7..a5d4fd4c8d 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -47,30 +47,4 @@ Below is a full list of event types along with which modules produce/consume the
 ## List of Event Types
 
 <!-- BBOT EVENTS -->
-| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           | Producing Modules                                                                                                                                                                                                                                                                                                                                                                                                                              |
-|---------------------|-----------------------|-----------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | asn                                                                                                                                                                                                                                                                                                                                                                                                                                            |
-| DNS_NAME            | 52                    | 42                    | anubisdb, asset_inventory, azure_realm, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, myssl, nmap, nsec, oauth, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomain_hijack, subdomaincenter, subdomains, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, myssl, nsec, ntlm, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, speculate, sslcert, subdomaincenter, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
-| DNS_NAME_UNRESOLVED | 3                     | 0                     | speculate, subdomain_hijack, subdomains                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| EMAIL_ADDRESS       | 0                     | 6                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                            |
-| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                                                                             |
-| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | ipstack                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| HTTP_RESPONSE       | 11                    | 1                     | badsecrets, excavate, host_header, hunt, ntlm, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                               | httpx                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| IP_ADDRESS          | 6                     | 4                     | asn, asset_inventory, ipneighbor, ipstack, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | asset_inventory, censys, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                                                                                 |
-| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                   |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| OPEN_PORT           | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | censys                                                                                                                                                                                                                                                                                                                                                                                                                                         |
-| OPEN_TCP_PORT       | 4                     | 4                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | asset_inventory, masscan, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                      |
-| PROTOCOL            | 0                     | 2                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | censys, fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | social                                                                                                                                                                                                                                                                                                                                                                                                                                         |
-| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                                                                                     |
-| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| URL                 | 18                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                                                                                                                                                     | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                                                                               |
-| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                 |
-| URL_UNVERIFIED      | 4                     | 10                    | httpx, oauth, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                                                                                |
-| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  | vhost                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                                                                                      |
-| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                      |
 <!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 09a827fcfb..70f8bfb3ed 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -103,28 +103,6 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 ### List of Flags
 
 <!-- BBOT MODULE FLAGS -->
-| Flag             | # Modules   | Description                                   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-|------------------|-------------|-----------------------------------------------|--------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
-| safe             | 64          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, myssl, nsec, ntlm, oauth, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, skymem, social, sslcert, subdomain_hijack, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
-| passive          | 47          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, myssl, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, skymem, speculate, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                          |
-| subdomain-enum   | 42          | Enumerates subdomains                         | anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, myssl, nsec, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sslcert, subdomain_hijack, subdomaincenter, subdomains, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                               |
-| active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, nmap, ntlm, nuclei, oauth, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                                                                               |
-| web-thorough     | 24          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                             |
-| aggressive       | 18          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
-| web-basic        | 17          | Basic, non-intrusive web scan functionality   | azure_realm, badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, oauth, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |
-| cloud-enum       | 10          | Enumerates cloud resources                    | azure_realm, azure_tenant, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, oauth, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |
-| slow             | 9           | May take a long time to complete              | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
-| affiliates       | 8           | Discovers affiliated hostnames/domains        | affiliates, azure_realm, azure_tenant, builtwith, oauth, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
-| email-enum       | 6           | Enumerates email addresses                    | censys, emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
-| deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
-| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| portscan         | 2           | Discovers open ports                          | masscan, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
-| social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
-| service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
-| subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
-| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              |
 <!-- END BBOT MODULE FLAGS --> 
 
 ## Dependencies
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 4fa7e1d292..9b860107f7 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -75,6 +75,7 @@
 | riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
+| sitedossier          | scan     | No              | Query sitedossier.com for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
 | subdomaincenter      | scan     | No              | Query subdomain.center's API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
 | sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |

From d72773b1f328fc44485eb28f1c51954e1cfcfffe Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 4 Aug 2023 09:38:54 -0400
Subject: [PATCH 381/387] fix error in ntlm module

---
 bbot/core/errors.py  |  2 +-
 bbot/modules/base.py |  3 +--
 bbot/modules/ntlm.py | 10 ++++++----
 3 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/bbot/core/errors.py b/bbot/core/errors.py
index 8d39919cb6..826c060650 100644
--- a/bbot/core/errors.py
+++ b/bbot/core/errors.py
@@ -1,4 +1,4 @@
-from httpx import RequestError, ReadTimeout  # noqa
+from httpx import HTTPError  # noqa
 
 
 class BBOTError(Exception):
diff --git a/bbot/modules/base.py b/bbot/modules/base.py
index 525a57f48b..6f5b5445c7 100644
--- a/bbot/modules/base.py
+++ b/bbot/modules/base.py
@@ -622,8 +622,7 @@ def memory_usage(self):
         Return how much memory the module is currently using in bytes
         """
         seen = {self.scan, self.helpers, self.log}  # noqa
-        # return get_size(self, max_depth=3, seen=seen)
-        return 0
+        return get_size(self, max_depth=3, seen=seen)
 
     def __str__(self):
         return self.name
diff --git a/bbot/modules/ntlm.py b/bbot/modules/ntlm.py
index 6bc662d82b..91101374ab 100644
--- a/bbot/modules/ntlm.py
+++ b/bbot/modules/ntlm.py
@@ -1,5 +1,5 @@
 from bbot.modules.base import BaseModule
-from bbot.core.errors import NTLMError, RequestError, ReadTimeout
+from bbot.core.errors import NTLMError, HTTPError
 
 ntlm_discovery_endpoints = [
     "",
@@ -125,21 +125,23 @@ async def handle_url(self, event):
             self.processed.add(url_hash)
             tasks.append(self.helpers.create_task(self.check_ntlm(url)))
 
+        result, url = None, None
+
         gen = self.helpers.as_completed(tasks)
         async for task in gen:
             try:
                 result, url = await task
                 if result:
                     await self.helpers.cancel_tasks(tasks)
-                    return result, url
-            except (RequestError, ReadTimeout) as e:
+                    await gen.aclose()
+            except HTTPError as e:
                 if str(e):
                     self.warning(str(e))
                 # cancel all the tasks if there's an error
                 await self.helpers.cancel_tasks(tasks)
                 await gen.aclose()
 
-        return None, None
+        return result, url
 
     async def check_ntlm(self, test_url):
         # use lower timeout value

From fb719c37980330114bddcf5ee56483298b8c79bf Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 4 Aug 2023 09:49:37 -0400
Subject: [PATCH 382/387] blacked

---
 bbot/core/helpers/web.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/bbot/core/helpers/web.py b/bbot/core/helpers/web.py
index adb189306b..21fd1082fc 100644
--- a/bbot/core/helpers/web.py
+++ b/bbot/core/helpers/web.py
@@ -138,7 +138,9 @@ async def request(self, *args, **kwargs):
             async with self.web_rate_limiter:
                 response = await client.request(*args, **kwargs)
             if self.http_debug:
-                log.debug(f"Web response from {url}: {response} (Length: {len(response.content)}) headers: {response.headers}")
+                log.debug(
+                    f"Web response from {url}: {response} (Length: {len(response.content)}) headers: {response.headers}"
+                )
             return response
         except httpx.TimeoutException:
             log.verbose(f"HTTP timeout to URL: {url}")

From e0f5e8d648eb3f8920a25f3c8e479ad7a36228fb Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 4 Aug 2023 10:03:17 -0400
Subject: [PATCH 383/387] fix tests

---
 bbot/core/errors.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/bbot/core/errors.py b/bbot/core/errors.py
index 826c060650..5e5f57aeb0 100644
--- a/bbot/core/errors.py
+++ b/bbot/core/errors.py
@@ -1,4 +1,4 @@
-from httpx import HTTPError  # noqa
+from httpx import HTTPError, RequestError  # noqa
 
 
 class BBOTError(Exception):

From da0afe1521a7923444d448a3be73f9d7c0f68062 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 4 Aug 2023 10:20:52 -0400
Subject: [PATCH 384/387] update documentation

---
 README.md              | 1 +
 docs/scanning/index.md | 4 ++++
 2 files changed, 5 insertions(+)

diff --git a/README.md b/README.md
index d95bca933a..4dca47e439 100644
--- a/README.md
+++ b/README.md
@@ -89,6 +89,7 @@ BBOT accepts an unlimited number of targets. You can specify targets either dire
 - DNS_NAME (`evilcorp.com`)
 - IP_ADDRESS (`1.2.3.4`)
 - IP_RANGE (`1.2.3.0/24`)
+- `OPEN_PORT` (`192.168.0.1:80`)
 - URL (`https://www.evilcorp.com`)
 
 For more information, see [Targets](https://www.blacklanternsecurity.com/bbot/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/bbot/scanning/#scope).
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 70f8bfb3ed..3f3146fd2d 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -20,13 +20,17 @@ Targets declare what's in-scope, and seed a scan with initial data. BBOT accepts
 - `DNS_NAME` (`evilcorp.com`)
 - `IP_ADDRESS` (`1.2.3.4`)
 - `IP_RANGE` (`1.2.3.0/24`)
+- `OPEN_PORT` (`192.168.0.1:80`)
 - `URL` (`https://www.evilcorp.com`)
 
+Note that BBOT only discriminates down to the host level. This means, for example, if you specify a URL `https://www.evilcorp.com` as the target, the scan will be *seeded* with that URL, but the scope of the scan will be the entire host, `www.evilcorp.com`. Other ports/URLs on that same host may also be scanned.
+
 You can specify targets directly on the command line, load them from files, or both! For example:
 
 ```bash
 $ cat targets.txt
 4.3.2.1
+10.0.0.2:80
 1.2.3.0/24
 evilcorp.com
 evilcorp.co.uk

From 8cab7dc5c4334dfcfea4e1feda29fd6333214169 Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 4 Aug 2023 10:52:45 -0400
Subject: [PATCH 385/387] update documentation, longer dns failsafe timeout

---
 README.md                | 10 +++++-----
 bbot/core/helpers/dns.py |  4 ++--
 bbot/modules/censys.py   |  4 ++--
 docs/scanning/index.md   |  2 +-
 4 files changed, 10 insertions(+), 10 deletions(-)

diff --git a/README.md b/README.md
index 4dca47e439..2e11c5312a 100644
--- a/README.md
+++ b/README.md
@@ -86,11 +86,11 @@ bbot -t evilcorp.com -f subdomain-enum email-enum cloud-enum web-basic -m nmap g
 
 BBOT accepts an unlimited number of targets. You can specify targets either directly on the command line or in files (or both!). Targets can be any of the following:
 
-- DNS_NAME (`evilcorp.com`)
-- IP_ADDRESS (`1.2.3.4`)
-- IP_RANGE (`1.2.3.0/24`)
-- `OPEN_PORT` (`192.168.0.1:80`)
-- URL (`https://www.evilcorp.com`)
+- `DNS_NAME` (`evilcorp.com`)
+- `IP_ADDRESS` (`1.2.3.4`)
+- `IP_RANGE` (`1.2.3.0/24`)
+- `OPEN_TCP_PORT` (`192.168.0.1:80`)
+- `URL` (`https://www.evilcorp.com`)
 
 For more information, see [Targets](https://www.blacklanternsecurity.com/bbot/scanning/#targets-t). To learn how BBOT handles scope, see [Scope](https://www.blacklanternsecurity.com/bbot/scanning/#scope).
 
diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index 36db84ae25..d1abf54591 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -172,7 +172,7 @@ async def _resolve_hostname(self, query, **kwargs):
                         try:
                             dns_server_working = list(
                                 await asyncio.wait_for(
-                                    self.resolver.resolve("www.google.com", rdtype="A"), self.timeout + 0.1
+                                    self.resolver.resolve("www.google.com", rdtype="A"), self.timeout + 10
                                 )
                             )
                         except Exception:
@@ -194,7 +194,7 @@ async def _resolve_hostname(self, query, **kwargs):
                         # wait_for exists here because of this:
                         #  https://github.com/rthalley/dnspython/issues/976
                         results = await asyncio.wait_for(
-                            self._catch(self.resolver.resolve, query, **kwargs), self.timeout + 0.1
+                            self._catch(self.resolver.resolve, query, **kwargs), self.timeout + 10
                         )
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = results
diff --git a/bbot/modules/censys.py b/bbot/modules/censys.py
index 9a81ac7dd0..ed7a62f3bd 100644
--- a/bbot/modules/censys.py
+++ b/bbot/modules/censys.py
@@ -7,8 +7,8 @@ class censys(shodan_dns):
     """
 
     watched_events = ["DNS_NAME"]
-    produced_events = ["DNS_NAME", "EMAIL_ADDRESS", "IP_ADDRESS", "OPEN_PORT", "PROTOCOL"]
-    flags = ["subdomain-enum", "email-enum", "passive", "safe"]
+    produced_events = ["DNS_NAME"]
+    flags = ["subdomain-enum", "passive", "safe"]
     meta = {"description": "Query the Censys API", "auth_required": True}
     options = {"api_id": "", "api_secret": "", "max_pages": 5}
     options_desc = {
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index 3f3146fd2d..b25722cd92 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -20,7 +20,7 @@ Targets declare what's in-scope, and seed a scan with initial data. BBOT accepts
 - `DNS_NAME` (`evilcorp.com`)
 - `IP_ADDRESS` (`1.2.3.4`)
 - `IP_RANGE` (`1.2.3.0/24`)
-- `OPEN_PORT` (`192.168.0.1:80`)
+- `OPEN_TCP_PORT` (`192.168.0.1:80`)
 - `URL` (`https://www.evilcorp.com`)
 
 Note that BBOT only discriminates down to the host level. This means, for example, if you specify a URL `https://www.evilcorp.com` as the target, the scan will be *seeded* with that URL, but the scope of the scan will be the entire host, `www.evilcorp.com`. Other ports/URLs on that same host may also be scanned.

From f85112c6d757be272287218a730246e8c4c9721d Mon Sep 17 00:00:00 2001
From: TheTechromancer <thetechromancer@protonmail.com>
Date: Fri, 4 Aug 2023 11:04:22 -0400
Subject: [PATCH 386/387] PR review tweaks

---
 bbot/core/helpers/dns.py | 2 +-
 bbot/modules/httpx.py    | 3 +--
 bbot/modules/massdns.py  | 1 -
 3 files changed, 2 insertions(+), 4 deletions(-)

diff --git a/bbot/core/helpers/dns.py b/bbot/core/helpers/dns.py
index d1abf54591..6046c351ca 100644
--- a/bbot/core/helpers/dns.py
+++ b/bbot/core/helpers/dns.py
@@ -243,7 +243,7 @@ async def _resolve_ip(self, query, **kwargs):
                 except KeyError:
                     async with self.dns_rate_limiter:
                         results = await asyncio.wait_for(
-                            self._catch(self.resolver.resolve_address, query, **kwargs), self.timeout + 0.1
+                            self._catch(self.resolver.resolve_address, query, **kwargs), self.timeout + 10
                         )
                     if cache_result:
                         self._dns_cache[dns_cache_hash] = results
diff --git a/bbot/modules/httpx.py b/bbot/modules/httpx.py
index 7ac7257ca1..aa375f7ea6 100644
--- a/bbot/modules/httpx.py
+++ b/bbot/modules/httpx.py
@@ -10,7 +10,7 @@ class httpx(BaseModule):
     flags = ["active", "safe", "web-basic", "web-thorough", "social-enum", "subdomain-enum", "cloud-enum"]
     meta = {"description": "Visit webpages. Many other modules rely on httpx"}
 
-    batch_size = 100
+    batch_size = 500
     options = {"threads": 50, "in_scope_only": True, "version": "1.2.5", "max_response_size": 5242880}
     options_desc = {
         "threads": "Number of httpx threads to use",
@@ -30,7 +30,6 @@ class httpx(BaseModule):
         }
     ]
 
-    max_event_handlers = 2
     scope_distance_modifier = 1
     _priority = 2
 
diff --git a/bbot/modules/massdns.py b/bbot/modules/massdns.py
index c6ecd075a8..314e288b78 100644
--- a/bbot/modules/massdns.py
+++ b/bbot/modules/massdns.py
@@ -159,7 +159,6 @@ async def massdns(self, domain, subdomains):
                 if rdtype in wildcard_rdtypes:
                     self.debug(f"Skipping {hostname}:{rdtype} because it's a wildcard")
                     continue
-            # self.hugesuccess(f"{hostname}:wildcard_rdtypes:{wildcard_rdtypes}, domain_wildcard_rdtypes:{domain_wildcard_rdtypes}")
             results.append(hostname)
 
         # do another canary check for good measure

From ab7c24b3eaa50c74d408d935f70a731d0a0de050 Mon Sep 17 00:00:00 2001
From: BBOT Docs Autopublish <info@blacklanternsecurity.com>
Date: Fri, 4 Aug 2023 15:46:32 +0000
Subject: [PATCH 387/387] Refresh module docs

---
 docs/scanning/events.md          |  25 ++++
 docs/scanning/index.md           |  22 ++++
 docs/scanning/list_of_modules.md | 194 +++++++++++++++----------------
 3 files changed, 144 insertions(+), 97 deletions(-)

diff --git a/docs/scanning/events.md b/docs/scanning/events.md
index a5d4fd4c8d..fd020b0f32 100644
--- a/docs/scanning/events.md
+++ b/docs/scanning/events.md
@@ -47,4 +47,29 @@ Below is a full list of event types along with which modules produce/consume the
 ## List of Event Types
 
 <!-- BBOT EVENTS -->
+| Event Type          | # Consuming Modules   | # Producing Modules   | Consuming Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        | Producing Modules                                                                                                                                                                                                                                                                                                                                                                                                                                           |
+|---------------------|-----------------------|-----------------------|----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|-------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| *                   | 8                     | 0                     | affiliates, csv, http, human, json, neo4j, python, websocket                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| ASN                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | asn                                                                                                                                                                                                                                                                                                                                                                                                                                                         |
+| DNS_NAME            | 53                    | 43                    | anubisdb, asset_inventory, azure_realm, azure_tenant, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fullhunt, github, hackertarget, hunterio, leakix, massdns, myssl, nmap, nsec, oauth, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, sitedossier, skymem, speculate, subdomain_hijack, subdomaincenter, subdomains, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye | anubisdb, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, hackertarget, hunterio, leakix, massdns, myssl, nsec, ntlm, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sitedossier, speculate, sslcert, subdomaincenter, sublist3r, threatminer, urlscan, vhost, viewdns, virustotal, wayback, zoomeye |
+| DNS_NAME_UNRESOLVED | 3                     | 0                     | speculate, subdomain_hijack, subdomains                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| EMAIL_ADDRESS       | 0                     | 5                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| FINDING             | 2                     | 21                    | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, git, host_header, hunt, ntlm, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, smuggler, speculate, subdomain_hijack, telerik, url_manipulation                                                                                                                                                                          |
+| GEOLOCATION         | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | ipstack                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| HTTP_RESPONSE       | 11                    | 1                     | badsecrets, excavate, host_header, hunt, ntlm, paramminer_cookies, paramminer_getparams, paramminer_headers, secretsdb, speculate, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                            | httpx                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| IP_ADDRESS          | 6                     | 3                     | asn, asset_inventory, ipneighbor, ipstack, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | asset_inventory, ipneighbor, speculate                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| IP_RANGE            | 1                     | 0                     | speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                |                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| OPEN_TCP_PORT       | 4                     | 4                     | asset_inventory, fingerprintx, httpx, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                            | asset_inventory, masscan, nmap, speculate                                                                                                                                                                                                                                                                                                                                                                                                                   |
+| PROTOCOL            | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                |
+| SCAN                | 1                     | 0                     | masscan                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| SOCIAL              | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | social                                                                                                                                                                                                                                                                                                                                                                                                                                                      |
+| STORAGE_BUCKET      | 6                     | 5                     | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    | bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp                                                                                                                                                                                                                                                                                                                                                                                  |
+| TECHNOLOGY          | 2                     | 2                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              | gowitness, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| URL                 | 18                    | 2                     | asset_inventory, bypass403, ffuf, generic_ssrf, git, gowitness, httpx, iis_shortnames, ntlm, nuclei, robots, smuggler, speculate, telerik, url_manipulation, vhost, wafw00f, web_report                                                                                                                                                                                                                                                                                                                                                                                                                  | gowitness, httpx                                                                                                                                                                                                                                                                                                                                                                                                                                            |
+| URL_HINT            | 1                     | 1                     | ffuf_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                              |
+| URL_UNVERIFIED      | 4                     | 10                    | httpx, oauth, social, speculate                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | bevigil, excavate, ffuf, ffuf_shortnames, github, gowitness, hunterio, robots, urlscan, wayback                                                                                                                                                                                                                                                                                                                                                             |
+| VHOST               | 1                     | 1                     | web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               | vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| VULNERABILITY       | 2                     | 4                     | asset_inventory, web_report                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                              | badsecrets, generic_ssrf, nuclei, telerik                                                                                                                                                                                                                                                                                                                                                                                                                   |
+| WAF                 | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| WEBSCREENSHOT       | 0                     | 1                     |                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                   |
 <!-- END BBOT EVENTS -->
diff --git a/docs/scanning/index.md b/docs/scanning/index.md
index b25722cd92..06b689f3c0 100644
--- a/docs/scanning/index.md
+++ b/docs/scanning/index.md
@@ -107,6 +107,28 @@ A single module can have multiple flags. For example, the `securitytrails` modul
 ### List of Flags
 
 <!-- BBOT MODULE FLAGS -->
+| Flag             | # Modules   | Description                                   | Modules                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+|------------------|-------------|-----------------------------------------------|---------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------|
+| safe             | 65          | Non-intrusive, safe to run                    | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, badsecrets, bevigil, binaryedge, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, emailformat, fingerprintx, fullhunt, git, github, gowitness, hackertarget, httpx, hunt, hunterio, iis_shortnames, ipstack, leakix, myssl, nsec, ntlm, oauth, otx, passivetotal, pgp, rapiddns, riddler, robots, secretsdb, securitytrails, shodan_dns, sitedossier, skymem, social, sslcert, subdomain_hijack, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wappalyzer, wayback, zoomeye |
+| passive          | 48          | Never connects to target systems              | affiliates, aggregate, anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crobat, crt, digitorus, dnscommonsrv, dnsdumpster, emailformat, excavate, fullhunt, github, hackertarget, hunterio, ipneighbor, ipstack, leakix, massdns, myssl, nsec, otx, passivetotal, pgp, rapiddns, riddler, securitytrails, shodan_dns, sitedossier, skymem, speculate, subdomaincenter, sublist3r, threatminer, urlscan, viewdns, virustotal, wayback, zoomeye                                                                                                                                                                                                          |
+| subdomain-enum   | 43          | Enumerates subdomains                         | anubisdb, asn, azure_realm, azure_tenant, bevigil, binaryedge, builtwith, c99, censys, certspotter, columbus, crt, digitorus, dnscommonsrv, dnsdumpster, dnszonetransfer, fullhunt, github, hackertarget, httpx, hunterio, ipneighbor, leakix, massdns, myssl, nsec, oauth, otx, passivetotal, rapiddns, riddler, securitytrails, shodan_dns, sitedossier, sslcert, subdomain_hijack, subdomaincenter, subdomains, threatminer, urlscan, virustotal, wayback, zoomeye                                                                                                                                                                                                                                               |
+| active           | 37          | Makes active connections to target systems    | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, dnszonetransfer, ffuf, ffuf_shortnames, fingerprintx, generic_ssrf, git, gowitness, host_header, httpx, hunt, iis_shortnames, masscan, nmap, ntlm, nuclei, oauth, paramminer_cookies, paramminer_getparams, paramminer_headers, robots, secretsdb, smuggler, social, sslcert, subdomain_hijack, telerik, url_manipulation, vhost, wafw00f, wappalyzer                                                                                                                                                                                                                                                            |
+| web-thorough     | 24          | More advanced web scanning functionality      | badsecrets, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, bypass403, ffuf_shortnames, generic_ssrf, git, host_header, httpx, hunt, iis_shortnames, nmap, ntlm, robots, secretsdb, smuggler, sslcert, subdomain_hijack, telerik, url_manipulation, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| aggressive       | 18          | Generates a large amount of network traffic   | bypass403, ffuf, ffuf_shortnames, generic_ssrf, host_header, ipneighbor, masscan, massdns, nmap, nuclei, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, url_manipulation, vhost, wafw00f                                                                                                                                                                                                                                                                                                                                                                                                                                                                                          |
+| web-basic        | 17          | Basic, non-intrusive web scan functionality   | azure_realm, badsecrets, bucket_aws, bucket_azure, bucket_firebase, bucket_gcp, git, httpx, hunt, iis_shortnames, ntlm, oauth, robots, secretsdb, sslcert, subdomain_hijack, wappalyzer                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                             |
+| cloud-enum       | 10          | Enumerates cloud resources                    | azure_realm, azure_tenant, bucket_aws, bucket_azure, bucket_digitalocean, bucket_firebase, bucket_gcp, httpx, oauth, subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                               |
+| slow             | 9           | May take a long time to complete              | bucket_digitalocean, fingerprintx, massdns, paramminer_cookies, paramminer_getparams, paramminer_headers, smuggler, telerik, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |
+| affiliates       | 8           | Discovers affiliated hostnames/domains        | affiliates, azure_realm, azure_tenant, builtwith, oauth, sslcert, viewdns, zoomeye                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                  |
+| email-enum       | 5           | Enumerates email addresses                    | emailformat, hunterio, pgp, skymem, sslcert                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                         |
+| deadly           | 3           | Highly aggressive                             | ffuf, nuclei, vhost                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                 |
+| web-paramminer   | 3           | Discovers HTTP parameters through brute-force | paramminer_cookies, paramminer_getparams, paramminer_headers                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| iis-shortnames   | 2           | Scans for IIS Shortname vulnerability         | ffuf_shortnames, iis_shortnames                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| portscan         | 2           | Discovers open ports                          | masscan, nmap                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| report           | 2           | Generates a report at the end of the scan     | affiliates, asn                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                     |
+| social-enum      | 2           | Enumerates social media                       | httpx, social                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                       |
+| service-enum     | 1           | Identifies protocols running on open ports    | fingerprintx                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                        |
+| subdomain-hijack | 1           | Detects hijackable subdomains                 | subdomain_hijack                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                    |
+| web-screenshots  | 1           | Takes screenshots of web pages                | gowitness                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                                           |
 <!-- END BBOT MODULE FLAGS --> 
 
 ## Dependencies
diff --git a/docs/scanning/list_of_modules.md b/docs/scanning/list_of_modules.md
index 9b860107f7..79cefba118 100644
--- a/docs/scanning/list_of_modules.md
+++ b/docs/scanning/list_of_modules.md
@@ -1,103 +1,103 @@
 # List of Modules
 
 <!-- BBOT MODULES -->
-| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                               | Consumed Events                                                                                         | Produced Events                                          |
-|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------|----------------------------------------------------------|
-| badsecrets           | scan     | No              | Library for detecting known or weak secrets across many web frameworks | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING, VULNERABILITY                                   |
-| bucket_aws           | scan     | No              | Check for S3 buckets related to target                                 | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
-| bucket_azure         | scan     | No              | Check for Azure storage blobs related to target                        | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
-| bucket_digitalocean  | scan     | No              | Check for DigitalOcean spaces related to target                        | active, cloud-enum, safe, slow, web-thorough                                        | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
-| bucket_firebase      | scan     | No              | Check for open Firebase databases related to target                    | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
-| bucket_gcp           | scan     | No              | Check for Google object storage related to target                      | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                                  |
-| bypass403            | scan     | No              | Check 403 pages for common bypasses                                    | active, aggressive, web-thorough                                                    | URL                                                                                                     | FINDING                                                  |
-| dnszonetransfer      | scan     | No              | Attempt DNS zone transfers                                             | active, safe, subdomain-enum                                                        | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| ffuf                 | scan     | No              | A fast web fuzzer written in Go                                        | active, aggressive, deadly                                                          | URL                                                                                                     | URL_UNVERIFIED                                           |
-| ffuf_shortnames      | scan     | No              | Use ffuf in combination IIS shortnames                                 | active, aggressive, iis-shortnames, web-thorough                                    | URL_HINT                                                                                                | URL_UNVERIFIED                                           |
-| fingerprintx         | scan     | No              | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active, safe, service-enum, slow                                                    | OPEN_TCP_PORT                                                                                           | PROTOCOL                                                 |
-| generic_ssrf         | scan     | No              | Check for generic SSRFs                                                | active, aggressive, web-thorough                                                    | URL                                                                                                     | VULNERABILITY                                            |
-| git                  | scan     | No              | Check for exposed .git repositories                                    | active, safe, web-basic, web-thorough                                               | URL                                                                                                     | FINDING                                                  |
-| gowitness            | scan     | No              | Take screenshots of webpages                                           | active, safe, web-screenshots                                                       | URL                                                                                                     | TECHNOLOGY, URL, URL_UNVERIFIED, WEBSCREENSHOT           |
-| host_header          | scan     | No              | Try common HTTP Host header spoofing techniques                        | active, aggressive, web-thorough                                                    | HTTP_RESPONSE                                                                                           | FINDING                                                  |
-| httpx                | scan     | No              | Visit webpages. Many other modules rely on httpx                       | active, cloud-enum, safe, social-enum, subdomain-enum, web-basic, web-thorough      | OPEN_TCP_PORT, URL, URL_UNVERIFIED                                                                      | HTTP_RESPONSE, URL                                       |
-| hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                                  |
-| iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active, iis-shortnames, safe, web-basic, web-thorough                               | URL                                                                                                     | URL_HINT                                                 |
-| masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active, aggressive, portscan                                                        | SCAN                                                                                                    | OPEN_TCP_PORT                                            |
-| nmap                 | scan     | No              | Execute port scans with nmap                                           | active, aggressive, portscan, web-thorough                                          | DNS_NAME, IP_ADDRESS                                                                                    | OPEN_TCP_PORT                                            |
-| ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE, URL                                                                                      | DNS_NAME, FINDING                                        |
-| nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active, aggressive, deadly                                                          | URL                                                                                                     | FINDING, VULNERABILITY                                   |
-| oauth                | scan     | No              | Enumerate OAUTH and OpenID Connect services                            | active, affiliates, cloud-enum, safe, subdomain-enum, web-basic                     | DNS_NAME, URL_UNVERIFIED                                                                                | DNS_NAME                                                 |
-| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
-| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
-| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                                  |
-| robots               | scan     | No              | Look for and parse robots.txt                                          | active, safe, web-basic, web-thorough                                               | URL                                                                                                     | URL_UNVERIFIED                                           |
-| secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                                  |
-| smuggler             | scan     | No              | Check for HTTP smuggling                                               | active, aggressive, slow, web-thorough                                              | URL                                                                                                     | FINDING                                                  |
-| social               | scan     | No              | Look for social media links in webpages                                | active, safe, social-enum                                                           | URL_UNVERIFIED                                                                                          | SOCIAL                                                   |
-| sslcert              | scan     | No              | Visit open ports and retrieve SSL certificates                         | active, affiliates, email-enum, safe, subdomain-enum, web-basic, web-thorough       | OPEN_TCP_PORT                                                                                           | DNS_NAME, EMAIL_ADDRESS                                  |
-| subdomain_hijack     | scan     | No              | Detect hijackable subdomains                                           | active, cloud-enum, safe, subdomain-enum, subdomain-hijack, web-basic, web-thorough | DNS_NAME, DNS_NAME_UNRESOLVED                                                                           | FINDING                                                  |
-| telerik              | scan     | No              | Scan for critical Telerik vulnerabilities                              | active, aggressive, slow, web-thorough                                              | URL                                                                                                     | FINDING, VULNERABILITY                                   |
-| url_manipulation     | scan     | No              | Attempt to identify URL parsing/routing based vulnerabilities          | active, aggressive, web-thorough                                                    | URL                                                                                                     | FINDING                                                  |
-| vhost                | scan     | No              | Fuzz for virtual hosts                                                 | active, aggressive, deadly, slow                                                    | URL                                                                                                     | DNS_NAME, VHOST                                          |
-| wafw00f              | scan     | No              | Web Application Firewall Fingerprinting Tool                           | active, aggressive                                                                  | URL                                                                                                     | WAF                                                      |
-| wappalyzer           | scan     | No              | Extract technologies from web responses                                | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | TECHNOLOGY                                               |
-| affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates, passive, report, safe                                                   | *                                                                                                       |                                                          |
-| anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive, report, safe, subdomain-enum                                               | IP_ADDRESS                                                                                              | ASN                                                      |
-| azure_realm          | scan     | No              | Retrieves the "AuthURL" from login.microsoftonline.com/getuserrealm    | affiliates, cloud-enum, passive, safe, subdomain-enum, web-basic                    | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates, cloud-enum, passive, safe, subdomain-enum                               | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |
-| binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| c99                  | scan     | Yes             | Query the C99 API for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| censys               | scan     | Yes             | Query the Censys API                                                   | email-enum, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME, EMAIL_ADDRESS, IP_ADDRESS, OPEN_PORT, PROTOCOL |
-| certspotter          | scan     | No              | Query Certspotter's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| digitorus            | scan     | No              | Query certificatedetails.com for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
-| fullhunt             | scan     | Yes             | Query the fullhunt.io API for subdomains                               | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| github               | scan     | Yes             | Query Github's API for related repositories                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | URL_UNVERIFIED                                           |
-| hackertarget         | scan     | No              | Query the hackertarget.com API for subdomains                          | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| hunterio             | scan     | Yes             | Query hunter.io for emails                                             | email-enum, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME, EMAIL_ADDRESS, URL_UNVERIFIED                  |
-| ipneighbor           | scan     | No              | Look beside IPs in their surrounding subnet                            | aggressive, passive, subdomain-enum                                                 | IP_ADDRESS                                                                                              | IP_ADDRESS                                               |
-| ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive, safe                                                                       | IP_ADDRESS                                                                                              | GEOLOCATION                                              |
-| leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive, passive, slow, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| myssl                | scan     | No              | Query myssl.com's API for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| nsec                 | scan     | No              | Enumerate subdomains by NSEC-walking                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
-| rapiddns             | scan     | No              | Query rapiddns.io for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| sitedossier          | scan     | No              | Query sitedossier.com for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                            |
-| subdomaincenter      | scan     | No              | Query subdomain.center's API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |
-| viewdns              | scan     | No              | Query viewdns.info's reverse whois for related domains                 | affiliates, passive, safe                                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| virustotal           | scan     | Yes             | Query VirusTotal's API for subdomains                                  | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| wayback              | scan     | No              | Query archive.org's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                                 |
-| zoomeye              | scan     | Yes             | Query ZoomEye's API for subdomains                                     | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                                 |
-| asset_inventory      | output   | No              | Output to an asset inventory style flattened CSV file                  |                                                                                     | DNS_NAME, FINDING, IP_ADDRESS, OPEN_TCP_PORT, TECHNOLOGY, URL, VULNERABILITY                            | IP_ADDRESS, OPEN_TCP_PORT                                |
-| csv                  | output   | No              | Output to CSV                                                          |                                                                                     | *                                                                                                       |                                                          |
-| http                 | output   | No              | Send every event to a custom URL via a web request                     |                                                                                     | *                                                                                                       |                                                          |
-| human                | output   | No              | Output to text                                                         |                                                                                     | *                                                                                                       |                                                          |
-| json                 | output   | No              | Output to JSON                                                         |                                                                                     | *                                                                                                       |                                                          |
-| neo4j                | output   | No              | Output to Neo4j                                                        |                                                                                     | *                                                                                                       |                                                          |
-| python               | output   | No              | Output via Python API                                                  |                                                                                     | *                                                                                                       |                                                          |
-| subdomains           | output   | No              | Output only resolved, in-scope subdomains                              | subdomain-enum                                                                      | DNS_NAME, DNS_NAME_UNRESOLVED                                                                           |                                                          |
-| web_report           | output   | No              | Create a markdown report with web assets                               |                                                                                     | FINDING, TECHNOLOGY, URL, VHOST, VULNERABILITY                                                          |                                                          |
-| websocket            | output   | No              | Output to websockets                                                   |                                                                                     | *                                                                                                       |                                                          |
-| aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive, safe                                                                       |                                                                                                         |                                                          |
-| excavate             | internal | No              | Passively extract juicy tidbits from scan data                         | passive                                                                             | HTTP_RESPONSE                                                                                           | URL_UNVERIFIED                                           |
-| speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                             | DNS_NAME, DNS_NAME_UNRESOLVED, HTTP_RESPONSE, IP_ADDRESS, IP_RANGE, STORAGE_BUCKET, URL, URL_UNVERIFIED | DNS_NAME, FINDING, IP_ADDRESS, OPEN_TCP_PORT             |
+| Module               | Type     | Needs API Key   | Description                                                            | Flags                                                                               | Consumed Events                                                                                         | Produced Events                                |
+|----------------------|----------|-----------------|------------------------------------------------------------------------|-------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------------------|------------------------------------------------|
+| badsecrets           | scan     | No              | Library for detecting known or weak secrets across many web frameworks | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING, VULNERABILITY                         |
+| bucket_aws           | scan     | No              | Check for S3 buckets related to target                                 | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                        |
+| bucket_azure         | scan     | No              | Check for Azure storage blobs related to target                        | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                        |
+| bucket_digitalocean  | scan     | No              | Check for DigitalOcean spaces related to target                        | active, cloud-enum, safe, slow, web-thorough                                        | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                        |
+| bucket_firebase      | scan     | No              | Check for open Firebase databases related to target                    | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                        |
+| bucket_gcp           | scan     | No              | Check for Google object storage related to target                      | active, cloud-enum, safe, web-basic, web-thorough                                   | DNS_NAME, STORAGE_BUCKET                                                                                | FINDING, STORAGE_BUCKET                        |
+| bypass403            | scan     | No              | Check 403 pages for common bypasses                                    | active, aggressive, web-thorough                                                    | URL                                                                                                     | FINDING                                        |
+| dnszonetransfer      | scan     | No              | Attempt DNS zone transfers                                             | active, safe, subdomain-enum                                                        | DNS_NAME                                                                                                | DNS_NAME                                       |
+| ffuf                 | scan     | No              | A fast web fuzzer written in Go                                        | active, aggressive, deadly                                                          | URL                                                                                                     | URL_UNVERIFIED                                 |
+| ffuf_shortnames      | scan     | No              | Use ffuf in combination IIS shortnames                                 | active, aggressive, iis-shortnames, web-thorough                                    | URL_HINT                                                                                                | URL_UNVERIFIED                                 |
+| fingerprintx         | scan     | No              | Fingerprint exposed services like RDP, SSH, MySQL, etc.                | active, safe, service-enum, slow                                                    | OPEN_TCP_PORT                                                                                           | PROTOCOL                                       |
+| generic_ssrf         | scan     | No              | Check for generic SSRFs                                                | active, aggressive, web-thorough                                                    | URL                                                                                                     | VULNERABILITY                                  |
+| git                  | scan     | No              | Check for exposed .git repositories                                    | active, safe, web-basic, web-thorough                                               | URL                                                                                                     | FINDING                                        |
+| gowitness            | scan     | No              | Take screenshots of webpages                                           | active, safe, web-screenshots                                                       | URL                                                                                                     | TECHNOLOGY, URL, URL_UNVERIFIED, WEBSCREENSHOT |
+| host_header          | scan     | No              | Try common HTTP Host header spoofing techniques                        | active, aggressive, web-thorough                                                    | HTTP_RESPONSE                                                                                           | FINDING                                        |
+| httpx                | scan     | No              | Visit webpages. Many other modules rely on httpx                       | active, cloud-enum, safe, social-enum, subdomain-enum, web-basic, web-thorough      | OPEN_TCP_PORT, URL, URL_UNVERIFIED                                                                      | HTTP_RESPONSE, URL                             |
+| hunt                 | scan     | No              | Watch for commonly-exploitable HTTP parameters                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                        |
+| iis_shortnames       | scan     | No              | Check for IIS shortname vulnerability                                  | active, iis-shortnames, safe, web-basic, web-thorough                               | URL                                                                                                     | URL_HINT                                       |
+| masscan              | scan     | No              | Port scan IP subnets with masscan                                      | active, aggressive, portscan                                                        | SCAN                                                                                                    | OPEN_TCP_PORT                                  |
+| nmap                 | scan     | No              | Execute port scans with nmap                                           | active, aggressive, portscan, web-thorough                                          | DNS_NAME, IP_ADDRESS                                                                                    | OPEN_TCP_PORT                                  |
+| ntlm                 | scan     | No              | Watch for HTTP endpoints that support NTLM authentication              | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE, URL                                                                                      | DNS_NAME, FINDING                              |
+| nuclei               | scan     | No              | Fast and customisable vulnerability scanner                            | active, aggressive, deadly                                                          | URL                                                                                                     | FINDING, VULNERABILITY                         |
+| oauth                | scan     | No              | Enumerate OAUTH and OpenID Connect services                            | active, affiliates, cloud-enum, safe, subdomain-enum, web-basic                     | DNS_NAME, URL_UNVERIFIED                                                                                | DNS_NAME                                       |
+| paramminer_cookies   | scan     | No              | Smart brute-force to check for common HTTP cookie parameters           | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                        |
+| paramminer_getparams | scan     | No              | Use smart brute-force to check for common HTTP GET parameters          | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                        |
+| paramminer_headers   | scan     | No              | Use smart brute-force to check for common HTTP header parameters       | active, aggressive, slow, web-paramminer                                            | HTTP_RESPONSE                                                                                           | FINDING                                        |
+| robots               | scan     | No              | Look for and parse robots.txt                                          | active, safe, web-basic, web-thorough                                               | URL                                                                                                     | URL_UNVERIFIED                                 |
+| secretsdb            | scan     | No              | Detect common secrets with secrets-patterns-db                         | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | FINDING                                        |
+| smuggler             | scan     | No              | Check for HTTP smuggling                                               | active, aggressive, slow, web-thorough                                              | URL                                                                                                     | FINDING                                        |
+| social               | scan     | No              | Look for social media links in webpages                                | active, safe, social-enum                                                           | URL_UNVERIFIED                                                                                          | SOCIAL                                         |
+| sslcert              | scan     | No              | Visit open ports and retrieve SSL certificates                         | active, affiliates, email-enum, safe, subdomain-enum, web-basic, web-thorough       | OPEN_TCP_PORT                                                                                           | DNS_NAME, EMAIL_ADDRESS                        |
+| subdomain_hijack     | scan     | No              | Detect hijackable subdomains                                           | active, cloud-enum, safe, subdomain-enum, subdomain-hijack, web-basic, web-thorough | DNS_NAME, DNS_NAME_UNRESOLVED                                                                           | FINDING                                        |
+| telerik              | scan     | No              | Scan for critical Telerik vulnerabilities                              | active, aggressive, slow, web-thorough                                              | URL                                                                                                     | FINDING, VULNERABILITY                         |
+| url_manipulation     | scan     | No              | Attempt to identify URL parsing/routing based vulnerabilities          | active, aggressive, web-thorough                                                    | URL                                                                                                     | FINDING                                        |
+| vhost                | scan     | No              | Fuzz for virtual hosts                                                 | active, aggressive, deadly, slow                                                    | URL                                                                                                     | DNS_NAME, VHOST                                |
+| wafw00f              | scan     | No              | Web Application Firewall Fingerprinting Tool                           | active, aggressive                                                                  | URL                                                                                                     | WAF                                            |
+| wappalyzer           | scan     | No              | Extract technologies from web responses                                | active, safe, web-basic, web-thorough                                               | HTTP_RESPONSE                                                                                           | TECHNOLOGY                                     |
+| affiliates           | scan     | No              | Summarize affiliate domains at the end of a scan                       | affiliates, passive, report, safe                                                   | *                                                                                                       |                                                |
+| anubisdb             | scan     | No              | Query jldc.me's database for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| asn                  | scan     | No              | Query ripe and bgpview.io for ASNs                                     | passive, report, safe, subdomain-enum                                               | IP_ADDRESS                                                                                              | ASN                                            |
+| azure_realm          | scan     | No              | Retrieves the "AuthURL" from login.microsoftonline.com/getuserrealm    | affiliates, cloud-enum, passive, safe, subdomain-enum, web-basic                    | DNS_NAME                                                                                                | DNS_NAME                                       |
+| azure_tenant         | scan     | No              | Query Azure for tenant sister domains                                  | affiliates, cloud-enum, passive, safe, subdomain-enum                               | DNS_NAME                                                                                                | DNS_NAME                                       |
+| bevigil              | scan     | Yes             | Retrieve OSINT data from mobile applications using BeVigil             | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                       |
+| binaryedge           | scan     | Yes             | Query the BinaryEdge API                                               | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| builtwith            | scan     | Yes             | Query Builtwith.com for subdomains                                     | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                       |
+| c99                  | scan     | Yes             | Query the C99 API for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| censys               | scan     | Yes             | Query the Censys API                                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| certspotter          | scan     | No              | Query Certspotter's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| columbus             | scan     | No              | Query the Columbus Project API for subdomains                          | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| crobat               | scan     | No              | Query Project Crobat for subdomains                                    | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| crt                  | scan     | No              | Query crt.sh (certificate transparency) for subdomains                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| digitorus            | scan     | No              | Query certificatedetails.com for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| dnscommonsrv         | scan     | No              | Check for common SRV records                                           | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| dnsdumpster          | scan     | No              | Query dnsdumpster for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| emailformat          | scan     | No              | Query email-format.com for email addresses                             | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                  |
+| fullhunt             | scan     | Yes             | Query the fullhunt.io API for subdomains                               | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| github               | scan     | Yes             | Query Github's API for related repositories                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | URL_UNVERIFIED                                 |
+| hackertarget         | scan     | No              | Query the hackertarget.com API for subdomains                          | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| hunterio             | scan     | Yes             | Query hunter.io for emails                                             | email-enum, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME, EMAIL_ADDRESS, URL_UNVERIFIED        |
+| ipneighbor           | scan     | No              | Look beside IPs in their surrounding subnet                            | aggressive, passive, subdomain-enum                                                 | IP_ADDRESS                                                                                              | IP_ADDRESS                                     |
+| ipstack              | scan     | Yes             | Query IPStack's API for GeoIP                                          | passive, safe                                                                       | IP_ADDRESS                                                                                              | GEOLOCATION                                    |
+| leakix               | scan     | No              | Query leakix.net for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| massdns              | scan     | No              | Brute-force subdomains with massdns (highly effective)                 | aggressive, passive, slow, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                       |
+| myssl                | scan     | No              | Query myssl.com's API for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| nsec                 | scan     | No              | Enumerate subdomains by NSEC-walking                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| otx                  | scan     | No              | Query otx.alienvault.com for subdomains                                | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| passivetotal         | scan     | Yes             | Query the PassiveTotal API for subdomains                              | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| pgp                  | scan     | No              | Query common PGP servers for email addresses                           | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                  |
+| rapiddns             | scan     | No              | Query rapiddns.io for subdomains                                       | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| riddler              | scan     | No              | Query riddler.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| securitytrails       | scan     | Yes             | Query the SecurityTrails API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| shodan_dns           | scan     | Yes             | Query Shodan for subdomains                                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| sitedossier          | scan     | No              | Query sitedossier.com for subdomains                                   | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| skymem               | scan     | No              | Query skymem.info for email addresses                                  | email-enum, passive, safe                                                           | DNS_NAME                                                                                                | EMAIL_ADDRESS                                  |
+| subdomaincenter      | scan     | No              | Query subdomain.center's API for subdomains                            | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| sublist3r            | scan     | No              | Query sublist3r's API for subdomains                                   | passive, safe                                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| threatminer          | scan     | No              | Query threatminer's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| urlscan              | scan     | No              | Query urlscan.io for subdomains                                        | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                       |
+| viewdns              | scan     | No              | Query viewdns.info's reverse whois for related domains                 | affiliates, passive, safe                                                           | DNS_NAME                                                                                                | DNS_NAME                                       |
+| virustotal           | scan     | Yes             | Query VirusTotal's API for subdomains                                  | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME                                       |
+| wayback              | scan     | No              | Query archive.org's API for subdomains                                 | passive, safe, subdomain-enum                                                       | DNS_NAME                                                                                                | DNS_NAME, URL_UNVERIFIED                       |
+| zoomeye              | scan     | Yes             | Query ZoomEye's API for subdomains                                     | affiliates, passive, safe, subdomain-enum                                           | DNS_NAME                                                                                                | DNS_NAME                                       |
+| asset_inventory      | output   | No              | Output to an asset inventory style flattened CSV file                  |                                                                                     | DNS_NAME, FINDING, IP_ADDRESS, OPEN_TCP_PORT, TECHNOLOGY, URL, VULNERABILITY                            | IP_ADDRESS, OPEN_TCP_PORT                      |
+| csv                  | output   | No              | Output to CSV                                                          |                                                                                     | *                                                                                                       |                                                |
+| http                 | output   | No              | Send every event to a custom URL via a web request                     |                                                                                     | *                                                                                                       |                                                |
+| human                | output   | No              | Output to text                                                         |                                                                                     | *                                                                                                       |                                                |
+| json                 | output   | No              | Output to JSON                                                         |                                                                                     | *                                                                                                       |                                                |
+| neo4j                | output   | No              | Output to Neo4j                                                        |                                                                                     | *                                                                                                       |                                                |
+| python               | output   | No              | Output via Python API                                                  |                                                                                     | *                                                                                                       |                                                |
+| subdomains           | output   | No              | Output only resolved, in-scope subdomains                              | subdomain-enum                                                                      | DNS_NAME, DNS_NAME_UNRESOLVED                                                                           |                                                |
+| web_report           | output   | No              | Create a markdown report with web assets                               |                                                                                     | FINDING, TECHNOLOGY, URL, VHOST, VULNERABILITY                                                          |                                                |
+| websocket            | output   | No              | Output to websockets                                                   |                                                                                     | *                                                                                                       |                                                |
+| aggregate            | internal | No              | Summarize statistics at the end of a scan                              | passive, safe                                                                       |                                                                                                         |                                                |
+| excavate             | internal | No              | Passively extract juicy tidbits from scan data                         | passive                                                                             | HTTP_RESPONSE                                                                                           | URL_UNVERIFIED                                 |
+| speculate            | internal | No              | Derive certain event types from others by common sense                 | passive                                                                             | DNS_NAME, DNS_NAME_UNRESOLVED, HTTP_RESPONSE, IP_ADDRESS, IP_RANGE, STORAGE_BUCKET, URL, URL_UNVERIFIED | DNS_NAME, FINDING, IP_ADDRESS, OPEN_TCP_PORT   |
 <!-- END BBOT MODULES -->
 
 For a list of module config options, see [Module Options](../configurations/#module-config-options).