Merge 7e638a41f2 into 0700427bac

2025-10-02 14:48:21 +00:00 · 2025-09-28 23:43:12 +08:00 · 2025-09-28 23:43:12 +08:00 · 372b70a8ca
commit 372b70a8ca
parent 0700427bac 7e638a41f2
1077 changed files with 169219 additions and 29 deletions
--- a/.github/workflows/generate-docs.yml
+++ b/.github/workflows/generate-docs.yml
@ -34,15 +34,6 @@ jobs:
        with:
          submodules: "recursive"

-      # Only reset the submodule pointer for scheduled builds. The reason to do
-      # this is to pick up any merge commits or anything that may have been
-      # missed in a merge, but not have any actual content. We don't want to do
-      # it otherwise because PRs should just use the submodule they're pointing
-      # at.
-      - name: Switch doc submodule to master
-        if: github.event_name == 'schedule'
-        run: cd doc && git checkout master
-
      - name: Fetch Dependencies
        run: |
          sudo apt-get update
@ -119,9 +110,6 @@ jobs:

          cd doc

-          echo "*** Running pre-commit ***"
-          pre-commit run -a --show-diff-on-failure --color=always
-
          echo "*** Generating Sphinx Docs ***"
          make > make.out 2>&1
          make_status=$?
@ -132,7 +120,7 @@ jobs:
          grep -q WARNING make.out && exit 1
          rm make.out

-      - name: Push zeek-docs Changes
+      - name: Push docs Changes
        if: github.event_name == 'schedule'
        run: |
          cd doc
@ -142,16 +130,6 @@ jobs:
          # with a check that detects whether there's anything staged.
          git diff-index --cached --quiet HEAD || { git commit -m "Generate docs" && git push; }

-      - name: Update zeek-docs Submodule
-        if: github.event_name == 'schedule'
-        run: |
-          git config --global user.name zeek-bot
-          git config --global user.email info@zeek.org
-          git add doc
-          git status
-          # Similar logic here: proceed only if there's a change in the submodule.
-          git diff-index --cached --quiet HEAD || { git commit -m 'Update doc submodule [nomail] [skip ci]' && git push; }
-
      - name: Send email
        # Only send notifications for scheduled runs. Runs from pull requests
        # show failures in the GitHub UI.
--- a/.gitignore
+++ b/.gitignore
@ -3,6 +3,9 @@
 build*
 !ci/windows/build.cmd

+# Don't ignore things in the docs directory
+!doc/**
+
 tmp
 *.gcov

--- a/.gitmodules
+++ b/.gitmodules
@ -16,9 +16,6 @@
 [submodule "auxil/netcontrol-connectors"]
 	path = auxil/netcontrol-connectors
 	url = https://github.com/zeek/zeek-netcontrol
-[submodule "doc"]
-	path = doc
-	url = https://github.com/zeek/zeek-docs
 [submodule "auxil/paraglob"]
 	path = auxil/paraglob
 	url = https://github.com/zeek/paraglob
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@ -10,7 +10,7 @@ repos:
    language: python
    files: '\.(h|c|cpp|cc|spicy|evt)$'
    types: [file]
-    exclude: '^(testing/btest/(Baseline|plugins|spicy|scripts)/.*|testing/builtin-plugins/.*|src/3rdparty/.*)$'
+    exclude: '^(testing/btest/(Baseline|plugins|spicy|scripts)/.*|testing/builtin-plugins/.*|src/3rdparty/.*|doc/.*)$'

  - id: btest-command-commented
    name: Check that all BTest command lines are commented out
@ -56,4 +56,4 @@ repos:
  rev: v0.26.0
  hooks:
    - id: spicy-format
-      exclude: '^testing/.*'
+      exclude: '^(testing/.*|doc/devel/spicy/autogen/.*)'
--- a/.readthedocs.yml
+++ b/.readthedocs.yml
@ -0,0 +1,16 @@
+version: 2
+
+formats:
+  - htmlzip
+
+build:
+  os: ubuntu-24.04
+  tools:
+    python: "3.13"
+
+python:
+  install:
+    - requirements: doc/requirements.txt
+
+sphinx:
+  configuration: doc/conf.py
--- a/1
+++ b/1
@ -1 +0,0 @@
-Subproject commit 2731def9159247e6da8a3191783c89683363689c
--- a/doc/.gitignore
+++ b/doc/.gitignore
@ -0,0 +1,2 @@
+build
+*.pyc
--- a/doc/.typos.toml
+++ b/doc/.typos.toml
@ -0,0 +1,66 @@
+[default]
+extend-ignore-re = [
+    # seh too close to she
+    "registered SEH to support IDL",
+    # ALLO is a valid FTP command
+    "\"ALLO\".*[0-9]{3}",
+    "des-ede3-cbc-Env-OID",
+    # On purpose
+    "\"THE NETBIOS NAM\"",
+    # NFS stuff.
+    "commited :zeek:type:`NFS3::stable_how_t`",
+    "\\/fo\\(o",
+    "  nd\\.<br",
+    "\"BaR\"",
+    "Not-ECT",
+    "Ninteenth: Ninteenth",
+
+    # Connecton and file UIDs
+    "[CF][a-zA-Z0-9]{17}",
+
+    # Smoot
+    "Smoot",
+
+    "SIEM",
+]
+
+extend-ignore-identifiers-re = [
+    "TLS_.*_EDE.*_.*",
+    "SSL.*_EDE.*_.*",
+    "_3DES_EDE_CBC_SHA",
+    "GOST_R_.*",
+    "icmp6_nd_.*",
+    "pn", # Use for `PoolNode` variables
+    "complte_flag", # Existing use in exported record in base.
+    "VidP(n|N)", # In SMB.
+    "iin", # In DNP3.
+    "(ScValidatePnPService|ScSendPnPMessage)", # In DCE-RPC.
+    "snet", # Used as shorthand for subnet in base scripts.
+    "typ",
+    "tpe",
+]
+
+[default.extend-identifiers]
+MCA_OCCURED = "MCA_OCCURED"
+MNT3ERR_ACCES = "MNT3ERR_ACCES"
+ND_QUEUE_OVERFLOW = "ND_QUEUE_OVERFLOW"
+ND_REDIRECT = "ND_REDIRECT"
+NFS3ERR_ACCES = "NFS3ERR_ACCES"
+NO_SEH = "NO_SEH"
+RPC_NT_CALL_FAILED_DNE = "RPC_NT_CALL_FAILED_DNE"
+RpcAddPrintProvidor = "RpcAddPrintProvidor"
+RpcDeletePrintProvidor = "RpcDeletePrintProvidor"
+THA = "THA"
+tha = "tha"
+uses_seh = "uses_seh"
+exat = "exat"
+EXAT = "EXAT"
+tpe = "tpe"
+
+[default.extend-words]
+caf = "caf"
+helo = "helo"
+# Seems we use this in the management framework
+requestor = "requestor"
+# `inout` is used as a keyword in Spicy, but looks like a typo of `input`.
+inout = "inout"
--- a/doc/LICENSE
+++ b/doc/LICENSE
@ -0,0 +1,5 @@
+This work is licensed under the Creative Commons
+Attribution 4.0 International License. To view a copy of this
+license, visit https://creativecommons.org/licenses/by/4.0/ or send
+a letter to Creative Commons, 444 Castro Street, Suite 900, Mountain
+View, California, 94041, USA.
--- a/doc/Makefile
+++ b/doc/Makefile
@ -0,0 +1,37 @@
+SPHINXOPTS =
+
+NUMJOBS ?= auto
+
+all: html
+
+doc: html
+
+builddir:
+	mkdir -p build/html
+
+clean:
+	rm -rf build/html
+
+html: builddir
+	sphinx-build -j $(NUMJOBS) -b html $(SPHINXOPTS) . ./build/html
+
+livehtml: builddir
+	sphinx-autobuild --ignore "*.git/*" --ignore "*.lock" --ignore "*.pyc" --ignore "*.swp" --ignore "*.swpx" --ignore "*.swx" -b html $(SPHINXOPTS) . ./build/html
+
+commit:
+	git add * && git commit -m 'Update generated docs'
+
+spicy-%:
+	git clone https://github.com/zeek/$@
+
+check-spicy-docs: spicy-tftp
+	@echo Refreshing checkouts
+	@for REPO in $^; do (cd $$REPO && git pull && git reset HEAD --hard)>/dev/null; done
+	@
+	@echo Checking whether docs for Spicy integration are up-to-date
+	@./devel/spicy/autogen-spicy-docs spicy-tftp
+	@
+	@git diff --quiet devel/spicy/autogen/ \
+		|| (echo "Spicy docs are not up-to-date, rerun './devel/spicy/autogen-spicy-docs'." && exit 1)
+
+.PHONY : all doc builddir clean html livehtml
--- a/doc/README
+++ b/doc/README
@ -0,0 +1,132 @@
+.. _zeek-docs: https://github.com/zeek/zeek-docs
+.. _Read the Docs: https://docs.readthedocs.io/en/stable/index.html
+.. _Zeek repo: https://github.com/zeek/zeek
+.. _Sphinx: https://www.sphinx-doc.org/en/master
+.. _pip: https://pypi.org/project/pip
+
+Zeek Documentation
+==================
+
+The documentation repo at zeek-docs_
+contains version-specific Zeek documentation source files that are ultimately
+used as the basis for content hosted at https://docs.zeek.org.
+
+Markup Format, Style, and Conventions
+-------------------------------------
+
+For general guidance on the basics of how the documentation is written,
+consult this Zeek wiki:
+
+https://github.com/zeek/zeek/wiki/Documentation-Style-and-Conventions
+
+Source-Tree Organization
+------------------------
+
+The zeek-docs_ repo containing this README file is the root of a Sphinx_ source
+tree and can be modified to add more documentation, style sheets, JavaScript,
+etc.  The Sphinx config file is ``conf.py``.  The typical way new documents get
+integrated is from them being referenced directly in ``index.rst`` or
+indirectly from something in the ``toctree`` (Table of Contents Tree) specified
+in that main index.
+
+There is also a custom Sphinx domain implemented in ``ext/zeek.py`` which adds
+some reStructureText (reST) directives and roles that aid in generating useful
+index entries and cross-references. This primarily supports integration with
+the script-reference sections, some of which are auto-generated by Zeek's
+Doxygen-like feature, named "Zeekygen".  The bulk of auto-generated content
+lives under the ``scripts/`` directory or has a file name starting with
+"autogenerated", so if you find yourself wanting to change those, you should
+actually look at at doing those changes within the `Zeek repo`_ itself rather
+than here, so see the next section for how Zeekygen docs can be (re)generated.
+
+Generating Zeekygen Reference Docs
+----------------------------------
+
+All Zeekygen-generated docs get committed into Git, so if you don't have to
+perform any changes on it and just want to preview what's already existing,
+you can skip down to the next :ref:`Local Previewing <local-doc-preview>` section.
+
+The Zeekygen documentation-generation feature is a part of Zeek itself, so
+you'll want to obtain the `Zeek repo`_ from Git, read the :doc:`INSTALL
+</install>` file directions to install required dependencies, and build Zeek::
+
+  git clone --recursive https://github.com/zeek/zeek
+  cd zeek
+  # Read INSTALL file and get dependencies here
+  ./configure && make -j $(nproc)
+  # Make desired edits to scripts/, src/, etc.
+  ./ci/update-zeekygen-docs.sh
+
+The last command runs a script to generate documentation, which will end up in
+the ``doc/`` subdirectory.  Note that ``doc/`` is just a Git submodule of this
+this zeek-docs_ repository, so you can run ``git status`` there to find exactly
+what changed.
+
+Also note that the documentation-generation script is run automatically
+on a daily basis to incorporate up any documentation changes that people make
+in Zeek itself without them having to necessarily be aware of the full
+documentation process.  The GitHub Action that does that daily task is
+located in the Zeek repo's ``.github/workflows/generate-docs.yml`` file.
+
+.. _local-doc-preview:
+
+Local Previewing (How To Build)
+-------------------------------
+
+First make sure you have the required dependencies used for building docs:
+
+* Python interpreter >= 3.9
+* Sphinx: https://www.sphinx-doc.org/en/master/
+* Read the Docs Sphinx Theme: https://github.com/rtfd/sphinx_rtd_theme
+* GitPython: https://github.com/gitpython-developers/GitPython
+
+If you have pip_, you may just use the command ``pip3 install -r
+requirements.txt`` to install all the dependencies using the
+``requirements.txt`` from zeek-docs_.
+
+Now run ``make`` within the zeek-docs_ repository's top-level to locally render
+its reST files into HTML. After the build completes, HTML documentation is
+symlinked in ``build/html`` and you can open the ``index.html`` found there in
+your web browser.
+
+There's also a ``make livehtml`` (requires ``pip3 install sphinx-autobuild``)
+target in the top-level Makefile that is useful for editing the reST files and
+seeing changes rendered out live to a separate browser.
+
+Hosting
+-------
+
+Documentation is hosted by `Read the Docs`_ (RTD), so you can generally read
+about how it works there.  The web-interface is accessible via
+https://readthedocs.org/projects/zeek-docs.
+
+How zeek-docs_ is configured to use RTD is a combination of some custom
+settings in its ``.readthedocs.yml`` file and others only accessible through
+RTD's web-interface (e.g. domain and subproject settings).  Most config
+settings are likely understandable just by browsing the web-interface and
+RTD's guides, but a few particular points to mention:
+
+* There is an associated, always-failing project at
+  https://readthedocs.org/projects/zeek.  It's always-failing because
+  RTD redirects only activate when pages 404 and this project exists so that
+  all attempts to use https://zeek.rtfd.io or https://zeek.readthedocs.io
+  get redirected to https://docs.zeek.org.  Those would have been the project
+  URLs if ownership of the RTD 'zeek' project was had from the start, but
+  it was only obtained later, after documentation already started development
+  in the 'zeek-docs' RTD project slug.
+
+* Over time, page redirects have accrued into ``redirects.yml`` as a way to
+  help document what they are and why they happened and also as a potential
+  way to automate addition/reinstantiation of a large number of redirects,
+  but typically redirects can be manually added via the RTD web interface
+  first and then noted in ``redirects.yml``
+
+* There are RTD subprojects for things like Broker, Package Manager,
+  and Spicy.  The use of subprojects simply allows access to their RTD
+  docs via the custom domain of https://docs.zeek.org
+
+* RTD will auto-build any newly-pushed commits to zeek-docs_ (i.e. a webhook is
+  configured), but if a tag is changed to point somewhere different, you'll
+  typically have to go into the RTD web interface, "Edit" the associated
+  version under "Versions", "wipe" the existing docs, and then manually trigger
+  a rebuild of that version tag under "Builds".
--- a/doc/README.rst
+++ b/doc/README.rst
@ -0,0 +1,132 @@
+.. _zeek-docs: https://github.com/zeek/zeek-docs
+.. _Read the Docs: https://docs.readthedocs.io/en/stable/index.html
+.. _Zeek repo: https://github.com/zeek/zeek
+.. _Sphinx: https://www.sphinx-doc.org/en/master
+.. _pip: https://pypi.org/project/pip
+
+Zeek Documentation
+==================
+
+The documentation repo at zeek-docs_
+contains version-specific Zeek documentation source files that are ultimately
+used as the basis for content hosted at https://docs.zeek.org.
+
+Markup Format, Style, and Conventions
+-------------------------------------
+
+For general guidance on the basics of how the documentation is written,
+consult this Zeek wiki:
+
+https://github.com/zeek/zeek/wiki/Documentation-Style-and-Conventions
+
+Source-Tree Organization
+------------------------
+
+The zeek-docs_ repo containing this README file is the root of a Sphinx_ source
+tree and can be modified to add more documentation, style sheets, JavaScript,
+etc.  The Sphinx config file is ``conf.py``.  The typical way new documents get
+integrated is from them being referenced directly in ``index.rst`` or
+indirectly from something in the ``toctree`` (Table of Contents Tree) specified
+in that main index.
+
+There is also a custom Sphinx domain implemented in ``ext/zeek.py`` which adds
+some reStructureText (reST) directives and roles that aid in generating useful
+index entries and cross-references. This primarily supports integration with
+the script-reference sections, some of which are auto-generated by Zeek's
+Doxygen-like feature, named "Zeekygen".  The bulk of auto-generated content
+lives under the ``scripts/`` directory or has a file name starting with
+"autogenerated", so if you find yourself wanting to change those, you should
+actually look at at doing those changes within the `Zeek repo`_ itself rather
+than here, so see the next section for how Zeekygen docs can be (re)generated.
+
+Generating Zeekygen Reference Docs
+----------------------------------
+
+All Zeekygen-generated docs get committed into Git, so if you don't have to
+perform any changes on it and just want to preview what's already existing,
+you can skip down to the next :ref:`Local Previewing <local-doc-preview>` section.
+
+The Zeekygen documentation-generation feature is a part of Zeek itself, so
+you'll want to obtain the `Zeek repo`_ from Git, read the :doc:`INSTALL
+</install>` file directions to install required dependencies, and build Zeek::
+
+  git clone --recursive https://github.com/zeek/zeek
+  cd zeek
+  # Read INSTALL file and get dependencies here
+  ./configure && make -j $(nproc)
+  # Make desired edits to scripts/, src/, etc.
+  ./ci/update-zeekygen-docs.sh
+
+The last command runs a script to generate documentation, which will end up in
+the ``doc/`` subdirectory.  Note that ``doc/`` is just a Git submodule of this
+this zeek-docs_ repository, so you can run ``git status`` there to find exactly
+what changed.
+
+Also note that the documentation-generation script is run automatically
+on a daily basis to incorporate up any documentation changes that people make
+in Zeek itself without them having to necessarily be aware of the full
+documentation process.  The GitHub Action that does that daily task is
+located in the Zeek repo's ``.github/workflows/generate-docs.yml`` file.
+
+.. _local-doc-preview:
+
+Local Previewing (How To Build)
+-------------------------------
+
+First make sure you have the required dependencies used for building docs:
+
+* Python interpreter >= 3.9
+* Sphinx: https://www.sphinx-doc.org/en/master/
+* Read the Docs Sphinx Theme: https://github.com/rtfd/sphinx_rtd_theme
+* GitPython: https://github.com/gitpython-developers/GitPython
+
+If you have pip_, you may just use the command ``pip3 install -r
+requirements.txt`` to install all the dependencies using the
+``requirements.txt`` from zeek-docs_.
+
+Now run ``make`` within the zeek-docs_ repository's top-level to locally render
+its reST files into HTML. After the build completes, HTML documentation is
+symlinked in ``build/html`` and you can open the ``index.html`` found there in
+your web browser.
+
+There's also a ``make livehtml`` (requires ``pip3 install sphinx-autobuild``)
+target in the top-level Makefile that is useful for editing the reST files and
+seeing changes rendered out live to a separate browser.
+
+Hosting
+-------
+
+Documentation is hosted by `Read the Docs`_ (RTD), so you can generally read
+about how it works there.  The web-interface is accessible via
+https://readthedocs.org/projects/zeek-docs.
+
+How zeek-docs_ is configured to use RTD is a combination of some custom
+settings in its ``.readthedocs.yml`` file and others only accessible through
+RTD's web-interface (e.g. domain and subproject settings).  Most config
+settings are likely understandable just by browsing the web-interface and
+RTD's guides, but a few particular points to mention:
+
+* There is an associated, always-failing project at
+  https://readthedocs.org/projects/zeek.  It's always-failing because
+  RTD redirects only activate when pages 404 and this project exists so that
+  all attempts to use https://zeek.rtfd.io or https://zeek.readthedocs.io
+  get redirected to https://docs.zeek.org.  Those would have been the project
+  URLs if ownership of the RTD 'zeek' project was had from the start, but
+  it was only obtained later, after documentation already started development
+  in the 'zeek-docs' RTD project slug.
+
+* Over time, page redirects have accrued into ``redirects.yml`` as a way to
+  help document what they are and why they happened and also as a potential
+  way to automate addition/reinstantiation of a large number of redirects,
+  but typically redirects can be manually added via the RTD web interface
+  first and then noted in ``redirects.yml``
+
+* There are RTD subprojects for things like Broker, Package Manager,
+  and Spicy.  The use of subprojects simply allows access to their RTD
+  docs via the custom domain of https://docs.zeek.org
+
+* RTD will auto-build any newly-pushed commits to zeek-docs_ (i.e. a webhook is
+  configured), but if a tag is changed to point somewhere different, you'll
+  typically have to go into the RTD web interface, "Edit" the associated
+  version under "Versions", "wipe" the existing docs, and then manually trigger
+  a rebuild of that version tag under "Builds".
--- a/doc/_static/theme_overrides.css
+++ b/doc/_static/theme_overrides.css
@ -0,0 +1,32 @@
+/* override table width restrictions */
+@media screen and (min-width: 767px) {
+
+   .wy-table-responsive table td {
+      /* !important prevents the common CSS stylesheets from overriding
+         this as on RTD they are loaded after this stylesheet */
+      white-space: normal !important;
+   }
+
+   .wy-table-responsive {
+      overflow: visible !important;
+   }
+}
+
+h1, h2, h3, h4, h5, h6 {
+  color: #294488;
+  font-family: 'Open Sans',Helvetica,Arial,Lucida,sans-serif!important;
+}
+
+a {
+  color: #2ea3f2;
+}
+
+body {
+  font-family: "Open Sans",Arial,sans-serif;
+  color: #666;
+}
+
+div.highlight pre strong {
+  font-weight: 800;
+  background-color: #ffffcc;
+}
--- a/doc/_templates/breadcrumbs.html
+++ b/doc/_templates/breadcrumbs.html
@ -0,0 +1,15 @@
+{% extends "!breadcrumbs.html" %}
+
+{% block breadcrumbs_aside %}
+<li class="wy-breadcrumbs-aside">
+{% if pagename != "search" %}
+  {% if display_github %}
+    {% if github_version == "master" %}
+      <a href="https://{{ github_host|default("github.com") }}/{{ github_user }}/{{ github_repo }}/edit/{{ github_version }}{{ conf_py_path }}{{ pagename }}{{ page_source_suffix }}" class="fa fa-github"> {{ _('Edit on GitHub') }}</a>
+    {% endif %}
+  {% elif show_source and has_source and sourcename %}
+    <a href="{{ pathto('_sources/' + sourcename, true)|e }}" rel="nofollow"> {{ _('View page source') }}</a>
+  {% endif %}
+{% endif %}
+</li>
+{% endblock %}
--- a/doc/_templates/layout.html
+++ b/doc/_templates/layout.html
@ -0,0 +1,14 @@
+{% extends "!layout.html" %}
+
+{% if READTHEDOCS and current_version %}
+  {% if current_version == "latest" or current_version == "stable"
+     or current_version == "master" or current_version == "current"
+     or current_version == "lts" or current_version == "LTS" %}
+    {% set current_version = current_version ~ " (" ~ version ~ ")" %}
+  {% endif %}
+{% endif %}
+
+{% block menu %}
+  {{ super() }}
+  <a href="{{pathto('genindex.html', 1)}}">Index</a>
+{% endblock %}
--- a/doc/about.rst
+++ b/doc/about.rst
@ -0,0 +1,256 @@
+==========
+About Zeek
+==========
+
+What Is Zeek?
+=============
+
+Zeek is a passive, open-source network traffic analyzer. Many operators use
+Zeek as a network security monitor (NSM) to support investigations of
+suspicious or malicious activity. Zeek also supports a wide range of traffic
+analysis tasks beyond the security domain, including performance measurement
+and troubleshooting.
+
+The first benefit a new user derives from Zeek is the extensive set of logs
+describing network activity. These logs include not only a comprehensive record
+of every connection seen on the wire, but also application-layer transcripts.
+These include all HTTP sessions with their requested URIs, key headers, MIME
+types, and server responses; DNS requests with replies; SSL certificates; key
+content of SMTP sessions; and much more. By default, Zeek writes all this
+information into well-structured tab-separated or JSON log files suitable for
+post-processing with external software. Users can also choose to have external
+databases or SIEM products consume, store, process, and present the data for
+querying.
+
+In addition to the logs, Zeek comes with built-in functionality for a range of
+analysis and detection tasks, including extracting files from HTTP sessions,
+detecting malware by interfacing to external registries, reporting vulnerable
+versions of software seen on the network, identifying popular web applications,
+detecting SSH brute-forcing, validating SSL certificate chains, and much more.
+
+In addition to shipping such powerful functionality “out of the box,” Zeek is a
+fully customizable and extensible platform for traffic analysis. Zeek provides
+users a domain-specific, Turing-complete scripting language for expressing
+arbitrary analysis tasks. Think of the Zeek language as a “domain-specific
+Python” (or Perl): just like Python, the system comes with a large set of
+pre-built functionality (the “standard library”), yet users can also put Zeek
+to use in novel ways by writing custom code. Indeed, all of Zeek’s default
+analyses, including logging, are done via scripts; no specific analysis is
+hard-coded into the core of the system.
+
+Zeek runs on commodity hardware and hence provides a low-cost alternative to
+expensive proprietary solutions. In many ways Zeek exceeds the capabilities of
+other network monitoring tools, which typically remain limited to a small set
+of hard-coded analysis tasks. Zeek is not a classic signature-based intrusion
+detection system (IDS); while it supports such standard functionality as well,
+Zeek’s scripting language facilitates a much broader spectrum of very different
+approaches to finding malicious activity. These include semantic misuse
+detection, anomaly detection, and behavioral analysis.
+
+A large variety of sites deploy Zeek to protect their infrastructure, including
+many universities, research labs, supercomputing centers, open-science
+communities, major corporations, and government agencies. Zeek specifically
+targets high-speed, high-volume network monitoring, and an increasing number of
+sites are now using the system to monitor their 10GE networks, with some
+already moving on to 100GE links.
+
+Zeek accommodates high-performance settings by supporting scalable
+load-balancing. Large sites typically run “Zeek Clusters” in which a high-speed
+front end load balancer distributes the traffic across an appropriate number of
+back end PCs, all running dedicated Zeek instances on their individual traffic
+slices. A central manager system coordinates the process, synchronizing state
+across the back ends and providing the operators with a central management
+interface for configuration and access to aggregated logs. Zeek’s integrated
+management framework, ZeekControl, supports such cluster setups out-of-the-box.
+
+Zeek’s cluster features support single-system and multi-system setups. That's
+part of Zeek’s scalability advantages. For example, administrators can scale
+Zeek within one system for as long as possible, and then transparently add more
+systems when necessary.
+
+In brief, Zeek is optimized for interpreting network traffic and generating
+logs based on that traffic. It is not optimized for byte matching, and users
+seeking signature detection approaches would be better served by trying
+intrusion detection systems such as Suricata. Zeek is also not a protocol
+analyzer in the sense of Wireshark, seeking to depict every element of network
+traffic at the frame level, or a system for storing traffic in packet capture
+(PCAP) form. Rather, Zeek sits at the “happy medium” representing compact yet
+high fidelity network logs, generating better understanding of network traffic
+and usage.
+
+Why Zeek?
+=========
+
+Zeek offers many advantages for security and network teams who want to better
+understand how their infrastructure is being used.
+
+Security teams generally depend upon four sorts of data sources when trying to
+detect and respond to suspicious and malicious activity. These include *third
+party* sources such as law enforcement, peers, and commercial or nonprofit
+threat intelligence organizations; *network data*; *infrastructure and
+application data*, including logs from cloud environments; and *endpoint data*.
+Zeek is primarily a platform for collecting and analyzing the second form of
+data -- network data. All four are important elements of any security team’s
+program, however.
+
+When looking at data derived from the network, there are four types of data
+available to analysts. As defined by the `network security monitoring paradigm
+<https://corelight.blog/2019/04/30/do-you-know-your-nsm-data-types/>`_, these
+four data types are *full content*, *transaction data*, *extracted content*,
+and *alert data*. Using these data types, one can record traffic, summarize
+traffic, extract traffic (or perhaps more accurately, extract content
+in the form of files), and judge traffic, respectively.
+
+It’s critical to collect and analyze the four types of network security
+monitoring data. The question becomes one of determining the best way to
+accomplish this goal. Thankfully, Zeek as a NSM platform enables collection of
+at least two, and in some ways three, of these data forms, namely transaction
+data, extracted content, and alert data.
+
+Zeek is best known for its transaction data. By default, when run and told to
+watch a network interface, Zeek will generate a collection of compact,
+high-fidelity, richly-annotated set of transaction logs. These logs describe
+the protocols and activity seen on the wire, in a judgement-free,
+policy-neutral manner. This documentation will spend a considerable amount of
+time describing the most common Zeek log files such that readers will become
+comfortable with the format and learn to apply them to their environment.
+
+Zeek can also easily carve files from network traffic, thanks to its file
+extraction capabilities. Analysts can then send those files to execution
+sandboxes or other file examination tools for additional investigation. Zeek
+has some capability to perform classical byte-centric intrusion detection, but
+that job is best suited for packages like the open source Snort or Suricata
+engines. Zeek has other capabilities however that are capable of providing
+judgements in the form of alerts, through its notice mechanism.
+
+Zeek is not optimized for writing traffic to disk in the spirit of a full
+content data collection, and that task is best handled by software written to
+fulfill that requirement.
+
+Beyond the forms of network data that Zeek can natively collect and generate,
+Zeek has advantages that appeared in the `What Is Zeek?`_ section. These
+include its built-in functionality for a range of analysis and detection
+tasks, and its status as a fully customizable and extensible platform for
+traffic analysis.  Zeek is also attractive because of its ability to run on
+commodity hardware, giving users of all types the ability to at least try Zeek
+in a low-cost manner.
+
+History
+=======
+
+Zeek has a rich history stretching back to the 1990s. `Vern Paxson
+<http://www.icir.org/vern/>`_ designed and implemented the initial version in
+1995 as a researcher at the `Lawrence Berkeley National Laboratory (LBNL)
+<http://www.lbl.gov/>`_. The original software was called “Bro,” as an
+“Orwellian reminder that monitoring comes hand in hand with the potential
+for privacy violations”.
+
+LBNL first deployed Zeek in 1996, and the USENIX Security Symposium published
+Vern’s original paper on Zeek in 1998, and awarded it the Best Paper Award that
+year He published a refined version of the paper in 1999 as `Bro: A System for
+Detecting Network Intruders in Real-Time
+<http://www.icir.org/vern/papers/bro-CN99.pdf>`_.
+
+In 2003, the `National Science Foundation (NSF) <http://www.nsf.gov/>`_ began
+supporting research and advanced development on Bro at the `International
+Computer Science Institute (ICSI) <http://www.icsi.berkeley.edu/>`_. (Vern
+still leads the ICSI `Networking and Security group <http://www.icir.org/>`_.)
+
+Over the years, a growing team of ICSI researchers and students kept adding
+novel functions to Zeek, while LBNL continued its support with funding from the
+`Department of Energy (DOE) <http://www.doe.gov/>`_. Much of Zeek’s
+capabilities originate in academic research projects, with results often
+published at top-tier conferences. A key to Zeek’s success was the project’s
+ability to bridge the gap between academia and operations. This relationship
+helped ground research on Zeek in real-world challenges.
+
+With a growing operational user community, the research-centric development
+model eventually became a bottleneck to the system’s evolution.  Research
+grants did not support the more mundane parts of software development and
+maintenance. However, those elements were crucial for the end-user experience.
+As a result, deploying Zeek required overcoming a steep learning curve.
+
+In 2010, NSF sought to address this challenge by awarding ICSI a grant from its
+Software Development for Cyberinfrastructure fund. The `National Center for
+Supercomputing Applications (NCSA) <http://www.ncsa.illinois.edu/>`_ joined the
+team as a core partner, and the Zeek project began to overhaul many of the
+user-visible parts of the system for the 2.0 release in 2012.
+
+After Zeek 2.0, the project enjoyed tremendous growth in new deployments across
+a diverse range of settings, and the ongoing collaboration between ICSI (co-PI
+Robin Sommer) and NCSA (co-PI Adam Slagell) brought a number of important
+features.  In 2012, Zeek added native IPv6 support, long before many enterprise
+networking monitoring tools. In 2013, NSF renewed its support with a second
+grant that established the Bro Center of Expertise at ICSI and NCSA, promoting
+Zeek as a comprehensive, low-cost security capability for research and
+education communities. To facilitate both debugging and education,
+`try.zeek.org <https://try.zeek.org>`_ (formerly try.bro.org) was launched in
+2014.  This provided an interactive way for users to test a script with their
+own packet captures against a variety of Zeek versions and easily share
+sample code with others.  For Zeek clusters and external communication,
+the Broker communication framework was added.  Last, but not least, the
+Zeek package manager was created in 2016, funded by an additional grant
+from the Mozilla Foundation.
+
+In the fall of 2018, the project leadership team decided to change the name of
+the software from Bro to Zeek. The leadership team desired a name that better
+reflected the values of the community while avoiding the negative connotations
+of so-called “bro culture” outside the computing world. The project released
+version 3.0 in the fall of 2019, the first release bearing the name Zeek. The
+year 2020 saw a renewed focus on community and growing the Zeek community, with
+increased interaction via social media, webinars, Slack channels, and related
+outreach efforts.
+
+For a history of the project from 1995 to 2015, see Vern Paxson’s talk from
+BroCon 2015, `Reflecting on Twenty Years of Bro
+<https://www.youtube.com/watch?v=pb9HlmV0s2A>`_.
+
+For background on the decision to rename Bro to Zeek, see Vern Paxson’s talk
+from BroCon 2018, `Renaming Bro
+<https://www.youtube.com/watch?v=L88ZYfjPzyk>`_.
+
+Architecture
+============
+
+.. image:: /images/architecture.png
+   :align: center
+   :scale: 75%
+
+At a very high level, Zeek is architecturally layered into two major
+components. Its *event engine* (or *core*) reduces the incoming packet stream
+into a series of higher-level *events*. These events reflect network activity
+in policy-neutral terms, i.e., they describe *what* has been seen, but not
+*why*, or whether it is significant.
+
+For example, every HTTP request on the wire turns into a corresponding
+:zeek:see:`http_request` event that carries with it the involved IP addresses
+and ports, the URI being requested, and the HTTP version in use. The event
+however does not convey any further *interpretation*, such as whether that URI
+corresponds to a known malware site.
+
+The event engine component comprises a number of subcomponents, including in
+particular the packet processing pipeline consisting of: input sources,
+packet analysis, session analysis, and file analysis. Input sources ingest
+incoming network traffic from network interfaces. Packet analysis processes
+lower-level protocols, starting all the way down at the link layer. Session
+analysis handles application-layer protocols, such as HTTP, FTP, etc. File
+analysis dissects the content of files transferred over sessions. The event
+engine provides a plugin architecture for adding any of these from outside
+of the core Zeek code base, allowing to expand Zeek’s capabilities as
+needed.
+
+Semantics related to the events are derived by Zeek’s second main component,
+the *script interpreter*, which executes a set of *event handlers* written in
+Zeek’s custom scripting language. These scripts can express a site’s
+security policy, such as what actions to take when the monitor detects
+different types of activity.
+
+More generally scripts can derive any desired properties and statistics from
+the input traffic. In fact, all of Zeek’s default output comes from scripts
+included in the distribution. Zeek’s language comes with extensive
+domain-specific types and support functionality. Crucially, Zeek’s language
+allows scripts to maintain state over time, enabling them to track and
+correlate the evolution of what they observe across connection and host
+boundaries. Zeek scripts can generate real-time alerts and also execute
+arbitrary external programs on demand. One might use this functionality to
+trigger an active response to an attack.
--- a/doc/acknowledgements.rst
+++ b/doc/acknowledgements.rst
@ -0,0 +1,22 @@
+================
+Acknowledgements
+================
+
+Thanks to everyone who contributed in making Zeek's documentation
+(alphabetically):
+
+* Johanna Amann
+* Richard Bejtlich
+* Michael Dopheide
+* Amber Graner
+* Jan Grashöfer
+* Christian Kreibich
+* Terry Leach
+* Aashish Sharma
+* Jon Siwek
+* Stephen Smoot
+* Robin Sommer
+* Aaron Soto
+* Nick Turley
+* Fatema Bannat Wala
+* Tim Wojtulewicz
--- a/doc/building-from-source.rst
+++ b/doc/building-from-source.rst
@ -0,0 +1,392 @@
+
+.. _CMake: https://www.cmake.org
+.. _SWIG: https://www.swig.org
+.. _Xcode: https://developer.apple.com/xcode/
+.. _MacPorts: https://www.macports.org
+.. _Fink: https://www.finkproject.org
+.. _Homebrew: https://brew.sh
+.. _downloads page: https://zeek.org/get-zeek
+.. _devtoolset: https://developers.redhat.com/products/developertoolset/hello-world
+.. _zkg package manager: https://docs.zeek.org/projects/package-manager/en/stable/
+.. _crosstool-NG: https://crosstool-ng.github.io/
+.. _CMake toolchain: https://cmake.org/cmake/help/latest/manual/cmake-toolchains.7.html
+.. _contribute: https://github.com/zeek/zeek/wiki/Contribution-Guide
+.. _Chocolatey: https://chocolatey.org
+.. _Npcap: https://npcap.com/
+
+.. _building-from-source:
+
+====================
+Building from Source
+====================
+
+Building Zeek from source provides the most control over your build and is the
+preferred approach for advanced users. We support a wide range of operating
+systems and distributions. Our `support policy
+<https://github.com/zeek/zeek/wiki/Platform-Support-Policy>`_ is informed by
+what we can run in our CI pipelines with reasonable effort, with the current
+status captured in our `support matrix
+<https://github.com/zeek/zeek/wiki/Zeek-Operating-System-Support-Matrix>`_.
+
+Required Dependencies
+---------------------
+
+Building Zeek from source requires the following dependencies, including
+development headers for libraries:
+
+    * Bash (for ZeekControl and BTest)
+    * BIND8 library or greater (if not covered by system's libresolv)
+    * Bison 3.3 or greater (https://www.gnu.org/software/bison/)
+    * C/C++ compiler with C++17 support (GCC 8+ or Clang 9+)
+    * CMake 3.15 or greater (https://www.cmake.org)
+    * Flex (lexical analyzer generator) 2.6 or greater (https://github.com/westes/flex)
+    * Libpcap (https://www.tcpdump.org)
+    * Make
+    * OpenSSL (https://www.openssl.org)
+    * Python 3.9 or greater (https://www.python.org/)
+    * SWIG (https://www.swig.org)
+    * ZeroMQ (https://zeromq.org)
+    * Zlib (https://zlib.net/)
+
+To install these, you can use:
+
+* RPM/RedHat-based Linux:
+
+  .. code-block:: console
+
+     sudo dnf install bison cmake cppzmq-devel gcc gcc-c++ flex libpcap-devel make openssl-devel python3 python3-devel swig zlib-devel
+
+  On pre-``dnf`` systems, use ``yum`` instead.  Additionally, on RHEL/CentOS 7,
+  you can install and activate a devtoolset_ to get access to recent GCC
+  versions. You will also have to install and activate CMake 3.  For example:
+
+  .. code-block:: console
+
+     sudo yum install cmake3 devtoolset-7
+     scl enable devtoolset-7 bash
+
+* DEB/Debian-based Linux:
+
+  .. code-block:: console
+
+     sudo apt-get install bison cmake cppzmq-dev gcc g++ flex libfl-dev libpcap-dev libssl-dev make python3 python3-dev swig zlib1g-dev
+
+  If your platform doesn't offer ``cppzmq-dev``, try ``libzmq3-dev``
+  instead. Zeek's build will fall back to an in-tree version of C++
+  bindings to ZeroMQ in that case.
+
+* FreeBSD:
+
+  Most required dependencies should come with a minimal FreeBSD install
+  except for the following.
+
+  .. code-block:: console
+
+      sudo pkg install -y base64 bash bison cmake cppzmq git python3 swig
+      pyver=`python3 -c 'import sys; print(f"py{sys.version_info[0]}{sys.version_info[1]}")'`
+      sudo pkg install -y $pyver-sqlite3
+
+* macOS:
+
+  Compiling source code on Macs requires first installing either Xcode_
+  or the "Command Line Tools" (which is a much smaller download).  To check
+  if either is installed, run the ``xcode-select -p`` command.  If you see
+  an error message, then neither is installed and you can then run
+  ``xcode-select --install`` which will prompt you to either get Xcode (by
+  clicking "Get Xcode") or to install the command line tools (by
+  clicking "Install").
+
+  macOS comes with all required dependencies except for CMake_, SWIG_,
+  Bison, Flex, and OpenSSL (OpenSSL headers were removed in macOS 10.11,
+  therefore OpenSSL must be installed manually for macOS versions 10.11
+  or newer).
+
+  Distributions of these dependencies can likely be obtained from your
+  preferred macOS package management system (e.g. Homebrew_,
+  MacPorts_, or Fink_). Specifically for Homebrew, the ``bison``, ``cmake``,
+  ``cppzmq``, ``flex``, ``swig``, and ``openssl`` packages
+  provide the required dependencies.  For MacPorts, use the ``bison``, ``cmake``,
+  ``cppzmq``, ``flex``, ``swig``, ``swig-python``, and ``openssl`` packages.
+
+* Windows
+
+  Windows support is experimental. These instructions are meant as a starting
+  point for development on that platform, and might have issues or be missing
+  steps. Notify the Zeek team if any such problems arise.
+
+  Compiling on Windows requires the installation of a development environment.
+  Zeek currently builds on Visual Studio 2019, and you can either install the
+  full version including the UI tools or you can install the command-line tools
+  and build from a shell. The instructions below describe how to install the
+  command-line tools, but are not necessary if you install the full VS2019
+  package. You will need to install Chocolatey_ in order to install the
+  dependencies as instructed below. It's possible to install them from other
+  sources (msys2, cygwin, etc), which we leave to the reader.
+
+  Cloning the repository will also require Developer Mode to be enabled in
+  Windows. This is due to the existence of a number of symbolic links in the
+  repository. Without Developer Mode, ``git`` on Windows will ignore these
+  links and builds will fail. There are a couple of different ways to enable
+  it, and the settings may differ depending on the version of Windows.
+
+  .. code-block:: console
+
+     choco install -y --no-progress visualstudio2019buildtools --version=16.11.11.0
+     choco install -y --no-progress visualstudio2019-workload-vctools --version=1.0.0 --package-parameters '--add Microsoft.VisualStudio.Component.VC.ATLMFC'
+     choco install -y --no-progress sed
+     choco install -y --no-progress winflexbison3
+     choco install -y --no-progress msysgit
+     choco install -y --no-progress python
+     choco install -y --no-progress openssl --version=3.1.1
+
+  Once the dependencies are installed, you will need to add the Git installation
+  to your PATH (``C:\Program Files\Git\bin`` by default). This is needed for the
+  ``sh`` command to be available during the build. Once all of the dependencies
+  are in place, you will need to open a shell (PowerShell or cmd) and add the
+  development environment to it. The following command is for running on an
+  x86_64 host.
+
+  .. code-block:: console
+
+     C:\Program Files (x86)\Microsoft Visual Studio\2019\BuildTools\VC\Auxiliary\Build\vcvarsall.bat x86_amd64
+
+  Now you can build via cmake:
+
+  .. code-block:: console
+
+     mkdir build
+     cd build
+     cmake.exe .. -DCMAKE_BUILD_TYPE=release -DENABLE_ZEEK_UNIT_TESTS=yes -DENABLE_CLUSTER_BACKEND_ZEROMQ=no -DVCPKG_TARGET_TRIPLET="x64-windows-static" -G Ninja
+     cmake.exe --build .
+
+  All of this is duplicated in the CI configuration for Windows which lives in
+  the ``ci/windows`` directory, and can be used as a reference for running the
+  commands by hand.
+
+  Note: By default, Windows links against the standard libpcap library from
+  vcpkg. This version of libpcap does not support packet capture on Windows,
+  unlike other platforms. In order to capture packets from live interfaces on
+  Windows, you will need to link against the Npcap_ library. This library is free
+  for personal use, but requires a paid license for commercial use or
+  redistribution. To link against Npcap, download the SDK from their website,
+  unzip it, and then pass ``-DPCAP_ROOT_DIR="<path to npcap sdk>"`` to the
+  initial CMake invocation for Zeek.
+
+  Note also that the ZeroMQ cluster backend is not yet supported on Windows.
+
+Optional Dependencies
+---------------------
+
+Zeek can make use of some optional libraries and tools if they are found at
+build time:
+
+    * libmaxminddb (for geolocating IP addresses)
+    * sendmail (enables Zeek and ZeekControl to send mail)
+    * curl (used by a Zeek script that implements active HTTP)
+    * gperftools (tcmalloc is used to improve memory and CPU usage)
+    * jemalloc (https://github.com/jemalloc/jemalloc)
+    * PF_RING (Linux only, see :ref:`pf-ring-config`)
+    * krb5 libraries and headers
+    * ipsumdump (for trace-summary; https://github.com/kohler/ipsumdump)
+    * hiredis (for the Redis storage backend)
+
+Geolocation is probably the most interesting and can be installed on most
+platforms by following the instructions for :ref:`address geolocation and AS
+lookups <geolocation>`.
+
+The `zkg package manager`_, included in the Zeek installation, requires
+two external Python modules:
+
+    * GitPython: https://pypi.org/project/GitPython/
+    * semantic-version: https://pypi.org/project/semantic-version/
+
+These install easily via pip (``pip3 install GitPython
+semantic-version``) and also ship with some distributions:
+
+* RPM/RedHat-based Linux:
+
+  .. code-block:: console
+
+     sudo yum install python3-GitPython python3-semantic_version
+
+* DEB/Debian-based Linux:
+
+  .. code-block:: console
+
+     sudo apt-get install python3-git python3-semantic-version
+
+``zkg`` also requires a ``git`` installation, which the above system packages
+pull in as a dependency. If you install via pip, remember that you also need
+``git`` itself.
+
+Retrieving the Sources
+----------------------
+
+Zeek releases are bundled into source packages for convenience and are
+available on the `downloads page`_. The source code can be manually downloaded
+from the link in the ``.tar.gz`` format to the target system for installation.
+
+If you plan to `contribute`_ to Zeek or just want to try out the latest
+features under development, you should obtain Zeek's source code through its
+Git repositories hosted at https://github.com/zeek:
+
+.. code-block:: console
+
+    git clone --recurse-submodules https://github.com/zeek/zeek
+
+.. note:: If you choose to clone the ``zeek`` repository
+   non-recursively for a "minimal Zeek experience", be aware that
+   compiling it depends on several of the other submodules as well, so
+   you'll likely have to build/install those independently first.
+
+Configuring and Building
+------------------------
+
+The typical way to build and install from source is as follows:
+
+.. code-block:: console
+
+    ./configure
+    make
+    make install
+
+If the ``configure`` script fails, then it is most likely because it either
+couldn't find a required dependency or it couldn't find a sufficiently new
+version of a dependency.  Assuming that you already installed all required
+dependencies, then you may need to use one of the ``--with-*`` options
+that can be given to the ``configure`` script to help it locate a dependency.
+To find out what all different options ``./configure`` supports, run
+``./configure --help``.
+
+The default installation path is ``/usr/local/zeek``, which would typically
+require root privileges when doing the ``make install``.  A different
+installation path can be chosen by specifying the ``configure`` script
+``--prefix`` option.  Note that ``/usr``, ``/opt/bro/``, and ``/opt/zeek`` are
+the standard prefixes for binary Zeek packages to be installed, so those are
+typically not good choices unless you are creating such a package.
+
+OpenBSD users, please see our `FAQ <https://zeek.org/faq/>`_ if you are having
+problems installing Zeek.
+
+Depending on the Zeek package you downloaded, there may be auxiliary
+tools and libraries available in the ``auxil/`` directory. Some of them
+will be automatically built and installed along with Zeek. There are
+``--disable-*`` options that can be given to the configure script to
+turn off unwanted auxiliary projects that would otherwise be installed
+automatically.  Finally, use ``make install-aux`` to install some of
+the other programs that are in the ``auxil/zeek-aux`` directory.
+
+Finally, if you want to build the Zeek documentation (not required, because
+all of the documentation for the latest Zeek release is available at
+https://docs.zeek.org), there are instructions in ``doc/README`` in the source
+distribution.
+
+Cross Compiling
+---------------
+
+Prerequisites
+~~~~~~~~~~~~~
+
+You need three things on the host system:
+
+1. The Zeek source tree.
+2. A cross-compilation toolchain, such as one built via crosstool-NG_.
+3. Pre-built Zeek dependencies from the target system.  This usually
+   includes libpcap, zlib, OpenSSL, and Python development headers
+   and libraries.
+
+Configuration and Compiling
+~~~~~~~~~~~~~~~~~~~~~~~~~~~
+
+You first need to compile a few build tools native to the host system
+for use during the later cross-compile build.  In the root of your
+Zeek source tree:
+
+.. code-block:: console
+
+   ./configure --builddir=../zeek-buildtools
+   ( cd ../zeek-buildtools && make binpac bifcl )
+
+Next configure Zeek to use your cross-compilation toolchain (this example
+uses a Raspberry Pi as the target system):
+
+.. code-block:: console
+
+   ./configure --toolchain=/home/jon/x-tools/RaspberryPi-toolchain.cmake --with-binpac=$(pwd)/../zeek-buildtools/auxil/binpac/src/binpac --with-bifcl=$(pwd)/../zeek-buildtools/src/bifcl
+
+Here, the :file:`RaspberryPi-toolchain.cmake` file specifies a `CMake
+toolchain`_.  In the toolchain file, you need to point the toolchain and
+compiler at the cross-compilation toolchain.  It might look something the
+following:
+
+.. code-block:: cmake
+
+  # Operating System on which CMake is targeting.
+  set(CMAKE_SYSTEM_NAME Linux)
+
+  # The CMAKE_STAGING_PREFIX option may not work.
+  # Given that Zeek is configured:
+  #
+  #   ``./configure --prefix=<dir>``
+  #
+  # The options are:
+  #
+  #   (1) ``make install`` and then copy over the --prefix dir from host to
+  #       target system.
+  #
+  #   (2) ``DESTDIR=<staging_dir> make install`` and then copy over the
+  #       contents of that staging directory.
+
+  set(toolchain /home/jon/x-tools/arm-rpi-linux-gnueabihf)
+  set(CMAKE_C_COMPILER   ${toolchain}/bin/arm-rpi-linux-gnueabihf-gcc)
+  set(CMAKE_CXX_COMPILER ${toolchain}/bin/arm-rpi-linux-gnueabihf-g++)
+
+  # The cross-compiler/linker will use these paths to locate dependencies.
+  set(CMAKE_FIND_ROOT_PATH
+      /home/jon/x-tools/zeek-rpi-deps
+      ${toolchain}/arm-rpi-linux-gnueabihf/sysroot
+  )
+
+  set(CMAKE_FIND_ROOT_PATH_MODE_PROGRAM NEVER)
+  set(CMAKE_FIND_ROOT_PATH_MODE_LIBRARY ONLY)
+  set(CMAKE_FIND_ROOT_PATH_MODE_INCLUDE ONLY)
+
+If that configuration succeeds you are ready to build:
+
+.. code-block:: console
+
+   make
+
+And if that works, install on your host system:
+
+.. code-block:: console
+
+   make install
+
+Once installed, you can copy/move the files from the installation prefix on the
+host system to the target system and start running Zeek as usual.
+
+Configuring the Run-Time Environment
+====================================
+
+You may want to adjust your :envvar:`PATH` environment variable
+according to the platform/shell/package you're using since
+neither :file:`/usr/local/zeek/bin/` nor :file:`/opt/zeek/bin/`
+will reside in the default :envvar:`PATH`. For example:
+
+Bourne-Shell Syntax:
+
+.. code-block:: console
+
+   export PATH=/usr/local/zeek/bin:$PATH
+
+C-Shell Syntax:
+
+.. code-block:: console
+
+   setenv PATH /usr/local/zeek/bin:$PATH
+
+Or substitute ``/opt/zeek/bin`` instead if you installed from a binary package.
+
+Zeek supports several environment variables to adjust its behavior. Take a look
+at the ``zeek --help`` output for details.
--- a/doc/cluster-setup.rst
+++ b/doc/cluster-setup.rst
@ -0,0 +1,507 @@
+
+.. _ZeekControl documentation: https://github.com/zeek/zeekctl
+
+==================
+Zeek Cluster Setup
+==================
+
+.. TODO: integrate BoZ revisions
+
+A *Zeek Cluster* is a set of systems jointly analyzing the traffic of
+a network link in a coordinated fashion.  You can operate such a setup from
+a central manager system easily using ZeekControl because it
+hides much of the complexity of the multi-machine installation.
+
+Cluster Architecture
+====================
+
+Zeek is not multithreaded, so once the limitations of a single processor core
+are reached the only option currently is to spread the workload across many
+cores, or even many physical computers. The cluster deployment scenario for
+Zeek is the current solution to build these larger systems. The tools and
+scripts that accompany Zeek provide the structure to easily manage many Zeek
+processes examining packets and doing correlation activities but acting as
+a singular, cohesive entity.  This section describes the Zeek cluster
+architecture.  For information on how to configure a Zeek cluster,
+see the documentation for `ZeekControl <https://github.com/zeek/zeekctl>`_.
+
+Architecture
+------------
+
+The figure below illustrates the main components of a Zeek cluster.
+
+.. image:: /images/deployment.png
+
+For more specific information on the way Zeek processes are connected,
+how they function, and how they communicate with each other, see the
+:ref:`Broker Framework Documentation <broker-framework>`.
+
+Tap
+***
+The tap is a mechanism that splits the packet stream in order to make a copy
+available for inspection. Examples include the monitoring port on a switch
+and an optical splitter on fiber networks.
+
+Frontend
+********
+The frontend is a discrete hardware device or on-host technique that splits
+traffic into many streams or flows. The Zeek binary does not do this job.
+There are numerous ways to accomplish this task, some of which are described
+below in `Frontend Options`_.
+
+Manager
+*******
+The manager is a Zeek process that has two primary jobs.  It receives log
+messages and notices from the rest of the nodes in the cluster using the Zeek
+communications protocol (note that if you use a separate logger node, then the
+logger receives all logs instead of the manager).  The result
+is a single log instead of many discrete logs that you have to
+combine in some manner with post-processing.
+The manager also supports other functionality and analysis which
+requires a centralized, global view of events or data.
+
+Logger
+******
+A logger is an optional Zeek process that receives log messages from the
+rest of the nodes in the cluster using the Zeek communications protocol.
+The purpose of having a logger receive logs instead of the manager is
+to reduce the load on the manager.  If no logger is needed, then the
+manager will receive logs instead.
+
+Proxy
+*****
+A proxy is a Zeek process that may be used to offload data storage or
+any arbitrary workload.  A cluster may contain multiple proxy nodes.
+The default scripts that come with Zeek make minimal use of proxies, so
+a single one may be sufficient, but customized use of them to partition
+data or workloads provides greater cluster scalability potential than
+just doing similar tasks on a single, centralized Manager node.
+
+Zeek processes acting as proxies don't tend to be extremely hard on CPU
+or memory and users frequently run proxy processes on the same physical
+host as the manager.
+
+Worker
+******
+The worker is the Zeek process that sniffs network traffic and does protocol
+analysis on the reassembled traffic streams.  Most of the work of an active
+cluster takes place on the workers and as such, the workers typically
+represent the bulk of the Zeek processes that are running in a cluster.
+The fastest memory and CPU core speed you can afford is recommended
+since all of the protocol parsing and most analysis will take place here.
+There are no particular requirements for the disks in workers since almost all
+logging is done remotely to the manager, and normally very little is written
+to disk.
+
+Frontend Options
+----------------
+
+There are many options for setting up a frontend flow distributor.  In many
+cases it is beneficial to do multiple stages of flow distribution
+on the network and on the host.
+
+Discrete hardware flow balancers
+********************************
+
+cPacket
+^^^^^^^
+
+If you are monitoring one or more 10G physical interfaces, the recommended
+solution is to use either a cFlow or cVu device from cPacket because they
+are used successfully at a number of sites.  These devices will perform
+layer-2 load balancing by rewriting the destination Ethernet MAC address
+to cause each packet associated with a particular flow to have the same
+destination MAC.  The packets can then be passed directly to a monitoring
+host where each worker has a BPF filter to limit its visibility to only that
+stream of flows, or onward to a commodity switch to split the traffic out to
+multiple 1G interfaces for the workers.  This greatly reduces
+costs since workers can use relatively inexpensive 1G interfaces.
+
+On host flow balancing
+**********************
+
+PF_RING
+^^^^^^^
+
+The PF_RING software for Linux has a "clustering" feature which will do
+flow-based load balancing across a number of processes that are sniffing the
+same interface.  This allows you to easily take advantage of multiple
+cores in a single physical host because Zeek's main event loop is single
+threaded and can't natively utilize all of the cores.  If you want to use
+PF_RING, see the documentation on :ref:`how to configure Zeek with PF_RING
+<pf-ring-config>`.
+
+
+AF_PACKET
+^^^^^^^^^
+
+On Linux, Zeek supports `AF_PACKET sockets <https://docs.kernel.org/networking/packet_mmap.html>`_ natively.
+Currently, this is provided by including the `external Zeek::AF_Packet plugin <https://github.com/zeek/zeek-af_packet-plugin>`_
+in default builds of Zeek for Linux. Additional information can be found in
+the project's README file.
+
+To check the availability of the ``af_packet`` packet source, print its information using ``zeek -N``::
+
+    zeek -N Zeek::AF_Packet
+    Zeek::AF_Packet - Packet acquisition via AF_Packet (dynamic, version 3.2.0)
+
+On FreeBSD, MacOSX, or if Zeek was built with ``--disable-af-packet``, the
+plugin won't be available.
+
+Single worker mode
+""""""""""""""""""
+
+For the most basic usage, prefix the interface with ``af_packet::`` when invoking Zeek::
+
+    zeek -i af_packet::eth0
+
+Generally, running Zeek this way requires a privileged user with CAP_NET_RAW
+and CAP_NET_ADMIN capabilities. Linux supports file-based capabilities: A
+process executing an executable with capabilities will receive these.
+Using this mechanism allows to run Zeek as an unprivileged user once the file
+capabilities have been added::
+
+    sudo setcap cap_net_raw,cap_net_admin=+eip /path/to/zeek
+
+Offloading and ethtool tuning
+"""""""""""""""""""""""""""""
+
+While not specific to AF_PACKET, it is recommended to disable any offloading
+features provided by the network card or Linux networking stack when running
+Zeek. This allows to see network packets as they arrive on the wire.
+See this `blog post <https://blog.securityonion.net/2011/10/when-is-full-packet-capture-not-full.html>`_
+for more background
+
+Toggling these features can be done with the ``ethtool -K`` command, for example::
+
+    IFACE=eth0
+    for offload in rx tx sg tso ufo gso gro lro; do
+      ethtool -K $IFACE $offload off
+    done
+
+Detailed statistics about the interface can be gathered via ``ethtool -S``.
+
+For more details around the involved offloads consult the
+`ethtool manpage <https://man7.org/linux/man-pages/man8/ethtool.8.html>`_.
+
+Load balancing
+""""""""""""""
+
+The more interesting use-case is to use AF_PACKET to run multiple Zeek workers
+and have their packet sockets join what is called a fanout group.
+In such a setup, the network traffic is load-balanced across Zeek workers.
+By default load balancing is based on symmetric flow hashes [#]_.
+
+For example, running two Zeek workers listening on the same network interface,
+each worker analyzing approximately half of the network traffic, can be done
+as follows::
+
+    zeek -i af_packet::eth0 &
+    zeek -i af_packet::eth0 &
+
+The fanout group is identified by an id and configurable using the
+``AF_Packet::fanout_id`` constant which defaults to 23. In the example
+above, both Zeek workers join the same fanout group.
+
+
+.. note::
+
+  As a caveat, within the same Linux network namespace, two Zeek processes can
+  not use the same fanout group id for listening on different network interfaces.
+  If this is a setup you're planning on running, configure the fanout group
+  ids explicitly.
+  For illustration purposes, the following starts two Zeek workers each using
+  a different network interface and fanout group id::
+
+    zeek -i af_packet::eth0 AF_Packet::fanout_id=23 &
+    zeek -i af_packet::eth1 AF_Packet::fanout_id=24 &
+
+.. warning::
+
+  Zeek workers crashing or restarting due to running out of memory can,
+  for a short period of time, disturb load balancing due to their packet
+  sockets being removed and later rejoining the fanout group.
+  This may be visible in Zeek logs as gaps and/or duplicated connection
+  entries produced by different Zeek workers.
+
+See :ref:`cluster-configuration` for instructions how to configure AF_PACKET
+with ZeekControl.
+
+
+Netmap
+^^^^^^
+
+`Netmap <https://github.com/luigirizzo/netmap>`_ is a framework for fast
+packet I/O that is natively supported on FreeBSD since version 10.
+On Linux it can be installed as an out-of-tree kernel module.
+
+FreeBSD
+"""""""
+FreeBSD's libpcap library supports netmap natively. This allows to prefix
+interface names with ``netmap:`` to instruct libpcap to open the interface
+in netmap mode. For example, a single Zeek worker can leverage netmap
+transparently using Zeek's default packet source as follows::
+
+    zeek -i netmap:em0
+
+.. warning::
+
+  Above command will put the em0 interface into kernel-bypass mode. Network
+  packets will pass directly to Zeek without being interpreted by the kernel.
+  If em0 is your primary network interface, this effectively disables
+  networking, including SSH connectivity.
+
+If your network card supports multiple rings, individual Zeek workers can be
+attached to these as well (this assumes the NIC does proper flow hashing in hardware)::
+
+    zeek -i netmap:em0-0
+    zeek -i netmap:em0-1
+
+For software load balancing support, the FreeBSD source tree includes the
+``lb`` tool to distribute packets into netmap pipes doing flow hashing
+in user-space.
+
+To compile and install ``lb``, ensure ``/usr/src`` is available on your
+FreeBSD system, then run the following commands::
+
+    cd /usr/src/tools/tools/netmap/
+    make
+    # Installs lb into /usr/local/bin
+    cp /usr/obj/usr/src/`uname -m`.`uname -m`/tools/tools/netmap/lb /usr/local/bin/
+
+
+To load-balance packets arriving on em0 into 4 different netmap pipes named
+``zeek}0`` through ``zeek}3``, run ``lb`` as follows::
+
+    lb -i em0 -p zeek:4
+    410.154166 main [634] interface is em0
+    411.377220 main [741] successfully opened netmap:em0
+    411.377243 main [812] opening pipe named netmap:zeek{0/xT@1
+    411.379200 main [829] successfully opened pipe #1 netmap:zeek{0/xT@1 (tx slots: 1024)
+    411.379242 main [838] zerocopy enabled
+    ...
+
+Now, Zeek workers can attach to these four netmap pipes. When starting Zeek
+workers manually, the respective invocations would be as follows. The ``/x``
+suffix specifies exclusive mode to prevent two Zeek processes consuming packets
+from the same netmap pipe::
+
+    zeek -i netmap:zeek}0/x
+    zeek -i netmap:zeek}1/x
+    zeek -i netmap:zeek}2/x
+    zeek -i netmap:zeek}3/x
+
+For packet-level debugging, you can attach ``tcpdump`` to any of the netmap
+pipes in read monitor mode even while Zeek workers are consuming from them::
+
+    tcpdump -i netmap:zeek}1/r
+
+In case libpcap's netmap support is insufficient, the external
+`Zeek netmap plugin <https://github.com/zeek/zeek-netmap>`_ can be installed.
+
+.. warning::
+
+  When using the zeek-netmap plugin on FreeBSD, the interface specification given to Zeek
+  needs to change from ``netmap:zeek}0/x`` to ``netmap::zeek}0/x`` - a single colon more.
+  In the first case, Zeek uses the default libpcap packet source and passes ``netmap:zeek}0``
+  as interface name. In the second case, ``netmap::`` is interpreted by Zeek and
+  the netmap packet source is instantiated. The ``zeek}0/x`` part is used as
+  interface name.
+
+Linux
+"""""
+
+While netmap isn't included in the Linux kernel, it can be installed as
+an out-of-tree kernel module.
+See the project's `GitHub repository <https://github.com/luigirizzo/netmap>`_
+for detailed instructions. This includes the ``lb`` tool for load balancing.
+
+On Linux, the external `zeek-netmap <https://github.com/zeek/zeek-netmap>`_
+packet source plugin is required, or the system's libpcap library as used by
+Zeek needs to be recompiled with native netmap support. With the netmap kernel
+module loaded and the Zeek plugin installed, running a Zeek worker as follows
+will leverage netmap on Linux::
+
+    zeek -i netmap::eth1
+
+For using ``lb`` or libpcap with netmap support, refer to the commands shown
+in the FreeBSD section - these are essentially the same.
+
+
+.. _cluster-configuration:
+
+Cluster Configuration
+=====================
+
+A *Zeek Cluster* is a set of systems jointly analyzing the traffic of
+a network link in a coordinated fashion.  You can operate such a setup from
+a central manager system easily using ZeekControl because it
+hides much of the complexity of the multi-machine installation.
+
+This section gives examples of how to setup common cluster configurations
+using ZeekControl.  For a full reference on ZeekControl, see the
+`ZeekControl documentation`_.
+
+Preparing to Setup a Cluster
+----------------------------
+
+We refer to the user account used to set up the cluster
+as the "Zeek user".  When setting up a cluster the Zeek user must be set up
+on all hosts, and this user must have ssh access from the manager to all
+machines in the cluster, and it must work without being prompted for a
+password/passphrase (for example, using ssh public key authentication).
+Also, on the worker nodes this user must have access to the target
+network interface in promiscuous mode.
+
+Additional storage must be available on all hosts under the same path,
+which we will call the cluster's prefix path.  We refer to this directory
+as ``<prefix>``.  If you build Zeek from source, then ``<prefix>`` is
+the directory specified with the ``--prefix`` configure option,
+or ``/usr/local/zeek`` by default.  The Zeek user must be able to either
+create this directory or, where it already exists, must have write
+permission inside this directory on all hosts.
+
+When trying to decide how to configure the Zeek nodes, keep in mind that
+there can be multiple Zeek instances running on the same host.  For example,
+it's possible to run a proxy and the manager on the same host.  However, it is
+recommended to run workers on a different machine than the manager because
+workers can consume a lot of CPU resources.  The maximum recommended
+number of workers to run on a machine should be one or two less than
+the number of CPU cores available on that machine.  Using a load-balancing
+method (such as PF_RING) along with CPU pinning can decrease the load on
+the worker machines.  Also, in order to reduce the load on the manager
+process, it is recommended to have a logger in your configuration.  If a
+logger is defined in your cluster configuration, then it will receive logs
+instead of the manager process.
+
+Basic Cluster Configuration
+---------------------------
+
+With all prerequisites in place, perform the following steps to setup
+a Zeek cluster (do this as the Zeek user on the manager host only):
+
+- Edit the ZeekControl configuration file, ``<prefix>/etc/zeekctl.cfg``,
+  and change the value of any options to be more suitable for
+  your environment.  You will most likely want to change the value of
+  the ``MailTo`` and ``LogRotationInterval`` options.  A complete
+  reference of all ZeekControl options can be found in the
+  `ZeekControl documentation`_.
+
+- Edit the ZeekControl node configuration file, ``<prefix>/etc/node.cfg``
+  to define where logger, manager, proxies, and workers are to run.  For a
+  cluster configuration, you must comment-out (or remove) the standalone node
+  in that file, and either uncomment or add node entries for each node
+  in your cluster (logger, manager, proxy, and workers).  For example, if you
+  wanted to run five Zeek nodes (two workers, one proxy, a logger, and a
+  manager) on a cluster consisting of three machines, your cluster
+  configuration would look like this::
+
+    [logger]
+    type=logger
+    host=10.0.0.10
+
+    [manager]
+    type=manager
+    host=10.0.0.10
+
+    [proxy-1]
+    type=proxy
+    host=10.0.0.10
+
+    [worker-1]
+    type=worker
+    host=10.0.0.11
+    interface=eth0
+
+    [worker-2]
+    type=worker
+    host=10.0.0.12
+    interface=eth0
+
+  For a complete reference of all options that are allowed in the ``node.cfg``
+  file, see the `ZeekControl documentation`_.
+
+- Edit the network configuration file ``<prefix>/etc/networks.cfg``.  This
+  file lists all of the networks which the cluster should consider as local
+  to the monitored environment.
+
+- Install Zeek on all machines in the cluster using ZeekControl::
+
+    > zeekctl install
+
+- See the `ZeekControl documentation`_
+  for information on setting up a cron job on the manager host that can
+  monitor the cluster.
+
+AF_PACKET Cluster Configuration
+-------------------------------
+
+Since version 5.2, Zeek includes AF_PACKET as a native packet source. This
+provides an easy and efficient capture mechanism for Linux users.
+
+Adapt the worker section in ZeekControl's ``node.cfg`` file with the
+following entries, assuming running four worker processes listening on ``eth0`` ::
+
+    [worker-1]
+    type=worker
+    host=10.0.0.11
+    interface=eth0
+    lb_method=af_packet
+    lb_procs=4
+
+The specific options are ``lb_method=af_packet`` and ``lb_procs=4``.
+If listening on two or more interfaces on the same host is a requirement,
+remember to set a unique ``fanout_id`` using the node option ``af_packet_fanout_id``::
+
+    [worker-1-eth0]
+    type=worker
+    host=10.0.0.11
+    interface=eth0
+    lb_method=af_packet
+    lb_procs=4
+    af_packet_fanout_id=20
+
+    [worker-1-eth1]
+    type=worker
+    host=10.0.0.11
+    interface=eth1
+    lb_method=af_packet
+    lb_procs=4
+    af_packet_fanout_id=21
+
+Pinning the worker processes to individual CPU cores can improve performance.
+Use the node's option ``pin_cpus=4,5,6,7``, listing as many CPU numbers as
+processes at appropriate offsets.
+
+.. _pf-ring-config:
+
+PF_RING Cluster Configuration
+-----------------------------
+
+`PF_RING <http://www.ntop.org/products/pf_ring/>`_ allows speeding up the
+packet capture process by installing a new type of socket in Linux systems.
+It supports 10Gbit hardware packet filtering using standard network adapters,
+and user-space DNA (Direct NIC Access) for fast packet capture/transmission.
+
+.. note::
+
+   Unless you have evaluated to specifically require PF_RING, consider using
+   AF_PACKET first and test if it fulfills your requirements. AF_PACKET has
+   been integrated into Zeek since version 5.2. It's a bit easier to get
+   started with as it does not require an out of tree Linux kernel module.
+
+Head over to :ref:`cluster-pf-ring` for more details.
+
+.. toctree::
+   :hidden:
+
+   cluster/pf_ring
+
+
+.. [#] Some Linux kernel versions between 3.10 and 4.7 might exhibit
+       a bug that prevents the required symmetric hashing. The script available
+       in the GitHub project `can-i-use-afpacket-fanout <https://github.com/JustinAzoff/can-i-use-afpacket-fanout>`_
+       can be used to verify whether ``PACKET_FANOUT`` works as expected.
+
+       This issue has been fixed in all stable kernels for at least 5 years.
+       You're unlikely to be affected.
--- a/doc/cluster/pf_ring.rst
+++ b/doc/cluster/pf_ring.rst
@ -0,0 +1,141 @@
+.. _cluster-pf-ring:
+
+===================
+PF_RING Setup Guide
+===================
+
+Installing PF_RING
+******************
+
+1. Download and install PF_RING for your system following the instructions
+   `here <http://www.ntop.org/get-started/download/#PF_RING>`_.  The following
+   commands will install the PF_RING libraries and kernel module (replace
+   the version number 5.6.2 in this example with the version that you
+   downloaded)::
+
+     cd /usr/src
+     tar xvzf PF_RING-5.6.2.tar.gz
+     cd PF_RING-5.6.2/userland/lib
+     ./configure --prefix=/opt/pfring
+     make install
+
+     cd ../libpcap
+     ./configure --prefix=/opt/pfring
+     make install
+
+     cd ../tcpdump-4.1.1
+     ./configure --prefix=/opt/pfring
+     make install
+
+     cd ../../kernel
+     make
+     make install
+
+     modprobe pf_ring enable_tx_capture=0 min_num_slots=32768
+
+   Refer to the documentation for your Linux distribution on how to load the
+   pf_ring module at boot time.  You will need to install the PF_RING
+   library files and kernel module on all of the workers in your cluster.
+
+2. Download the Zeek source code.
+
+3. Configure and install Zeek using the following commands::
+
+     ./configure --with-pcap=/opt/pfring
+     make
+     make install
+
+4. Make sure Zeek is correctly linked to the PF_RING libpcap libraries::
+
+     ldd /usr/local/zeek/bin/zeek | grep pcap
+           libpcap.so.1 => /opt/pfring/lib/libpcap.so.1 (0x00007fa6d7d24000)
+
+5. Configure ZeekControl to use PF_RING (explained below).
+
+6. Run "zeekctl install" on the manager.  This command will install Zeek and
+   required scripts to all machines in your cluster.
+
+Using PF_RING
+*************
+
+In order to use PF_RING, you need to specify the correct configuration
+options for your worker nodes in ZeekControl's node configuration file.
+Edit the ``node.cfg`` file and specify ``lb_method=pf_ring`` for each of
+your worker nodes.  Next, use the ``lb_procs`` node option to specify how
+many Zeek processes you'd like that worker node to run, and optionally pin
+those processes to certain CPU cores with the ``pin_cpus`` option (CPU
+numbering starts at zero).  The correct ``pin_cpus`` setting to use is
+dependent on your CPU architecture (Intel and AMD systems enumerate
+processors in different ways).  Using the wrong ``pin_cpus`` setting
+can cause poor performance.  Here is what a worker node entry should
+look like when using PF_RING and CPU pinning::
+
+   [worker-1]
+   type=worker
+   host=10.0.0.50
+   interface=eth0
+   lb_method=pf_ring
+   lb_procs=10
+   pin_cpus=2,3,4,5,6,7,8,9,10,11
+
+
+Using PF_RING+DNA with symmetric RSS
+************************************
+
+You must have a PF_RING+DNA license in order to do this.  You can sniff
+each packet only once.
+
+1. Load the DNA NIC driver (i.e. ixgbe) on each worker host.
+
+2. Run "ethtool -L dna0 combined 10" (this will establish 10 RSS queues
+   on your NIC) on each worker host.  You must make sure that you set the
+   number of RSS queues to the same as the number you specify for the
+   lb_procs option in the node.cfg file.
+
+3. On the manager, configure your worker(s) in node.cfg::
+
+       [worker-1]
+       type=worker
+       host=10.0.0.50
+       interface=dna0
+       lb_method=pf_ring
+       lb_procs=10
+
+
+Using PF_RING+DNA with pfdnacluster_master
+******************************************
+
+You must have a PF_RING+DNA license and a libzero license in order to do
+this.  You can load balance between multiple applications and sniff the
+same packets multiple times with different tools.
+
+1. Load the DNA NIC driver (i.e. ixgbe) on each worker host.
+
+2. Run "ethtool -L dna0 1" (this will establish 1 RSS queues on your NIC)
+   on each worker host.
+
+3. Run the pfdnacluster_master command on each worker host.  For example::
+
+       pfdnacluster_master -c 21 -i dna0 -n 10
+
+   Make sure that your cluster ID (21 in this example) matches the interface
+   name you specify in the node.cfg file.  Also make sure that the number
+   of processes you're balancing across (10 in this example) matches
+   the lb_procs option in the node.cfg file.
+
+4. If you are load balancing to other processes, you can use the
+   pfringfirstappinstance variable in zeekctl.cfg to set the first
+   application instance that Zeek should use.  For example, if you are running
+   pfdnacluster_master with "-n 10,4" you would set
+   pfringfirstappinstance=4.  Unfortunately that's still a global setting
+   in zeekctl.cfg at the moment but we may change that to something you can
+   set in node.cfg eventually.
+
+5. On the manager, configure your worker(s) in node.cfg::
+
+       [worker-1]
+       type=worker
+       host=10.0.0.50
+       interface=dnacluster:21
+       lb_method=pf_ring
+       lb_procs=10
--- a/doc/components/index.rst
+++ b/doc/components/index.rst
@ -0,0 +1,33 @@
+
+=============
+Subcomponents
+=============
+
+To find documentation for the various subcomponents of Zeek, see their
+respective GitHub repositories or documentation:
+
+* `Spicy <https://docs.zeek.org/projects/spicy>`__
+  - C++ parser generator for dissecting protocols & files.
+* `BinPAC <https://github.com/zeek/binpac>`__
+  - A protocol parser generator
+* `ZeekControl <https://github.com/zeek/zeekctl>`__
+  - Interactive Zeek management shell
+* `Zeek-Aux <https://github.com/zeek/zeek-aux>`__
+  - Small auxiliary tools for Zeek
+* `BTest <https://github.com/zeek/btest>`__
+  - A system testing framework
+* `Capstats <https://github.com/zeek/capstats>`__
+  - Command-line packet statistic tool
+* `PySubnetTree <https://github.com/zeek/pysubnettree>`__
+  - Python module for CIDR lookups
+* `trace-summary <https://github.com/zeek/trace-summary>`__
+  - Script for generating break-downs of network traffic
+* `Broker <https://github.com/zeek/broker>`__
+  - Zeek's Messaging Library
+  - `(Docs) <https://docs.zeek.org/projects/broker>`__
+* `Package Manager <https://github.com/zeek/package-manager>`__
+  - A package manager for Zeek
+  - `(Docs) <https://docs.zeek.org/projects/package-manager>`__
+* `Paraglob <https://github.com/zeek/paraglob>`__
+  - A pattern matching data structure for Zeek.
+  - `(Docs) <https://github.com/zeek/paraglob/blob/master/README.md>`__
--- a/doc/conf.py
+++ b/doc/conf.py
@ -0,0 +1,305 @@
+#
+# Zeek documentation build configuration file, created by sphinx-quickstart
+#
+# This file is execfile()d with the current directory set to its containing dir.
+#
+# Note that not all possible configuration values are present in this
+# autogenerated file.
+#
+# All configuration values have a default; values that are commented out
+# serve to show the default.
+
+import os
+import sys
+
+extensions = []
+
+# If extensions (or modules to document with autodoc) are in another directory,
+# add these directories to sys.path here. If the directory is relative to the
+# documentation root, use os.path.abspath to make it absolute, like shown here.
+sys.path.insert(0, os.path.abspath("ext"))
+
+# -- General configuration -----------------------------------------------------
+
+# If your documentation needs a minimal Sphinx version, state it here.
+# needs_sphinx = '1.0'
+
+# Add any Sphinx extension module names here, as strings. They can be extensions
+# coming with Sphinx (named 'sphinx.ext.*') or your custom ones.
+extensions += [
+    "zeek",
+    "sphinx.ext.todo",
+    "zeek_pygments",
+    "spicy-pygments",
+    "literal-emph",
+    "sphinx.ext.extlinks",
+]
+
+# Add any paths that contain templates here, relative to this directory.
+templates_path = ["_templates"]
+
+# The suffix of source filenames.
+source_suffix = ".rst"
+
+# The encoding of source files.
+# source_encoding = 'utf-8-sig'
+
+# The master toctree document.
+master_doc = "index"
+
+# General information about the project.
+project = "Zeek"
+copyright = "by the Zeek Project"
+
+# The version info for the project you're documenting, acts as replacement for
+# |version| and |release|, also used in various other places throughout the
+# built documents.
+#
+# The short X.Y version.
+#
+
+version = "source"
+
+try:
+    # Use the actual Zeek version if available
+    with open("../VERSION") as f:
+        version = f.readline().strip()
+except:
+    try:
+        import re
+
+        import git
+
+        repo = git.Repo(os.path.abspath("."))
+        version = "git/master"
+
+        version_tag_re = r"v\d+\.\d+(\.\d+)?"
+        version_tags = [
+            t
+            for t in repo.tags
+            if t.commit == repo.head.commit and re.match(version_tag_re, str(t))
+        ]
+        # Note: sorting by tag date doesn't necessarily give correct
+        # order in terms of version numbers, but doubtful that will ever be
+        # a problem (if we ever do re-tag an old version number on a given
+        # commit such that it is incorrectly found as the most recent version,
+        # we can just re-tag all the other version numbers on that same commit)
+        version_tags = sorted(version_tags, key=lambda t: t.tag.tagged_date)
+
+        if version_tags:
+            version = str(version_tags[-1])
+
+    except:
+        pass
+
+# The full version, including alpha/beta/rc tags.
+release = version
+
+# In terms of the actual hyperlink URL, a more ideal/stable way to reference
+# source code on GitHub would be by commit hash, but that can be tricky to
+# update in a way that produces stable Sphinx/reST configuration: don't want
+# to update the commit-hash for every Zeek commit unless it actually produces
+# new content, and also don't want to accidentally make it easy for people to
+# insert unreachable commits when manually running
+# `zeek/ci/update-zeekygen-docs.sh`.
+#
+# We only have a few versions of docs that actually matter: `master` and
+# `release/.*`, and the tip of those branches will always be in sync with
+# auto-generated content by simply having `zeek/ci/update-zeekygen-docs.sh`
+# change this to `release/.*` when needed.
+zeek_code_version = "master"
+zeek_code_url = f"https://github.com/zeek/zeek/blob/{zeek_code_version}"
+
+# The language for content autogenerated by Sphinx. Refer to documentation
+# for a list of supported languages.
+# language = None
+
+# There are two options for replacing |today|: either, you set today to some
+# non-false value, then it is used:
+# today = ''
+# Else, today_fmt is used as the format for a strftime call.
+today_fmt = "%B %d, %Y"
+
+# List of patterns, relative to source directory, that match files and
+# directories to ignore when looking for source files.
+exclude_patterns = [".#*", "script-reference/autogenerated-*"]
+
+# The reST default role (used for this markup: `text`) to use for all documents.
+# default_role = None
+
+# If true, '()' will be appended to :func: etc. cross-reference text.
+# add_function_parentheses = True
+
+# If true, the current module name will be prepended to all description
+# unit titles (such as .. function::).
+# add_module_names = True
+
+# If true, sectionauthor and moduleauthor directives will be shown in the
+# output. They are ignored by default.
+show_authors = True
+
+# The name of the Pygments (syntax highlighting) style to use.
+pygments_style = "sphinx"
+
+highlight_language = "none"
+
+# A list of ignored prefixes for module index sorting.
+# modindex_common_prefix = []
+
+
+# -- Options for HTML output ---------------------------------------------------
+
+html_theme = "sphinx_rtd_theme"
+
+# Set canonical URL from the Read the Docs Domain
+html_baseurl = os.environ.get("READTHEDOCS_CANONICAL_URL", "")
+
+# Tell Jinja2 templates the build is running on Read the Docs
+if os.environ.get("READTHEDOCS", "") == "True":
+    if "html_context" not in globals():
+        html_context = {}
+    html_context["READTHEDOCS"] = True
+
+html_last_updated_fmt = "%B %d, %Y"
+
+# Theme options are theme-specific and customize the look and feel of a theme
+# further.  For a list of options available for each theme, see the
+# documentation.
+html_theme_options = {
+    "analytics_id": "UA-144186885-1",
+    "collapse_navigation": False,
+    "style_external_links": True,
+}
+
+# Add any paths that contain custom themes here, relative to this directory.
+# html_theme_path = []
+
+# The name for this set of Sphinx documents.  If None, it defaults to
+# "<project> v<release> Documentation".
+html_title = f"Book of Zeek ({release})"
+
+# A shorter title for the navigation bar.  Default is the same as html_title.
+# html_short_title = None
+
+# The name of an image file (relative to this directory) to place at the top
+# of the sidebar.
+html_logo = "images/zeek-logo-sidebar.png"
+
+# The name of an image file (within the static path) to use as favicon of the
+# docs.  This file should be a Windows icon file (.ico) being 16x16 or 32x32
+# pixels large.
+html_favicon = "images/zeek-favicon.ico"
+
+# Add any paths that contain custom static files (such as style sheets) here,
+# relative to this directory. They are copied after the builtin static files,
+# so a file named "default.css" will overwrite the builtin "default.css".
+html_static_path = ["_static"]
+
+
+def setup(app):
+    app.add_css_file("theme_overrides.css")
+    from sphinx.highlighting import lexers
+    from zeek_pygments import ZeekLexer
+
+    lexers["zeek"] = ZeekLexer()
+    app.add_config_value("zeek-code-url", zeek_code_url, "env")
+
+
+# If not '', a 'Last updated on:' timestamp is inserted at every page bottom,
+# using the given strftime format.
+# html_last_updated_fmt = '%b %d, %Y'
+
+# If true, SmartyPants will be used to convert quotes and dashes to
+# typographically correct entities.
+# html_use_smartypants = True
+
+# Custom sidebar templates, maps document names to template names.
+# html_sidebars = {
+#'**': ['localtoc.html', 'sourcelink.html', 'searchbox.html'],
+# }
+
+# Additional templates that should be rendered to pages, maps page names to
+# template names.
+# html_additional_pages = {}
+
+# If false, no module index is generated.
+# html_domain_indices = True
+
+# If false, no index is generated.
+# html_use_index = True
+
+# If true, the index is split into individual pages for each letter.
+# html_split_index = False
+
+# If true, links to the reST sources are added to the pages.
+# html_show_sourcelink = True
+
+# If true, "Created using Sphinx" is shown in the HTML footer. Default is True.
+# html_show_sphinx = True
+
+# If true, "(C) Copyright ..." is shown in the HTML footer. Default is True.
+# html_show_copyright = True
+
+# If true, an OpenSearch description file will be output, and all pages will
+# contain a <link> tag referring to it.  The value of this option must be the
+# base URL from which the finished HTML is served.
+# html_use_opensearch = ''
+
+# This is the file name suffix for HTML files (e.g. ".xhtml").
+# html_file_suffix = None
+
+# Output file base name for HTML help builder.
+htmlhelp_basename = "zeek-docs"
+
+# -- Options for LaTeX output --------------------------------------------------
+
+# The paper size ('letter' or 'a4').
+# latex_paper_size = 'letter'
+
+# The font size ('10pt', '11pt' or '12pt').
+# latex_font_size = '10pt'
+
+# Grouping the document tree into LaTeX files. List of tuples
+# (source start file, target name, title, author, documentclass [howto/manual]).
+latex_documents = [
+    ("index", "Zeek.tex", "Zeek Documentation", "The Zeek Project", "manual"),
+]
+
+# The name of an image file (relative to this directory) to place at the top of
+# the title page.
+# latex_logo = None
+
+# For "manual" documents, if this is true, then toplevel headings are parts,
+# not chapters.
+# latex_use_parts = False
+
+# If true, show page references after internal links.
+# latex_show_pagerefs = False
+
+# If true, show URL addresses after external links.
+# latex_show_urls = False
+
+# Additional stuff for the LaTeX preamble.
+# latex_preamble = ''
+
+# Documents to append as an appendix to all manuals.
+# latex_appendices = []
+
+# If false, no module index is generated.
+# latex_domain_indices = True
+
+# -- Options for manual page output --------------------------------------------
+
+# One entry per manual page. List of tuples
+# (source start file, name, description, authors, manual section).
+man_pages = [("index", "zeek", "Zeek Documentation", ["The Zeek Project"], 1)]
+
+# -- Options for todo plugin --------------------------------------------
+todo_include_todos = True
+
+extlinks = {
+    "slacklink": ("https://zeek.org/slack%s", None),
+    "discourselink": ("https://community.zeek.org/%s", None),
+    "spicylink": ("https://docs.zeek.org/projects/spicy/en/latest/%s", None),
+}
+extlinks_detect_hardcoded_links = True
--- a/doc/customizations.rst
+++ b/doc/customizations.rst
@ -0,0 +1,318 @@
+.. _popular-customizations:
+
+======================
+Popular Customizations
+======================
+
+This page outlines customizations and additions that are popular
+among Zeek users.
+
+.. note::
+
+  This page lists externally-maintained Zeek packages. The Zeek team does not
+  provide support or maintenance for these packages. If you find bugs or have
+  feature requests, please reach out to the respective package maintainers directly.
+
+  You may also post in the :slacklink:`Zeek Slack <>` #packages
+  channel or :discourselink:`forum <>` to get help from the broader
+  Zeek community.
+
+
+Log Enrichment
+==============
+
+Community ID
+------------
+
+.. versionadded:: 6.0
+
+Zeek includes native `Community ID Flow Hashing`_ support. This functionality
+has previously been provided through the `zeek-community-id`_ package.
+
+.. note::
+
+  At this point, the external `zeek-community-id`_ package is still
+  available to support Zeek deployments running older versions. However,
+  the scripts provided by the package cause conflicts with those provided in
+  Zeek 6.0 - do not load both.
+
+Loading the
+:doc:`/scripts/policy/protocols/conn/community-id-logging.zeek`
+and
+:doc:`/scripts/policy/frameworks/notice/community-id.zeek`
+scripts adds an additional ``community_id`` field to the
+:zeek:see:`Conn::Info` and :zeek:see:`Notice::Info` record.
+
+.. code-block:: console
+
+   $ zeek -r ./traces/get.trace protocols/conn/community-id-logging LogAscii::use_json=T
+   $ jq < conn.log
+   {
+     "ts": 1362692526.869344,
+     "uid": "CoqLmg1Ds5TE61szq1",
+     "id.orig_h": "141.142.228.5",
+     "id.orig_p": 59856,
+     "id.resp_h": "192.150.187.43",
+     "id.resp_p": 80,
+     "proto": "tcp",
+     ...
+     "community_id": "1:yvyB8h+3dnggTZW0UEITWCst97w="
+   }
+
+
+The Community ID Flow Hash of a :zeek:see:`conn_id` instance can be computed
+with the :zeek:see:`community_id_v1` builtin function directly on the command-line
+or used in custom scripts.
+
+.. code-block:: console
+
+    $ zeek -e 'print community_id_v1([$orig_h=141.142.228.5, $orig_p=59856/tcp, $resp_h=192.150.187.43, $resp_p=80/tcp])'
+    1:yvyB8h+3dnggTZW0UEITWCst97w=
+
+.. _Community ID Flow Hashing: https://github.com/corelight/community-id-spec
+.. _zeek-community-id: https://github.com/corelight/zeek-community-id/>`_
+
+.. _geolocation:
+
+Address geolocation and AS lookups
+----------------------------------
+
+.. _libmaxminddb: https://github.com/maxmind/libmaxminddb
+
+Zeek supports IP address geolocation as well as AS (autonomous system)
+lookups. This requires two things:
+
+    * Compilation of Zeek with the `libmaxminddb`_ library and development
+      headers. If you're using our :ref:`Docker images <docker-images>` or
+      :ref:`binary packages <binary-packages>`, there's nothing to do: they ship
+      with GeoIP support.
+    * Installation of corresponding MaxMind database files on your
+      system.
+
+To check whether your Zeek supports geolocation, run ``zeek-config --have-geoip``
+(available since Zeek 6.2) or simply try an address lookup. The following
+indicates that your Zeek lacks support:
+
+.. code-block:: console
+
+    $ zeek -e 'lookup_location(1.2.3.4)'
+    error in <command line>, line 1: Zeek was not configured for GeoIP support (lookup_location(1.2.3.4))
+
+Read on for more details about building Zeek with GeoIP support, and how to
+configure access to the database files.
+
+Building Zeek with libmaxminddb
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+If you build Zeek yourself, you need to install libmaxminddb prior to
+configuring your build.
+
+* RPM/RedHat-based Linux:
+
+  .. code-block:: console
+
+      sudo yum install libmaxminddb-devel
+
+* DEB/Debian-based Linux:
+
+  .. code-block:: console
+
+      sudo apt-get install libmaxminddb-dev
+
+* FreeBSD:
+
+  .. code-block:: console
+
+      sudo pkg install libmaxminddb
+
+* Mac OS X:
+
+  You need to install from your preferred package management system
+  (e.g. Homebrew, MacPorts, or Fink).  For Homebrew, the name of the package
+  that you need is libmaxminddb.
+
+The ``configure`` script's output indicates whether it successfully located
+libmaxminddb. If your system's MaxMind library resides in a non-standard path,
+you may need to specify it via ``./configure --with-geoip=<path>``.
+
+Installing and configuring GeoIP databases
+^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+
+MaxMind's databases ship as individual files that you can `download
+<https://www.maxmind.com/en/accounts/current/geoip/downloads>`_ from their
+website after `signing up <https://www.maxmind.com/en/geolite2/signup>`_ for an
+account. Some Linux distributions also offer free databases in their package
+managers.
+
+There are three types of databases: city-level geolocation, country-level
+geolocation, and mapping of IP addresses to autonomous systems (AS number and
+organization). Download these and decide on a place to put them on your
+file system. If you use automated tooling or system packages for the
+installation, that path may be chosen for you, such as ``/usr/share/GeoIP``.
+
+Zeek provides three ways to configure access to the databases:
+
+* Specifying the path and filenames via script variables. Use the
+  :zeek:see:`mmdb_dir` variable, unset by default, to point to the directory
+  containing the database(s). By default Zeek looks for databases called
+  ``GeoLite2-City.mmdb``, ``GeoLite2-Country.mmdb``, and
+  ``GeoLite2-ASN.mmdb``. Starting with Zeek 6.2 you can adjust these names by
+  redefining the :zeek:see:`mmdb_city_db`, :zeek:see:`mmdb_country_db`, and
+  :zeek:see:`mmdb_asn_db` variables.
+* Relying on Zeek's pre-configured search paths and filenames. The
+  :zeek:see:`mmdb_dir_fallbacks` variable contains default
+  search paths that Zeek will try in turn when :zeek:see:`mmdb_dir` is not
+  set. Prior to Zeek 6.2 these paths were hardcoded; they're now redefinable.
+  For geolocation, Zeek first attempts the city-level databases due to their
+  greater precision, and falls back to the city-level one.  You can adjust the
+  database filenames via :zeek:see:`mmdb_city_db` and related variables, as
+  covered above.
+* Opening databases explicitly via scripting. The
+  :zeek:see:`mmdb_open_location_db` and :zeek:see:`mmdb_open_asn_db`
+  functions take full paths to database files. Zeek only ever uses one
+  geolocation and one ASN database, and these loads override any databases
+  previously loaded. These loads can occur at any point.
+
+Querying the databases
+^^^^^^^^^^^^^^^^^^^^^^
+
+Two built-in functions provide GeoIP functionality:
+
+.. code-block:: zeek
+
+    function lookup_location(a:addr): geo_location
+    function lookup_autonomous_system(a:addr): geo_autonomous_system
+
+:zeek:see:`lookup_location` returns a :zeek:see:`geo_location` record with
+country/region/etc fields, while :zeek:see:`lookup_autonomous_system` returns a
+:zeek:see:`geo_autonomous_system` record indicating the AS number and
+organization. Depending on the queried IP address some fields may be
+uninitialized, so you should guard access with an ``a?$b`` :ref:`existence test
+<record-field-operators>`.
+
+Zeek tests the database files for staleness. If it detects that a database has
+been updated, it will automatically reload it. Zeek does not automatically add
+GeoIP intelligence to its logs, but several add-on scripts and packages provide
+such functionality. These include:
+
+* The :ref:`notice framework <notice-framework>` lets you configure notice types
+  that you'd like to augment with location information. See
+  :zeek:see:`Notice::lookup_location_types` and
+  :zeek:see:`Notice::ACTION_ADD_GEODATA` for details.
+* The :doc:`/scripts/policy/protocols/smtp/detect-suspicious-orig.zeek` and
+  :doc:`/scripts/policy/protocols/ssh/geo-data.zeek` policy scripts.
+* Several `Zeek packages <https://packages.zeek.org>`_.
+
+Testing
+^^^^^^^
+
+Before using the GeoIP functionality it is a good idea to verify that
+everything is setup correctly. You can quickly check if the GeoIP
+functionality works by running commands like these:
+
+.. code-block:: console
+
+    zeek -e "print lookup_location(8.8.8.8);"
+
+If you see an error message similar to "Failed to open GeoIP location database",
+then your database configuration is broken. You may need to rename or move your
+GeoIP database files.
+
+Example
+^^^^^^^
+
+The following shows every FTP connection from hosts in Ohio, US:
+
+.. code-block:: zeek
+
+    event ftp_reply(c: connection, code: count, msg: string, cont_resp: bool)
+    {
+      local client = c$id$orig_h;
+      local loc = lookup_location(client);
+
+      if (loc?$region && loc$region == "OH" && loc?$country_code && loc$country_code == "US")
+      {
+        local city = loc?$city ? loc$city : "<unknown>";
+
+        print fmt("FTP Connection from:%s (%s,%s,%s)", client, city,
+          loc$region, loc$country_code);
+      }
+    }
+
+
+Log Writers
+===========
+
+Kafka
+-----
+
+For exporting logs to `Apache Kafka`_ in a streaming fashion, the externally-maintained
+`zeek-kafka`_ package is a popular choice and easy to configure. It relies on `librdkafka`_.
+
+.. code-block:: zeek
+
+   redef Log::default_writer = Log::WRITER_KAFKAWRITER;
+
+   redef Kafka::kafka_conf += {
+       ["metadata.broker.list"] = "192.168.0.1:9092"
+   };
+
+.. _Apache Kafka: https://kafka.apache.org/
+.. _zeek-kafka: https://github.com/SeisoLLC/zeek-kafka/
+.. _librdkafka: https://github.com/confluentinc/librdkafka
+
+
+Logging
+=======
+
+JSON Streaming Logs
+-------------------
+
+The externally-maintained `json-streaming-logs`_ package tailors Zeek
+for use with log shippers like `Filebeat`_ or `fluentd`_. It configures
+additional log files prefixed with ``json_streaming_``, adds ``_path``
+and ``_write_ts`` fields to log records and configures log rotation
+appropriately.
+
+If you do not use a logging archive and want to stream all logs away
+from the system where Zeek is running without leveraging Kafka, this
+package helps you with that.
+
+.. _json-streaming-logs: https://github.com/corelight/json-streaming-logs
+.. _Filebeat: https://www.elastic.co/beats/filebeat
+.. _fluentd: https://www.fluentd.org/
+
+
+Long Connections
+----------------
+
+Zeek logs connection entries into the :file:`conn.log` only upon termination
+or due to expiration of inactivity timeouts. Depending on the protocol and
+chosen timeout values this can significantly delay the appearance of a log
+entry for a given connection. The delay may be up to an hour for lingering
+SSH connections or connections where the final FIN or RST packets were missed.
+
+The `zeek-long-connections`_ package alleviates this by creating a :file:`conn_long.log`
+log with the same format as :file:`conn.log`, but containing entries for connections
+that have been existing for configurable intervals.
+By default, the first entry for a connection is logged after 10mins. Depending on
+the environment, this can be lowered as even a 10 minute delay may be significant
+for detection purposes in streaming setup.
+
+.. _zeek-long-connections: https://github.com/corelight/zeek-long-connections
+
+
+Profiling and Debugging
+=======================
+
+jemalloc profiling
+------------------
+
+For investigation of memory leaks or state-growth issues within Zeek,
+jemalloc's profiling is invaluable. A package providing a bit support
+for configuring jemalloc's profiling facilities is `zeek-jemalloc-profiling`_.
+
+Some general information about memory profiling exists in the :ref:`Troubleshooting <troubleshooting>`
+section.
+
+.. _zeek-jemalloc-profiling: https://github.com/JustinAzoff/zeek-jemalloc-profiling
--- a/doc/devel/cluster-backend-zeromq.rst
+++ b/doc/devel/cluster-backend-zeromq.rst
@ -0,0 +1,120 @@
+.. _cluster_backend_zeromq:
+
+======================
+ZeroMQ Cluster Backend
+======================
+
+.. versionadded:: 7.1
+
+*Experimental*
+
+Quickstart
+==========
+
+To switch a Zeek cluster with a static cluster layout over to use ZeroMQ
+as cluster backend, add the following snippet to ``local.zeek``:
+
+.. code-block:: zeek
+
+   @load frameworks/cluster/backend/zeromq/connect
+
+
+Note that the function :zeek:see:`Broker::publish` will be non-functional
+and a warning emitted when used - use :zeek:see:`Cluster::publish` instead.
+
+By default, a configuration based on hard-coded endpoints and cluster layout
+information is created. For more customization, refer to the module documentation
+at :doc:`cluster/backend/zeromq/main.zeek </scripts/policy/frameworks/cluster/backend/zeromq/main.zeek>`.
+
+
+Architecture
+============
+
+Publish-Subscribe of Zeek Events
+--------------------------------
+
+The `ZeroMQ <https://zeromq.org/>`_ based cluster backend uses a central
+XPUB/XSUB broker for publish-subscribe functionality. Zeek events published
+via :zeek:see:`Cluster::publish` are distributed by this central broker to
+interested nodes.
+
+.. figure:: /images/cluster/zeromq-pubsub.png
+
+
+As depicted in the figure above, each cluster node connects to the central
+broker twice, once via its XPUB socket and once via its XSUB socket. This
+results in two TCP connections from every cluster node to the central broker.
+This setup allows every node in the cluster to see messages from all other
+nodes, avoiding the need for cluster topology awareness.
+
+.. note::
+
+   Scalability of the central broker in production setups, but for small
+   clusters on a single node, may be fast enough.
+
+On a cluster node, the XPUB socket provides notifications about subscriptions
+created by other nodes: For every subscription created by any node in
+the cluster, the :zeek:see:`Cluster::Backend::ZeroMQ::subscription` event is
+raised locally on every other node (unless another node had created the same
+subscription previously).
+
+This mechanism is used to discover the existence of other cluster nodes by
+matching the topics with the prefix for node specific subscriptions as produced
+by :zeek:see:`Cluster::nodeid_topic`.
+
+As of now, the implementation of the central broker calls ZeroMQ's
+``zmq::proxy()`` function to forward messages between the XPUB and
+XSUB socket.
+
+While the diagram above indicates the central broker being deployed separately
+from Zeek cluster nodes, by default the manager node will start and run this
+broker using a separate thread. There's nothing that would prevent from running
+a long running central broker independently from the Zeek cluster nodes, however.
+
+The serialization of Zeek events is done by the selected
+:zeek:see:`Cluster::event_serializer` and is independent of ZeroMQ.
+The central broker needs no knowledge about the chosen format, it is
+only shuffling messages between nodes.
+
+
+Logging
+-------
+
+While remote events always pass through the central broker, nodes connect and
+send log writes directly to logger nodes in a cluster. The ZeroMQ cluster backend
+leverages ZeroMQ's pipeline pattern for this functionality. That is, logger nodes
+(including the manager if configured using :zeek:see:`Cluster::manager_is_logger`)
+open a ZeroMQ PULL socket to receive log writes. All other nodes connect their
+PUSH socket to all available PULL sockets. These connections are separate from
+the publish-subscribe setup outlined above.
+
+When sending log-writes over a PUSH socket, load balancing is done by ZeroMQ.
+Individual cluster nodes do not have control over the decision which logger
+node receives log writes at any given time.
+
+.. figure:: /images/cluster/zeromq-logging.png
+
+While the previous paragraph used "log writes", a single message to a logger
+node actually contains a batch of log writes. The options :zeek:see:`Log::flush_interval`
+and :zeek:see:`Log::write_buffer_size` control the frequency and maximum size
+of these batches.
+
+The serialization format used to encode such batches is controlled by the
+selected :zeek:see:`Cluster::log_serializer` and is independent of ZeroMQ.
+
+With the default serializer (:zeek:see:`Cluster::LOG_SERIALIZER_ZEEK_BIN_V1`),
+every log batch on the wire has a header prepended that describes it. This allows
+interpretation of log writes even by non-Zeek processes. This opens the possibility
+to implement non-Zeek logger processes as long as the chosen serializer format
+is understood by the receiving process. In the future, a JSON lines serialization
+may be provided, allowing easier interpretation than a proprietary binary format.
+
+
+Summary
+-------
+
+Combining the diagrams above, the connections between the different socket
+types in a Zeek cluster looks something like the following.
+
+.. figure:: /images/cluster/zeromq-cluster.png
+
--- a/doc/devel/contributors.rst
+++ b/doc/devel/contributors.rst
@ -0,0 +1,111 @@
+
+===================
+Contributor's Guide
+===================
+
+See below for selection of some of the more common contribution guidelines
+maintained directly in `Zeek wiki
+<https://github.com/zeek/zeek/wiki#contributors>`_.
+
+General Contribution Process
+============================
+
+See https://github.com/zeek/zeek/wiki/Contribution-Guide
+
+Coding Style and Conventions
+============================
+
+See https://github.com/zeek/zeek/wiki/Coding-Style-and-Conventions
+
+General Documentation Structure/Process
+=======================================
+
+See the :doc:`README </README>` file of https://github.com/zeek/zeek-docs
+
+Documentation Style and Conventions
+===================================
+
+See https://github.com/zeek/zeek/wiki/Documentation-Style-and-Conventions
+
+Checking for Memory Errors and Leaks
+====================================
+
+See https://github.com/zeek/zeek/wiki/Checking-for-Memory-Errors-and-Leaks
+
+Maintaining long-lived forks of Zeek
+====================================
+
+Consistent formatting of the Zeek codebase is enforced automatically by
+configurations tracked in the repository. Upstream updates to these
+configurations can lead to formatting changes which could cause merge conflicts
+for long-lived forks.
+
+Currently the following configuration files in the root directory are used:
+
+- ``.pre-commit-config.yaml``: Configuration for `pre-commit <https://pre-commit.com/>`_.
+  We use pre-commit to manage and orchestrate formatters and linters.
+- ``.clang-format``: Configuration for `clang-format
+  <https://clang.llvm.org/docs/ClangFormat.html>`_ for formatting C++ files.
+- ``.style.yapf``: Configuration for `YAPF <https://github.com/google/yapf>`_
+  for formatting Python files.
+- ``.cmake-format.json``: Configuration for `cmake-format
+  <https://github.com/cheshirekow/cmake_format>`_ for formatting CMake files.
+
+With these configuration files present ``pre-commit run --all-files`` will
+install all needed formatters and reformat all files in the repository
+according to the current configuration.
+
+.. rubric:: Workflow: Zeek ``master`` branch regularly merged into fork
+
+If Zeek's master branch is regularly merged into the fork, merge conflicts can
+be resolved once and their resolution is tracked in the repository. Similarly,
+we can explicitly reformat the fork once and then merge the upstream branch.
+
+.. code-block:: sh
+
+   ## Get and stage latest versions of configuration files from master.
+   git checkout master -- .pre-commit-config.yaml .clang-format .style.yapf .cmake-format.json
+
+   ## Reformat fork according to new configuration.
+   pre-commit run -a
+
+   ## Record reformatted state of fork.
+   git add -u && git commit -m 'Reformat'
+
+   # Merge in master, resolve merge conflicts as usual.
+   git merge master
+
+.. rubric:: Workflow: Fork regularly rebased onto Zeek ``master`` branch
+
+If the target for a rebase has been reformatted individual diff hunks might not
+apply cleanly anymore. There are different approaches to work around that. The
+approach with the least conflicts is likely to first reformat the fork
+according to upstream style without pulling in changes, and only after that
+rebase on upstream and resolve potential semantic conflicts.
+
+.. code-block:: sh
+
+   # Create a commit updating the configuration files.
+   git checkout master -- .pre-commit-config.yaml .clang-format .style.yapf .cmake-format.json
+   git commit -m 'Bump formatter configurations'
+
+   # With a fork branched from upstream at commit FORK_COMMIT, rebase the
+   # config update commit 'Bump formatter configurations' to the start of the
+   # fork, but do not yet rebase on master (interactively move the last patch
+   # to the start of the list of patches).
+   git rebase -i FORK_COMMIT
+
+   # Reformat all commits according to configs at the base. We use the '--exec'
+   # flag of 'git rebase' to execute pre-commit after applying each patch. If
+   # 'git rebase' detects uncommitted changes it stops automatic progress so
+   # one can inspect and apply the changes.
+   git rebase -i FORK_COMMIT --exec 'pre-commit run --all-files'
+   # When this stops, inspect changes and stage them.
+   git add -u
+   # Continue rebasing. This prompts for a commit message and amends the last
+   # patch.
+   git rebase --continue
+
+   # The fork is now formatted according to upstream style. Rebase on master,
+   # and drop the 'Bump formatter configurations' patch from the list of patches.
+   git rebase -i master
--- a/doc/devel/index.rst
+++ b/doc/devel/index.rst
@ -0,0 +1,21 @@
+
+================
+Developer Guides
+================
+
+In addition to documentation found or mentioned below, some developer-oriented
+content is maintained directly in the `Zeek wiki
+<https://github.com/zeek/zeek/wiki#development-guides>`_ due to the nature of
+the content (e.g. the author finds it to be more dynamic, informal, meta,
+transient, etc. compared to other documentation).
+
+.. toctree::
+   :maxdepth: 2
+
+   plugins
+   spicy/index
+   websocket-api
+   Documentation Guide </README.rst>
+   contributors
+   maintainers
+   cluster-backend-zeromq
--- a/doc/devel/maintainers.rst
+++ b/doc/devel/maintainers.rst
@ -0,0 +1,13 @@
+
+==================
+Maintainer's Guide
+==================
+
+Some notable guidelines for maintainers are linked below for convenience, but
+they are generally maintained directly in the `Zeek wiki
+<https://github.com/zeek/zeek/wiki#maintainers>`_.
+
+Release Process
+===============
+
+See https://github.com/zeek/zeek/wiki/Release-Process
--- a/doc/devel/plugins.rst
+++ b/doc/devel/plugins.rst
@ -0,0 +1,505 @@
+.. _zkg package manager: https://docs.zeek.org/projects/package-manager/en/stable/
+
+.. _writing-plugins:
+
+===============
+Writing Plugins
+===============
+
+Zeek provides a plugin API that enables extending
+the system dynamically, without modifying the core code base. That way,
+custom code remains self-contained and can be maintained, compiled,
+and installed independently. Currently, plugins can add the following
+functionality to Zeek:
+
+    - Zeek scripts.
+
+    - Builtin functions/events/types for the scripting language.
+
+    - Protocol analyzers.
+
+    - File analyzers.
+
+    - Packet sources and packet dumpers.
+
+    - Logging framework backends.
+
+    - Input framework readers.
+
+A plugin's functionality is available to the user just as if Zeek had
+the corresponding code built-in. Indeed, internally many of Zeek's
+pieces are structured as plugins as well, they are just statically
+compiled into the binary rather than loaded dynamically at runtime.
+
+.. note::
+
+  Plugins and Zeek packages are related but separate concepts. Both extend
+  Zeek's functionality without modifying Zeek's source code. A plugin achieves
+  this via compiled, native code that Zeek links into its core at runtime. A Zeek
+  package, on the other hand, is a modular addition to Zeek, managed via the
+  `zkg package manager`_, that may or may not include a plugin. More commonly,
+  packages consist of script-layer additions to Zeek's functionality.  Packages
+  also feature more elaborate metadata, enabling dependencies on other packages,
+  Zeek versions, etc.
+
+Quick Start
+===========
+
+Writing a basic plugin is quite straight-forward as long as one
+follows a few conventions. In the following, we create a simple example
+plugin that adds a new Built-In Function (BIF) to Zeek: we'll add
+``rot13(s: string) : string``, a function that rotates every letter
+in a string by 13 places.
+
+Generally, a plugin comes in the form of a directory following a
+certain structure. To get started, Zeek's distribution provides a
+helper script ``auxil/zeek-aux/plugin-support/init-plugin`` that creates
+a skeleton plugin that can then be customized. Let's use that::
+
+    # init-plugin ./rot13-plugin Demo Rot13
+
+As you can see, the script takes three arguments. The first is a
+directory inside which the plugin skeleton will be created.  The second
+is the namespace the plugin will live in, and the third is a descriptive
+name for the plugin itself relative to the namespace. Zeek uses the
+combination of namespace and name to identify a plugin. The namespace
+serves to avoid naming conflicts between plugins written by independent
+developers; pick, e.g., the name of your organisation. The namespaces
+``Bro`` (legacy) and ``Zeek`` are reserved for functionality distributed
+by the Zeek Project. In
+our example, the plugin will be called ``Demo::Rot13``.
+
+The ``init-plugin`` script puts a number of files in place. The full
+layout is described later. For now, all we need is
+``src/rot13.bif``. It's initially empty, but we'll add our new BIF
+there as follows::
+
+    # cat src/rot13.bif
+    %%{
+    #include <cstring>
+    #include <cctype>
+    #include "zeek/util.h"
+    #include "zeek/ZeekString.h"
+    #include "zeek/Val.h"
+    %%}
+
+    module Demo;
+
+    function rot13%(s: string%) : string
+        %{
+        char* rot13 = util::copy_string(s->CheckString());
+
+        for ( char* p = rot13; *p; p++ )
+            {
+            char b = islower(*p) ? 'a' : 'A';
+            char d = *p - b + 13;
+
+            if ( d >= 13 && d <= 38 )
+                *p  = d % 26 + b;
+            }
+
+        zeek::String* zs = new zeek::String(1, reinterpret_cast<byte_vec>(rot13),
+                                            strlen(rot13));
+        return make_intrusive<StringVal>(zs);
+        %}
+
+The syntax of this file is just like any other ``*.bif`` file; we
+won't go into it here.
+
+Now we are ready to compile our plugin.  The configure script will just
+need to be able to find the location of either a Zeek installation-tree or
+a Zeek source-tree.
+
+When building a plugin against a Zeek installation-tree, simply have the
+installation's associated ``zeek-config`` in your :envvar:`PATH` and the
+configure script will detect it and use it to obtain all the information
+it needs::
+
+    # which zeek-config
+    /usr/local/zeek/bin/zeek-config
+    # cd rot13-plugin
+    # ./configure && make
+    [... cmake output ...]
+
+When building a plugin against a Zeek source-tree (which itself needs
+to have first been built), the configure script has to explicitly be
+told its location::
+
+    # cd rot13-plugin
+    # ./configure --zeek-dist=/path/to/zeek/dist && make
+    [... cmake output ...]
+
+This builds the plugin in a subdirectory ``build/``. In fact, that
+subdirectory *becomes* the plugin: when ``make`` finishes, ``build/``
+has everything it needs for Zeek to recognize it as a dynamic plugin.
+
+Let's try that. Once we point Zeek to the ``build/`` directory, it will
+pull in our new plugin automatically, as we can check with the ``-N``
+option::
+
+    # export ZEEK_PLUGIN_PATH=/path/to/rot13-plugin/build
+    # zeek -N
+    [...]
+    Demo::Rot13 - <Insert description> (dynamic, version 0.1.0)
+    [...]
+
+That looks quite good, except for the dummy description that we should
+replace with something nicer so that users will know what our plugin
+is about.  We do this by editing the ``config.description`` line in
+``src/Plugin.cc``, like this::
+
+    [...]
+    plugin::Configuration Plugin::Configure()
+        {
+        plugin::Configuration config;
+        config.name = "Demo::Rot13";
+        config.description = "Caesar cipher rotating a string's letters by 13 places.";
+        config.version.major = 0;
+        config.version.minor = 1;
+        config.version.patch = 0;
+        return config;
+        }
+    [...]
+
+Now rebuild and verify that the description is visible::
+
+    # make
+    [...]
+    # zeek -N | grep Rot13
+    Demo::Rot13 - Caesar cipher rotating a string's letters by 13 places. (dynamic, version 0.1.0)
+
+Zeek can also show us what exactly the plugin provides with the
+more verbose option ``-NN``::
+
+    # zeek -NN
+    [...]
+    Demo::Rot13 - Caesar cipher rotating a string's letters by 13 places. (dynamic, version 0.1.0)
+        [Function] Demo::rot13
+    [...]
+
+There's our function. Now let's use it::
+
+    # zeek -e 'print Demo::rot13("Hello")'
+    Uryyb
+
+It works. We next install the plugin along with Zeek itself, so that it
+will find it directly without needing the ``ZEEK_PLUGIN_PATH``
+environment variable. If we first unset the variable, the function
+will no longer be available::
+
+    # unset ZEEK_PLUGIN_PATH
+    # zeek -e 'print Demo::rot13("Hello")'
+    error in <command line>, line 1: unknown identifier Demo::rot13, at or near "Demo::rot13"
+
+Once we install it, it works again::
+
+    # make install
+    # zeek -e 'print Demo::rot13("Hello")'
+    Uryyb
+
+The installed version went into
+``<zeek-install-prefix>/lib/zeek/plugins/Demo_Rot13``.
+
+One can distribute the plugin independently of Zeek for others to use.
+To distribute in source form, just remove the ``build/`` directory
+(``make distclean`` does that) and then tar up the whole ``rot13-plugin/``
+directory. Others then follow the same process as above after
+unpacking.
+
+To distribute the plugin in binary form, the build process
+conveniently creates a corresponding tarball in ``build/dist/``. In
+this case, it's called ``Demo_Rot13-0.1.0.tar.gz``, with the version
+number coming out of the ``VERSION`` file that ``init-plugin`` put
+into place. The binary tarball has everything needed to run the
+plugin, but no further source files. Optionally, one can include
+further files by specifying them in the plugin's ``CMakeLists.txt``
+through the ``zeek_plugin_dist_files`` macro; the skeleton does that
+for ``README``, ``VERSION``, ``CHANGES``, and ``COPYING``. To use the
+plugin through the binary tarball, just unpack it into
+``<zeek-install-prefix>/lib/zeek/plugins/``.  Alternatively, if you unpack
+it in another location, then you need to point ``ZEEK_PLUGIN_PATH`` there.
+
+Before distributing your plugin, you should edit some of the meta
+files that ``init-plugin`` puts in place. Edit ``README`` and
+``VERSION``, and update ``CHANGES`` when you make changes. Also put a
+license file in place as ``COPYING``; if BSD is fine, you will find a
+template in ``COPYING.edit-me``.
+
+Plugin Directory Layout
+=======================
+
+A plugin's directory needs to follow a set of conventions so that Zeek
+(1) recognizes it as a plugin, and (2) knows what to load.  While
+``init-plugin`` takes care of most of this, the following is the full
+story. We'll use ``<base>`` to represent a plugin's top-level
+directory. With the skeleton, ``<base>`` corresponds to ``build/``.
+
+``<base>/__zeek_plugin__``
+    A file that marks a directory as containing a Zeek plugin. The file
+    must exist, and its content must consist of a single line with the
+    qualified name of the plugin (e.g., "Demo::Rot13").
+
+``<base>/lib/<plugin-name>.<os>-<arch>.so``
+    The shared library containing the plugin's compiled code. Zeek will
+    load this in dynamically at run-time if OS and architecture match
+    the current platform.
+
+``scripts/``
+    A directory with the plugin's custom Zeek scripts. When the plugin
+    gets activated, this directory will be automatically added to
+    ``ZEEKPATH``, so that any scripts/modules inside can be
+    "@load"ed.
+
+``scripts``/__load__.zeek
+    A Zeek script that will be loaded when the plugin gets activated.
+    When this script executes, any BIF elements that the plugin
+    defines will already be available. See below for more information
+    on activating plugins.
+
+``scripts``/__preload__.zeek
+    A Zeek script that will be loaded when the plugin gets activated,
+    but before any BIF elements become available. See below for more
+    information on activating plugins.
+
+``lib/bif/``
+    Directory with auto-generated Zeek scripts that declare the plugin's
+    BIF elements. The files here are produced by ``bifcl``.
+
+Any other files in ``<base>`` are ignored by Zeek.
+
+By convention, a plugin should put its custom scripts into sub folders
+of ``scripts/``, i.e., ``scripts/<plugin-namespace>/<plugin-name>/<script>.zeek``
+to avoid conflicts. As usual, you can then put a ``__load__.zeek`` in
+there as well so that, e.g., ``@load Demo/Rot13`` could load a whole
+module in the form of multiple individual scripts.
+
+Note that in addition to the paths above, the ``init-plugin`` helper
+puts some more files and directories in place that help with
+development and installation (e.g., ``CMakeLists.txt``, ``Makefile``,
+and source code in ``src/``). However, all these do not have a special
+meaning for Zeek at runtime and aren't necessary for a plugin to
+function.
+
+``init-plugin``
+===============
+
+``init-plugin`` puts a basic plugin structure in place that follows
+the above layout and augments it with a CMake build and installation
+system. Plugins with this structure can be used both directly out of
+their source directory (after ``make`` and setting Zeek's
+``ZEEK_PLUGIN_PATH``), and when installed alongside Zeek (after ``make
+install``).
+
+Upon completion, ``init-plugin`` initializes a git repository and stages its
+produced files for committing, but does not yet commit the files. This allows
+you to tweak the new plugin as needed prior to the initial commit.
+
+``make install`` copies over the ``lib`` and ``scripts`` directories,
+as well as the ``__zeek_plugin__`` magic file and any further
+distribution files specified in ``CMakeLists.txt`` (e.g., README,
+VERSION). You can find a full list of files installed in
+``build/MANIFEST``. Behind the scenes, ``make install`` really just
+unpacks the binary tarball from ``build/dist`` into the destination
+directory.
+
+``init-plugin`` will never overwrite existing files. If its target
+directory already exists, it will by default decline to do anything.
+You can run it with ``-u`` instead to update an existing plugin,
+however it will never overwrite any existing files; it will only put
+in place files it doesn't find yet. To revert a file back to what
+``init-plugin`` created originally, delete it first and then rerun
+with ``-u``.
+
+``init-plugin`` puts a ``configure`` script in place that wraps
+``cmake`` with a more familiar configure-style configuration. By
+default, the script provides two options for specifying paths to the
+Zeek source (``--zeek-dist``) and to the plugin's installation directory
+(``--install-root``). To extend ``configure`` with plugin-specific
+options (such as search paths for its dependencies) don't edit the
+script directly but instead extend ``configure.plugin``, which
+``configure`` includes. That way you will be able to more easily
+update ``configure`` in the future when the distribution version
+changes. In ``configure.plugin`` you can use the predefined shell
+function ``append_cache_entry`` to seed values into the CMake cache;
+see the installed skeleton version and existing plugins for examples.
+
+.. note::
+
+  In the past ``init-plugin`` also generated a ``zkg.meta`` file, automatically
+  creating a Zeek package containing a plugin. ``init-plugin`` now focuses
+  purely on plugins, as its name suggests. To bootstrap new Zeek packages
+  (possibly containing plugins), use the more featureful templating
+  functionality provided by the ``zkg create`` command, explained `here
+  <https://docs.zeek.org/projects/package-manager/en/stable/package.html>`_.
+
+Activating a Plugin
+===================
+
+A plugin needs to be *activated* to make it available to the user.
+Activating a plugin will:
+
+    1. Load the dynamic module
+    2. Make any BIF items available
+    3. Add the ``scripts/`` directory to ``ZEEKPATH``
+    4. Load ``scripts/__preload__.zeek``
+    5. Make BIF elements available to scripts.
+    6. Load ``scripts/__load__.zeek``
+
+By default, Zeek will automatically activate all dynamic plugins found
+in its search path ``ZEEK_PLUGIN_PATH``. However, in bare mode (``zeek
+-b``), no dynamic plugins will be activated by default; instead the
+user can selectively enable individual plugins in scriptland using the
+``@load-plugin <qualified-plugin-name>`` directive (e.g.,
+``@load-plugin Demo::Rot13``). Alternatively, one can activate a
+plugin from the command-line by specifying its full name
+(``Demo::Rot13``), or set the environment variable
+``ZEEK_PLUGIN_ACTIVATE`` to a list of comma-separated names of
+plugins to unconditionally activate, even in bare mode.
+
+``zeek -N`` shows activated plugins separately from found but not yet
+activated plugins. Note that plugins compiled statically into Zeek are
+always activated, and hence show up as such even in bare mode.
+
+Plugin Components
+=================
+
+It's easy for a plugin to provide custom scripts: just put them into
+``scripts/``, as described above.  The CMake infrastructure will automatically
+install them, as well include them into the source and binary plugin
+distributions.
+
+Any number or combination of other components can be provided by a single
+plugin.  For example a plugin can provide multiple different protocol
+analyzers, or both a log writer and input reader.
+
+The best place to look for examples or templates for a specific type of plugin
+component are the source code of Zeek itself since every one of its components
+uses the same API as any external plugin.
+
+Each component type also has a simple integration test, found
+in the Zeek source-tree's ``testing/btest/plugins/`` directory,
+that can serve useful for creating basic plugin skeletons.
+
+Testing Plugins
+===============
+
+A plugin should come with a test suite to exercise its functionality.
+The ``init-plugin`` script puts in place a basic
+`BTest <https://github.com/zeek/btest>`_ setup
+to start with. Initially, it comes with a single test that just checks
+that Zeek loads the plugin correctly::
+
+    # cd tests
+    # btest -A
+    [  0%] rot13.show-plugin ... ok
+    all 1 tests successful
+
+You can also run this via the Makefile::
+
+    # cd ..
+    # make test
+    make -C tests
+    make[1]: Entering directory `tests'
+    all 1 tests successful
+    make[1]: Leaving directory `tests'
+
+Now let's add a custom test that ensures that our BIF works correctly::
+
+    # cd tests
+    # cat >rot13/bif-rot13.zeek
+
+    # @TEST-EXEC: zeek %INPUT >output
+    # @TEST-EXEC: btest-diff output
+
+    event zeek_init()
+        {
+        print Demo::rot13("Hello");
+        }
+
+Check the output::
+
+    # btest -d rot13/bif-rot13.zeek
+    [  0%] rot13.bif-rot13 ... failed
+    % 'btest-diff output' failed unexpectedly (exit code 100)
+    % cat .diag
+    == File ===============================
+    Uryyb
+    == Error ===============================
+    test-diff: no baseline found.
+    =======================================
+
+    % cat .stderr
+
+    1 of 1 test failed
+
+Install the baseline::
+
+    # btest -U rot13/bif-rot13.zeek
+    all 1 tests successful
+
+Run the test-suite::
+
+    # btest
+    all 2 tests successful
+
+Debugging Plugins
+=================
+
+If your plugin isn't loading as expected, Zeek's debugging facilities
+can help illuminate what's going on. To enable, recompile Zeek
+with debugging support (``./configure --enable-debug``), and
+afterwards rebuild your plugin as well. If you then run Zeek with ``-B
+plugins``, it will produce a file :file:`debug.log` that records details
+about the process for searching, loading, and activating plugins.
+
+To generate your own debugging output from inside your plugin, you can
+add a custom debug stream by using the ``PLUGIN_DBG_LOG(<plugin>,
+<args>)`` macro (defined in ``DebugLogger.h``), where ``<plugin>`` is
+the ``Plugin`` instance and ``<args>`` are printf-style arguments,
+just as with Zeek's standard debugging macros (grep for ``DBG_LOG`` in
+Zeek's ``src/`` to see examples). At runtime, you can then activate
+your plugin's debugging output with ``-B plugin-<name>``, where
+``<name>`` is the name of the plugin as returned by its
+``Configure()`` method, yet with the namespace-separator ``::``
+replaced with a simple dash. Example: If the plugin is called
+``Demo::Rot13``, use ``-B plugin-Demo-Rot13``. As usual, the debugging
+output will be recorded to :file:`debug.log` if Zeek's compiled in debug
+mode.
+
+.. _building-plugins-statically:
+
+Building Plugins Statically into Zeek
+=====================================
+
+Plugins can be built statically into a Zeek binary using the
+``--include-plugins`` option passed to Zeek's ``configure``. This argument
+takes a semicolon-separated list of absolute paths to plugin sources. Each
+path needs to contain a ``CMakeLists.txt`` file, as is commonly the case at the
+toplevel of plugin source trees, and usually also in Zeek packages. Building
+plugins in this manner includes them directly into the Zeek binary
+and installation. They are loaded automatically by Zeek at startup
+without needing to install them separately.
+
+Building plugins into Zeek is a handy way to build them consistently with
+sanitizers, as you can use Zeek's existing ``./configure --sanitizers=...``
+infrastructure to apply transparently to built-in plugins.
+
+The configure run lists built-in plugins at the end, so you can verify
+successful inclusion of your plugin there. Your plugin should also
+show up in the resulting build's ``zeek -NN`` output.
+
+Headers for built-in plugins are installed into a subdirectory of
+``<zeek-install-prefix>/include/zeek/builtin-plugins`` specific to
+each plugin. Scripts are installed into a subdirectory of
+``<zeek-install-prefix>/share/zeek/builtin-plugins`` specific to
+each plugin. The scripts directory is also automatically added to
+the default ``ZEEKPATH``.
+
+Plugin Tutorials
+================
+
+.. toctree::
+   :maxdepth: 1
+
+   plugins/connkey-plugin
+   plugins/event-metadata-plugin
--- a/doc/devel/plugins/connkey-plugin.rst
+++ b/doc/devel/plugins/connkey-plugin.rst
@ -0,0 +1,205 @@
+.. _connkey-plugin:
+
+===============================
+Writing a Connection Key Plugin
+===============================
+
+.. versionadded:: 8.0
+
+By default, Zeek looks up internal connection state using the classic five-tuple
+of originator and responder IP addresses, ports, and the numeric protocol
+identifier (for TCP, UDP, etc). Zeek's data structure driving this is called a
+connection key, or ``ConnKey``.
+
+In certain environments the classic five-tuple does not sufficiently distinguish
+connections. Consider traffic mirrored from multiple VLANs with overlapping IP
+address ranges. Concretely, a connection between 10.0.0.1 and 10.0.0.2 in one
+VLAN is distinct from a connection between the same IPs in another VLAN.  Here,
+Zeek should include the VLAN identifier into the connection key, and you can
+instruct Zeek to do so by loading the
+:doc:`/scripts/policy/frameworks/conn_key/vlan_fivetuple.zeek` policy script.
+
+Zeek's plugin API allows adding support for additional custom connection keys.
+This section provides a tutorial on how to do so, using the example of VXLAN-enabled
+flow tuples. If you're not familiar with plugin development, head over to the
+:ref:`Writing Plugins <writing-plugins>` section.
+
+Our goal is to implement a custom connection key to scope connections
+transported within a `VXLAN <https://datatracker.ietf.org/doc/html/rfc7348/index.html>`_
+tunnel by the VXLAN Network Identifier (VNI).
+
+As a test case, we have encapsulated the `HTTP GET trace <https://github.com/zeek/zeek/raw/refs/heads/master/testing/btest/Traces/http/get.trace>`_
+from the Zeek repository twice with VXLAN using VNIs 4711 and 4242, respectively,
+and merged the resulting two PCAP files with the original PCAP.
+The :download:`resulting PCAP <connkey-vxlan-fivetuple-plugin-src/Traces/vxlan-overlapping-http-get.pcap>`
+contains three HTTP connections, two of which are VXLAN-encapsulated.
+
+By default, Zeek will create the same connection key for the original and
+encapsulated HTTP connections, since they have identical inner five-tuples.
+Therefore, Zeek creates only a single ``http.log`` entry, and two entries
+in ``conn.log``.
+
+.. code-block:: shell
+
+    $ zeek -C -r Traces/vxlan-overlapping-http-get.pcap
+    $ zeek-cut -m uid method host uri < http.log
+    uid     method  host    uri
+    CpWF5etn1l2rpaLu3       GET     bro.org /download/CHANGES.bro-aux.txt
+
+    $ zeek-cut -m uid service history orig_pkts resp_pkts < conn.log
+    uid     service history orig_pkts       resp_pkts
+    Cq2CY245oGGbibJ8k9      http    ShADTadtFf      21      21
+    CMleDu4xANIMzePYd7      vxlan   D       28      0
+
+Note that just two of the HTTP connections are encapsulated.
+That is why the VXLAN connection shows only 28 packets.
+Each HTTP connection has 14 packets total, 7 in each direction. Zeek aggregates
+all packets into the single HTTP connection, but only 28 of them were
+transported within the VXLAN tunnel connection. Note also the ``t`` and ``T``
+flags in the :zeek:field:`Conn::Info$history` field. These stand for retransmissions,
+caused by Zeek not discriminating between the different HTTP connections.
+
+The plugin we'll develop below adds the VXLAN VNI to the connection key.
+As a result, Zeek will correctly report three HTTP connections, tracked
+and logged separately. We'll add the VNI as
+:zeek:field:`vxlan_vni` to the :zeek:see:`conn_id_ctx` record, making it available
+in ``http.log`` and ``conn.log`` via the ``id.ctx.vxlan_vni`` column.
+
+After activating the plugin Zeek tracks each HTTP connection individually and
+the logs will look as follows:
+
+.. code-block:: shell
+
+    $ zeek-cut -m uid method host uri id.ctx.vxlan_vni < http.log
+    uid     method  host    uri     id.ctx.vxlan_vni
+    CBifsS2vqGEg8Fa5ac      GET     bro.org /download/CHANGES.bro-aux.txt   4711
+    CEllEz13txeSrbGqBe      GET     bro.org /download/CHANGES.bro-aux.txt   4242
+    CRfbJw1kBBvHDQQBta      GET     bro.org /download/CHANGES.bro-aux.txt   -
+
+    $ zeek-cut -m uid service history orig_pkts resp_pkts id.ctx.vxlan_vni < conn.log
+    uid     service history orig_pkts       resp_pkts       id.ctx.vxlan_vni
+    CRfbJw1kBBvHDQQBta      http    ShADadFf        7       7       -
+    CEllEz13txeSrbGqBe      http    ShADadFf        7       7       4242
+    CBifsS2vqGEg8Fa5ac      http    ShADadFf        7       7       4711
+    CC6Ald2LejCS1qcDy4      vxlan   D       28      0       -
+
+
+Implementation
+==============
+
+Adding alternative connection keys involves implementing two classes.
+First, a factory class producing ``zeek::ConnKey`` instances. This
+is the class created through the added ``zeek::conn_key::Component``.
+Second, a custom connection key class derived from ``zeek::ConnKey``.
+Instances of this class are created by the factory. This is a typical
+abstract factory pattern.
+
+Our plugin's ``Configure()`` method follows the standard pattern of setting up
+basic information about the plugin and registering our own ``ConnKey`` component.
+
+.. literalinclude:: connkey-vxlan-fivetuple-plugin-src/src/Plugin.cc
+   :caption: Plugin.cc
+   :language: cpp
+   :lines: 16-
+   :linenos:
+   :tab-width: 4
+
+
+Next, in the ``Factory.cc`` file, we're implementing a custom ``zeek::ConnKey`` class.
+This class is named ``VxlanVniConnKey`` and inherits from ``zeek::IPBasedConnKey``.
+While ``zeek::ConnKey`` is technically the base class, in this tutorial we'll
+derive from ``zeek::IPBasedConnKey``.
+Currently, Zeek only supports IP-based connection tracking via the
+``IPBasedAnalyzer`` analyzer. This analyzer requires ``zeek::IPBasedConnKey``
+instances.
+
+.. literalinclude:: connkey-vxlan-fivetuple-plugin-src/src/Factory.cc
+   :caption: VxlanVniConnKey class in Factory.cc
+   :language: cpp
+   :linenos:
+   :lines: 18-78
+   :tab-width: 4
+
+The current pattern for custom connection keys is to embed the bytes used for
+the ``zeek::session::detail::Key`` as a packed struct within a ``ConnKey`` instance.
+We override ``DoPopulateConnIdVal()`` to set the :zeek:field:`vxlan_vni` field
+of the :zeek:see:`conn_id_ctx` record value to the extracted VXLAN VNI. A small trick
+employed is that we default the most significant byte of ``key.vxlan_vni`` to 0xFF.
+As a VNI has only 24 bits, this allows us to determine if a VNI was actually
+extracted, or whether it remained unset.
+
+The ``DoInit()`` implementation is the actual place for connection key customization.
+This is where we extract the VXLAN VNI from packet data. To do so, we're using the relatively
+new ``GetAnalyzerData()`` API of the packet analysis manager.
+This API allows generic access to the raw data layers analyzed by a give packet analyzer.
+For our use-case, we take the most outer VXLAN layer, if any, and extract the VNI
+into ``key.vxlan_vni``.
+
+There's no requirement to use the ``GetAnalyzerData()`` API. If the ``zeek::Packet``
+instance passed to ``DoInit()`` contains the needed information, e.g. VLAN identifiers
+or information from the packet's raw bytes, you can use them directly.
+Specifically, ``GetAnalyzerData()`` may introduce additional overhead into the
+packet path that you can avoid if the information is readily available
+elsewhere.
+Using other Zeek APIs to determine connection key information is of course
+also possible.
+
+The next part shown concerns the ``Factory`` class itself. The
+``DoConnKeyFromVal()`` method contains logic to produce a ``VxlanVniConnKey``
+instance from an existing :zeek:see:`conn_id` record.
+This is needed in order for the :zeek:see:`lookup_connection` builtin function to work properly.
+The implementation re-uses the ``DoConnKeyFromVal()`` implementation of the
+default ``fivetuple::Factory`` that our factory inherits from to extract the
+classic five-tuple information.
+
+.. literalinclude:: connkey-vxlan-fivetuple-plugin-src/src/Factory.cc
+   :caption: Factory class in Factory.cc
+   :language: cpp
+   :linenos:
+   :lines: 80-103
+   :tab-width: 4
+
+Calling the ``fivetuple::Factory::DoConnKeyFromVal()`` in turn calls our
+own factory's ``DoNewConnKey()`` method through virtual dispatch.  Since our
+factory overrides this method to always return a ``VxlanVniConnKey`` instance,
+the static cast later is safe.
+
+Last, the plugin's ``__load__.zeek`` file is shown. It includes the extension
+of the :zeek:see:`conn_id_ctx` identifier by the :zeek:field:`vxlan_vni` field.
+
+.. literalinclude:: connkey-vxlan-fivetuple-plugin-src/scripts/__load__.zeek
+   :caption: The conn_id redefinition in __load__.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+
+Using the custom Connection Key
+===============================
+
+After installing the plugin, the new connection key implementation can be
+selected by redefining the script-level :zeek:see:`ConnKey::factory` variable.
+This can either be done in a separate script, but we do it directly on the
+command-line for simplicity. The ``ConnKey::CONNKEY_VXLAN_VNI_FIVETUPLE`` is
+registered in Zeek during the plugin's ``AddComponent()`` call during
+``Configure()``, where the component has the name ``VXLAN_VNI_FIVETUPLE``.
+
+.. code-block:: shell
+
+    $ zeek -C -r Traces/vxlan-overlapping-http-get.pcap  ConnKey::factory=ConnKey::CONNKEY_VXLAN_VNI_FIVETUPLE
+
+
+Viewing the ``conn.log`` now shows three separate HTTP connections,
+two of which have a ``vxlan_vni`` value set in their logs.
+
+
+.. code-block:: shell
+
+    $ zeek-cut -m uid service history orig_pkts resp_pkts id.ctx.vxlan_vni < conn.log
+    uid     service history orig_pkts       resp_pkts       id.ctx.vxlan_vni
+    CRfbJw1kBBvHDQQBta      http    ShADadFf        7       7       -
+    CEllEz13txeSrbGqBe      http    ShADadFf        7       7       4242
+    CBifsS2vqGEg8Fa5ac      http    ShADadFf        7       7       4711
+    CC6Ald2LejCS1qcDy4      vxlan   D       28      0       -
+
+Pretty cool, isn't it?
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/CMakeLists.txt
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/CMakeLists.txt
@ -0,0 +1,9 @@
+cmake_minimum_required(VERSION 3.15 FATAL_ERROR)
+
+project(ZeekPluginConnKeyVxlanVniFivetuple)
+
+include(ZeekPlugin)
+
+zeek_add_plugin(
+    Zeek ConnKey_Vxlan_Vni_Fivetuple
+    SOURCES src/Factory.cc src/Plugin.cc SCRIPT_FILES scripts/__load__.zeek)
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/COPYING
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/COPYING
@ -0,0 +1,26 @@
+Copyright (c) 2025 by the Zeek Project. All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification,
+are permitted provided that the following conditions are met:
+
+1. Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+
+2. Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+3. Neither the name of the copyright holder nor the names of its contributors
+   may be used to endorse or promote products derived from this software
+   without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/Makefile
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/Makefile
@ -0,0 +1,23 @@
+#
+# Convenience Makefile providing a few common top-level targets.
+#
+
+cmake_build_dir=build
+arch=`uname -s | tr A-Z a-z`-`uname -m`
+
+all: build-it
+
+build-it:
+	( cd $(cmake_build_dir) && make )
+
+install:
+	( cd $(cmake_build_dir) && make install )
+
+clean:
+	( cd $(cmake_build_dir) && make clean )
+
+distclean:
+	rm -rf $(cmake_build_dir)
+
+test:
+	make -C tests
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/README
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/README
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/Traces/vxlan-overlapping-http-get.pcap
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/Traces/vxlan-overlapping-http-get.pcap
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/VERSION
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/VERSION
@ -0,0 +1 @@
+0.1.0
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/configure
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/configure
@ -0,0 +1,193 @@
+#!/bin/sh
+#
+# Wrapper for viewing/setting options that the plugin's CMake
+# scripts will recognize.
+#
+# Don't edit this. Edit configure.plugin to add plugin-specific options.
+#
+
+set -e
+command="$0 $*"
+
+if [ -e $(dirname $0)/configure.plugin ]; then
+    # Include custom additions.
+    . $(dirname $0)/configure.plugin
+fi
+
+usage() {
+
+    cat 1>&2 <<EOF
+Usage: $0 [OPTIONS]
+
+  Plugin Options:
+    --cmake=PATH               Path to CMake binary
+    --zeek-dist=DIR            Path to Zeek source tree
+    --install-root=DIR         Path where to install plugin into
+    --with-binpac=DIR          Path to BinPAC installation root
+    --with-broker=DIR          Path to Broker installation root
+    --with-bifcl=PATH          Path to bifcl executable
+    --enable-debug             Compile in debugging mode
+    --disable-cpp-tests        Don't build C++ unit tests
+EOF
+
+    if type plugin_usage >/dev/null 2>&1; then
+        plugin_usage 1>&2
+    fi
+
+    echo
+
+    exit 1
+}
+
+# Function to append a CMake cache entry definition to the
+# CMakeCacheEntries variable
+#   $1 is the cache entry variable name
+#   $2 is the cache entry variable type
+#   $3 is the cache entry variable value
+append_cache_entry() {
+    CMakeCacheEntries="$CMakeCacheEntries -D $1:$2=$3"
+}
+
+# set defaults
+builddir=build
+zeekdist=""
+installroot="default"
+zeek_plugin_begin_opts=""
+CMakeCacheEntries=""
+
+while [ $# -ne 0 ]; do
+    case "$1" in
+        -*=*) optarg=$(echo "$1" | sed 's/[-_a-zA-Z0-9]*=//') ;;
+        *) optarg= ;;
+    esac
+
+    case "$1" in
+        --help | -h)
+            usage
+            ;;
+
+        --cmake=*)
+            CMakeCommand=$optarg
+            ;;
+
+        --zeek-dist=*)
+            zeekdist=$(cd $optarg && pwd)
+            ;;
+
+        --install-root=*)
+            installroot=$optarg
+            ;;
+
+        --with-binpac=*)
+            append_cache_entry BinPAC_ROOT_DIR PATH $optarg
+            binpac_root=$optarg
+            ;;
+
+        --with-broker=*)
+            append_cache_entry BROKER_ROOT_DIR PATH $optarg
+            broker_root=$optarg
+            ;;
+
+        --with-bifcl=*)
+            append_cache_entry BifCl_EXE PATH $optarg
+            ;;
+
+        --enable-debug)
+            append_cache_entry BRO_PLUGIN_ENABLE_DEBUG BOOL true
+            ;;
+
+        --disable-cpp-tests)
+            zeek_plugin_begin_opts="DISABLE_CPP_TESTS;$zeek_plugin_begin_opts"
+            ;;
+
+        *)
+            if type plugin_option >/dev/null 2>&1; then
+                plugin_option $1 && shift && continue
+            fi
+
+            echo "Invalid option '$1'.  Try $0 --help to see available options."
+            exit 1
+            ;;
+    esac
+    shift
+done
+
+if [ -z "$CMakeCommand" ]; then
+    # prefer cmake3 over "regular" cmake (cmake == cmake2 on RHEL)
+    if command -v cmake3 >/dev/null 2>&1; then
+        CMakeCommand="cmake3"
+    elif command -v cmake >/dev/null 2>&1; then
+        CMakeCommand="cmake"
+    else
+        echo "This plugin requires CMake, please install it first."
+        echo "Then you may use this script to configure the CMake build."
+        echo "Note: pass --cmake=PATH to use cmake in non-standard locations."
+        exit 1
+    fi
+fi
+
+if [ -z "$zeekdist" ]; then
+    if type zeek-config >/dev/null 2>&1; then
+        zeek_config="zeek-config"
+    else
+        echo "Either 'zeek-config' must be in PATH or '--zeek-dist=<path>' used"
+        exit 1
+    fi
+
+    append_cache_entry BRO_CONFIG_PREFIX PATH $(${zeek_config} --prefix)
+    append_cache_entry BRO_CONFIG_INCLUDE_DIR PATH $(${zeek_config} --include_dir)
+    append_cache_entry BRO_CONFIG_PLUGIN_DIR PATH $(${zeek_config} --plugin_dir)
+    append_cache_entry BRO_CONFIG_LIB_DIR PATH $(${zeek_config} --lib_dir)
+    append_cache_entry BRO_CONFIG_CMAKE_DIR PATH $(${zeek_config} --cmake_dir)
+    append_cache_entry CMAKE_MODULE_PATH PATH $(${zeek_config} --cmake_dir)
+
+    build_type=$(${zeek_config} --build_type)
+
+    if [ "$build_type" = "debug" ]; then
+        append_cache_entry BRO_PLUGIN_ENABLE_DEBUG BOOL true
+    fi
+
+    if [ -z "$binpac_root" ]; then
+        append_cache_entry BinPAC_ROOT_DIR PATH $(${zeek_config} --binpac_root)
+    fi
+
+    if [ -z "$broker_root" ]; then
+        append_cache_entry BROKER_ROOT_DIR PATH $(${zeek_config} --broker_root)
+    fi
+else
+    if [ ! -e "$zeekdist/zeek-path-dev.in" ]; then
+        echo "$zeekdist does not appear to be a valid Zeek source tree."
+        exit 1
+    fi
+
+    # BRO_DIST is the canonical/historical name used by plugin CMake scripts
+    # ZEEK_DIST doesn't serve a function at the moment, but set/provided anyway
+    append_cache_entry BRO_DIST PATH $zeekdist
+    append_cache_entry ZEEK_DIST PATH $zeekdist
+    append_cache_entry CMAKE_MODULE_PATH PATH $zeekdist/cmake
+fi
+
+if [ "$installroot" != "default" ]; then
+    mkdir -p $installroot
+    append_cache_entry BRO_PLUGIN_INSTALL_ROOT PATH $installroot
+fi
+
+if [ -n "$zeek_plugin_begin_opts" ]; then
+    append_cache_entry ZEEK_PLUGIN_BEGIN_OPTS STRING "$zeek_plugin_begin_opts"
+fi
+
+if type plugin_addl >/dev/null 2>&1; then
+    plugin_addl
+fi
+
+echo "Build Directory        : $builddir"
+echo "Zeek Source Directory   : $zeekdist"
+
+mkdir -p $builddir
+cd $builddir
+
+"$CMakeCommand" $CMakeCacheEntries ..
+
+echo "# This is the command used to configure this build" >config.status
+echo $command >>config.status
+chmod u+x config.status
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/scripts/load.zeek
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/scripts/load.zeek
@ -0,0 +1,3 @@
+redef record conn_id_ctx += {
+	vxlan_vni: count &log &optional;
+};
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/scripts/preload.zeek
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/scripts/preload.zeek
@ -0,0 +1 @@
+# Empty
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Factory.cc
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Factory.cc
@ -0,0 +1,105 @@
+// See the file "COPYING" in the main distribution directory for copyright.
+
+#include "Factory.h"
+
+#include <memory>
+
+#include "zeek/ID.h"
+#include "zeek/Val.h"
+#include "zeek/iosource/Packet.h"
+#include "zeek/packet_analysis/Analyzer.h"
+#include "zeek/packet_analysis/Manager.h"
+#include "zeek/packet_analysis/protocol/ip/conn_key/IPBasedConnKey.h"
+#include "zeek/packet_analysis/protocol/ip/conn_key/fivetuple/Factory.h"
+#include "zeek/util-types.h"
+
+namespace zeek::conn_key::vxlan_vni_fivetuple {
+
+class VxlanVniConnKey : public zeek::IPBasedConnKey {
+public:
+    VxlanVniConnKey() {
+        // Ensure padding holes in the key struct are filled with zeroes.
+        memset(static_cast<void*>(&key), 0, sizeof(key));
+    }
+
+    detail::PackedConnTuple& PackedTuple() override { return key.tuple; }
+
+    const detail::PackedConnTuple& PackedTuple() const override { return key.tuple; }
+
+protected:
+    zeek::session::detail::Key DoSessionKey() const override {
+        return {reinterpret_cast<const void*>(&key), sizeof(key), session::detail::Key::CONNECTION_KEY_TYPE};
+    }
+
+    void DoPopulateConnIdVal(zeek::RecordVal& conn_id, zeek::RecordVal& ctx) override {
+        // Base class populates conn_id fields (orig_h, orig_p, resp_h, resp_p)
+        zeek::IPBasedConnKey::DoPopulateConnIdVal(conn_id, ctx);
+
+        if ( conn_id.GetType() != id::conn_id )
+            return;
+
+        if ( (key.vxlan_vni & 0xFF000000) == 0 ) // High-bits unset: Have VNI
+            ctx.Assign(GetVxlanVniOffset(), static_cast<zeek_uint_t>(key.vxlan_vni));
+        else
+            ctx.Remove(GetVxlanVniOffset());
+    }
+
+    // Extract VNI from most outer VXLAN layer.
+    void DoInit(const Packet& pkt) override {
+        static const auto& analyzer = zeek::packet_mgr->GetAnalyzer("VXLAN");
+
+        // Set the high-bits: This is needed because keys can get reused.
+        key.vxlan_vni = 0xFF000000;
+
+        if ( ! analyzer || ! analyzer->IsEnabled() )
+            return;
+
+        auto spans = zeek::packet_mgr->GetAnalyzerData(analyzer);
+
+        if ( spans.empty() || spans[0].size() < 8 )
+            return;
+
+        key.vxlan_vni = spans[0][4] << 16 | spans[0][5] << 8 | spans[0][6];
+    }
+
+    static int GetVxlanVniOffset() {
+        static const auto& conn_id_ctx = zeek::id::find_type<zeek::RecordType>("conn_id_ctx");
+        static int vxlan_vni_offset = conn_id_ctx->FieldOffset("vxlan_vni");
+        return vxlan_vni_offset;
+    }
+
+private:
+    friend class Factory;
+
+    struct {
+        struct detail::PackedConnTuple tuple;
+        uint32_t vxlan_vni;
+    } __attribute__((packed, aligned)) key; // packed and aligned due to usage for hashing
+};
+
+zeek::ConnKeyPtr Factory::DoNewConnKey() const { return std::make_unique<VxlanVniConnKey>(); }
+
+zeek::expected<zeek::ConnKeyPtr, std::string> Factory::DoConnKeyFromVal(const zeek::Val& v) const {
+    if ( v.GetType() != id::conn_id )
+        return zeek::unexpected<std::string>{"unexpected value type"};
+
+    auto ck = zeek::conn_key::fivetuple::Factory::DoConnKeyFromVal(v);
+    if ( ! ck.has_value() )
+        return ck;
+
+    int vxlan_vni_offset = VxlanVniConnKey::GetVxlanVniOffset();
+    static int ctx_offset = id::conn_id->FieldOffset("ctx");
+
+    auto* k = static_cast<VxlanVniConnKey*>(ck.value().get());
+    auto* ctx = v.AsRecordVal()->GetFieldAs<zeek::RecordVal>(ctx_offset);
+
+    if ( vxlan_vni_offset < 0 )
+        return zeek::unexpected<std::string>{"missing vlxan_vni field"};
+
+    if ( ctx->HasField(vxlan_vni_offset) )
+        k->key.vxlan_vni = ctx->GetFieldAs<zeek::CountVal>(vxlan_vni_offset);
+
+    return ck;
+}
+
+} // namespace zeek::conn_key::vxlan_vni_fivetuple
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Factory.h
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Factory.h
@ -0,0 +1,18 @@
+#pragma once
+
+#include "zeek/ConnKey.h"
+#include "zeek/packet_analysis/protocol/ip/conn_key/fivetuple/Factory.h"
+
+namespace zeek::conn_key::vxlan_vni_fivetuple {
+
+class Factory : public zeek::conn_key::fivetuple::Factory {
+public:
+    static zeek::conn_key::FactoryPtr Instantiate() { return std::make_unique<Factory>(); }
+
+private:
+    // Returns a VxlanVniConnKey instance.
+    zeek::ConnKeyPtr DoNewConnKey() const override;
+    zeek::expected<zeek::ConnKeyPtr, std::string> DoConnKeyFromVal(const zeek::Val& v) const override;
+};
+
+} // namespace zeek::conn_key::vxlan_vni_fivetuple
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Plugin.cc
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Plugin.cc
@ -0,0 +1,26 @@
+
+#include "Plugin.h"
+
+#include <zeek/conn_key/Component.h>
+
+#include "Factory.h"
+
+namespace plugin {
+namespace Zeek_ConnKey_Vxlan_Vni_Fivetuple {
+Plugin plugin;
+}
+} // namespace plugin
+
+using namespace plugin::Zeek_ConnKey_Vxlan_Vni_Fivetuple;
+
+zeek::plugin::Configuration Plugin::Configure() {
+    zeek::plugin::Configuration config;
+    config.name = "Zeek::ConnKey_Vxlan_Vni_Fivetuple";
+    config.description = "ConnKey implementation using the most outer VXLAN VNI";
+    config.version = {0, 1, 0};
+
+    AddComponent(new zeek::conn_key::Component("VXLAN_VNI_FIVETUPLE",
+                                               zeek::conn_key::vxlan_vni_fivetuple::Factory::Instantiate));
+
+    return config;
+}
--- a/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Plugin.h
+++ b/doc/devel/plugins/connkey-vxlan-fivetuple-plugin-src/src/Plugin.h
@ -0,0 +1,17 @@
+
+#pragma once
+
+#include <zeek/plugin/Plugin.h>
+
+namespace plugin {
+namespace Zeek_ConnKey_Vxlan_Vni_Fivetuple {
+
+class Plugin : public zeek::plugin::Plugin {
+protected:
+    zeek::plugin::Configuration Configure() override;
+};
+
+extern Plugin plugin;
+
+} // namespace Zeek_ConnKey_Vxlan_Vni_Fivetuple
+} // namespace plugin
--- a/doc/devel/plugins/event-metadata-plugin-src/.gitignore
+++ b/doc/devel/plugins/event-metadata-plugin-src/.gitignore
@ -0,0 +1,3 @@
+build
+*.log
+.state
--- a/doc/devel/plugins/event-metadata-plugin-src/CMakeLists.txt
+++ b/doc/devel/plugins/event-metadata-plugin-src/CMakeLists.txt
@ -0,0 +1,9 @@
+cmake_minimum_required(VERSION 3.15 FATAL_ERROR)
+
+project(ZeekPluginEventLatency)
+
+include(ZeekPlugin)
+
+zeek_add_plugin(
+    Zeek EventLatency
+    SOURCES src/Plugin.cc SCRIPT_FILES scripts/__load__.zeek)
--- a/doc/devel/plugins/event-metadata-plugin-src/COPYING
+++ b/doc/devel/plugins/event-metadata-plugin-src/COPYING
@ -0,0 +1,26 @@
+Copyright (c) 2025 by the Zeek Project. All rights reserved.
+
+Redistribution and use in source and binary forms, with or without modification,
+are permitted provided that the following conditions are met:
+
+1. Redistributions of source code must retain the above copyright notice, this
+   list of conditions and the following disclaimer.
+
+2. Redistributions in binary form must reproduce the above copyright notice,
+   this list of conditions and the following disclaimer in the documentation
+   and/or other materials provided with the distribution.
+
+3. Neither the name of the copyright holder nor the names of its contributors
+   may be used to endorse or promote products derived from this software
+   without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
+ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
+WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
+DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE FOR
+ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
+(INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
+LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON
+ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
--- a/doc/devel/plugins/event-metadata-plugin-src/Makefile
+++ b/doc/devel/plugins/event-metadata-plugin-src/Makefile
@ -0,0 +1,23 @@
+#
+# Convenience Makefile providing a few common top-level targets.
+#
+
+cmake_build_dir=build
+arch=`uname -s | tr A-Z a-z`-`uname -m`
+
+all: build-it
+
+build-it:
+	( cd $(cmake_build_dir) && make )
+
+install:
+	( cd $(cmake_build_dir) && make install )
+
+clean:
+	( cd $(cmake_build_dir) && make clean )
+
+distclean:
+	rm -rf $(cmake_build_dir)
+
+test:
+	make -C tests
--- a/doc/devel/plugins/event-metadata-plugin-src/README
+++ b/doc/devel/plugins/event-metadata-plugin-src/README
--- a/doc/devel/plugins/event-metadata-plugin-src/VERSION
+++ b/doc/devel/plugins/event-metadata-plugin-src/VERSION
@ -0,0 +1 @@
+0.1.0
--- a/doc/devel/plugins/event-metadata-plugin-src/configure
+++ b/doc/devel/plugins/event-metadata-plugin-src/configure
@ -0,0 +1,193 @@
+#!/bin/sh
+#
+# Wrapper for viewing/setting options that the plugin's CMake
+# scripts will recognize.
+#
+# Don't edit this. Edit configure.plugin to add plugin-specific options.
+#
+
+set -e
+command="$0 $*"
+
+if [ -e $(dirname $0)/configure.plugin ]; then
+    # Include custom additions.
+    . $(dirname $0)/configure.plugin
+fi
+
+usage() {
+
+    cat 1>&2 <<EOF
+Usage: $0 [OPTIONS]
+
+  Plugin Options:
+    --cmake=PATH               Path to CMake binary
+    --zeek-dist=DIR            Path to Zeek source tree
+    --install-root=DIR         Path where to install plugin into
+    --with-binpac=DIR          Path to BinPAC installation root
+    --with-broker=DIR          Path to Broker installation root
+    --with-bifcl=PATH          Path to bifcl executable
+    --enable-debug             Compile in debugging mode
+    --disable-cpp-tests        Don't build C++ unit tests
+EOF
+
+    if type plugin_usage >/dev/null 2>&1; then
+        plugin_usage 1>&2
+    fi
+
+    echo
+
+    exit 1
+}
+
+# Function to append a CMake cache entry definition to the
+# CMakeCacheEntries variable
+#   $1 is the cache entry variable name
+#   $2 is the cache entry variable type
+#   $3 is the cache entry variable value
+append_cache_entry() {
+    CMakeCacheEntries="$CMakeCacheEntries -D $1:$2=$3"
+}
+
+# set defaults
+builddir=build
+zeekdist=""
+installroot="default"
+zeek_plugin_begin_opts=""
+CMakeCacheEntries=""
+
+while [ $# -ne 0 ]; do
+    case "$1" in
+        -*=*) optarg=$(echo "$1" | sed 's/[-_a-zA-Z0-9]*=//') ;;
+        *) optarg= ;;
+    esac
+
+    case "$1" in
+        --help | -h)
+            usage
+            ;;
+
+        --cmake=*)
+            CMakeCommand=$optarg
+            ;;
+
+        --zeek-dist=*)
+            zeekdist=$(cd $optarg && pwd)
+            ;;
+
+        --install-root=*)
+            installroot=$optarg
+            ;;
+
+        --with-binpac=*)
+            append_cache_entry BinPAC_ROOT_DIR PATH $optarg
+            binpac_root=$optarg
+            ;;
+
+        --with-broker=*)
+            append_cache_entry BROKER_ROOT_DIR PATH $optarg
+            broker_root=$optarg
+            ;;
+
+        --with-bifcl=*)
+            append_cache_entry BifCl_EXE PATH $optarg
+            ;;
+
+        --enable-debug)
+            append_cache_entry BRO_PLUGIN_ENABLE_DEBUG BOOL true
+            ;;
+
+        --disable-cpp-tests)
+            zeek_plugin_begin_opts="DISABLE_CPP_TESTS;$zeek_plugin_begin_opts"
+            ;;
+
+        *)
+            if type plugin_option >/dev/null 2>&1; then
+                plugin_option $1 && shift && continue
+            fi
+
+            echo "Invalid option '$1'.  Try $0 --help to see available options."
+            exit 1
+            ;;
+    esac
+    shift
+done
+
+if [ -z "$CMakeCommand" ]; then
+    # prefer cmake3 over "regular" cmake (cmake == cmake2 on RHEL)
+    if command -v cmake3 >/dev/null 2>&1; then
+        CMakeCommand="cmake3"
+    elif command -v cmake >/dev/null 2>&1; then
+        CMakeCommand="cmake"
+    else
+        echo "This plugin requires CMake, please install it first."
+        echo "Then you may use this script to configure the CMake build."
+        echo "Note: pass --cmake=PATH to use cmake in non-standard locations."
+        exit 1
+    fi
+fi
+
+if [ -z "$zeekdist" ]; then
+    if type zeek-config >/dev/null 2>&1; then
+        zeek_config="zeek-config"
+    else
+        echo "Either 'zeek-config' must be in PATH or '--zeek-dist=<path>' used"
+        exit 1
+    fi
+
+    append_cache_entry BRO_CONFIG_PREFIX PATH $(${zeek_config} --prefix)
+    append_cache_entry BRO_CONFIG_INCLUDE_DIR PATH $(${zeek_config} --include_dir)
+    append_cache_entry BRO_CONFIG_PLUGIN_DIR PATH $(${zeek_config} --plugin_dir)
+    append_cache_entry BRO_CONFIG_LIB_DIR PATH $(${zeek_config} --lib_dir)
+    append_cache_entry BRO_CONFIG_CMAKE_DIR PATH $(${zeek_config} --cmake_dir)
+    append_cache_entry CMAKE_MODULE_PATH PATH $(${zeek_config} --cmake_dir)
+
+    build_type=$(${zeek_config} --build_type)
+
+    if [ "$build_type" = "debug" ]; then
+        append_cache_entry BRO_PLUGIN_ENABLE_DEBUG BOOL true
+    fi
+
+    if [ -z "$binpac_root" ]; then
+        append_cache_entry BinPAC_ROOT_DIR PATH $(${zeek_config} --binpac_root)
+    fi
+
+    if [ -z "$broker_root" ]; then
+        append_cache_entry BROKER_ROOT_DIR PATH $(${zeek_config} --broker_root)
+    fi
+else
+    if [ ! -e "$zeekdist/zeek-path-dev.in" ]; then
+        echo "$zeekdist does not appear to be a valid Zeek source tree."
+        exit 1
+    fi
+
+    # BRO_DIST is the canonical/historical name used by plugin CMake scripts
+    # ZEEK_DIST doesn't serve a function at the moment, but set/provided anyway
+    append_cache_entry BRO_DIST PATH $zeekdist
+    append_cache_entry ZEEK_DIST PATH $zeekdist
+    append_cache_entry CMAKE_MODULE_PATH PATH $zeekdist/cmake
+fi
+
+if [ "$installroot" != "default" ]; then
+    mkdir -p $installroot
+    append_cache_entry BRO_PLUGIN_INSTALL_ROOT PATH $installroot
+fi
+
+if [ -n "$zeek_plugin_begin_opts" ]; then
+    append_cache_entry ZEEK_PLUGIN_BEGIN_OPTS STRING "$zeek_plugin_begin_opts"
+fi
+
+if type plugin_addl >/dev/null 2>&1; then
+    plugin_addl
+fi
+
+echo "Build Directory        : $builddir"
+echo "Zeek Source Directory   : $zeekdist"
+
+mkdir -p $builddir
+cd $builddir
+
+"$CMakeCommand" $CMakeCacheEntries ..
+
+echo "# This is the command used to configure this build" >config.status
+echo $command >>config.status
+chmod u+x config.status
--- a/doc/devel/plugins/event-metadata-plugin-src/scripts/load.zeek
+++ b/doc/devel/plugins/event-metadata-plugin-src/scripts/load.zeek
@ -0,0 +1,11 @@
+module EventLatency;
+
+redef enum EventMetadata::ID += {
+	## Identifier for the absolute time at which Zeek published this event.
+	WALLCLOCK_TIMESTAMP = 10001000,
+};
+
+event zeek_init()
+	{
+	assert EventMetadata::register(WALLCLOCK_TIMESTAMP, time);
+	}
--- a/doc/devel/plugins/event-metadata-plugin-src/scripts/preload.zeek
+++ b/doc/devel/plugins/event-metadata-plugin-src/scripts/preload.zeek
@ -0,0 +1 @@
+# Empty
--- a/doc/devel/plugins/event-metadata-plugin-src/src/Plugin.cc
+++ b/doc/devel/plugins/event-metadata-plugin-src/src/Plugin.cc
@ -0,0 +1,65 @@
+
+#include "Plugin.h"
+
+#include <zeek/Event.h>
+#include <zeek/Val.h>
+#include <zeek/cluster/Backend.h>
+#include <zeek/plugin/Plugin.h>
+#include <zeek/telemetry/Manager.h>
+
+namespace plugin {
+namespace Zeek_EventLatency {
+Plugin plugin;
+}
+} // namespace plugin
+
+using namespace plugin::Zeek_EventLatency;
+
+zeek::plugin::Configuration Plugin::Configure() {
+    zeek::plugin::Configuration config;
+    config.name = "Zeek::EventLatency";
+    config.description = "Track remote event latencies";
+    config.version = {0, 1, 0};
+    EnableHook(zeek::plugin::HOOK_PUBLISH_EVENT);
+    EnableHook(zeek::plugin::HOOK_QUEUE_EVENT);
+    return config;
+}
+
+void Plugin::InitPostScript() {
+    double bounds[] = {0.0002, 0.0004, 0.0006, 0.0008, 0.0010, 0.0012, 0.0014, 0.0016, 0.0018, 0.0020};
+    histogram =
+        zeek::telemetry_mgr->HistogramInstance("zeek", "cluster_event_latency_seconds", {}, bounds, "event latency");
+}
+
+bool Plugin::HookPublishEvent(zeek::cluster::Backend& backend, const std::string& topic,
+                              zeek::cluster::detail::Event& event) {
+    static const auto& wallclock_id = zeek::id::find_val<zeek::EnumVal>("EventLatency::WALLCLOCK_TIMESTAMP");
+
+    auto now_val = zeek::make_intrusive<zeek::TimeVal>(zeek::util::current_time(/*real=*/true));
+
+    if ( ! event.AddMetadata(wallclock_id, now_val) )
+        zeek::reporter->FatalError("failed to add wallclock timestamp metadata");
+
+    return true;
+}
+
+bool Plugin::HookQueueEvent(zeek::Event* event) {
+    static const auto& wallclock_id = zeek::id::find_val<zeek::EnumVal>("EventLatency::WALLCLOCK_TIMESTAMP");
+
+    if ( event->Source() == zeek::util::detail::SOURCE_LOCAL )
+        return false;
+
+    auto timestamps = event->MetadataValues(wallclock_id);
+
+    if ( timestamps->Size() > 0 ) {
+        double remote_ts = timestamps->ValAt(0)->AsTime();
+        auto now = zeek::util::current_time(/*real=*/true);
+        auto latency = std::max(0.0, now - remote_ts);
+
+        histogram->Observe(latency);
+    }
+    else
+        zeek::reporter->Warning("missing wallclock timestamp metadata");
+
+    return false;
+}
--- a/doc/devel/plugins/event-metadata-plugin-src/src/Plugin.h
+++ b/doc/devel/plugins/event-metadata-plugin-src/src/Plugin.h
@ -0,0 +1,29 @@
+
+#pragma once
+
+#include <zeek/plugin/Plugin.h>
+#include <zeek/telemetry/Histogram.h>
+
+namespace plugin {
+namespace Zeek_EventLatency {
+
+class Plugin : public zeek::plugin::Plugin {
+protected:
+    // Overridden from zeek::plugin::Plugin.
+    zeek::plugin::Configuration Configure() override;
+
+    void InitPostScript() override;
+
+    bool HookPublishEvent(zeek::cluster::Backend& backend, const std::string& topic,
+                          zeek::cluster::detail::Event& event) override;
+
+    bool HookQueueEvent(zeek::Event* event) override;
+
+private:
+    zeek::telemetry::HistogramPtr histogram;
+};
+
+extern Plugin plugin;
+
+} // namespace Zeek_EventLatency
+} // namespace plugin
--- a/doc/devel/plugins/event-metadata-plugin.rst
+++ b/doc/devel/plugins/event-metadata-plugin.rst
@ -0,0 +1,103 @@
+.. _event-metadata-plugin:
+
+=====================
+Event Metadata Plugin
+=====================
+
+.. versionadded:: 8.0
+
+
+Zeek's plugin API allows adding metadata to Zeek events. In the Zeek-script
+layer, the :zeek:see:`EventMetadata::current` and :zeek:see:`EventMetadata::current_all`
+functions can be used to introspect metadata attached to events. In a Zeek cluster,
+metadata is transported via remote events for consumption by other Zeek nodes.
+This section describes the functionality in form of a tutorial. We'll
+be using custom event metadata to track the latency of Zeek events in a
+cluster and expose them as a Prometheus histogram.
+
+If you're unfamiliar with plugin development, head over to the
+:ref:`Writing Plugins <writing-plugins>` section. For more information
+about telemetry and Prometheus, see also the :ref:`Telemetry framework's <framework-telemetry>`
+documentation.
+
+
+Registering Metadata
+====================
+
+Initially, we make Zeek's core aware of the metadata to attach to events. This
+requires two steps.
+First, redefining the :zeek:see:`EventMetadata::ID` enumeration with our
+custom enumeration value ``WALLCLOCK_TIMESTAMP``. This is our metadata identifier.
+Its value represents the Unix timestamps when an event was published.
+Second, registering the metadata identifier with Zeek's :zeek:see:`time` type
+by calling :zeek:see:`EventMetadata::register` in a :zeek:see:`zeek_init` handler.
+This instructs Zeek to convert metadata items in received remote events with
+identifier ``10001000`` to a :zeek:see:`time` value.
+
+For simplicity, the second step is done in the plugin's ``scripts/__init__.zeek`` file
+that's loaded automatically when Zeek loads the plugin.
+
+.. literalinclude:: event-metadata-plugin-src/scripts/__load__.zeek
+   :caption: main.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+The ``10001000`` represents the metadata identifier for serialization purposes. It
+needs to be unique and have a defined meaning and consistent type for a given Zeek
+deployment. Metadata identifiers below ``200`` are reserved for Zeek's internal use.
+Users are free to choose any other value. Zeek will fail to start or fail to
+register the type in the case of conflicting identifiers in third-party packages.
+
+
+Implementing the Plugin
+=======================
+
+Next, we implement the ``InitPostScript()``, ``HookPublishEvent()`` and
+``HookQueueEvent()`` methods in our plugin.
+In the ``InitPostScript()`` method, a histogram instance is initialized using
+Zeek's telemetry manager with hard-coded bounds. These define buckets for latency
+monitoring.
+The ``HookPublishEvent()`` method adds ``WALLCLOCK_TIMESTAMP`` metadata with
+the current time to the event, while the ``HookQueueEvent()`` method extracts
+the sender's timestamp and computes the latency based on its own local time.
+Finally, the latency is recorded with the histogram by calling ``Observe()``.
+
+
+.. literalinclude:: event-metadata-plugin-src/src/Plugin.cc
+   :caption: main.zeek
+   :language: zeek
+   :linenos:
+   :lines: 28-
+   :tab-width: 4
+
+
+Resulting Prometheus Metrics
+============================
+
+Deploying the plugin outlined above in a cluster and querying the manager's
+metrics endpoint presents the following result::
+
+    $ curl -s localhost:10001/metrics | grep '^zeek_cluster_event_latency'
+    zeek_cluster_event_latency_seconds_count{endpoint="manager"} 11281
+    zeek_cluster_event_latency_seconds_sum{endpoint="manager"} 7.960928916931152
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0002"} 37
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0004"} 583
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0005999999999999999"} 3858
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0008"} 7960
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.001"} 10185
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0012"} 10957
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0014"} 11239
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0016"} 11269
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.0018"} 11279
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="0.002"} 11281
+    zeek_cluster_event_latency_seconds_bucket{endpoint="manager",le="+Inf"} 11281
+
+
+This example indicates that there were a total of 11281 latencies observed,
+the summed up latency was around 8 seconds, 37 events had a latency less or equal
+to 0.2 milliseconds, 583 with less or equal than 0.4 milliseconds and none
+that took more than 2 milliseconds.
+
+This sort of data is usually scraped and ingested by a `Prometheus server <https://prometheus.io/>`_  and
+then visualized using `Grafana <https://grafana.com/>`_.
--- a/doc/devel/spicy/autogen-spicy-docs
+++ b/doc/devel/spicy/autogen-spicy-docs
@ -0,0 +1,46 @@
+#!/bin/bash
+#
+# Copyright (c) 2020-2023 by the Zeek Project. See LICENSE for details.
+#
+# Tool to update autogenerated docs that require external files. Must be
+# run manually and requires access to the Spicy TFTP analyzer.
+
+set -e
+
+if [ $# != 1 ]; then
+    echo "usage: $(basename "$0") <spicy-tftp-repo>"
+    exit 1
+fi
+
+TFTP=$1
+
+if [ ! -d "${TFTP}"/analyzer ]; then
+    echo "${TFTP} does not seem to point to a spicy-tftp repository."
+    exit 1
+fi
+
+set -o errexit
+set -o nounset
+
+ZEEK="$(cd "$(dirname "${BASH_SOURCE[0]}")" >/dev/null 2>&1 && pwd)/../../.."
+DOC="${ZEEK}/doc"
+SPICY="${ZEEK}/auxil/spicy"
+SPICYDOC="${ZEEK}/build/auxil/spicy/bin/spicy-doc"
+AUTOGEN_FINAL="${ZEEK}/doc/devel/spicy/autogen"
+
+if [ ! -x "${SPICYDOC}" ]; then
+    >&2 echo "Warning: Could not find spicy-doc in build directory, aborting"
+    exit 0
+fi
+
+"${SPICY}/doc/scripts/autogen-spicy-lib" functions zeek <"${ZEEK}/scripts/spicy/zeek.spicy" >"${AUTOGEN_FINAL}/zeek-functions.spicy" || exit 1
+
+# Copy some static files over.
+cp "${TFTP}"/scripts/main.zeek "${AUTOGEN_FINAL}"/tftp.zeek || exit 1
+cp "${TFTP}"/analyzer/tftp.spicy "${AUTOGEN_FINAL}"/tftp.spicy || exit 1
+cp "${TFTP}"/analyzer/tftp.evt "${AUTOGEN_FINAL}"/tftp.evt || exit 1
+
+# Copy some files from the Zeek source tree so that zeek-docs remains standaline for CI.
+cp "${ZEEK}/scripts/base/frameworks/spicy/init-bare.zeek" "${AUTOGEN_FINAL}/"
+cp "${ZEEK}/scripts/base/frameworks/spicy/init-framework.zeek" "${AUTOGEN_FINAL}/"
+cp "${ZEEK}/auxil/spicy/doc/scripts/spicy-pygments.py" "${DOC}/ext"
--- a/doc/devel/spicy/autogen/init-bare.zeek
+++ b/doc/devel/spicy/autogen/init-bare.zeek
@ -0,0 +1,38 @@
+
+module Spicy;
+
+export {
+# doc-options-start
+    ## Constant for testing if Spicy is available.
+    const available = T;
+
+    ## Show output of Spicy print statements.
+    const enable_print = F &redef;
+
+    # Record and display profiling information, if compiled into analyzer.
+    const enable_profiling = F &redef;
+
+    ## abort() instead of throwing HILTI exceptions.
+    const abort_on_exceptions = F &redef;
+
+    ## Include backtraces when reporting unhandled exceptions.
+    const show_backtraces = F &redef;
+
+    ## Maximum depth of recursive file analysis (Spicy analyzers only)
+    const max_file_depth: count = 5 &redef;
+# doc-options-end
+
+# doc-types-start
+    ## Result type for :zeek:see:`Spicy::resource_usage`. The values reflect resource
+    ## usage as reported by the Spicy runtime system.
+    type ResourceUsage: record {
+        user_time : interval;           ##< user CPU time of the Zeek process
+        system_time :interval;          ##< system CPU time of the Zeek process
+        memory_heap : count;            ##< memory allocated on the heap by the Zeek process
+        num_fibers : count;             ##< number of fibers currently in use
+        max_fibers: count;              ##< maximum number of fibers ever in use
+        max_fiber_stack_size: count;    ##< maximum fiber stack size ever in use
+        cached_fibers: count;           ##< number of fibers currently cached
+    };
+# doc-types-end
+}
--- a/doc/devel/spicy/autogen/init-framework.zeek
+++ b/doc/devel/spicy/autogen/init-framework.zeek
@ -0,0 +1,85 @@
+# doc-common-start
+module Spicy;
+
+export {
+# doc-functions-start
+    ## Enable a specific Spicy protocol analyzer if not already active. If this
+    ## analyzer replaces an standard analyzer, that one will automatically be
+    ## disabled.
+    ##
+    ## tag: analyzer to toggle
+    ##
+    ## Returns: true if the operation succeeded
+    global enable_protocol_analyzer: function(tag: Analyzer::Tag) : bool;
+
+    ## Disable a specific Spicy protocol analyzer if not already inactive. If
+    ## this analyzer replaces an standard analyzer, that one will automatically
+    ## be re-enabled.
+    ##
+    ## tag: analyzer to toggle
+    ##
+    ## Returns: true if the operation succeeded
+    global disable_protocol_analyzer: function(tag: Analyzer::Tag) : bool;
+
+
+    ## Enable a specific Spicy file analyzer if not already active. If this
+    ## analyzer replaces an standard analyzer, that one will automatically be
+    ## disabled.
+    ##
+    ## tag: analyzer to toggle
+    ##
+    ## Returns: true if the operation succeeded
+    global enable_file_analyzer: function(tag: Files::Tag) : bool;
+
+    ## Disable a specific Spicy file analyzer if not already inactive. If
+    ## this analyzer replaces an standard analyzer, that one will automatically
+    ## be re-enabled.
+    ##
+    ## tag: analyzer to toggle
+    ##
+    ## Returns: true if the operation succeeded
+    global disable_file_analyzer: function(tag: Files::Tag) : bool;
+
+    ## Returns current resource usage as reported by the Spicy runtime system.
+    global resource_usage: function() : ResourceUsage;
+# doc-functions-end
+}
+
+# Marked with &is_used to suppress complaints when there aren't any
+# Spicy file analyzers loaded, and hence this event can't be generated.
+event spicy_analyzer_for_mime_type(a: Files::Tag, mt: string) &is_used
+    {
+    Files::register_for_mime_type(a, mt);
+    }
+
+# Marked with &is_used to suppress complaints when there aren't any
+# Spicy protocol analyzers loaded, and hence this event can't be generated.
+event spicy_analyzer_for_port(a: Analyzer::Tag, p: port) &is_used
+    {
+    Analyzer::register_for_port(a, p);
+    }
+
+function enable_protocol_analyzer(tag: Analyzer::Tag) : bool
+    {
+    return Spicy::__toggle_analyzer(tag, T);
+    }
+
+function disable_protocol_analyzer(tag: Analyzer::Tag) : bool
+    {
+    return Spicy::__toggle_analyzer(tag, F);
+    }
+
+function enable_file_analyzer(tag: Files::Tag) : bool
+    {
+    return Spicy::__toggle_analyzer(tag, T);
+    }
+
+function disable_file_analyzer(tag: Files::Tag) : bool
+    {
+    return Spicy::__toggle_analyzer(tag, F);
+    }
+
+function resource_usage() : ResourceUsage
+    {
+    return Spicy::__resource_usage();
+    }
--- a/doc/devel/spicy/autogen/tftp.evt
+++ b/doc/devel/spicy/autogen/tftp.evt
@ -0,0 +1,16 @@
+# Copyright (c) 2021 by the Zeek Project. See LICENSE for details.
+#
+# Note: When line numbers change in this file, update the documentation that pulls it in.
+
+protocol analyzer spicy::TFTP over UDP:
+    parse with TFTP::Packet,
+    port 69/udp;
+
+import TFTP;
+
+on TFTP::Request if ( is_read )   -> event tftp::read_request($conn, $is_orig, self.filename, self.mode);
+on TFTP::Request if ( ! is_read ) -> event tftp::write_request($conn, $is_orig, self.filename, self.mode);
+
+on TFTP::Data            -> event tftp::data($conn, $is_orig, self.num, self.data);
+on TFTP::Acknowledgement -> event tftp::ack($conn, $is_orig, self.num);
+on TFTP::Error           -> event tftp::error($conn, $is_orig, self.code, self.msg);
--- a/doc/devel/spicy/autogen/tftp.spicy
+++ b/doc/devel/spicy/autogen/tftp.spicy
@ -0,0 +1,95 @@
+# Copyright (c) 2021 by the Zeek Project. See LICENSE for details.
+#
+# Trivial File Transfer Protocol
+#
+# Specs from https://tools.ietf.org/html/rfc1350
+
+module TFTP;
+
+import spicy;
+
+# Common header for all messages:
+#
+#      2 bytes
+# ---------------
+# |  TFTP Opcode  |
+#  ---------------
+
+public type Packet = unit {
+    # public top-level entry point for parsing
+    op: uint16 &convert=Opcode($$);
+    switch (self.op) {
+        Opcode::RRQ -> rrq: Request(True);
+        Opcode::WRQ -> wrq: Request(False);
+        Opcode::DATA -> data: Data;
+        Opcode::ACK -> ack: Acknowledgement;
+        Opcode::ERROR -> error: Error;
+    };
+};
+
+# TFTP supports five types of packets [...]:
+#
+# opcode  operation
+#   1     Read request (RRQ)
+#   2     Write request (WRQ)
+#   3     Data (DATA)
+#   4     Acknowledgment (ACK)
+#   5     Error (ERROR)
+type Opcode = enum {
+    RRQ = 0x01,
+    WRQ = 0x02,
+    DATA = 0x03,
+    ACK = 0x04,
+    ERROR = 0x05,
+};
+
+# Figure 5-1: RRQ/WRQ packet
+#
+#  2 bytes     string    1 byte     string   1 byte
+#  ------------------------------------------------
+# | Opcode |  Filename  |   0  |    Mode    |   0  |
+#  ------------------------------------------------
+
+type Request = unit(is_read: bool) {
+    filename: bytes &until=b"\x00";
+    mode: bytes &until=b"\x00";
+
+    on %done {
+        spicy::accept_input();
+    }
+};
+
+# Figure 5-2: DATA packet
+#
+#  2 bytes     2 bytes      n bytes
+#   ----------------------------------
+#  | Opcode |   Block #  |   Data     |
+#   ----------------------------------
+
+type Data = unit {
+    num: uint16;
+    data: bytes &eod;
+};
+
+# Figure 5-3: ACK packet
+#
+#  2 bytes     2 bytes
+#  ---------------------
+# | Opcode |   Block #  |
+#  ---------------------
+
+type Acknowledgement = unit {
+    num: uint16;
+};
+
+#  Figure 5-4: ERROR packet
+#
+#  2 bytes     2 bytes      string    1 byte
+#  -----------------------------------------
+# | Opcode |  ErrorCode |   ErrMsg   |   0  |
+#  -----------------------------------------
+
+type Error = unit {
+    code: uint16;
+    msg: bytes &until=b"\x00";
+};
--- a/doc/devel/spicy/autogen/tftp.zeek
+++ b/doc/devel/spicy/autogen/tftp.zeek
@ -0,0 +1,162 @@
+# Copyright (c) 2021 by the Zeek Project. See LICENSE for details.
+
+module TFTP;
+
+export {
+	redef enum Log::ID += { LOG };
+
+	type Info: record {
+		## Timestamp for when the request happened.
+		ts:		time &log;
+		## Unique ID for the connection.
+		uid:		string &log;
+		## The connection's 4-tuple of endpoint addresses/ports.
+		id:		conn_id &log;
+		## True  for write requests, False for read request.
+		wrq:		bool &log;
+		## File name of request.
+		fname:		string &log;
+		## Mode of request.
+		mode:		string &log;
+		## UID of data connection
+		uid_data:	string &optional &log;
+		## Number of bytes sent.
+		size:		count &default=0 &log;
+		## Highest block number sent.
+		block_sent:	count &default=0 &log;
+		## Highest block number ackknowledged.
+		block_acked:	count &default=0 &log;
+		## Any error code encountered.
+		error_code:	count &optional &log;
+		## Any error message encountered.
+		error_msg:	string &optional &log;
+
+		# Set to block number of final piece of data once received.
+		final_block: count &optional;
+
+		# Set to true once logged.
+		done: bool &default=F;
+	};
+
+	## Event that can be handled to access the TFTP logging record.
+	global log_tftp: event(rec: Info);
+}
+
+# Maps a partial data connection ID to the request's Info record.
+global expected_data_conns: table[addr, port, addr] of Info;
+
+redef record connection += {
+	tftp: Info &optional;
+};
+
+event zeek_init() &priority=5
+	{
+	Log::create_stream(TFTP::LOG, [$columns = Info, $ev = log_tftp, $path="tftp"]);
+	}
+
+function log_pending(c: connection)
+	{
+	if ( ! c?$tftp || c$tftp$done )
+		return;
+
+	Log::write(TFTP::LOG, c$tftp);
+	c$tftp$done = T;
+	}
+
+function init_request(c: connection, is_orig: bool, fname: string, mode: string, is_read: bool)
+	{
+	log_pending(c);
+
+	local info: Info;
+	info$ts  = network_time();
+	info$uid = c$uid;
+	info$id  = c$id;
+	info$fname = fname;
+	info$mode = mode;
+	info$wrq = (! is_read);
+	c$tftp = info;
+
+	# The data will come in from a different source port.
+	Analyzer::schedule_analyzer(c$id$resp_h, c$id$orig_h, c$id$orig_p, Analyzer::ANALYZER_SPICY_TFTP, 1min);
+	expected_data_conns[c$id$resp_h, c$id$orig_p, c$id$orig_h] = info;
+	}
+
+event scheduled_analyzer_applied(c: connection, a: Analyzer::Tag) &priority=10
+	{
+	local id = c$id;
+	if ( [c$id$orig_h, c$id$resp_p, c$id$resp_h] in expected_data_conns )
+		{
+		c$tftp = expected_data_conns[c$id$orig_h, c$id$resp_p, c$id$resp_h];
+		c$tftp$uid_data = c$uid;
+		add c$service["spicy_tftp_data"];
+		}
+	}
+
+event tftp::read_request(c: connection, is_orig: bool, fname: string, mode: string)
+	{
+	init_request(c, is_orig, fname, mode, T);
+	}
+
+event tftp::write_request(c: connection, is_orig: bool, fname: string, mode: string)
+	{
+	init_request(c, is_orig, fname, mode, F);
+	}
+
+event tftp::data(c: connection, is_orig: bool, block_num: count, data: string)
+	{
+	if ( ! c?$tftp || c$tftp$done )
+		return;
+
+	local info = c$tftp;
+
+	if ( block_num <= info$block_sent )
+		# Duplicate (or previous gap; we don't track that)
+		return;
+
+	info$size += |data|;
+	info$block_sent = block_num;
+
+	if ( |data| < 512 )
+		# Last block, per spec.
+		info$final_block = block_num;
+	}
+
+event tftp::ack(c: connection, is_orig: bool, block_num: count)
+	{
+	if ( ! c?$tftp || c$tftp$done )
+		return;
+
+	local info = c$tftp;
+
+	info$block_acked = block_num;
+
+	if ( block_num <= info$block_acked )
+		# Duplicate (or previous gap, we don't track that)
+		return;
+
+	info$block_acked = block_num;
+
+	# If it's an ack for the last block, we're done.
+	if ( info?$final_block && info$final_block == block_num )
+		log_pending(c);
+	}
+
+event tftp::error(c: connection, is_orig: bool, code: count, msg: string)
+	{
+	if ( ! c?$tftp || c$tftp$done )
+		return;
+
+	local info = c$tftp;
+
+	info$error_code = code;
+	info$error_msg = msg;
+	log_pending(c);
+	}
+
+event connection_state_remove(c: connection)
+	{
+	if ( ! c?$tftp || c$tftp$done )
+		return;
+
+	log_pending(c);
+	}
--- a/doc/devel/spicy/autogen/zeek-functions.spicy
+++ b/doc/devel/spicy/autogen/zeek-functions.spicy
@ -0,0 +1,736 @@
+.. _spicy_confirm_protocol:
+
+.. rubric:: ``function zeek::confirm_protocol()``
+
+[Deprecated] Triggers a DPD protocol confirmation for the current connection.
+
+This function has been deprecated and will be removed. Use ``spicy::accept_input``
+instead, which will have the same effect with Zeek.
+
+.. _spicy_reject_protocol:
+
+.. rubric:: ``function zeek::reject_protocol(reason: string)``
+
+[Deprecated] Triggers a DPD protocol violation for the current connection.
+
+This function has been deprecated and will be removed. Use ``spicy::decline_input``
+instead, which will have the same effect with Zeek.
+
+.. _spicy_weird:
+
+.. rubric:: ``function zeek::weird(id: string, addl: string = "") : &cxxname="zeek::spicy::rt::weird";``
+
+Reports a "weird" to Zeek. This should be used with similar semantics as in
+Zeek: something quite unexpected happening at the protocol level, which however
+does not prevent us from continuing to process the connection.
+
+id: the name of the weird, which (just like in Zeek) should be a *static*
+string identifying the situation reported (e.g., ``unexpected_command``).
+
+addl: additional information to record along with the weird
+
+.. _spicy_is_orig:
+
+.. rubric:: ``function zeek::is_orig() : bool``
+
+Returns true if we're currently parsing the originator side of a connection.
+
+.. _spicy_uid:
+
+.. rubric:: ``function zeek::uid() : string``
+
+Returns the current connection's UID.
+
+.. _spicy_conn_id:
+
+.. rubric:: ``function zeek::conn_id() : tuple<orig_h: addr, orig_p: port, resp_h: addr, resp_p: port>``
+
+Returns the current connection's 4-tuple ID to make IP address and port information available.
+
+.. _spicy_flip_roles:
+
+.. rubric:: ``function zeek::flip_roles()``
+
+Instructs Zeek to flip the directionality of the current connection.
+
+.. _spicy_number_packets:
+
+.. rubric:: ``function zeek::number_packets() : uint64``
+
+Returns the number of packets seen so far on the current side of the current connection.
+
+.. _spicy_has_analyzer:
+
+.. rubric:: ``function zeek::has_analyzer(analyzer: string, if_enabled: bool = True) : bool``
+
+Checks if there is a Zeek analyzer of a given name.
+
+analyzer: the Zeek-side name of the analyzer to check for
+if_enabled: if true, only checks for analyzers that are enabled
+
+Returns the type of the analyzer if it exists, or ``Undef`` if it does not.
+
+.. _spicy_analyzer_type:
+
+.. rubric:: ``function zeek::analyzer_type(analyzer: string, if_enabled: bool = True) : AnalyzerType``
+
+Returns the type of a Zeek analyzer of a given name.
+
+analyzer: the Zeek-side name of the analyzer to check
+if_enabled: if true, only checks for analyzers that are enabled
+
+Returns the type of the analyzer if it exists, or ``Undef`` if it does not.
+
+.. _spicy_protocol_begin:
+
+.. rubric:: ``function zeek::protocol_begin(analyzer: optional<string>, protocol: spicy::Protocol = spicy::Protocol::TCP)``
+
+Adds a Zeek-side child protocol analyzer to the current connection.
+
+If the same analyzer was added previously with `protocol_handle_get_or_create` or
+`protocol_begin` with same argument, and not closed with `protocol_handle_close`
+or `protocol_end`, no new analyzer will be added.
+
+See `protocol_handle_get_or_create` for lifetime and error semantics.
+
+analyzer: type of analyzer to instantiate, specified through its Zeek-side
+name (similar to what Zeek's signature action `enable` takes)
+
+protocol: the transport-layer protocol that the analyzer uses; only TCP is
+currently supported here
+
+Note: For backwards compatibility, the analyzer argument can be left unset to add
+a DPD analyzer. This use is deprecated, though; use the single-argument version of
+`protocol_begin` for that instead.
+
+.. _spicy_protocol_begin_2:
+
+.. rubric:: ``function zeek::protocol_begin(protocol: spicy::Protocol = spicy::Protocol::TCP)``
+
+Adds a Zeek-side DPD child protocol analyzer performing dynamic protocol detection
+on subsequently provided data.
+
+If the same DPD analyzer was added previously with `protocol_handle_get_or_create` or
+`protocol_begin` with same argument, and not closed with `protocol_handle_close`
+or `protocol_end`, no new analyzer will be added.
+
+See `protocol_handle_get_or_create` for lifetime and error semantics.
+
+protocol: the transport-layer protocol on which to perform protocol detection;
+only TCP is currently supported here
+
+.. _spicy_protocol_handle_get_or_create:
+
+.. rubric:: ``function zeek::protocol_handle_get_or_create(analyzer: string, protocol: spicy::Protocol = spicy::Protocol::TCP) : ProtocolHandle``
+
+Gets a handle to a Zeek-side child protocol analyzer for the current connection.
+
+If no such child exists yet it will be added; otherwise a handle to the
+existing child protocol analyzer will be returned.
+
+This function will return an error if:
+
+- not called from a protocol analyzer, or
+- the requested child protocol analyzer is of unknown type or not support by the requested transport protocol, or
+- creation of a child analyzer of the requested type was prevented by a
+  previous call of `disable_analyzer` with `prevent=T`
+
+By default, any newly created child protocol analyzer will remain alive
+until Zeek expires the current connection's state. Alternatively, one
+can call `protocol_handle_close` or `protocol_end` to delete the analyzer
+earlier.
+
+analyzer: type of analyzer to get or instantiate, specified through its Zeek-side
+name (similar to what Zeek's signature action `enable` takes).
+
+protocol: the transport-layer protocol that the analyser uses; only TCP is
+currently supported here
+
+
+.. _spicy_protocol_data_in:
+
+.. rubric:: ``function zeek::protocol_data_in(is_orig: bool, data: bytes, protocol: spicy::Protocol = spicy::Protocol::TCP)``
+
+Forwards protocol data to all previously instantiated Zeek-side child protocol analyzers of a given transport-layer.
+
+is_orig: true to feed the data to the child's originator side, false for the responder
+
+data: chunk of data to forward to child analyzer
+
+protocol: the transport-layer protocol of the children to forward to; only TCP is currently supported here
+
+.. _spicy_protocol_data_in_2:
+
+.. rubric:: ``function zeek::protocol_data_in(is_orig: bool, data: bytes, h: ProtocolHandle)``
+
+Forwards protocol data to a specific previously instantiated Zeek-side child analyzer.
+
+is_orig: true to feed the data to the child's originator side, false for the responder
+
+data: chunk of data to forward to child analyzer
+
+h: handle to the child analyzer to forward data into
+
+.. _spicy_protocol_gap:
+
+.. rubric:: ``function zeek::protocol_gap(is_orig: bool, offset: uint64, len: uint64, h: optional<ProtocolHandle> = Null)``
+
+Signals a gap in input data to all previously instantiated Zeek-side child protocol analyzers.
+
+is_orig: true to signal gap to the child's originator side, false for the responder
+
+offset: start offset of gap in input stream
+
+len: size of gap
+
+h: optional handle to the child analyzer signal a gap to, else signal to all child analyzers
+
+.. _spicy_protocol_end:
+
+.. rubric:: ``function zeek::protocol_end()``
+
+Signals end-of-data to all previously instantiated Zeek-side child protocol
+analyzers and removes them.
+
+.. _spicy_protocol_handle_close:
+
+.. rubric:: ``function zeek::protocol_handle_close(handle: ProtocolHandle)``
+
+Signals end-of-data to the given child analyzer and removes it.
+
+The given handle must be live, i.e., it must not have been used in a
+previous protocol_handle_close call, and must not have been live when
+protocol_end was called. If the handle is not live a runtime error will
+be triggered.
+
+handle: handle to the child analyzer to remove
+
+.. _spicy_file_begin:
+
+.. rubric:: ``function zeek::file_begin(mime_type: optional<string> = Null, fuid: optional<string> = Null) : string``
+
+Signals the beginning of a file to Zeek's file analysis, associating it with the current connection.
+Optionally, a mime type can be provided. It will be passed on to Zeek's file analysis framework.
+Optionally, a file ID can be provided. It will be passed on to Zeek's file analysis framework.
+Returns the Zeek-side file ID of the new file.
+
+This function creates a new Zeek file analyzer that will remain alive until
+either `file_end` gets called, or Zeek eventually expires the analyzer
+through a timeout. (As Zeek does not tie a file analyzer's lifetime to any
+connection, it may survive the termination of the current connection.)
+
+.. _spicy_fuid:
+
+.. rubric:: ``function zeek::fuid() : string``
+
+Returns the current file's FUID.
+
+.. _spicy_terminate_session:
+
+.. rubric:: ``function zeek::terminate_session()``
+
+Terminates the currently active Zeek-side session, flushing all state. Any
+subsequent activity will start a new session from scratch. This can only be
+called from inside a protocol analyzer.
+
+.. _spicy_skip_input:
+
+.. rubric:: ``function zeek::skip_input()``
+
+Tells Zeek to skip sending any further input data to the current analyzer.
+This is supported for protocol and file analyzers.
+
+.. _spicy_file_set_size:
+
+.. rubric:: ``function zeek::file_set_size(size: uint64, fid: optional<string> = Null)``
+
+Signals the expected size of a file to Zeek's file analysis.
+
+size: expected size of file
+fid: Zeek-side ID of the file to operate on; if not given, the file started by the most recent file_begin() will be used
+
+.. _spicy_file_data_in:
+
+.. rubric:: ``function zeek::file_data_in(data: bytes, fid: optional<string> = Null)``
+
+Passes file content on to Zeek's file analysis.
+
+data: chunk of raw data to pass into analysis
+fid: Zeek-side ID of the file to operate on; if not given, the file started by the most recent file_begin() will be used
+
+.. _spicy_file_data_in_at_offset:
+
+.. rubric:: ``function zeek::file_data_in_at_offset(data: bytes, offset: uint64, fid: optional<string> = Null)``
+
+Passes file content at a specific offset on to Zeek's file analysis.
+
+data: chunk of raw data to pass into analysis
+offset: position in file where data starts
+fid: Zeek-side ID of the file to operate on; if not given, the file started by the most recent file_begin() will be used
+
+.. _spicy_file_gap:
+
+.. rubric:: ``function zeek::file_gap(offset: uint64, len: uint64, fid: optional<string> = Null)``
+
+Signals a gap in a file to Zeek's file analysis.
+
+offset: position in file where gap starts
+len: size of gap
+fid: Zeek-side ID of the file to operate on; if not given, the file started by the most recent file_begin() will be used
+
+.. _spicy_file_end:
+
+.. rubric:: ``function zeek::file_end(fid: optional<string> = Null)``
+
+Signals the end of a file to Zeek's file analysis.
+
+fid: Zeek-side ID of the file to operate on; if not given, the file started by the most recent file_begin() will be used
+
+.. _spicy_forward_packet:
+
+.. rubric:: ``function zeek::forward_packet(identifier: uint32)``
+
+Inside a packet analyzer, forwards what data remains after parsing the top-level unit
+on to another analyzer. The index specifies the target, per the current dispatcher table.
+
+.. _spicy_network_time:
+
+.. rubric:: ``function zeek::network_time() : time``
+
+Gets the network time from Zeek.
+
+.. _spicy_get_address:
+
+.. rubric:: ``function zeek::get_address(id: string) : addr``
+
+Returns the value of a global Zeek script variable of Zeek type ``addr``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_bool:
+
+.. rubric:: ``function zeek::get_bool(id: string) : bool``
+
+Returns the value of a global Zeek script variable of Zeek type ``bool``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_count:
+
+.. rubric:: ``function zeek::get_count(id: string) : uint64``
+
+Returns the value of a global Zeek script variable of Zeek type ``count``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_double:
+
+.. rubric:: ``function zeek::get_double(id: string) : real``
+
+Returns the value of a global Zeek script variable of Zeek type ``double``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_enum:
+
+.. rubric:: ``function zeek::get_enum(id: string) : string``
+
+Returns the value of a global Zeek script variable of Zeek type ``enum``.
+The value is returned as a string containing the enum's label name, without
+any scope. Throws an exception if there's no such Zeek of that name, or if
+it's not of the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_int:
+
+.. rubric:: ``function zeek::get_int(id: string) : int64``
+
+Returns the value of a global Zeek script variable of Zeek type ``int``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_interval:
+
+.. rubric:: ``function zeek::get_interval(id: string) : interval``
+
+Returns the value of a global Zeek script variable of Zeek type
+``interval``. Throws an exception if there's no such Zeek of that name, or
+if it's not of the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_port:
+
+.. rubric:: ``function zeek::get_port(id: string) : port``
+
+Returns the value of a global Zeek script variable of Zeek type ``port``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_record:
+
+.. rubric:: ``function zeek::get_record(id: string) : ZeekRecord``
+
+Returns the value of a global Zeek script variable of Zeek type ``record``.
+The value is returned as an opaque handle to the record, which can be used
+with the ``zeek::record_*()`` functions to access the record's fields.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_set:
+
+.. rubric:: ``function zeek::get_set(id: string) : ZeekSet``
+
+Returns the value of a global Zeek script variable of Zeek type ``set``. The
+value is returned as an opaque handle to the set, which can be used with the
+``zeek::set_*()`` functions to access the set's content. Throws an exception
+if there's no such Zeek of that name, or if it's not of the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_string:
+
+.. rubric:: ``function zeek::get_string(id: string) : bytes``
+
+Returns the value of a global Zeek script variable of Zeek type ``string``.
+The string's value is returned as a Spicy ``bytes`` value. Throws an
+exception if there's no such Zeek of that name, or if it's not of the
+expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_subnet:
+
+.. rubric:: ``function zeek::get_subnet(id: string) : network``
+
+Returns the value of a global Zeek script variable of Zeek type ``subnet``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_table:
+
+.. rubric:: ``function zeek::get_table(id: string) : ZeekTable``
+
+Returns the value of a global Zeek script variable of Zeek type ``table``.
+The value is returned as an opaque handle to the set, which can be used with
+the ``zeek::set_*()`` functions to access the set's content. Throws an
+exception if there's no such Zeek of that name, or if it's not of the
+expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_time:
+
+.. rubric:: ``function zeek::get_time(id: string) : time``
+
+Returns the value of a global Zeek script variable of Zeek type ``time``.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_vector:
+
+.. rubric:: ``function zeek::get_vector(id: string) : ZeekVector``
+
+Returns the value of a global Zeek script variable of Zeek type ``vector``.
+The value is returned as an opaque handle to the vector, which can be used
+with the ``zeek::vector_*()`` functions to access the vector's content.
+Throws an exception if there's no such Zeek of that name, or if it's not of
+the expected type.
+
+id: fully-qualified name of the global Zeek variable to retrieve
+
+.. _spicy_get_value:
+
+.. rubric:: ``function zeek::get_value(id: string) : ZeekVal``
+
+Returns an opaque handle to a global Zeek script variable. The handle can be
+used with the ``zeek::as_*()`` functions to access the variable's value.
+Throws an exception if there's no Zeek variable of that name.
+
+.. _spicy_as_address:
+
+.. rubric:: ``function zeek::as_address(v: ZeekVal) : addr``
+
+Returns a Zeek ``addr`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_bool:
+
+.. rubric:: ``function zeek::as_bool(v: ZeekVal) : bool``
+
+Returns a Zeek ``bool`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_count:
+
+.. rubric:: ``function zeek::as_count(v: ZeekVal) : uint64``
+
+Returns a Zeek ``count`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_double:
+
+.. rubric:: ``function zeek::as_double(v: ZeekVal) : real``
+
+Returns a Zeek ``double`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_enum:
+
+.. rubric:: ``function zeek::as_enum(v: ZeekVal) : string``
+
+Returns a Zeek ``enum`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_int:
+
+.. rubric:: ``function zeek::as_int(v: ZeekVal) : int64``
+
+Returns a Zeek ``int`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_interval:
+
+.. rubric:: ``function zeek::as_interval(v: ZeekVal) : interval``
+
+Returns a Zeek ``interval`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_port:
+
+.. rubric:: ``function zeek::as_port(v: ZeekVal) : port``
+
+Returns a Zeek ``port`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_record:
+
+.. rubric:: ``function zeek::as_record(v: ZeekVal) : ZeekRecord``
+
+Returns a Zeek ``record`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_set:
+
+.. rubric:: ``function zeek::as_set(v: ZeekVal) : ZeekSet``
+
+Returns a Zeek ``set`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_string:
+
+.. rubric:: ``function zeek::as_string(v: ZeekVal) : bytes``
+
+Returns a Zeek ``string`` value refereced by an opaque handle. The string's
+value is returned as a Spicy ``bytes`` value. Throws an exception if the
+referenced value is not of the expected type.
+
+.. _spicy_as_subnet:
+
+.. rubric:: ``function zeek::as_subnet(v: ZeekVal) : network``
+
+Returns a Zeek ``subnet`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_table:
+
+.. rubric:: ``function zeek::as_table(v: ZeekVal) : ZeekTable``
+
+Returns a Zeek ``table`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_time:
+
+.. rubric:: ``function zeek::as_time(v: ZeekVal) : time``
+
+Returns a Zeek ``time`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_as_vector:
+
+.. rubric:: ``function zeek::as_vector(v: ZeekVal) : ZeekVector``
+
+Returns a Zeek ``vector`` value refereced by an opaque handle. Throws an
+exception if the referenced value is not of the expected type.
+
+.. _spicy_set_contains:
+
+.. rubric:: ``function zeek::set_contains(id: string, v: any) : bool``
+
+Returns true if a Zeek set contains a given value. Throws an exception if
+the given ID does not exist, or does not have the expected type.
+
+id: fully-qualified name of the global Zeek set to check
+v: value to check for, which must be of the Spicy-side equivalent of the set's key type
+
+.. _spicy_set_contains_2:
+
+.. rubric:: ``function zeek::set_contains(s: ZeekSet, v: any) : bool``
+
+Returns true if a Zeek set contains a given value. Throws an exception if
+the set does not have the expected type.
+
+s: opaque handle to the Zeek set, as returned by other functions
+v: value to check for, which must be of the Spicy-side equivalent of the set's key type
+
+.. _spicy_table_contains:
+
+.. rubric:: ``function zeek::table_contains(id: string, v: any) : bool``
+
+Returns true if a Zeek table contains a given value. Throws an exception if
+the given ID does not exist, or does not have the expected type.
+
+id: fully-qualified name of the global Zeek table to check
+v: value to check for, which must be of the Spicy-side equivalent of the table's key type
+
+.. _spicy_table_contains_2:
+
+.. rubric:: ``function zeek::table_contains(t: ZeekTable, v: any) : bool``
+
+Returns true if a Zeek table contains a given value. Throws an exception if
+the given ID does not exist, or does not have the expected type.
+
+t: opaque handle to the Zeek table, as returned by other functions
+v: value to check for, which must be of the Spicy-side equivalent of the table's key type
+
+.. _spicy_table_lookup:
+
+.. rubric:: ``function zeek::table_lookup(id: string, v: any) : optional<ZeekVal>``
+
+Returns the value associated with a key in a Zeek table. Returns an error
+result if the key does not exist in the table. Throws an exception if the
+given table ID does not exist, or does not have the expected type.
+
+id: fully-qualified name of the global Zeek table to check
+v: value to lookup, which must be of the Spicy-side equivalent of the table's key type
+
+.. _spicy_table_lookup_2:
+
+.. rubric:: ``function zeek::table_lookup(t: ZeekTable, v: any) : optional<ZeekVal>``
+
+Returns the value associated with a key in a Zeek table. Returns an error
+result if the key does not exist in the table. Throws an exception if the
+given table ID does not exist, or does not have the expected type.
+
+t: opaque handle to the Zeek table, as returned by other functions
+v: value to lookup, which must be of the Spicy-side equivalent of the table's key type
+
+.. _spicy_record_has_value:
+
+.. rubric:: ``function zeek::record_has_value(id: string, field: string) : bool``
+
+Returns true if a Zeek record provides a value for a given field. This
+includes fields with `&default` values. Throws an exception if the given ID
+does not exist, or does not have the expected type.
+
+id: fully-qualified name of the global Zeek record to check field: name of
+the field to check
+
+.. _spicy_record_has_value_2:
+
+.. rubric:: ``function zeek::record_has_value(r: ZeekRecord, field: string) : bool``
+
+Returns true if a Zeek record provides a value for a given field.
+This includes fields with `&default` values.
+
+r: opaque handle to the Zeek record, as returned by other functions
+field: name of the field to check
+
+.. _spicy_record_has_field:
+
+.. rubric:: ``function zeek::record_has_field(id: string, field: string) : bool``
+
+Returns true if the type of a Zeek record has a field of a given name.
+Throws an exception if the given ID does not exist, or does not have the
+expected type.
+
+id: fully-qualified name of the global Zeek record to check
+field: name of the field to check
+
+.. _spicy_record_has_field_2:
+
+.. rubric:: ``function zeek::record_has_field(r: ZeekRecord, field: string) : bool``
+
+Returns true if the type of a Zeek record has a field of a given name.
+
+r: opaque handle to the Zeek record, as returned by other functions
+field: name of the field to check
+
+.. _spicy_record_field:
+
+.. rubric:: ``function zeek::record_field(id: string, field: string) : ZeekVal``
+
+Returns a field's value from a Zeek record. Throws an exception if the given
+ID does not exist, or does not have the expected type; or if there's no such
+field in the record type, or if the field does not have a value.
+
+id: fully-qualified name of the global Zeek record to check
+field: name of the field to retrieve
+
+.. _spicy_record_field_2:
+
+.. rubric:: ``function zeek::record_field(r: ZeekRecord, field: string) : ZeekVal``
+
+Returns a field's value from a Zeek record. Throws an exception if the given
+record does not have such a field, or if the field does not have a value.
+
+r: opaque handle to the Zeek record, as returned by other functions
+field: name of the field to retrieve
+
+.. _spicy_vector_index:
+
+.. rubric:: ``function zeek::vector_index(id: string, index: uint64) : ZeekVal``
+
+Returns the value of an index in a Zeek vector. Throws an exception if the
+given ID does not exist, or does not have the expected type; or if the index
+is out of bounds.
+
+id: fully-qualified name of the global Zeek vector to check
+index: index of the element to retrieve
+
+.. _spicy_vector_index_2:
+
+.. rubric:: ``function zeek::vector_index(v: ZeekVector, index: uint64) : ZeekVal``
+
+Returns the value of an index in a Zeek vector. Throws an exception if the
+index is out of bounds.
+
+v: opaque handle to the Zeek vector, as returned by other functions
+index: index of the element to retrieve
+
+.. _spicy_vector_size:
+
+.. rubric:: ``function zeek::vector_size(id: string) : uint64``
+
+Returns the size of a Zeek vector. Throws an exception if the given ID does
+not exist, or does not have the expected type.
+
+id: fully-qualified name of the global Zeek vector to check
+
+.. _spicy_vector_size_2:
+
+.. rubric:: ``function zeek::vector_size(v: ZeekVector) : uint64``
+
+Returns the size of a Zeek vector.
+
+v: opaque handle to the Zeek vector, as returned by other functions
+
--- a/doc/devel/spicy/examples/my-http.evt
+++ b/doc/devel/spicy/examples/my-http.evt
@ -0,0 +1,5 @@
+protocol analyzer spicy::MyHTTP over TCP:
+    parse originator with MyHTTP::RequestLine,
+    port 12345/tcp;
+
+on MyHTTP::RequestLine -> event MyHTTP::request_line($conn, self.method, self.uri, self.version.number);
--- a/doc/devel/spicy/examples/my-http.spicy
+++ b/doc/devel/spicy/examples/my-http.spicy
@ -0,0 +1,26 @@
+# @TEST-EXEC: echo "GET /index.html HTTP/1.0" | spicy-driver %INPUT >output
+# @TEST-EXEC: btest-diff output
+
+module MyHTTP;
+
+const Token = /[^ \t\r\n]+/;
+const WhiteSpace = /[ \t]+/;
+const NewLine = /\r?\n/;
+
+type Version = unit {
+    : /HTTP\//;
+    number: /[0-9]+\.[0-9]+/;
+};
+
+public type RequestLine = unit {
+    method: Token;
+    : WhiteSpace;
+    uri: Token;
+    : WhiteSpace;
+    version: Version;
+    : NewLine;
+
+    on %done {
+        print self.method, self.uri, self.version.number;
+    }
+};
--- a/doc/devel/spicy/examples/my-http.zeek
+++ b/doc/devel/spicy/examples/my-http.zeek
@ -0,0 +1,4 @@
+event MyHTTP::request_line(c: connection, method: string, uri: string, version: string)
+	{
+	print fmt("Zeek saw from %s: %s %s %s", c$id$orig_h, method, uri, version);
+	}
--- a/doc/devel/spicy/examples/request-line.pcap
+++ b/doc/devel/spicy/examples/request-line.pcap
--- a/doc/devel/spicy/examples/tftp-schedule-analyzer.zeek
+++ b/doc/devel/spicy/examples/tftp-schedule-analyzer.zeek
@ -0,0 +1,37 @@
+
+function schedule_tftp_analyzer(id: conn_id)
+    {
+    # Schedule the TFTP analyzer for the expected next packet coming in on different
+    # ports. We know that it will be exchanged between same IPs and reuse the
+    # originator's port. "Spicy_TFTP" is the Zeek-side name of the TFTP analyzer
+    # (generated from "Spicy::TFTP" in tftp.evt).
+    Analyzer::schedule_analyzer(id$resp_h, id$orig_h, id$orig_p, Analyzer::ANALYZER_SPICY_TFTP, 1min);
+    }
+
+event tftp::read_request(c: connection, is_orig: bool, filename: string, mode: string)
+    {
+    print "TFTP read request", c$id, filename, mode;
+    schedule_tftp_analyzer(c$id);
+    }
+
+event tftp::write_request(c: connection, is_orig: bool, filename: string, mode: string)
+    {
+    print "TFTP write request", c$id, filename, mode;
+    schedule_tftp_analyzer(c$id);
+    }
+
+# Add handlers for other packet types so that we see their events being generated.
+event tftp::data(c: connection, is_orig: bool, block_num: count, data: string)
+    {
+    print "TFTP data", block_num, data;
+    }
+
+event tftp::ack(c: connection, is_orig: bool, block_num: count)
+    {
+    print "TFTP ack", block_num;
+    }
+
+event tftp::error(c: connection, is_orig: bool, code: count, msg: string)
+    {
+    print "TFTP error", code, msg;
+    }
--- a/doc/devel/spicy/examples/tftp-single-request-more-args.evt
+++ b/doc/devel/spicy/examples/tftp-single-request-more-args.evt
@ -0,0 +1,7 @@
+protocol analyzer spicy::TFTP over UDP:
+    parse with TFTP::Packet,
+    port 69/udp;
+
+import TFTP;
+
+on TFTP::Request -> event tftp::request($conn, $is_orig, self.filename, self.mode);
--- a/doc/devel/spicy/examples/tftp-single-request-more-args.zeek
+++ b/doc/devel/spicy/examples/tftp-single-request-more-args.zeek
@ -0,0 +1,4 @@
+event tftp::request(c: connection, is_orig: bool, filename: string, mode: string)
+	{
+	print "TFTP request", c$id, is_orig, filename, mode;
+	}
--- a/doc/devel/spicy/examples/tftp-single-request.evt
+++ b/doc/devel/spicy/examples/tftp-single-request.evt
@ -0,0 +1,7 @@
+protocol analyzer spicy::TFTP over UDP:
+    parse with TFTP::Packet,
+    port 69/udp;
+
+import TFTP;
+
+on TFTP::Request -> event tftp::request($conn);
--- a/doc/devel/spicy/examples/tftp-single-request.zeek
+++ b/doc/devel/spicy/examples/tftp-single-request.zeek
@ -0,0 +1,4 @@
+event tftp::request(c: connection)
+	{
+	print "TFTP request", c$id;
+	}
--- a/doc/devel/spicy/examples/tftp-two-requests.zeek
+++ b/doc/devel/spicy/examples/tftp-two-requests.zeek
@ -0,0 +1,9 @@
+event tftp::read_request(c: connection, is_orig: bool, filename: string, mode: string)
+	{
+	print "TFTP read request", c$id, is_orig, filename, mode;
+	}
+
+event tftp::write_request(c: connection, is_orig: bool, filename: string, mode: string)
+	{
+	print "TFTP write request", c$id, is_orig, filename, mode;
+	}
--- a/doc/devel/spicy/faq.rst
+++ b/doc/devel/spicy/faq.rst
@ -0,0 +1,88 @@
+
+===
+FAQ
+===
+
+.. _faq_zeek_install_spicy_and_plugin_to_use_parsers:
+
+.. rubric:: Do I need to install Spicy and/or a Zeek plugin to use Spicy parsers in Zeek?
+
+If you're using Zeek >= 5.0 with a default build configuration,
+there's nothing else you need to install. After installing Zeek, the
+same folder containing the ``zeek`` binary will also have the relevant
+Spicy tools, such as  ``spicyc`` (provided by Spicy) and ``spicyz``
+(provided by Zeek). To double check that the Spicy support is indeed
+available, look for ``Zeek::Spicy`` in the output of ``zeek -N``::
+
+    # zeek -N
+    <...>
+    Zeek::Spicy - Support for Spicy parsers (``*.spicy``, ``*.evt``, ``*.hlto``) (built-in)
+
+Note that it remains possible to build Zeek against an external Spicy
+installation, or even without any Spicy support at all. Look at Zeek's
+``configure`` for corresponding options.
+
+.. note::
+
+    For some historic background: Zeek 5.0 started bundling Spicy, as well
+    as the former Zeek plugin for Spicy, so that now nothing else needs to
+    be installed separately anymore to use Spicy parsers. Since Zeek 6.0,
+    the code for that former plugin has further moved into Zeek itself,
+    and is now maintained directly by the Zeek developers.
+
+
+.. _faq_zeek_spicy_dpd_support:
+
+.. rubric:: Does Spicy support *Dynamic Protocol Detection (DPD)*?
+
+Yes, see the :ref:`corresponding section <spicy_dpd>` on how to add it
+to your analyzers.
+
+.. _faq_zeek_layer2_analyzer:
+
+.. rubric:: Can I write a Layer 2 protocol analyzer with Spicy?
+
+Yes, you can. In Zeek terminology a layer 2 protocol analyzer is a packet
+analyzer, see the :ref:`corresponding section <spicy_packet_analyzer>` on how
+to declare such an analyzer.
+
+.. _faq_zeek_print_statements_no_effect:
+
+.. rubric:: I have ``print`` statements in my Spicy grammar, why do I not see any output when running Zeek?
+
+Zeek by default disables the output of Spicy-side ``print``
+statements. To enable them, add ``Spicy::enable_print=T`` to the Zeek
+command line (or ``redef Spicy::enable_print=T;`` to a Zeek script
+that you are loading).
+
+.. _faq_zeek_tcp_analyzer_not_all_messages_recognized:
+
+.. rubric:: My analyzer recognizes only one or two TCP packets even though there are more in the input.
+
+In Zeek, a Spicy analyzer parses the sending and receiving sides of a TCP
+connection each according to the given Spicy grammar. This means that
+if more than one message can be sent per side the grammar needs to
+allow for that. For example, if the grammar parses messages of the
+protocol as ``Message``, the top-level parsing unit given in the EVT
+file needs to be able to parse a list of messages ``Message[]``.
+
+One way to express this is to introduce a parser which wraps messages
+of the protocol in an :spicylink:`anonymous field
+<programming/parsing.html#anonymous-fields>`.
+
+.. warning:: Since in general the number of messages exchanged over a TCP
+  connection is unbounded, an anonymous field should be used. If a named field
+  was used instead the parser would need to store all messages over the
+  connection which would lead to unbounded memory growth.
+
+.. code-block:: spicy
+
+   type Message = unit {
+     # Fields for messages of the protocol.
+   };
+
+   # Parser used e.g., in EVT file.
+   public type Messages = unit {
+     : Message[];
+   };
+
--- a/doc/devel/spicy/getting-started.rst
+++ b/doc/devel/spicy/getting-started.rst
@ -0,0 +1,118 @@
+
+===============
+Getting Started
+===============
+
+Spicy's own :spicylink:`Getting Started <getting-started.html>` guide
+uses the following Spicy code to parse a simple HTTP request line:
+
+.. literalinclude:: examples/my-http.spicy
+   :lines: 4-
+   :caption: my-http.spicy
+   :language: spicy
+
+While the Spicy documentation goes on to show :spicylink:`how to use
+this to parse corresponding data from the command line
+<getting-started.html#a-simple-parser>`, here we will instead leverage
+the ``RequestLine`` parser to build a proof-of-concept protocol
+analyzer for Zeek. While this all remains simplified here, the
+following, more in-depth :ref:`spicy_tutorial` demonstrates how
+to build a complete analyzer for a real protocol.
+
+.. rubric:: Preparations
+
+Because Zeek works from network packets, we first need a packet trace
+with the payload we want to parse. We can't just use a normal HTTP
+session as our simple parser wouldn't go further than just the first
+line of the protocol exchange and then bail out with an error. So
+instead, for our example we create a custom packet trace with a TCP
+connection that carries just a single HTTP request line as its
+payload::
+
+    # tcpdump -i lo0 -w request-line.pcap port 12345 &
+    # nc -l 12345 &
+    # echo "GET /index.html HTTP/1.0" | nc localhost 12345
+    # killall tcpdump nc
+
+This gets us :download:`this trace file <examples/request-line.pcap>`.
+
+.. _example_spicy_my_http_adding_analyzer:
+
+.. rubric:: Adding a Protocol Analyzer
+
+Now we can go ahead and add a new protocol analyzer to Zeek. We
+already got the Spicy grammar to parse our connection's payload, it's
+in ``my-http.spicy``. In order to use this with Zeek, we have two
+additional things to do: (1) We need to let Zeek know about our new
+protocol analyzer, including when to use it; and (2) we need to define
+at least one Zeek event that we want our parser to generate, so that
+we can then write a Zeek script working with the information that it
+extracts.
+
+We do both of these by creating an additional control file for Zeek:
+
+.. literalinclude:: examples/my-http.evt
+    :caption: my-http.evt
+    :linenos:
+    :language: spicy-evt
+
+The first block (lines 1-3) tells Zeek that we have a new protocol
+analyzer to provide. The analyzer's Zeek-side name is
+``spicy::MyHTTP``, and it's meant to run on top of TCP connections
+(line 1). Lines 2-3 then provide Zeek with more specifics: The entry
+point for originator-side payload is the ``MyHTTP::RequestLine`` unit
+type that our Spicy grammar defines (line 2); and we want Zeek to
+activate our analyzer for all connections with a responder port of
+12345 (which, of course, matches the packet trace we created).
+
+The second block (line 5) tells Zeek that we want to
+define one event. On the left-hand side of that line we give the unit
+that is to trigger the event. The right-hand side defines its name and
+arguments. What we are saying here is that every time a ``RequestLine``
+line has been fully parsed, we'd like a ``MyHTTP::request_line`` event
+to go to Zeek. Each event instance will come with four parameters:
+Three of them are the values of corresponding unit fields, accessed
+just through normal Spicy expressions (inside an event argument
+expression, ``self`` refers to the unit instance that has led to the
+generation of the current event). The first parameter, ``$conn``, is a
+"magic" keyword that passes the Zeek-side
+connection ID (``conn_id``) to the event.
+
+Now we got everything in place that we need for our new protocol
+analyzer---except for a Zeek script actually doing something with the
+information we are parsing. Let's use this:
+
+.. literalinclude:: examples/my-http.zeek
+    :caption: my-http.zeek
+    :language: zeek
+
+You see an Zeek event handler for the event that we just defined,
+having the expected signature of four parameters matching the types of
+the parameter expressions that the ``*.evt`` file specifies. The
+handler's body then just prints out what it gets.
+
+.. _example_spicy_my_http:
+
+Finally we can put together our pieces by compiling the Spicy grammar and the
+EVT file into an HLTO file with ``spicyz``, and by pointing Zeek at the produced
+file and the analyzer-specific Zeek scripts::
+
+    # spicyz my-http.spicy my-http.evt -o my-http.hlto
+    # zeek -Cr request-line.pcap my-http.hlto my-http.zeek
+    Zeek saw from 127.0.0.1: GET /index.html 1.0
+
+When Zeek starts up here the Spicy integration registers a protocol analyzer to
+the entry point of our Spicy grammar as specified in the EVT file. It then
+begins processing the packet trace as usual, now activating our new analyzer
+whenever it sees a TCP connection on port 12345. Accordingly, the
+``MyHTTP::request_line`` event gets generated once the parser gets to process
+the session's payload. The Zeek event handler then executes and prints the
+output we would expect.
+
+.. note::
+
+    By default, Zeek suppresses any output from Spicy-side
+    ``print`` statements. You can add ``Spicy::enable_print=T`` to the
+    command line to see it. In the example above, you would then get
+    an additional line of output: ``GET, /index.html, 1.0``.
+
--- a/doc/devel/spicy/index.rst
+++ b/doc/devel/spicy/index.rst
@ -0,0 +1,73 @@
+============================
+Writing Analyzers with Spicy
+============================
+
+:spicylink:`Spicy <index.html>` is a parser generator that makes it
+easy to create robust C++ parsers for network protocols, file formats,
+and more. Zeek supports integrating Spicy analyzers so that one can
+create Zeek protocol, packet and file analyzers. This section digs
+into how that integration works. We begin with a short "Getting
+Started" guide showing you the basics of using Spicy with Zeek,
+followed by an in-depth tutorial on adding a complete protocol
+analyzer to Zeek. The final part consists of a reference section
+documenting everything the Spicy integration supports.
+
+While this documentation walks through all the bits and pieces that an
+analyzer consists of, there's an easy way to get started when writing
+a new analyzer from scratch: the `Zeek package manager
+<https://docs.zeek.org/projects/package-manager>`_ can create analyzer
+scaffolding for you that includes an initial Spicy grammar
+(``*.spicy``), Zeek integration glue code (``*.evt``; see below) and a
+corresponding CMake build setup. To create that scaffolding, use the
+package managers ``create`` command and pass one of
+``--features=spicy-protocol-analyzer``,
+``--features=spicy-packet-analyzer``, or
+``--features=spicy-file-analyzer`` to create a Zeek protocol, packet,
+or file analyzer, respectively. See :ref:`the tutorial
+<zkg_create_package>` for more on this.
+
+Note that Zeek itself installs the grammars of its builtin Spicy
+analyzers for potential reuse. For example, the `Finger grammar
+<https://github.com/zeek/zeek/blob/master/src/analyzer/protocol/finger/finger.spicy>`_
+gets installed to ``<PREFIX>/share/spicy/finger/finger.spicy``. It can
+be used in custom code by importing it with ``import Finger from
+finger;``.
+
+.. toctree::
+   :maxdepth: 2
+   :caption: Table of Contents
+
+   installation
+   getting-started
+   tutorial
+   reference
+   faq
+
+.. note::
+
+   This documentation focuses on writing *external* Spicy analyzers
+   that you can load into Zeek at startup. Zeek also comes with the
+   infrastructure to build Spicy analyzers directly into the
+   executable itself, just like traditional built-in analyzers. We
+   will document this more as we're converting more of Zeek's built-in
+   analyzers over to Spicy. For now, we recommend locking at one of
+   the existing built-in Spicy analyzers (Syslog, Finger) as examples.
+
+.. _spicy_terminology:
+
+Terminology
+===========
+
+A word on terminology: In Zeek, the term "analyzer" generally refers
+to a component that processes a particular protocol ("protocol
+analyzer"), file format ("file analyzer"), or low-level packet
+structure ("packet analyzer"). "Processing" here means more than just
+parsing content: An analyzer controls when it wants to be used (e.g.,
+with connections on specific ports, or with files of a specific MIME
+type); what events to generate for Zeek's scripting layer; and how to
+handle any errors occurring during parsing. While Spicy itself focuses
+just on the parsing part, Spicy makes it possible to provide the
+remaining pieces to Zeek, turning a Spicy parser into a full Zeek
+analyzer. That's what we refer to as a "Spicy (protocol/file/packet)
+analyzer" for Zeek.
+
--- a/doc/devel/spicy/installation.rst
+++ b/doc/devel/spicy/installation.rst
@ -0,0 +1,18 @@
+
+.. _spicy_installation:
+
+Installation
+============
+
+Since Zeek version 5.0, support for Spicy is built right into Zeek by
+default. To confirm that Spicy is indeed available, you can inspect
+the output of ``zeek -N``::
+
+    # zeek -N Zeek::Spicy
+    Zeek::Spicy - Support for Spicy parsers (*.hlto) (built-in)
+
+It remains possible to build Zeek against an external Spicy
+installation through Zeek's ``configure`` option
+``--with-spicy=PATH``, where ``PATH`` points to the Spicy installation
+directory. In that case, you also need to ensure that the Spicy tools
+(e.g., ``spicyc``, ``spicy-config``) are available in ``PATH``.
--- a/doc/devel/spicy/reference.rst
+++ b/doc/devel/spicy/reference.rst
--- a/doc/devel/spicy/tutorial.rst
+++ b/doc/devel/spicy/tutorial.rst
@ -0,0 +1,441 @@
+
+.. _spicy_tutorial:
+
+Tutorial
+========
+
+This tutorial walks through the integration of a simple TFTP analyzer
+into Zeek. This discussion continues  the example from
+:spicylink:`Spicy's own tutorial <tutorial/index.html>` that develops
+the TFTP grammar, now focusing on how to use it with Zeek. Please go
+through that Spicy tutorial first before continuing here.
+
+To turn a Spicy-side grammar into a Zeek analyzer, we need to provide
+Zeek with a description of how to employ it. There are two parts to
+that: Telling Zeek when to activate the analyzer, and defining events
+to generate. In addition, we will need a Zeek-side script to do
+something with our new TFTP events. We will walk through this in the
+following, starting with the mechanics of compiling the Spicy analyzer
+for Zeek. While we will build up the files involved individually
+first, see the :ref:`final section <zkg_create_package>` for how the
+Zeek package manager, *zkg*, can be used to bootstrap a new Zeek
+package with a skeleton of everything needed for an analyzer.
+
+Before proceeding, make sure that your Zeek comes with Spicy support
+built-in---which is the default since Zeek version 5.0::
+
+    # zeek -N Zeek::Spicy
+    Zeek::Spicy - Support for Spicy parsers (*.hlto) (built-in)
+
+You should also have ``spicyz`` in your ``PATH``::
+
+    # which spicyz
+    /usr/local/zeek/bin/spicyz
+
+.. note::
+
+    There are a number of pieces involved in creating a full Zeek
+    analyzer, in particular if you want to distribute it as a Zeek
+    package. To help you get started with that, Zeek's package manager
+    can create a skeleton Spicy package by running::
+
+        # zkg create --features=spicy-protocol-analyzer --packagedir <packagedir>
+
+    The generated files mark places that will need manual editing with
+    ``TODO``. See the :ref:`tutorial <zkg_create_package>` for more on
+    this.
+
+Compiling the Analyzer
+----------------------
+
+Zeek comes with a tool :ref:`spicyz <spicyz>` that compiles Spicy
+analyzers into binary code that Zeek can load through a Spicy plugin.
+The following command line produces a binary object file ``tftp.hlto``
+containing the executable analyzer code:
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy
+
+Below, we will prepare an additional interface definition file
+``tftp.evt`` that describes the analyzer's integration into Zeek. We
+will need to give that to ``spicyz`` as well, and our full
+compilation command hence becomes:
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy tftp.evt
+
+When starting Zeek, we add ``tftp.hlto`` to its command line:
+
+.. code::
+
+    # zeek -r tftp_rrq.pcap tftp.hlto
+
+
+Activating the Analyzer
+-----------------------
+
+In *Getting Started*, :ref:`we already saw
+<example_spicy_my_http_adding_analyzer>` how to inform Zeek about a new
+protocol analyzer. We follow the same scheme here and put the
+following into ``tftp.evt``, the analyzer definition file:
+
+.. literalinclude:: autogen/tftp.evt
+    :lines: 5-7
+    :language: spicy-evt
+
+The first line provides our analyzer with a Zeek-side name
+(``spicy::TFTP``) and also tells Zeek that we are adding an
+application analyzer on top of UDP (``over UDP``). ``TFTP::Packet``
+provides the top-level entry point for parsing both sides of a TFTP
+connection. Furthermore, we want Zeek to automatically activate our
+analyzer for all sessions on UDP port 69 (i.e., TFTP's well known
+port). See :ref:`spicy_evt_analyzer_setup` for more details on defining
+such a ``protocol analyzer`` section.
+
+.. note::
+
+    We use the ``port`` attribute in the ``protocol analyzer`` section
+    mainly for convenience; it's not the only way to define the
+    well-known ports. For a production analyzer, it's more idiomatic
+    to use the a Zeek script instead; see :ref:`this note
+    <zeek_init_instead_of_port>` for more information.
+
+With this in place, we can already employ the analyzer inside Zeek. It
+will not generate any events yet, but we can at least see the output of
+the ``on %done { print self; }`` hook that still remains part of the
+grammar from earlier:
+
+.. code::
+
+    # zeek -r tftp_rrq.pcap tftp.hlto Spicy::enable_print=T
+    [$opcode=Opcode::RRQ, $rrq=[$filename=b"rfc1350.txt", $mode=b"octet"], $wrq=(not set), $data=(not set), $ack=(not set), $error=(not set)]
+
+As by default, the Zeek plugin does not show the output of Spicy-side
+``print`` statements, we added ``Spicy::enable_print=T`` to the
+command line to turn that on. We see that Zeek took care of the
+lower network layers, extracted the UDP payload from the Read Request,
+and passed that into our Spicy parser. (If you want to view more about
+the internals of what is happening here, there are a couple kinds of
+:ref:`debug output available <spicy_debugging>`.)
+
+You might be wondering why there is only one line of output, even
+though there are multiple TFTP packets in our pcap trace. Shouldn't
+the ``print`` execute multiple times? Yes, it should, but it does not
+currently: Due to some intricacies of the TFTP protocol, our analyzer
+gets to see only the first packet for now. We will fix this later. For
+now, we focus on the Read Request packet that the output above shows.
+
+Defining Events
+---------------
+
+The core task of any Zeek analyzer is to generate events for Zeek
+scripts to process. For binary protocols, events will often correspond
+pretty directly to data units specified by their specifications---and
+TFTP is no exception. We start with an event for Read/Write Requests
+by adding this definition to ``tftp.evt``:
+
+.. literalinclude:: examples/tftp-single-request.evt
+    :lines: 5-7
+    :language: spicy-evt
+
+The first line makes our Spicy TFTP grammar available to the rest of
+the file. The line ``on ...`` defines one event: Every time a
+``Request`` unit will be parsed, we want to receive an event
+``tftp::request`` with one parameter: the connection it belongs to.
+Here, ``$conn`` is a reserved identifier that will turn into the
+standard `connection record
+<https://docs.zeek.org/en/current/scripts/base/init-bare.zeek.html#type-connection>`_
+record on the Zeek side.
+
+Now we need a Zeek event handler for our new event. Let's put this
+into ``tftp.zeek``:
+
+.. literalinclude:: examples/tftp-single-request.zeek
+    :language: zeek
+
+Running Zeek then gives us:
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy tftp.evt
+    # zeek -r tftp_rrq.pcap tftp.hlto tftp.zeek
+    TFTP request, [orig_h=192.168.0.253, orig_p=50618/udp, resp_h=192.168.0.10, resp_p=69/udp]
+
+Let's extend the event signature a bit by passing further arguments:
+
+.. literalinclude:: examples/tftp-single-request-more-args.evt
+    :lines: 5-7
+    :language: spicy-evt
+
+This shows how each parameter gets specified as a Spicy expression:
+``self`` refers to the instance currently being parsed (``self``), and
+``self.filename`` retrieves the value of its ``filename`` field.
+``$is_orig`` is another reserved ID that turns into a boolean that
+will be true if the event has been triggered by originator-side
+traffic. On the Zeek side, our event now has the following signature:
+
+.. literalinclude:: examples/tftp-single-request-more-args.zeek
+    :language: zeek
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy tftp.evt
+    # zeek -r tftp_rrq.pcap tftp.hlto tftp.zeek
+    TFTP request, [orig_h=192.168.0.253, orig_p=50618/udp, resp_h=192.168.0.10, resp_p=69/udp], T, rfc1350.txt, octet
+
+Going back to our earlier discussion of Read vs Write Requests, we do
+not yet make that distinction with the ``request`` event that we are
+sending to Zeek-land. However, since we had introduced the ``is_read``
+unit parameter, we can easily separate the two by gating event
+generation through an additional ``if`` condition:
+
+.. literalinclude:: autogen/tftp.evt
+    :lines: 11-12
+    :language: spicy-evt
+
+This now defines two separate events, each being generated only for
+the corresponding value of ``is_read``. Let's try it with a new
+``tftp.zeek``:
+
+.. literalinclude:: examples/tftp-two-requests.zeek
+    :language: zeek
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy tftp.evt
+    # zeek -r tftp_rrq.pcap tftp.hlto tftp.zeek
+    TFTP read request, [orig_h=192.168.0.253, orig_p=50618/udp, resp_h=192.168.0.10, resp_p=69/udp], T, rfc1350.txt, octet
+
+If we look at the :file:`conn.log` that Zeek produces during this run, we
+will see that the ``service`` field is not filled in yet. That's
+because our analyzer does not yet confirm to Zeek that it has been
+successful in parsing the content. To do that, we can call a library
+function that Spicy makes available once we have successfully parsed a
+request: :spicylink:`spicy::accept_input
+<programming/library.html#spicy-accept-input>`. That function signals
+the host application---i.e., Zeek in our case—--that the parser is
+processing the expected protocol.
+
+First, we need to make sure the Spicy standard library is imported
+in ``tftp.spicy``, so that we will have its functions available:
+
+.. code::
+
+   import spicy;
+
+With that, our request looks like this now:
+
+.. code-block::
+
+    type Request = unit(is_read: bool) {
+        filename: bytes &until=b"\x00";
+        mode:     bytes &until=b"\x00";
+
+        on %done { spicy::accept_input(); }
+    };
+
+
+Let's try it again:
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy tftp.evt
+    # zeek -r tftp_rrq.pcap tftp.hlto tftp.zeek
+    TFTP read request, [orig_h=192.168.0.253, orig_p=50618/udp, resp_h=192.168.0.10, resp_p=69/udp], T, rfc1350.txt, octet
+    # cat conn.log
+    [...]
+    1367411051.972852  C1f7uj4uuv6zu2aKti  192.168.0.253  50618  192.168.0.10  69  udp  spicy_tftp  -  -  -  S0  -  -0  D  1  48  0  0  -
+    [...]
+
+Now the service field says TFTP! (There will be a 2nd connection in
+the log that we are not showing here; see the next section on that).
+
+Turning to the other TFTP packet types, it is straight-forward to add
+events for them as well. The following is our complete ``tftp.evt``
+file:
+
+.. literalinclude:: autogen/tftp.evt
+    :lines: 5-
+    :language: spicy-evt
+
+
+
+Detour: Zeek vs. TFTP
+---------------------
+
+We noticed above that Zeek seems to be seeing only a single TFTP
+packet from our input trace, even though ``tcpdump`` shows that the
+pcap file contains multiple different types of packets. The reason
+becomes clear once we look more closely at the UDP ports that are in
+use:
+
+.. code::
+
+    # tcpdump -ttnr tftp_rrq.pcap
+    1367411051.972852 IP 192.168.0.253.50618 > 192.168.0.10.69:  20 RRQ "rfc1350.txtoctet" [tftp]
+    1367411052.077243 IP 192.168.0.10.3445 > 192.168.0.253.50618: UDP, length 516
+    1367411052.081790 IP 192.168.0.253.50618 > 192.168.0.10.3445: UDP, length 4
+    1367411052.086300 IP 192.168.0.10.3445 > 192.168.0.253.50618: UDP, length 516
+    1367411052.088961 IP 192.168.0.253.50618 > 192.168.0.10.3445: UDP, length 4
+    1367411052.088995 IP 192.168.0.10.3445 > 192.168.0.253.50618: UDP, length 516
+    [...]
+
+Turns out that only the first packet is using the well-known TFTP port
+69/udp, whereas all the subsequent packets use ephemeral ports. Due to
+the port difference, Zeek believes it is seeing two independent
+network connections, and it does not associate TFTP with the second
+one at all due to its lack of the well-known port (neither does
+``tcpdump``!). Zeek's connection log confirms this by showing two
+separate entries:
+
+.. code::
+
+    # cat conn.log
+    1367411051.972852  CH3xFz3U1nYI1Dp1Dk  192.168.0.253  50618  192.168.0.10  69  udp  spicy_tftp  -  -  -  S0  -  -  0  D  1  48  0  0  -
+    1367411052.077243  CfwsLw2TaTIeo3gE9g  192.168.0.10  3445  192.168.0.253  50618  udp  -  0.181558  24795  196  SF  -  -  0  Dd  49  26167  49  1568  -
+
+Switching the ports for subsequent packets is a quirk in TFTP that
+resembles similar behaviour in standard FTP, where data connections
+get set up separately as well. Fortunately, Zeek provides a built-in
+function to designate a specific analyzer for an anticipated future
+connection. We can call that function when we see the initial request:
+
+.. literalinclude:: examples/tftp-schedule-analyzer.zeek
+    :language: zeek
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy tftp.evt
+    # zeek -r tftp_rrq.pcap tftp.hlto tftp.zeek
+    TFTP read request, [orig_h=192.168.0.253, orig_p=50618/udp, resp_h=192.168.0.10, resp_p=69/udp], rfc1350.txt, octet
+    TFTP data, 1, \x0a\x0a\x0a\x0a\x0a\x0aNetwork Working Group [...]
+    TFTP ack, 1
+    TFTP data, 2, B Official Protocol\x0a   Standards" for the  [...]
+    TFTP ack, 2
+    TFTP data, 3, protocol was originally designed by Noel Chia [...]
+    TFTP ack, 3
+    TFTP data, 4, r mechanism was suggested by\x0a   PARC's EFT [...]
+    TFTP ack, 4
+    [...]
+
+Now we are seeing all the packets as we would expect.
+
+
+Zeek Script
+-----------
+
+Analyzers normally come along with a Zeek-side script that implements
+a set of standard base functionality, such as recording activity into
+a protocol specific log file. These scripts provide handlers for the
+analyzers' events, and collect and correlate their activity as
+desired. We have created such :download:`a script for TFTP
+<autogen/tftp.zeek>`, based on the events that our Spicy analyzer
+generates. Once we add that to the Zeek command line, we will see a
+new :file:`tftp.log`:
+
+.. code::
+
+    # spicyz -o tftp.hlto tftp.spicy tftp.evt
+    # zeek -r tftp_rrq.pcap tftp.hlto tftp.zeek
+    # cat tftp.log
+    #fields	ts	uid	id.orig_h	id.orig_p	id.resp_h	id.resp_p	wrq	fname	mode	uid_data	size	block_sent	block_acked	error_code	error_msg
+    1367411051.972852	CKWH8L3AIekSHYzBU	192.168.0.253	50618	192.168.0.10	69	F	rfc1350.txt	octet	ClAr3P158Ei77Fql8h	24599	49	49	-	-
+
+The TFTP script also labels the second session as TFTP data by
+adding a corresponding entry to the ``service`` field inside the
+Zeek-side connection record. With that, we are now seeing this in
+:file:`conn.log`:
+
+.. code::
+
+    1367411051.972852  ChbSfq3QWKuNirt9Uh  192.168.0.253  50618  192.168.0.10  69  udp  spicy_tftp  -  -  -  S0  -  -0  D  1  48  0  0  -
+    1367411052.077243  CowFQj20FHHduhHSYk  192.168.0.10  3445  192.168.0.253  50618  udp  spicy_tftp_data  0.181558  24795  196  SF  --  0  Dd  49  26167  49  1568  -
+
+The TFTP script ends up being a bit more complex than one would expect
+for such a simple protocol. That's because it tracks the two related
+connections (initial request and follow-up traffic on a different
+port), and combines them into a single TFTP transaction for logging.
+Since there is nothing Spicy-specific in that Zeek script, we skip
+discussing it here in more detail.
+
+
+.. _zkg_create_package:
+
+Creating a Zeek Package
+-----------------------
+
+We have now assembled all the parts needed for providing a new
+analyzer to Zeek. By adding a few further pieces, we can wrap that
+analyzer into a full *Zeek package* for others to install easily
+through *zkg*. To help create that wrapping, *zkg* provides a template
+for instantiating a skeleton analyzer package as a starting point. The
+skeleton comes in three different flavors, depending on which kind of
+analyzer you want to create: protocol, file, or packet analyzer.
+In each case, it creates all the necessary files along with the
+appropriate directory layout, and even includes a couple of
+standard test cases.
+
+To create the scaffolding for our TFTP analyzer, execute the following
+command and provide the requested information::
+
+    # zkg create --features spicy-protocol-analyzer --packagedir spicy-tftp
+    "package-template" requires a "name" value (the name of the package, e.g. "FooBar" or "spicy-http"):
+    name: spicy-tftp
+    "package-template" requires a "analyzer" value (name of the Spicy analyzer, which typically corresponds to the protocol/format being parsed (e.g. "HTTP", "PNG")):
+    analyzer: TFTP
+    "package-template" requires a "protocol" value (transport protocol for the analyzer to use: TCP or UDP):
+    protocol: UDP
+    "package-template" requires a "unit_orig" value (name of the top-level Spicy parsing unit for the originator side of the connection (e.g. "Request")):
+    unit_orig: Packet
+    "package-template" requires a "unit_resp" value (name of the top-level Spicy parsing unit for the responder side of the connection (e.g. "Reply"); may be the same as originator side):
+    unit_resp: Packet
+
+
+The above creates the following files (skipping anything related to
+``.git``)::
+
+    spicy-tftp/CMakeLists.txt
+    spicy-tftp/COPYING
+    spicy-tftp/README
+    spicy-tftp/analyzer/CMakeLists.txt
+    spicy-tftp/analyzer/tftp.evt
+    spicy-tftp/analyzer/tftp.spicy
+    spicy-tftp/cmake/FindSpicyPlugin.cmake
+    spicy-tftp/scripts/__load__.zeek
+    spicy-tftp/scripts/dpd.sig
+    spicy-tftp/scripts/main.zeek
+    spicy-tftp/testing/Baseline/tests.run-pcap/conn.log
+    spicy-tftp/testing/Baseline/tests.run-pcap/output
+    spicy-tftp/testing/Baseline/tests.standalone/
+    spicy-tftp/testing/Baseline/tests.standalone/output
+    spicy-tftp/testing/Baseline/tests.trace/output
+    spicy-tftp/testing/Baseline/tests.trace/tftp.log
+    spicy-tftp/testing/Files/random.seed
+    spicy-tftp/testing/Makefile
+    spicy-tftp/testing/Scripts/README
+    spicy-tftp/testing/Scripts/diff-remove-timestamps
+    spicy-tftp/testing/Scripts/get-zeek-env
+    spicy-tftp/testing/Traces/tcp-port-12345.pcap
+    spicy-tftp/testing/Traces/udp-port-12345.pcap
+    spicy-tftp/testing/btest.cfg
+    spicy-tftp/testing/tests/availability.zeek
+    spicy-tftp/testing/tests/standalone.spicy
+    spicy-tftp/testing/tests/trace.zeek
+    spicy-tftp/zkg.meta
+
+
+Note the ``*.evt``, ``*.spicy``, ``*.zeek`` files: they correspond to
+the files we created for TFTP in the preceding sections; we can just
+move our versions in there. Furthermore, the generated scaffolding
+marks places with ``TODO`` that need manual editing: use ``git grep
+TODO`` inside the ``spicy-tftp`` directory to find them. We won't go
+through all the specific customizations for TFTP here, but for
+reference you can find the full TFTP package as created from the *zkg*
+template on `GitHub <https://github.com/zeek/spicy-tftp>`_.
+
+If instead of a protocol analyzer, you'd like to create a file or
+packet analyzer, run zkg with ``--features spicy-file-analyzer`` or
+``--features spicy-packet-analyzer``, respectively. The generated
+skeleton will be suitably adjusted then.
--- a/doc/devel/websocket-api.rst
+++ b/doc/devel/websocket-api.rst
@ -0,0 +1,317 @@
+.. _websocket-api:
+
+.. _websocat: https://github.com/vi/websocat
+
+
+======================================
+Interacting with Zeek using WebSockets
+======================================
+
+Introduction
+============
+
+Usually, Zeek produces protocol logs consumed by external applications. These
+external applications might be SIEMs, real-time streaming analysis platforms
+or basic archival processes compressing logs for long term storage.
+
+Certain use-cases require interacting and influencing Zeek's runtime behavior
+outside of static configuration via ``local.zeek``.
+
+The classic :ref:`framework-input` and :ref:`framework-configuration` can be
+leveraged for runtime configuration of Zeek as well as triggering arbitrary
+events or script execution via option handlers. These frameworks are mostly
+file- or process-based and may feel a bit unusual in environments where creation
+of files is uncommon or even impossible due to separation of concerns. In many
+of today's environments, interacting using HTTP-based APIs or other remote
+interfaces is more common.
+
+.. note::
+
+    As an aside, if you need more flexibility than the WebSocket API offers today,
+    an alternative could be to use :ref:`javascript` within Zeek. This opens the
+    possibility to run a separate HTTP or a totally different Node.js based server
+    within a Zeek process for quick experimentation and evaluation of other
+    approaches.
+
+Background and Setup
+====================
+
+Since Zeek 5.0, Zeek allows connections from external clients over WebSocket.
+This allows these clients to interact with Zeek's publish-subscribe layer and
+exchange Zeek events with other Zeek nodes.
+Initially, this implementation resided in the Broker subsystem.
+With Zeek 8.0, most of the implementation has been moved into core Zeek
+itself with the v1 serialization format remaining in Broker.
+
+WebSocket clients may subscribe to a fixed set of topics and will receive
+Zeek events matching these topics that Zeek cluster nodes, but also other
+WebSocket clients, publish.
+
+With Zeek 8.0, Zeekctl has received support to interact with Zeek cluster nodes
+using the WebSocket protocol. If you're running a Zeekctl based cluster and
+want to experiment with WebSocket functionality, add ``UseWebSocket = 1`` to
+your ``zeekctl.cfg``:
+
+.. code-block:: ini
+
+    # zeekctl.cfg
+    ...
+    UseWebSocket = 1
+
+This will essentially add the following snippet, enabling a WebSocket server
+on the Zeek manager:
+
+.. code-block:: zeek
+   :caption: websocket.zeek
+
+   event zeek_init()
+        {
+        if ( Cluster::local_node_type() == Cluster::MANAGER )
+            {
+            Cluster::listen_websocket([
+                $listen_addr=127.0.0.1,
+                $listen_port=27759/tcp,
+            ]);
+            }
+        }
+
+
+To verify that the WebSocket API is functional in your deployment use, for example,
+`websocat`_ as a quick check.
+
+.. code-block:: shell
+
+   $ echo '[]' | websocat ws://127.0.0.1:27759/v1/messages/json
+   {"type":"ack","endpoint":"3eece35d-9f94-568d-861c-6a16c433e090-websocket-2","version":"8.0.0-dev.684"}
+
+Zeek's ``cluster.log`` file will also have an entry for the WebSocket client connection.
+The empty array in the command specifies the client's subscriptions, in this case none.
+
+Version 1
+=========
+
+The currently implemented protocol is accessible at ``/v1/messages/json``.
+The `data representation <https://docs.zeek.org/projects/broker/en/current/web-socket.html#data-representation>`_
+is documented in detail within the Broker project. Note that this format is a
+direct translation of Broker's binary format into JSON, resulting in a fairly
+tight coupling between WebSocket clients and the corresponding Zeek scripts.
+Most prominently is the representation of record values as vectors instead
+of objects, making the protocol sensitive against reordering or introduction
+of optional fields to records.
+
+.. note::
+
+   We're looking into an iteration of the format. If you have feedback or
+   would like to contribute, please reach out on the usual community channels.
+
+
+Handshake and Acknowledgement
+-----------------------------
+
+The first message after a WebSocket connection has been established originates
+from the client. This message is a JSON array of strings that represent the
+topics the WebSocket client wishes to subscribe to.
+
+Zeek replies with an acknowledgement message that's a JSON object or an error.
+
+Events
+------
+
+After the acknowledgement, WebSocket clients receive all events arriving on
+topics they have subscribed to.
+
+.. code-block:: shell
+
+   $ websocat ws://127.0.0.1:27759/v1/messages/json
+   ["zeek.test"]
+   {"type":"ack","endpoint":"d955d990-ad8a-5ed4-8bc5-bee252d4a2e6-websocket-0","version":"8.0.0-dev.684"}
+   {"type":"data-message","topic":"zeek.test","@data-type":"vector","data":[{"@data-type":"count","data":1},{"@data-type":"count","data":1},{"@data-type":"vector","data":[{"@data-type":"string","data":"hello"},{"@data-type":"vector","data":[{"@data-type":"count","data":3}]},{"@data-type":"vector","data":[]}]}]}
+
+The received messages, again, are encoded in Broker's JSON format. Above ``data-message``
+represents an event received on topic ``zeek.test``. The event's name is ``hello``.
+This event has a single argument of type :zeek:type:`count`. In the example above
+its value is ``3``.
+
+To send events, WebSocket clients similarly encode their event representation
+to Broker's JSON format and send them as `text data frames <https://datatracker.ietf.org/doc/html/rfc6455#section-5.6>`_.
+
+
+X-Application-Name Header
+-------------------------
+
+When a WebSocket client includes an ``X-Application-Name`` HTTP header in
+the initial WebSocket Handshake's GET request, that header's value is available
+in the :zeek:see:`Cluster::websocket_client_added` event's ``endpoint`` argument (see :zeek:see:`Cluster::EndpointInfo`).
+
+The header's value will also be included in ``cluster.log`` messages.
+
+Additionally, if the cluster telemetry for WebSocket clients is set to
+:zeek:see:`Cluster::Telemetry::VERBOSE` or :zeek:see:`Cluster::Telemetry::DEBUG`
+via :zeek:see:`Cluster::Telemetry::websocket_metrics`, the header's value is
+included as ``app`` label in metrics exposed by the :ref:`framework-telemetry`.
+
+As of Zeek 8.0, a WebSocket client will be rejected if the header is set, but
+its value doesn't match ``[-/_.=:*@a-zA-Z0-9]+``.
+
+
+Language Bindings
+-----------------
+
+Note that it's possible to use any language that offers WebSocket bindings.
+The ones listed below mostly add a bit of convenience features around the
+initial Handshake message, error handling and serializing Zeek events and
+values into the Broker-specific serialization format.
+
+For example, using the Node.js `builtin WebSocket functionality <https://nodejs.org/en/learn/getting-started/websocket>`_,
+the ``websocat`` example from above can be reproduced as follows:
+
+.. code-block:: javascript
+   :caption: client.js
+
+   // client.js
+   const socket = new WebSocket('ws://192.168.122.107:27759/v1/messages/json');
+
+   socket.addEventListener('open', event => {
+     socket.send('["zeek.test"]');
+   });
+
+   socket.addEventListener('message', event => {
+     console.log('Message from server: ', event.data);
+   });
+
+.. code-block:: shell
+
+   $ node ./client.js
+   Message from server:  {"type":"ack","endpoint":"2e951b0c-3ca4-504c-ae8a-5d3750fec588-websocket-10","version":"8.0.0-dev.684"}
+   Message from server:  {"type":"data-message","topic":"zeek.test","@data-type":"vector","data":[{"@data-type":"count","data":1},{"@data-type":"count","data":1},{"@data-type":"vector","data":[{"@data-type":"string","data":"hello"},{"@data-type":"vector","data":[{"@data-type":"count","data":374}]},{"@data-type":"vector","data":[]}]}]}
+
+
+Golang
+^^^^^^
+
+* `Zeek Broker websocket interface library for Golang <https://github.com/corelight/go-zeek-broker-ws>`_ (not an official Zeek project)
+
+
+Rust
+^^^^
+
+* `Rust types for interacting with Zeek over WebSocket <https://github.com/bbannier/zeek-websocket-rs>`_ (not an official Zeek project)
+
+Python
+^^^^^^
+
+There are no ready to use Python libraries available, but the third-party
+`websockets <https://github.com/python-websockets/websockets>`_ package
+allows to get started quickly.
+You may take inspiration from `zeek-client's implementation <https://github.com/zeek/zeek-client>`_
+or the `small helper library <https://raw.githubusercontent.com/zeek/zeek/refs/heads/master/testing/btest/Files/ws/wstest.py>`_ used by various of Zeek's own tests for the
+WebSocket API.
+Zeekctl similarly ships a `light implementation <https://github.com/zeek/zeekctl/blob/93459b37c3deab4bec9e886211672024fa3e4759/ZeekControl/events.py#L159>`_
+using the ``websockets`` library to implement its ``netstats`` and ``print`` commands.
+
+
+Outgoing Connections
+====================
+
+For some deployment scenarios, Zeek only offering a WebSocket server can be cumbersome.
+Concretely, when multiple independent Zeek clusters interact with
+a single instance of a remote API. For instance, this could be needed for
+configuring a central firewall.
+In such scenarios, it is more natural for Zeek to connect out to the
+remote API, rather than the remote API connecting to the Zeek cluster.
+
+For these use-cases, the current suggestion is to run a WebSocket bridge between
+a Zeek cluster and the remote API. One concrete tool that can be used
+for this purpose is `websocat`_.
+
+.. note::
+
+   This topic has previously been discussed elsewhere. The following
+   `GitHub issue <https://github.com/zeek/zeek/issues/3597>`_ and
+   `discussion <https://github.com/zeek/zeek/discussions/4768>`_
+   provide more background and details.
+
+
+Example Architecture
+--------------------
+
+.. figure:: ../images/websocket-api/one-api-many-zeek.svg
+   :width: 300
+
+   Multiple Zeek instances and a single remote API
+
+The following proposal decouples the components using a WebSocket
+bridge for every Zeek cluster. This ensures that the depicted remote API
+does not need knowledge about an arbitrary number of Zeek clusters.
+
+
+.. figure:: ../images/websocket-api/one-api-many-zeek-ws-bridge.svg
+   :width: 300
+
+   Multiple Zeek instances and a single remote API with WebSocket bridges.
+
+Example Implementation
+----------------------
+
+Assuming the depicted remote API provides a WebSocket server as well,
+it is possible to use ``websocat`` as the bridge directly.
+The crux for the remote API is that upon a new WebSocket client connection,
+the first message is the topic array that the remote API wishes to subscribe
+to on a Zeek cluster.
+
+
+Putting these pieces together, the following JavaScript script presents the
+remote API, implemented using the `ws library <https://github.com/websockets/ws?tab=readme-ov-file>`_.
+It accepts WebSocket clients on port 8080 and sends the topic array as the first message
+containing just ``zeek.bridge.test``. Thereafter, it simply echos all incoming
+WebSocket messages.
+
+.. literalinclude:: websocket-api/server.js
+   :caption: server.js
+   :language: javascript
+
+The Zeek side starts a WebSocket server on port 8000 and regularly publishes
+a ``hello`` event to the ``zeek.bridge.test`` topic.
+
+.. literalinclude:: websocket-api/server.zeek
+   :caption: server.zeek
+   :language: zeek
+
+These two servers can now be connected by running ``websocat`` as follows:
+
+.. code-block:: shell
+
+    # In terminal 1 (use node if your Zeek has no JavaScript support)
+    $ zeek server.js
+
+    # In terminal 2
+    $ zeek server.zeek
+
+    # In terminal 3
+    $ while true; do websocat --text -H='X-Application-Name: client1' ws://localhost:8000/v1/messages/json ws://localhost:8080 || sleep 0.1 ; done
+
+
+The first few lines of output in terminal 1 should then look as follows:
+
+.. code-block:: shell
+
+   # zeek server.js
+   client1: connected, sending topics array ["zeek.bridge.test"]
+   client1: received: {"type":"ack","endpoint":"9089e06b-8d33-5585-ad79-4f7f6348754e-websocket-135","version":"8.1.0-dev.91"}
+   client1: received: {"type":"data-message","topic":"zeek.bridge.test","@data-type":"vector","data":[{"@data-type":"count","data":1},{"@data-type":"count","data":1},{"@data-type":"vector","data":[{"@data-type":"string","data":"hello"},{"@data-type":"vector","data":[{"@data-type":"count","data":1792}]},{"@data-type":"vector","data":[]}]}]}
+   ...
+
+If you require synchronization between the Zeek instance and the remote API, this
+is best achieved with events once the connection between the remote API and the
+Zeek cluster is established.
+
+Alternative Approaches
+----------------------
+
+Since v21, Node.js contains a built-in `WebSocket client <https://nodejs.org/en/learn/getting-started/websocket>`_,
+making it possible to use vanilla :ref:`javascript` within
+Zeek to establish outgoing WebSocket connections, too.
+
+The ``websocat`` tool provides more flexibility, potentially allowing
+to forward WebSocket messages to external commands which in turn could
+use HTTP POST requests to an external API.
--- a/doc/devel/websocket-api/server.js
+++ b/doc/devel/websocket-api/server.js
@ -0,0 +1,23 @@
+// server.js
+import WebSocket, { WebSocketServer } from 'ws';
+
+const wss = new WebSocketServer({ port: 8080 });
+
+wss.on('connection', (ws, req) => {
+  ws.on('error', console.error);
+  ws.on('close', () => { console.log('%s: gone', ws.zeek.app); });
+
+  ws.on('message', function message(data) {
+      console.log('%s: received: %s', ws.zeek.app, data);
+  });
+
+  let topics = ['zeek.bridge.test'];
+  let app = req.headers['x-application-name'] || '<unknown application>'
+  ws.zeek = {
+    app: app,
+    topics: topics,
+  };
+
+  console.log(`${app}: connected, sending topics array ${JSON.stringify(topics)}`);
+  ws.send(JSON.stringify(topics));
+});
--- a/doc/devel/websocket-api/server.zeek
+++ b/doc/devel/websocket-api/server.zeek
@ -0,0 +1,15 @@
+global hello: event(c : count);
+
+global c = 0;
+
+event tick()
+	{
+	Cluster::publish("zeek.bridge.test", hello, ++c);
+	schedule 1.0sec { tick() };
+	}
+
+event zeek_init()
+	{
+	Cluster::listen_websocket([$listen_addr=127.0.0.1, $listen_port=8000/tcp]);
+	event tick();
+	}
--- a/doc/ext/literal-emph.py
+++ b/doc/ext/literal-emph.py
@ -0,0 +1,41 @@
+import re
+
+import sphinx
+from docutils import nodes
+
+# This extension adds a 'literal-emph' directive that operates the same
+# as the 'code-block' directive except that it additionally understands
+# the **strong emphasis** markup, allowing custom rendering of it to be
+# substituted in the final literal block (e.g. HTML adds <strong> elements).
+# Adding " (no-emph)" to the end of a line within the 'literal-emph' content
+# disables substitutions for that line.
+
+
+class LiteralEmphNode(nodes.General, nodes.Element):
+    pass
+
+
+class LiteralEmph(sphinx.directives.code.CodeBlock):
+    def run(self):
+        node = LiteralEmphNode()
+        node += super().run()
+        return [node]
+
+
+def visit_litemph_node(self, node):
+    pass
+
+
+def depart_litemph_node(self, node):
+    text = self.body[-1]
+    text = re.sub(r"\*\*(.*?)\*\*(?!.* \(no-emph\)\n)", r"<strong>\1</strong>", text)
+    text = re.sub(r"(.*) \(no-emph\)\n", r"\1\n", text)
+    self.body[-1] = text
+
+
+def setup(app):
+    app.add_directive("literal-emph", LiteralEmph)
+    app.add_node(LiteralEmphNode, html=(visit_litemph_node, depart_litemph_node))
+    return {
+        "parallel_read_safe": True,
+    }
--- a/doc/ext/spicy-pygments.py
+++ b/doc/ext/spicy-pygments.py
@ -0,0 +1,391 @@
+# Copyright (c) 2020-now by the Zeek Project. See LICENSE for details.
+
+from pygments.lexer import RegexLexer, bygroups, include, words
+from pygments.token import (
+    Comment,
+    Keyword,
+    Name,
+    Number,
+    Operator,
+    Punctuation,
+    String,
+    Text,
+)
+from sphinx.highlighting import lexers
+
+
+def setup(app):
+    lexers["spicy"] = SpicyLexer()
+    lexers["spicy-evt"] = SpicyEvtLexer()
+    return {
+        "parallel_read_safe": True,
+        "parallel_write_safe": True,
+    }
+
+
+class SpicyLexer(RegexLexer):
+    """
+    For `Spicy <https://github.com/zeek/spicy>`_ grammars.
+    """
+
+    name = "Spicy"
+    aliases = ["spicy"]
+    filenames = ["*.spicy"]
+
+    _hex = r"[0-9a-fA-F]"
+    _float = r"((\d*\.?\d+)|(\d+\.?\d*))([eE][-+]?\d+)?"
+    _h = r"[A-Za-z0-9][-A-Za-z0-9]*"
+    _id = r"[a-zA-Z_][a-zA-Z_0-9]*"
+
+    tokens = {
+        "root": [
+            include("whitespace"),
+            include("comments"),
+            include("directives"),
+            include("attributes"),
+            include("hooks"),
+            include("properties"),
+            include("types"),
+            include("modules"),
+            include("keywords"),
+            include("literals"),
+            include("operators"),
+            include("punctuation"),
+            include("function-call"),
+            include("identifiers"),
+        ],
+        "whitespace": [
+            (r"\n", Text),
+            (r"\s+", Text),
+            (r"\\\n", Text),
+        ],
+        "comments": [
+            (r"#.*$", Comment),
+        ],
+        "directives": [(r"(@(if|else|endif))\b", Comment.Preproc)],
+        "attributes": [
+            (
+                words(
+                    (
+                        "bit-order",
+                        "byte-order",
+                        "chunked",
+                        "convert",
+                        "count",
+                        "cxxname",
+                        "default",
+                        "eod",
+                        "internal",
+                        "ipv4",
+                        "ipv6",
+                        "length",
+                        "max-size",
+                        "no-emit",
+                        "nosub",
+                        "on-heap",
+                        "optional",
+                        "originator",
+                        "parse-at",
+                        "parse-from",
+                        "priority",
+                        "requires",
+                        "responder",
+                        "size",
+                        "static",
+                        "synchronize",
+                        "transient",
+                        "try",
+                        "type",
+                        "until",
+                        "until-including",
+                        "while",
+                        "have_prototype",
+                    ),
+                    prefix=r"&",
+                    suffix=r"\b",
+                ),
+                Keyword.Pseudo,
+            ),
+        ],
+        "hooks": [
+            (
+                rf"(on)(\s+)(({_id}::)+%?{_id}(\.{_id})*)",
+                bygroups(Keyword, Text, Name.Function),
+            ),
+            (rf"(on)(\s+)(%?{_id}(\.{_id})*)", bygroups(Keyword, Text, Name.Function)),
+        ],
+        "properties": [
+            # Like an ID, but allow hyphenation ('-')
+            (r"%[a-zA-Z_][a-zA-Z_0-9-]*", Name.Attribute),
+        ],
+        "types": [
+            (
+                words(
+                    (
+                        "any",
+                        "addr",
+                        "bitfield",
+                        "bool",
+                        "bytes",
+                        "__library_type",
+                        "iterator",
+                        "const_iterator",
+                        "int8",
+                        "int16",
+                        "int32",
+                        "int64",
+                        "uint8",
+                        "uint16",
+                        "uint32",
+                        "uint64",
+                        "enum",
+                        "interval",
+                        "interval_ns",
+                        "list",
+                        "map",
+                        "optional",
+                        "port",
+                        "real",
+                        "regexp",
+                        "set",
+                        "sink",
+                        "stream",
+                        "view",
+                        "string",
+                        "time",
+                        "time_ns",
+                        "tuple",
+                        "unit",
+                        "vector",
+                        "void",
+                        "function",
+                        "struct",
+                    ),
+                    prefix=r"\b",
+                    suffix=r"\b",
+                ),
+                Keyword.Type,
+            ),
+            (
+                rf"\b(type)(\s+)((?:{_id})(?:::(?:{_id}))*)\b",
+                bygroups(Keyword, Text, Name.Class),
+            ),
+        ],
+        "modules": [
+            (
+                rf"\b(import)(\s+)({_id})(\s+)(from)(\s+)(\S+)\b",
+                bygroups(
+                    Keyword.Namespace,
+                    Text,
+                    Name.Namespace,
+                    Text,
+                    Keyword.Namespace,
+                    Text,
+                    Name.Namespace,
+                ),
+            ),
+            (
+                rf"\b(module|import)(\s+)({_id})\b",
+                bygroups(Keyword.Namespace, Text, Name.Namespace),
+            ),
+        ],
+        "keywords": [
+            (
+                words(
+                    ("global", "const", "local", "var", "public", "private", "inout"),
+                    prefix=r"\b",
+                    suffix=r"\b",
+                ),
+                Keyword.Declaration,
+            ),
+            (
+                words(
+                    (
+                        "print",
+                        "add",
+                        "delete",
+                        "stop",
+                        "unset",
+                        "assert",
+                        "assert-exception",
+                        "new",
+                        "cast",
+                        "begin",
+                        "end",
+                        "type",
+                        "attribute",
+                        "on",
+                        "priority",
+                        "if",
+                        "else",
+                        "switch",
+                        "case",
+                        "default",
+                        "try",
+                        "catch",
+                        "break",
+                        "return",
+                        "continue",
+                        "while",
+                        "for",
+                        "foreach",
+                        "module",
+                        "import",
+                        "export",
+                        "from",
+                    ),
+                    prefix=r"\b",
+                    suffix=r"\b",
+                ),
+                Keyword,
+            ),
+        ],
+        "literals": [
+            (r'b?"', String, "string"),
+            # Not the greatest match for patterns, but generally helps
+            # disambiguate between start of a pattern and just a division
+            # operator.
+            (r"/(?=.*/)", String.Regex, "regex"),
+            (r"\b(True|False|None|Null)\b", Keyword.Constant),
+            # Port
+            (r"\b\d{1,5}/(udp|tcp)\b", Number),
+            # IPv4 Address
+            (
+                r"\b(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\b",
+                Number,
+            ),
+            # IPv6 Address (not 100% correct: that takes more effort)
+            (
+                r"\[([0-9a-fA-F]{0,4}:){2,7}([0-9a-fA-F]{0,4})?((25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2}))?\]",
+                Number,
+            ),
+            # Numeric
+            (rf"\b0[xX]{_hex}+\b", Number.Hex),
+            (rf"\b{_float}\b", Number.Float),
+            (r"\b(\d+)\b", Number.Integer),
+        ],
+        "operators": [
+            (r"[$][$]", Name.Builtin.Pseudo),  # just-parsed-element
+            (r"[$]\d+", Name.Builtin.Pseudo),  # capture-group
+            (r"\b(in)\b", Operator.Word),
+            (r"[-+*=&|<>.]{2}", Operator),
+            (r"[-+*/=!><]=", Operator),
+            (r"[?][.]", Operator),
+            (r"[.][?]", Operator),
+            (r"[-][>]", Operator),
+            (r"[!][<>]", Operator),
+            (r"[!%*/+<=>~|&^-]", Operator),
+            # Technically, colons are often used for punctuation/sepration.
+            # E.g. field name/type separation.
+            (r"[?:]", Operator),
+        ],
+        "punctuation": [
+            (r"[{}()\[\],;:.]", Punctuation),
+        ],
+        "function-call": [
+            (rf"\b((?:{_id})(?:::(?:{_id}))*)(?=\s*\()", Name.Function),
+        ],
+        "identifiers": [
+            (r"\b(self)\b", Name.Builtin.Pseudo),
+            (r"([a-zA-Z_]\w*)(::)", bygroups(Name, Punctuation)),
+            (r"[a-zA-Z_]\w*", Name),
+        ],
+        "string": [
+            (r"\\.", String.Escape),
+            (r"%-?[0-9]*(\.[0-9]+)?[DTdxsefg]", String.Escape),
+            (r'"', String, "#pop"),
+            (r".", String),
+        ],
+        "regex": [
+            (r"\\.", String.Escape),
+            (r"/", String.Regex, "#pop"),
+            (r".", String.Regex),
+        ],
+    }
+
+
+class SpicyEvtLexer(RegexLexer):
+    """
+    For `Spicy <https://github.com/zeek/spicy>`_ Zeek interface definitions.
+    """
+
+    name = "SpicyEvt"
+    aliases = ["spicy-evt"]
+    filenames = ["*.evt"]
+
+    _id = r"[a-zA-Z_][a-zA-Z_0-9]*"
+
+    tokens = {
+        "root": [
+            include("whitespace"),
+            include("comments"),
+            include("directives"),
+            include("hooks"),
+            include("modules"),
+            include("keywords"),
+            include("literals"),
+            include("operators"),
+            include("punctuation"),
+            include("function-call"),
+            include("identifiers"),
+        ],
+        "whitespace": SpicyLexer.tokens["whitespace"],
+        "comments": SpicyLexer.tokens["comments"],
+        "directives": SpicyLexer.tokens["directives"],
+        "hooks": SpicyLexer.tokens["hooks"],
+        "modules": SpicyLexer.tokens["modules"],
+        "keywords": [
+            (
+                rf"\b(analyzer|with|replaces)(\s+)({_id}(::{_id})*)",
+                bygroups(Keyword, Text, Name.Class),
+            ),
+            (
+                words(("protocol", "packet", "file"), prefix=r"\b", suffix=r"\b"),
+                Keyword.Type,
+            ),
+            (
+                words(
+                    ("port", "event", "parse", "over", "mime-type"),
+                    prefix=r"\b",
+                    suffix=r"\b",
+                ),
+                Keyword,
+            ),
+            (words(("cast"), prefix=r"\b", suffix=r"\b"), Keyword),
+            (
+                words(
+                    (
+                        "if",
+                        "else",
+                        "switch",
+                        "case",
+                        "default",
+                        "try",
+                        "catch",
+                        "break",
+                        "return",
+                        "continue",
+                        "while",
+                        "for",
+                        "foreach",
+                    ),
+                    prefix=r"\b",
+                    suffix=r"\b",
+                ),
+                Keyword,
+            ),
+        ],
+        "literals": SpicyLexer.tokens["literals"],
+        "operators": SpicyLexer.tokens["operators"],
+        "punctuation": SpicyLexer.tokens["punctuation"],
+        "function-call": SpicyLexer.tokens["function-call"],
+        "identifiers": [
+            (r"\b(ZEEK_VERSION)\b", Name.Builtin),
+            (r"\b(self)\b", Name.Builtin.Pseudo),
+            (r"[$](conn|file|is_orig)", Name.Builtin.Pseudo),
+            (r"([a-zA-Z_]\w*)(::)", bygroups(Name, Punctuation)),
+            (r"[a-zA-Z_]\w*", Name),
+        ],
+        "string": SpicyLexer.tokens["string"],
+        "regex": SpicyLexer.tokens["regex"],
+    }
--- a/doc/ext/zeek.py
+++ b/doc/ext/zeek.py
@ -0,0 +1,597 @@
+"""
+The Zeek domain for Sphinx.
+"""
+
+import collections
+
+
+def setup(Sphinx):
+    Sphinx.add_domain(ZeekDomain)
+    Sphinx.add_node(see)
+    Sphinx.add_directive_to_domain("zeek", "see", SeeDirective)
+    Sphinx.connect("object-description-transform", object_description_transform)
+    Sphinx.connect("doctree-resolved", process_see_nodes)
+    return {
+        "parallel_read_safe": True,
+    }
+
+
+from sphinx import addnodes, version_info
+from sphinx.directives import ObjectDescription
+from sphinx.domains import Domain, Index, ObjType
+from sphinx.locale import _
+from sphinx.roles import XRefRole
+from sphinx.util import docfields, logging
+from sphinx.util.nodes import make_refnode
+
+logger = logging.getLogger(__name__)
+
+from docutils import nodes
+from docutils.parsers.rst import Directive, directives
+
+
+class see(nodes.General, nodes.Element):
+    refs = []
+
+
+class SeeDirective(Directive):
+    has_content = True
+
+    def run(self):
+        n = see("")
+        n.refs = " ".join(self.content).split()
+        return [n]
+
+
+# Wrapper for creating a tuple for index nodes, staying backwards
+# compatible to Sphinx < 1.4:
+def make_index_tuple(indextype, indexentry, targetname, targetname2):
+    if version_info >= (1, 4, 0, "", 0):
+        return (indextype, indexentry, targetname, targetname2, None)
+    else:
+        return (indextype, indexentry, targetname, targetname2)
+
+
+def object_description_transform(app, domain, objtype, contentnode):
+    """
+    Add all collected record fields as a "Field" field to a ZeekType.
+    """
+    if domain != "zeek" or objtype != "type":
+        return
+
+    type_name = app.env.ref_context["zeek:type"]
+    record_fields = app.env.domaindata["zeek"].get("fields", {}).get(type_name)
+
+    if not record_fields:
+        return
+
+    field_list = contentnode[0]
+
+    name = nodes.field_name("", _("Fields"))
+    body = nodes.field_body("")
+
+    for field_name, record_field in record_fields.items():
+        body += record_field["idx"]
+        body += record_field["signode"]
+
+    field_list.append(nodes.field("", name, body))
+
+
+def process_see_nodes(app, doctree, fromdocname):
+    for node in doctree.traverse(see):
+        content = []
+        para = nodes.paragraph()
+        para += nodes.Text("See also:", "See also:")
+        for name in node.refs:
+            join_str = " "
+            if name != node.refs[0]:
+                join_str = ", "
+            link_txt = join_str + name
+            if name not in app.env.domaindata["zeek"]["idtypes"]:
+                # Just create the text and issue warning
+                logger.warning(
+                    '%s: unknown target for ".. zeek:see:: %s"',
+                    fromdocname,
+                    name,
+                    location=node,
+                )
+                para += nodes.Text(link_txt, link_txt)
+            else:
+                # Create a reference
+                typ = app.env.domaindata["zeek"]["idtypes"][name]
+                todocname = app.env.domaindata["zeek"]["objects"][(typ, name)]
+
+                newnode = nodes.reference("", "")
+                innernode = nodes.literal(_(name), _(name), classes=["xref"])
+                newnode["refdocname"] = todocname
+                newnode["refuri"] = app.builder.get_relative_uri(fromdocname, todocname)
+                newnode["refuri"] += "#" + typ + "-" + name
+                newnode.append(innernode)
+                para += nodes.Text(join_str, join_str)
+                para += newnode
+
+        content.append(para)
+        node.replace_self(content)
+
+
+class ZeekGeneric(ObjectDescription):
+    option_spec = {"source-code": directives.unchanged}
+
+    def __init__(self, *args, **kwargs):
+        super(ObjectDescription, self).__init__(*args, **kwargs)
+        options = args[2]
+        self.code_url = None
+
+        if "source-code" in options and "zeek-code-url" in self.env.config:
+            base_url = self.env.config["zeek-code-url"]
+            path, start, end = options["source-code"].split()
+            path_parts = path.split("/")
+            file_name = path_parts[-1]
+
+            # Don't have anything to link to for BIFs
+            if not file_name.endswith(".bif.zeek"):
+                self.code_url = f"{base_url}/scripts/{path}#L{start}-L{end}"
+
+    def get_obj_name(self):
+        return self.objtype
+
+    def update_type_map(self, idname):
+        if "idtypes" not in self.env.domaindata["zeek"]:
+            self.env.domaindata["zeek"]["idtypes"] = {}
+        self.env.domaindata["zeek"]["idtypes"][idname] = self.get_obj_name()
+
+    def process_signode(self, name, sig, signode, targetname):
+        signode["names"].append(targetname)
+        signode["ids"].append(targetname)
+        signode["first"] = not self.names
+        self.state.document.note_explicit_target(signode)
+
+    def add_target_and_index(self, name, sig, signode):
+        targetname = self.get_obj_name() + "-" + name
+
+        if targetname not in self.state.document.ids:
+            self.process_signode(name, sig, signode, targetname)
+
+            objects = self.env.domaindata["zeek"]["objects"]
+            key = (self.get_obj_name(), name)
+
+            if (
+                key in objects
+                and self.get_obj_name() != "id"
+                and self.get_obj_name() != "type"
+                and self.get_obj_name() != "field"
+            ):
+                logger.warning(
+                    "%s: duplicate description of %s %s, other instance in %s %s",
+                    self.env.docname,
+                    self.get_obj_name(),
+                    name,
+                    self.env.doc2path(objects[key]),
+                    self.lineno,
+                )
+
+            objects[key] = self.env.docname
+            self.update_type_map(name)
+
+        indextext = self.get_index_text(name)
+
+        if indextext:
+            self.indexnode["entries"].append(
+                make_index_tuple("single", indextext, targetname, targetname)
+            )
+
+    def get_index_text(self, name):
+        return _("%s (%s)") % (name, self.get_obj_name())
+
+    def handle_signature(self, sig, signode):
+        if self.code_url:
+            signode += nodes.reference(
+                sig, sig, refuri=self.code_url, reftitle="View Source Code"
+            )
+
+            # Could embed snippets directly, but would probably want to clean
+            # up how it's done: don't use an external script, figure out why
+            # tab/indentation is broken, toggle snippet visibility on mouse
+            # hover or other explicit button/link, fix the colors/theming...
+            # But for now, leaving this commented out as an example and quick
+            # way of checking that the code ranges that Zeekygen outputs are
+            # sensible.
+
+            # import urllib
+            # snippet_target = urllib.parse.quote(self.code_url, '')
+            # snippet_url = 'https://emgithub.com/embed.js'
+            # snippet_url += f'?target={snippet_target}'
+            # snippet_url += '&style=github'
+            # snippet_url += '&showLineNumbers=on'
+            # snippet_url += '&showBorder=on'
+            # snippet_url += '&ts=4'
+            # rawnode = nodes.raw('', f'<script src="{snippet_url}"></script>',
+            #                     format='html')
+            # signode += rawnode
+
+        else:
+            signode += addnodes.desc_name("", sig)
+
+        return sig
+
+
+class ZeekNamespace(ZeekGeneric):
+    def add_target_and_index(self, name, sig, signode):
+        targetname = self.get_obj_name() + "-" + name
+
+        if targetname not in self.state.document.ids:
+            signode["names"].append(targetname)
+            signode["ids"].append(targetname)
+            signode["first"] = not self.names
+            self.state.document.note_explicit_target(signode)
+
+            objects = self.env.domaindata["zeek"]["objects"]
+            key = (self.get_obj_name(), name)
+            objects[key] = self.env.docname
+            self.update_type_map(name)
+
+        indextext = self.get_index_text(name)
+        self.indexnode["entries"].append(
+            make_index_tuple("single", indextext, targetname, targetname)
+        )
+        self.indexnode["entries"].append(
+            make_index_tuple("single", f"namespaces; {sig}", targetname, targetname)
+        )
+
+    def get_index_text(self, name):
+        return _("%s (namespace); %s") % (name, self.env.docname)
+
+    def handle_signature(self, sig, signode):
+        signode += addnodes.desc_name("", sig)
+        return sig
+
+
+class ZeekEnum(ZeekGeneric):
+    def add_target_and_index(self, name, sig, signode):
+        targetname = self.get_obj_name() + "-" + name
+
+        if targetname not in self.state.document.ids:
+            self.process_signode(name, sig, signode, targetname)
+
+            objects = self.env.domaindata["zeek"]["objects"]
+            key = (self.get_obj_name(), name)
+            objects[key] = self.env.docname
+            self.update_type_map(name)
+
+        # indextext = self.get_index_text(name)
+        # self.indexnode['entries'].append(make_index_tuple('single', indextext,
+        #                                  targetname, targetname))
+        m = sig.split()
+
+        if len(m) < 2:
+            logger.warning(
+                "%s: zeek:enum directive missing argument(s)", self.env.docname
+            )
+            return
+
+        if m[1] == "Notice::Type":
+            if "notices" not in self.env.domaindata["zeek"]:
+                self.env.domaindata["zeek"]["notices"] = []
+            self.env.domaindata["zeek"]["notices"].append(
+                (m[0], self.env.docname, targetname)
+            )
+
+        self.indexnode["entries"].append(
+            make_index_tuple(
+                "single", f"{m[1]} (enum values); {m[0]}", targetname, targetname
+            )
+        )
+
+    def handle_signature(self, sig, signode):
+        m = sig.split()
+        name = m[0]
+        signode += addnodes.desc_name("", name)
+        return name
+
+
+class ZeekParamField(docfields.GroupedField):
+    has_arg = True
+    is_typed = True
+
+
+class ZeekIdentifier(ZeekGeneric):
+    zeek_param_field = ZeekParamField("param", label="Parameters", can_collapse=True)
+    field_type_map = {"param": (zeek_param_field, False)}
+
+    def get_index_text(self, name):
+        return name
+
+    def get_field_type_map(self):
+        return self.field_type_map
+
+
+class ZeekNative(ZeekGeneric):
+    def handle_signature(self, sig, signode):
+        # The run() method is overridden to drop signode anyway in favor of
+        # simply adding the index and a target nodes and leaving up
+        # to the .rst document to explicitly add things that need to
+        # be presented in the final rendering (e.g. a section header)
+        self.native_name = sig
+        return sig
+
+    def process_signode(self, name, sig, signode, targetname):
+        pass
+
+    def run(self):
+        ns = super().run()
+        index_node = ns[0]
+
+        target_id = self.get_obj_name() + "-" + self.native_name
+        target_node = nodes.target("", "", ids=[target_id])
+        self.state.document.note_explicit_target(target_node)
+
+        # Replace the description node from Sphinx with a simple target node
+        return [index_node, target_node]
+
+
+class ZeekKeyword(ZeekNative):
+    def get_index_text(self, name):
+        if name and name[0] == "@":
+            return _("%s (directive)") % (name)
+        else:
+            return _("%s (keyword)") % (name)
+
+
+class ZeekAttribute(ZeekNative):
+    def get_index_text(self, name):
+        return _("%s (attribute)") % (name)
+
+
+class ZeekType(ZeekGeneric):
+    """
+    Put the type that's currently documented into env.ref_context
+    for usage with the ZeekField directive.
+    """
+
+    def before_content(self):
+        self.env.ref_context["zeek:type"] = self.arguments[0]
+
+    def after_content(self):
+        self.env.ref_context.pop("zeek:type", None)
+
+
+class ZeekField(ZeekGeneric):
+    def handle_signature(self, sig, signode):
+        """
+        The signature for .. zeek:field: currently looks like the following:
+
+          .. zeek:field:: ts :zeek:type:`time` :zeek:attr:`&log` :zeek:attr:`&optional`
+        """
+        parts = sig.split(" ", 2)
+        name, type_str = parts[0:2]
+        record_type = self.env.ref_context["zeek:type"]
+        fullname = "$".join([record_type, name])
+        attrs_str = ""
+        if len(parts) == 3:
+            attrs_str = parts[2]
+
+        type_nodes, _ = self.state.inline_text(type_str, -1)
+
+        signode += addnodes.desc_name(name, name)
+        signode += addnodes.desc_sig_punctuation("", ":")
+        signode += addnodes.desc_sig_space()
+        signode += type_nodes
+
+        if attrs_str:
+            attr_nodes, _ = self.state.inline_text(attrs_str, -1)
+            signode += addnodes.desc_sig_space()
+            signode += attr_nodes
+
+        signode["class"] = record_type
+        signode["fullname"] = fullname
+
+        return fullname
+
+    def run(self):
+        idx, signode = super().run()
+
+        record_type = self.env.ref_context["zeek:type"]
+
+        fields = self.env.domaindata["zeek"].setdefault("fields", {})
+        rfields = fields.setdefault(record_type, collections.OrderedDict())
+        rfields[signode[0]["fullname"]] = {
+            "idx": idx,
+            "signode": signode,
+        }
+
+        return []
+
+
+class ZeekNativeType(ZeekNative):
+    def get_obj_name(self):
+        # As opposed to using 'native-type', just imitate 'type'.
+        return "type"
+
+
+class ZeekFieldXRefRole(XRefRole):
+    def process_link(self, env, refnode, has_explicit_title, title, target):
+        title, target = super().process_link(
+            env, refnode, has_explicit_title, title, target
+        )
+
+        parts = title.split("$")
+        if len(parts) == 2 and parts[0] and parts[1]:
+            # If a field is in Type$field, form, strip Type.
+            title = parts[1]
+
+        return title, target
+
+
+class ZeekNotices(Index):
+    """
+    Index subclass to provide the Zeek notices index.
+    """
+
+    name = "noticeindex"
+    localname = _("Zeek Notice Index")
+    shortname = _("notices")
+
+    def generate(self, docnames=None):
+        content = {}
+
+        if "notices" not in self.domain.env.domaindata["zeek"]:
+            return content, False
+
+        for n in self.domain.env.domaindata["zeek"]["notices"]:
+            modname = n[0].split("::")[0]
+            entries = content.setdefault(modname, [])
+            entries.append([n[0], 0, n[1], n[2], "", "", ""])
+
+        content = sorted(content.items())
+
+        return content, False
+
+
+class ZeekDomain(Domain):
+    """Zeek domain."""
+
+    name = "zeek"
+    label = "Zeek"
+
+    object_types = {
+        "type": ObjType(_("type"), "type"),
+        "native-type": ObjType(_("type"), "type"),
+        "namespace": ObjType(_("namespace"), "namespace"),
+        "id": ObjType(_("id"), "id"),
+        "keyword": ObjType(_("keyword"), "keyword"),
+        "enum": ObjType(_("enum"), "enum"),
+        "attr": ObjType(_("attr"), "attr"),
+        "field": ObjType(_("field"), "field"),
+    }
+
+    directives = {
+        "type": ZeekType,
+        "native-type": ZeekNativeType,
+        "namespace": ZeekNamespace,
+        "id": ZeekIdentifier,
+        "keyword": ZeekKeyword,
+        "enum": ZeekEnum,
+        "attr": ZeekAttribute,
+        "field": ZeekField,
+    }
+
+    roles = {
+        "type": XRefRole(),
+        "namespace": XRefRole(),
+        "id": XRefRole(),
+        "keyword": XRefRole(),
+        "enum": XRefRole(),
+        "attr": XRefRole(),
+        "see": XRefRole(),
+        "field": ZeekFieldXRefRole(),
+    }
+
+    indices = [
+        ZeekNotices,
+    ]
+
+    initial_data = {
+        "objects": {},  # fullname -> docname, objtype
+    }
+
+    def clear_doc(self, docname):
+        to_delete = []
+
+        for (typ, name), doc in self.data["objects"].items():
+            if doc == docname:
+                to_delete.append((typ, name))
+
+        for typ, name in to_delete:
+            del self.data["objects"][typ, name]
+
+    def resolve_xref(self, env, fromdocname, builder, typ, target, node, contnode):
+        objects = self.data["objects"]
+
+        if typ == "see":
+            if target not in self.data["idtypes"]:
+                logger.warning(
+                    '%s: unknown target for ":zeek:see:`%s`"', fromdocname, target
+                )
+                return []
+
+            objtype = self.data["idtypes"][target]
+            return make_refnode(
+                builder,
+                fromdocname,
+                objects[objtype, target],
+                objtype + "-" + target,
+                contnode,
+                target + " " + objtype,
+            )
+        elif typ == "field" and "$" not in target:
+            # :zeek:field:`x` without a record type ends up just x, no ref.
+            return []
+        else:
+            objtypes = self.objtypes_for_role(typ)
+
+            for objtype in objtypes:
+                if (objtype, target) in objects:
+                    return make_refnode(
+                        builder,
+                        fromdocname,
+                        objects[objtype, target],
+                        objtype + "-" + target,
+                        contnode,
+                        target + " " + objtype,
+                    )
+                else:
+                    logger.warning(
+                        '%s: unknown target for ":zeek:%s:`%s`"',
+                        fromdocname,
+                        typ,
+                        target,
+                    )
+
+    def get_objects(self):
+        for (typ, name), docname in self.data["objects"].items():
+            yield name, name, typ, docname, typ + "-" + name, 1
+
+    def merge_domaindata(self, docnames, otherdata):
+        """
+        Merge domaindata in multiprocess mode.
+
+        I'm quite unclear how the objects dict works out okay in single
+        process mode. For example, the file_entropy() event is defined
+        in scripts/base/bif/plugins/Zeek_FileEntropy.events.bif.zeek.rst
+        *and* in script-reference/autogenerated-file-analyzer-index.rst.
+        The current documentation refers to the first one for :zeek:see:.
+        It seems in single process mode the reading sorts filenames and
+        just uses the last highest sorting one. That ends-up being the one
+        in scripts/base.
+
+            In [4]: "script-reference/autogenerated" < "scripts/base"
+            Out[4]: True
+
+        """
+        for target, data in otherdata.items():
+            if target == "version":
+                continue
+            elif hasattr(data, "items"):
+                target_data = self.env.domaindata["zeek"].setdefault(target, {})
+
+                # Iterate manually over the elements for debugging
+                for k, v in data.items():
+                    if k not in target_data:
+                        target_data[k] = v
+                    else:
+                        # The > comparison below updates the objects domaindata
+                        # to filenames that sort higher. See comment above.
+                        if isinstance(v, str):
+                            if v > target_data[k]:
+                                target_data[k] = v
+                        else:
+                            # Otherwise assume it's a dict and we can merge
+                            # using update()
+                            target_data[k].update(v)
+
+            elif hasattr(data, "extend"):
+                # notices are a list
+                target_data = self.env.domaindata["zeek"].setdefault(target, [])
+                target_data.extend(data)
+            else:
+                raise NotImplementedError(target, type(data))
--- a/doc/ext/zeek_pygments.py
+++ b/doc/ext/zeek_pygments.py
@ -0,0 +1,247 @@
+from pygments.lexer import RegexLexer, bygroups, include, words
+from pygments.token import (
+    Comment,
+    Keyword,
+    Literal,
+    Name,
+    Number,
+    Operator,
+    Punctuation,
+    String,
+    Text,
+)
+
+
+def setup(Sphinx):
+    return {
+        "parallel_read_safe": True,
+    }
+
+
+class ZeekLexer(RegexLexer):
+    """
+    For `Zeek <https://www.zeek.org/>`_ scripts.
+
+    .. versionadded:: 2.5
+    """
+
+    name = "Zeek"
+    aliases = ["zeek"]
+    filenames = ["*.zeek"]
+
+    _hex = r"[0-9a-fA-F]"
+    _float = r"((\d*\.?\d+)|(\d+\.?\d*))([eE][-+]?\d+)?"
+    _h = r"[A-Za-z0-9][-A-Za-z0-9]*"
+
+    tokens = {
+        "root": [
+            include("whitespace"),
+            include("comments"),
+            include("directives"),
+            include("attributes"),
+            include("types"),
+            include("keywords"),
+            include("literals"),
+            include("operators"),
+            include("punctuation"),
+            (
+                r"\b((?:[A-Za-z_][A-Za-z_0-9]*)(?:::(?:[A-Za-z_][A-Za-z_0-9]*))*)(?=\s*\()",
+                Name.Function,
+            ),
+            include("identifiers"),
+        ],
+        "whitespace": [
+            (r"\n", Text),
+            (r"\s+", Text),
+            (r"\\\n", Text),
+        ],
+        "comments": [
+            (r"#.*$", Comment),
+        ],
+        "directives": [
+            (r"(@(load-plugin|load-sigs|load|unload))\b.*$", Comment.Preproc),
+            (
+                r"(@(DEBUG|DIR|FILENAME|deprecated|if|ifdef|ifndef|else|endif))\b",
+                Comment.Preproc,
+            ),
+            (r"(@prefixes)\s*(\+?=).*$", Comment.Preproc),
+        ],
+        "attributes": [
+            (
+                words(
+                    (
+                        "redef",
+                        "priority",
+                        "log",
+                        "optional",
+                        "default",
+                        "add_func",
+                        "delete_func",
+                        "expire_func",
+                        "read_expire",
+                        "write_expire",
+                        "create_expire",
+                        "synchronized",
+                        "persistent",
+                        "rotate_interval",
+                        "rotate_size",
+                        "encrypt",
+                        "raw_output",
+                        "mergeable",
+                        "error_handler",
+                        "broker_allow_complex_type",
+                        "is_assigned",
+                        "is_used",
+                        "type_column",
+                        "deprecated",
+                        "on_change",
+                        "backend",
+                        "broker_store",
+                    ),
+                    prefix=r"&",
+                    suffix=r"\b",
+                ),
+                Keyword.Pseudo,
+            ),
+        ],
+        "types": [
+            (
+                words(
+                    (
+                        "any",
+                        "enum",
+                        "record",
+                        "set",
+                        "table",
+                        "vector",
+                        "function",
+                        "hook",
+                        "event",
+                        "addr",
+                        "bool",
+                        "count",
+                        "double",
+                        "file",
+                        "int",
+                        "interval",
+                        "pattern",
+                        "port",
+                        "string",
+                        "subnet",
+                        "time",
+                    ),
+                    prefix=r"\b",
+                    suffix=r"\b",
+                ),
+                Keyword.Type,
+            ),
+            (
+                r"\b(opaque)(\s+)(of)(\s+)((?:[A-Za-z_][A-Za-z_0-9]*)(?:::(?:[A-Za-z_][A-Za-z_0-9]*))*)\b",
+                bygroups(Keyword.Type, Text, Operator.Word, Text, Keyword.Type),
+            ),
+            (
+                r"\b(type)(\s+)((?:[A-Za-z_][A-Za-z_0-9]*)(?:::(?:[A-Za-z_][A-Za-z_0-9]*))*)(\s*)(:)(\s*)\b(record|enum)\b",
+                bygroups(Keyword, Text, Name.Class, Text, Operator, Text, Keyword.Type),
+            ),
+            (
+                r"\b(type)(\s+)((?:[A-Za-z_][A-Za-z_0-9]*)(?:::(?:[A-Za-z_][A-Za-z_0-9]*))*)(\s*)(:)",
+                bygroups(Keyword, Text, Name, Text, Operator),
+            ),
+            (
+                r"\b(redef)(\s+)(record|enum)(\s+)((?:[A-Za-z_][A-Za-z_0-9]*)(?:::(?:[A-Za-z_][A-Za-z_0-9]*))*)\b",
+                bygroups(Keyword, Text, Keyword.Type, Text, Name.Class),
+            ),
+        ],
+        "keywords": [
+            (
+                words(
+                    (
+                        "redef",
+                        "export",
+                        "if",
+                        "else",
+                        "for",
+                        "while",
+                        "return",
+                        "break",
+                        "next",
+                        "continue",
+                        "fallthrough",
+                        "switch",
+                        "default",
+                        "case",
+                        "add",
+                        "delete",
+                        "copy",
+                        "when",
+                        "timeout",
+                        "schedule",
+                    ),
+                    prefix=r"\b",
+                    suffix=r"\b",
+                ),
+                Keyword,
+            ),
+            (r"\b(print)\b", Keyword),
+            (r"\b(global|local|const|option)\b", Keyword.Declaration),
+            (
+                r"\b(module)(\s+)(([A-Za-z_][A-Za-z_0-9]*)(?:::([A-Za-z_][A-Za-z_0-9]*))*)\b",
+                bygroups(Keyword.Namespace, Text, Name.Namespace),
+            ),
+        ],
+        "literals": [
+            (r'"', String, "string"),
+            # Not the greatest match for patterns, but generally helps
+            # disambiguate between start of a pattern and just a division
+            # operator.
+            (r"/(?=.*/)", String.Regex, "regex"),
+            (r"\b(T|F)\b", Keyword.Constant),
+            # Port
+            (r"\b\d{1,5}/(udp|tcp|icmp|unknown)\b", Number),
+            # IPv4 Address
+            (
+                r"\b(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\b",
+                Number,
+            ),
+            # IPv6 Address (not 100% correct: that takes more effort)
+            (
+                r"\[([0-9a-fA-F]{0,4}:){2,7}([0-9a-fA-F]{0,4})?((25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2})\.(25[0-5]|2[0-4][0-9]|[0-1][0-9]{2}|[0-9]{1,2}))?\]",
+                Number,
+            ),
+            # Numeric
+            (r"\b0[xX]" + _hex + r"+\b", Number.Hex),
+            (r"\b" + _float + r"\s*(day|hr|min|sec|msec|usec)s?\b", Literal.Date),
+            (r"\b" + _float + r"\b", Number.Float),
+            (r"\b(\d+)\b", Number.Integer),
+            # Hostnames
+            (_h + r"(\." + _h + r")+", String),
+        ],
+        "operators": [
+            (r"[!%*/+<=>~|&^-]", Operator),
+            (r"([-+=&|]{2}|[+=!><-]=)", Operator),
+            (r"\b(in|as|is|of)\b", Operator.Word),
+            (r"\??\$", Operator),
+            # Technically, colons are often used for punctuation/separation.
+            # E.g. field name/type separation.
+            (r"[?:]", Operator),
+        ],
+        "punctuation": [
+            (r"\?\$", Punctuation),
+            (r"[{}()\[\],;:.]", Punctuation),
+        ],
+        "identifiers": [
+            (r"([a-zA-Z_]\w*)(::)", bygroups(Name, Punctuation)),
+            (r"[a-zA-Z_]\w*", Name),
+        ],
+        "string": [
+            (r"\\.", String.Escape),
+            (r"%-?[0-9]*(\.[0-9]+)?[DTdxsefg]", String.Escape),
+            (r'"', String, "#pop"),
+            (r".", String),
+        ],
+        "regex": [
+            (r"\\.", String.Escape),
+            (r"/", String.Regex, "#pop"),
+            (r".", String.Regex),
+        ],
+    }
--- a/doc/frameworks/broker.rst
+++ b/doc/frameworks/broker.rst
@ -0,0 +1,644 @@
+.. _CAF: https://github.com/actor-framework/actor-framework
+
+.. _broker-framework:
+
+==============================
+Broker Communication Framework
+==============================
+
+.. rst-class:: opening
+
+    Zeek uses the `Broker Library
+    <https://docs.zeek.org/projects/broker>`_ to exchange information with
+    other Zeek processes.  Broker itself uses CAF_ (C++ Actor Framework)
+    internally for connecting nodes and exchanging arbitrary data over
+    networks.  Broker then introduces, on top of CAF, a topic-based
+    publish/subscribe communication pattern using a data model that is
+    compatible to Zeek's.  Broker itself can be utilized outside the
+    context of Zeek, with Zeek itself making use of only a few predefined
+    Broker message formats that represent Zeek events, log entries, etc.
+
+    In summary, the Zeek's Broker framework provides basic facilities for
+    connecting broker-enabled peers (e.g. Zeek instances) to each other
+    and exchanging messages (e.g. events and logs).
+
+Cluster Layout / API
+====================
+
+Layout / Topology
+-----------------
+
+In a Zeek cluster setup, every Zeek process is assigned a cluster role.
+Such a process is then called a Zeek node, a cluster node, or just named
+after the role of the process (the manager, the loggers, ...). A basic Zeek
+cluster uses four different node types, enumerated in the script-level
+variable :zeek:see:`Cluster::NodeType`.
+
+- Manager
+- Logger
+- Worker
+- Proxy
+
+In small Zeek deployments, all nodes may run on a single host. In large
+Zeek deployments, nodes may be distributed across multiple physical
+systems for scaling.
+
+Currently, a single Manager node in a Zeek cluster exists. Further, connectivity
+between nodes is determined statically based on their type:
+
+- Every node connects to all loggers and the manager.
+
+- Each worker connects to all proxies.
+
+
+.. figure:: broker/cluster-layout.png
+
+Some general suggestions as to the purpose/utilization of each node type:
+
+- Workers: are a good first choice for doing the brunt of any work you need
+  done.  They should be spending a lot of time performing the actual job
+  of parsing/analyzing incoming data from packets, so you might choose
+  to look at them as doing a "first pass" analysis and then deciding how
+  the results should be shared with other nodes in the cluster.
+
+- Proxies: serve as intermediaries for data storage and work/calculation
+  offloading.  Good for helping offload work or data in a scalable and
+  distributed way.  Since any given worker is connected to all
+  proxies and can agree on an "arbitrary key -> proxy node" mapping
+  (more on that later), you can partition work or data amongst them in a
+  uniform manner.  e.g. you might choose to use proxies as a method of
+  sharing non-persistent state or as a "second pass" analysis for any
+  work that you don't want interfering with the workers' capacity to
+  keep up with capturing and parsing packets.  Note that the default scripts
+  that come with Zeek make minimal use of proxies, so if you are coming
+  from a previous ZeekControl deployment, you may want to try reducing down
+  to a single proxy node.  If you come to have custom/community scripts
+  that utilize proxies, that would be the time to start considering scaling
+  up the number of proxies to meet demands.
+
+- Manager: this node will be good at performing decisions that require a
+  global view of things since it is in a centralized location, connected
+  to everything.  However, that also makes it easy to overload, so try
+  to use it sparingly and only for tasks that must be done in a
+  centralized or authoritative location. Optionally, for some
+  deployments, the Manager can also serve as the sole Logger.
+
+- Loggers: these nodes should simply be spending their time writing out
+  logs to disk and not used for much else.  In the default cluster
+  configuration, logs get distributed among available loggers in a
+  round-robin fashion, providing failover capability should any given
+  logger temporarily go offline.
+
+Data Management/Sharing Strategies
+==================================
+
+There's maybe no single, best approach or pattern to use when you need a
+Zeek script to store or share long-term state and data.  The two
+approaches that were previously used were either using the ``&synchronized``
+attribute on tables/sets or by explicitly sending events to specific
+nodes on which you wanted data to be stored.  The former is no longer
+possible, though there are several new possibilities that the new
+Broker/Cluster framework offer, namely distributed data store and data
+partitioning APIs.
+
+Data Stores
+-----------
+
+Broker provides a distributed key-value store interface with optional
+choice of using a persistent backend. For more detail, see
+:ref:`this example <data_store_example>`.
+
+Some ideas/considerations/scenarios when deciding whether to use
+a data store for your use-case:
+
+* If you need the full data set locally in order to achieve low-latency
+  queries using data store "clones" can provide that.
+
+* If you need data that persists across restarts of Zeek processes, then
+  data stores can also provide that.
+
+* If the data you want to store is complex (tables, sets, records) or
+  you expect to read, modify, and store back, then data stores may not
+  be able to provide simple, race-free methods of performing the pattern
+  of logic that you want.
+
+* If the data set you want to store is excessively large, that's still
+  problematic even for stores that use a persistent backend as they are
+  implemented in a way that requires a full snapshot of the store's
+  contents to fit in memory (this limitation may change in the future).
+
+Data Partitioning
+-----------------
+
+New data partitioning strategies are available using the API in
+:doc:`/scripts/base/frameworks/cluster/pools.zeek`.  Using that API, developers
+of custom Zeek scripts can define a custom pool of nodes that best fits the
+needs of their script.
+
+One example strategy is to use Highest Random Weight (HRW) hashing to
+partition data tables amongst the pool of all proxy nodes.  e.g. using
+:zeek:see:`Cluster::publish_hrw`.  This could allow clusters to
+be scaled more easily than the approach of "the entire data set gets
+synchronized to all nodes" as the solution to memory limitations becomes
+"just add another proxy node".  It may also take away some of the
+messaging load that used to be required to synchronize data sets across
+all nodes.
+
+The tradeoff of this approach, is that nodes that leave the pool (due to
+crashing, etc.) cause a temporary gap in the total data set until
+workers start hashing keys to a new proxy node that is still alive,
+causing data to now be located and updated there.
+
+If the developer of a script expects its workload to be particularly
+intensive, wants to ensure that their operations get exclusive
+access to nodes, or otherwise set constraints on the number of nodes within
+a pool utilized by their script, then the :zeek:see:`Cluster::PoolSpec`
+structure will allow them to do that while still allowing users of that script
+to override the default suggestions made by the original developer.
+
+Broker Framework Examples
+=========================
+
+The broker framework provides basic facilities for connecting Zeek instances
+to each other and exchanging messages, like events or logs.
+
+See :doc:`/scripts/base/frameworks/broker/main.zeek` for an overview
+of the main Broker API.
+
+.. _broker_topic_naming:
+
+Topic Naming Conventions
+------------------------
+
+All Broker-based messaging involves two components: the information you
+want to send (e.g. an event w/ its arguments) along with an associated
+topic name string.  The topic strings are used as a filtering mechanism:
+Broker uses a publish/subscribe communication pattern where peers
+advertise interest in topic **prefixes** and only receive messages which
+match one of their prefix subscriptions.
+
+Broker itself supports arbitrary topic strings, however Zeek generally
+follows certain conventions in choosing these topics to help avoid
+conflicts and generally make them easier to remember.
+
+As a reminder of how topic subscriptions work, subscribers advertise
+interest in a topic **prefix** and then receive any messages published by a
+peer to a topic name that starts with that prefix.  E.g. Alice
+subscribes to the "alice/dogs" prefix, then would receive the following
+message topics published by Bob:
+
+- topic "alice/dogs/corgi"
+- topic "alice/dogs"
+- topic "alice/dogsarecool/oratleastilikethem"
+
+Alice would **not** receive the following message topics published by Bob:
+
+- topic "alice/cats/siamese"
+- topic "alice/cats"
+- topic "alice/dog"
+- topic "alice"
+
+Note that the topics aren't required to form a slash-delimited hierarchy,
+the subscription matching is purely a byte-per-byte prefix comparison.
+
+However, Zeek scripts generally will follow a topic naming hierarchy and
+any given script will make the topic names it uses apparent via some
+redef'able constant in its export section.  Generally topics that Zeek
+scripts use will be along the lines of :samp:`zeek/{<namespace>}/{<specifics>}`
+with :samp:`{<namespace>}` being the script's module name (in all-undercase).
+For example, you might expect an imaginary ``Pretend`` framework to
+publish/subscribe using topic names like ``zeek/pretend/my_cool_event``.
+For scripts that use Broker as a means of cluster-aware analysis,
+it's usually sufficient for them to make use of the topics declared
+by the cluster framework.  For scripts that are meant to establish
+communication flows unrelated to Zeek cluster, new topics are declared
+(examples being the NetControl and Control frameworks).
+
+For cluster operation, see :doc:`/scripts/base/frameworks/cluster/main.zeek`
+for a list of topics that are useful for steering published events to
+the various node classes.  E.g. you have the ability to broadcast
+to all nodes of a given class (e.g. just workers) or just send to a
+specific node within a class.
+
+The topic names that logs get published under are a bit nuanced.  In the
+default cluster configuration, they are round-robin published to
+explicit topic names that identify a single logger.  In standalone Zeek
+processes, logs get published to the topic indicated by
+:zeek:see:`Broker::default_log_topic_prefix`.
+
+For those writing their own scripts which need new topic names, a
+suggestion would be to avoid prefixing any new topics/prefixes with
+``zeek/`` as any changes in scripts shipping with Zeek will use that prefix
+and it's better to not risk unintended conflicts.  Again, it's
+often less confusing to just re-use existing topic names instead
+of introducing new topic names.  The typical use case is writing
+a cluster-enabled script, which usually just needs to route events
+based upon node classes, and that already has usable topics in the
+cluster framework.
+
+Connecting to Peers
+-------------------
+
+Zeek can accept incoming connections by calling :zeek:see:`Broker::listen`.
+
+.. literalinclude:: broker/connecting-listener.zeek
+   :caption: connecting-listener.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+Zeek can initiate outgoing connections by calling :zeek:see:`Broker::peer`.
+
+.. literalinclude:: broker/connecting-connector.zeek
+   :caption: connecting-connector.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+In either case, connection status updates are monitored via the
+:zeek:see:`Broker::peer_added` and :zeek:see:`Broker::peer_lost` events.
+
+Remote Events
+-------------
+
+To receive remote events, you need to first subscribe to a "topic" to which
+the events are being sent.  A topic is just a string chosen by the sender,
+and named in a way that helps organize events into various categories.
+See the :ref:`topic naming conventions section <broker_topic_naming>` for
+more on how topics work and are chosen.
+
+Use the :zeek:see:`Broker::subscribe` function to subscribe to topics and
+define any event handlers for events that peers will send.
+
+.. literalinclude:: broker/events-listener.zeek
+   :caption: events-listener.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+To send an event, call the :zeek:see:`Broker::publish` function which you can
+supply directly with the event and its arguments or give it the return value of
+:zeek:see:`Broker::make_event` in case you need to send the same event/args
+multiple times.  When publishing events like this, local event handlers for
+the event are not called, even if a matching subscription exists.
+
+.. literalinclude:: broker/events-connector.zeek
+   :caption: events-connector.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+Note that the subscription model is prefix-based, meaning that if you subscribe
+to the ``zeek/events`` topic prefix you would receive events that are published
+to topic names ``zeek/events/foo`` and ``zeek/events/bar`` but not
+``zeek/misc``.
+
+.. note::
+
+   In prior Zeek versions, ``Broker::auto_publish`` was available to automatically
+   send events to peers whenever the events were called locally via the normal
+   event invocation syntax. When auto-publishing events, local event handlers for
+   the event were called in addition to sending the event to any subscribed peers.
+
+   ``Broker::auto_publish`` was removed due to its
+   `implicit nature <https://github.com/zeek/zeek/discussions/3637>`_.
+
+
+Remote Logging
+--------------
+
+.. literalinclude:: broker/testlog.zeek
+   :caption: testlog.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+To toggle remote logs, redef :zeek:see:`Log::enable_remote_logging`.
+Use the :zeek:see:`Broker::subscribe` function to advertise interest
+in logs written by peers.  The topic names that Zeek uses are determined by
+:zeek:see:`Broker::log_topic`.
+
+.. literalinclude:: broker/logs-listener.zeek
+   :caption: logs-listener.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+.. literalinclude:: broker/logs-connector.zeek
+   :caption: logs-connector.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+Note that logging events are only raised locally on the node that performs
+the :zeek:see:`Log::write` and not automatically published to peers.
+
+.. _data_store_example:
+
+Distributed Data Stores
+-----------------------
+
+See :doc:`/scripts/base/frameworks/broker/store.zeek` for an overview
+of the Broker data store API.
+
+There are two flavors of key-value data store interfaces: master and clone.
+
+A master data store can be cloned from remote peers which may then
+perform lightweight, local queries against the clone, which
+automatically stays synchronized with the master store.  Clones cannot
+modify their content directly, instead they send modifications to the
+centralized master store which applies them and then broadcasts them to
+all clones.
+
+Master stores get to choose what type of storage backend to
+use.  E.g. In-memory versus SQLite for persistence.
+
+Data stores also support expiration on a per-key basis using an amount of
+time relative to the entry's last modification time.
+
+.. literalinclude:: broker/stores-listener.zeek
+   :caption: stores-listener.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+.. literalinclude:: broker/stores-connector.zeek
+   :caption: stores-connector.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+Note that all data store queries must be made within Zeek's asynchronous
+``when`` statements and must specify a timeout block.
+
+
+SQLite Data Store Tuning
+^^^^^^^^^^^^^^^^^^^^^^^^
+
+When leveraging the SQLite backend for persistence, SQLite's default journaling
+and consistency settings are used. Concretely, ``journal_mode`` is set to
+``DELETE`` and ``synchronous`` to ``FULL``. This in turn is not optimal for
+`high INSERT or UPDATE rates <https://www.sqlite.org/faq.html#q19>`_
+due to SQLite waiting for the required IO to complete until data is safely
+on disk. This can also have a non-negligible system effect when the
+SQLite database is located on the same device as other IO critical processes.
+
+Starting with Zeek 5.2, it is possible to tune and relax these settings by
+providing an appropriate :zeek:see:`Broker::BackendOptions` and
+:zeek:see:`Broker::SQLiteOptions` instance to
+:zeek:see:`Broker::create_master`. The following example changes the
+data store to use `Write-Ahead Logging <https://www.sqlite.org/wal.html>`_
+which should perform significantly faster than the default.
+
+
+.. literalinclude:: broker/store-sqlite-tuning.zeek
+   :caption: store-sqlite-tuning.zeek
+   :language: zeek
+   :linenos:
+   :tab-width: 4
+
+If your use-case turns out to require more and lower-level tuning around
+SQLite options, please get in contact or open a feature request on GitHub.
+
+
+Cluster Framework Examples
+==========================
+
+This section contains a few brief examples of how various communication
+patterns one might use when developing Zeek scripts that are to operate in
+the context of a cluster.
+
+.. _event-namespacing-pitfall:
+
+A Reminder About Events and Module Namespaces
+---------------------------------------------
+
+For simplicity, the following examples do not use any modules/namespaces.
+If you choose to use them within your own code, it's important to
+remember that the ``event`` and ``schedule`` dispatching statements
+should always use the fully-qualified event name.
+
+For example, this will likely not work as expected:
+
+.. code-block:: zeek
+
+    module MyModule;
+
+    export {
+        global my_event: event();
+    }
+
+    event my_event()
+        {
+        print "got my event";
+        }
+
+    event zeek_init()
+        {
+        event my_event();
+        schedule 10sec { my_event() };
+        }
+
+This code runs without errors, however, the local ``my_event`` handler
+will never be called and also not any remote handlers either. Instead, at
+minimum you would need change the ``zeek_init()`` handler:
+
+.. code-block:: zeek
+
+    event zeek_init()
+        {
+        event MyModule::my_event();
+        schedule 10sec { MyModule::my_event() };
+        }
+
+Though, an easy rule of thumb to remember would be to always use the
+explicit module namespace scoping and you can't go wrong:
+
+.. code-block:: zeek
+
+    module MyModule;
+
+    export {
+        global MyModule::my_event: event();
+    }
+
+    event MyModule::my_event()
+        {
+        print "got my event";
+        }
+
+    event zeek_init()
+        {
+        event MyModule::my_event();
+        schedule 10sec { MyModule::my_event() };
+        }
+
+Event types that reside in the default namespace (such as :zeek:id:`zeek_init` or
+:zeek:id:`connection_established`) require no qualification, even when scheduled from
+inside a module. Don't force qualification of such events by prefixing with
+``GLOBAL::``.
+
+Note that other identifiers in Zeek do not have this inconsistency
+related to module namespacing, it's just events that require
+explicitness.
+
+Manager Sending Events To Workers
+---------------------------------
+
+This is fairly straightforward, we just need a topic name which we know
+all workers are subscribed combined with the event we want to send them.
+
+.. code-block:: zeek
+
+    event manager_to_workers(s: string)
+        {
+        print "got event from manager", s;
+        }
+
+    event some_event_handled_on_manager()
+        {
+        Broker::publish(Cluster::worker_topic, manager_to_workers,
+                        "hello v0");
+
+        # If you know this event is only handled on the manager, you don't
+        # need any of the following conditions, they're just here as an
+        # example of how you can further discriminate based on node identity.
+
+        # Can check based on the name of the node.
+        if ( Cluster::node == "manager" )
+            Broker::publish(Cluster::worker_topic, manager_to_workers,
+                            "hello v1");
+
+        # Can check based on the type of the node.
+        if ( Cluster::local_node_type() == Cluster::MANAGER )
+            Broker::publish(Cluster::worker_topic, manager_to_workers,
+                            "hello v2");
+
+        # The run-time overhead of the above conditions can even be
+        # eliminated by using the following conditional directives.
+        # It's evaluated once per node at parse-time and, if false,
+        # any code within is just ignored / treated as not existing at all.
+    @if ( Cluster::local_node_type() == Cluster::MANAGER )
+            Broker::publish(Cluster::worker_topic, manager_to_workers,
+                            "hello v3");
+    @endif
+        }
+
+Worker Sending Events To Manager
+--------------------------------
+
+This should look almost identical to the previous case of sending an event
+from the manager to workers, except it simply changes the topic name to
+one which the manager is subscribed.
+
+.. code-block:: zeek
+
+    event worker_to_manager(worker_name: string)
+        {
+        print "got event from worker", worker_name;
+        }
+
+    event some_event_handled_on_worker()
+        {
+        Broker::publish(Cluster::manager_topic, worker_to_manager,
+                        Cluster::node);
+        }
+
+Worker Sending Events To All Workers
+------------------------------------
+
+Since workers are not directly connected to each other in the cluster
+topology, this type of communication is a bit different than what we
+did before since we have to manually relay the event via some node that *is*
+connected to all workers.  The manager or a proxy satisfies that requirement:
+
+.. code-block:: zeek
+
+    event worker_to_workers(worker_name: string)
+        {
+    @if ( Cluster::local_node_type() == Cluster::MANAGER ||
+          Cluster::local_node_type() == Cluster::PROXY )
+            Broker::publish(Cluster::worker_topic, worker_to_workers,
+                            worker_name);
+    @else
+            print "got event from worker", worker_name;
+    @endif
+        }
+
+    event some_event_handled_on_worker()
+        {
+        # We know the manager is connected to all workers, so we could
+        # choose to relay the event across it.
+        Broker::publish(Cluster::manager_topic,  worker_to_workers,
+                        Cluster::node + " (via manager)");
+
+        # We also know that any given proxy is connected to all workers,
+        # though now we have a choice of which proxy to use.  If we
+        # want to distribute the work associated with relaying uniformly,
+        # we can use a round-robin strategy.  The key used here is simply
+        # used by the cluster framework internally to keep track of
+        # which node is up next in the round-robin.
+        local pt = Cluster::rr_topic(Cluster::proxy_pool, "example_key");
+        Broker::publish(pt, worker_to_workers,
+                        Cluster::node + " (via a proxy)");
+        }
+
+Worker Distributing Events Uniformly Across Proxies
+---------------------------------------------------
+
+If you want to offload some data/work from a worker to your proxies,
+we can make use of a `Highest Random Weight (HRW) hashing
+<https://en.wikipedia.org/wiki/Rendezvous_hashing>`_ distribution strategy
+to uniformly map an arbitrary key space across all available proxies.
+
+.. code-block:: zeek
+
+    event worker_to_proxies(worker_name: string)
+        {
+        print "got event from worker", worker_name;
+        }
+
+    global my_counter = 0;
+
+    event some_event_handled_on_worker()
+        {
+        # The key here is used to choose which proxy shall receive
+        # the event.  Different keys may map to different nodes, but
+        # any given key always maps to the same node provided the
+        # pool of nodes remains consistent.  If a proxy goes offline,
+        # that key maps to a different node until the original comes
+        # back up.
+        Cluster::publish_hrw(Cluster::proxy_pool,
+                             cat("example_key", ++my_counter),
+                             worker_to_proxies, Cluster::node);
+        }
+
+Broker-backed Zeek Tables for Data Synchronization and Persistence
+==================================================================
+
+Starting with Zeek 3.2, it is possible to "bind" a Zeek table to a backing
+Broker store. Changes to the Zeek table are sent to the Broker store. Similarly,
+changes of the Broker store are applied to the Zeek table.
+
+This feature allows easy distribution of table contents across a cluster.
+It also offers persistence for tables (when using a persistent Broker store
+backend like SQLite).
+
+To give a short example, to distribute a table over a cluster you can use
+the :zeek:attr:`&backend` attribute.
+
+.. code-block:: zeek
+
+    global t: table[string] of count &backend=Broker::MEMORY;
+
+The :zeek:attr:`&backend` attribute creates a master data store on the
+manager and a clone data store on all other node on the cluster. This
+in essence means that the table exists twice in each Zeek process. One
+copy of the table is contained in a Broker data store (either a master
+or a clone depending on the node), which data store distributes the
+data across the cluster---and, depending on the backend, might also
+make the data persistent. Since Broker data stores are only accessible
+via asynchronous operations, and accessing them might not always be
+immediate, a second copy of the table, which is immediately
+accessible, is held inside the Zeek core. This is the copy that you
+see and interact with on the Zeek side.
--- a/doc/frameworks/broker/cluster-layout.png
+++ b/doc/frameworks/broker/cluster-layout.png
--- a/doc/frameworks/broker/cluster-layout.xml
+++ b/doc/frameworks/broker/cluster-layout.xml
@ -0,0 +1,2 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<mxfile userAgent="Mozilla/5.0 (Macintosh; Intel Mac OS X 10_13_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/68.0.3440.84 Safari/537.36" version="9.0.3-1" editor="www.draw.io" type="device"><diagram name="Page-1" id="42789a77-a242-8287-6e28-9cd8cfd52e62">7VxLc6M4EP41Po4LSUjAcZJJZg+7VVOVrd3ZowwKZgYjFyaxvb9+hZEwEhA/eITs2JdYrZYE0ve1ultyZuh+tfua0vXyDx6weAatYDdDX2ZQfDxL/Mkl+0Li2G4hCNMoKETgKHiK/mVSKNuFL1HANppixnmcRWtd6PMkYX6myWia8q2u9sxjfdQ1DVlN8OTTuC79OwqypZQCyzpW/MaicCmHdrGsWFD/Z5jyl0SON4Po+fApqldU9SX1N0sa8G1FhB5m6D7lPCu+rXb3LM7nVk1b0e6xpbZ87pQl2VkNGEXAcTwrgD71XPQJoKKLVxq/MPUOhyfN9mp2WCAmSxYTnog/d4dXZnmnQJSW2SqWX2O6YPFdOSv3PObpsdkmo2n2OV8wQ/YYxXkPlipLiGBRZkmgWvgx3Wwi/89llBQVshkoSpVGP1iW7WWZvmRciHiaLXnIExr/zvlattpkKf/J1FOK1fOIgz6TskahIdd95kn2SFdRnIP8L5YGNKFSLEcCUJYrHVqHj5An/KEyj4dH3kXZ9/yt51iW/pFzcHxWqVpfZ7n0G/6S+qxtcSWVaBqyrEXHK3TyNa50LNHzlfEVy9K9UEhZTLPoVScMlbwLSz3ZVKwY3VcU1jxKsk2l52+5QCgoE6KYJg0IcqCOY1MfQTFp1Ra2bVdbiC/FM6hS5WWOogM7zmWKfWPKL80UNAmmAHIZUwB0RmdKjSgrAYCQpTNIYjG7d4v8W5iVq1VlUByLTT9H+3YZZexpTQ9rthV+h06fI68OVFD7al7l81Xky4pTLGsANW0BtWBQRZOBADOnO9hpHIVJzliBVzFDbwD4laUZ270JPVWL9BVHyrpuj86NctmWFbdGQasJrBW4XIYG2GA2Cxhs1jRRQFinfLf/BJsQUkjEuFX9qQEncLyFZZ0DnOdnRnx/msCBUAcOwHXgOLgOHDwEcJo80zpwYh4Ky5LbnI+BE7Ig+CwDI4IIOFWcePoeZJN3hIlXg4mERIN7dlv7HjYXD7/b4t+CVQ1QXxzvrm3T6Qac0uGuuNvFg4sV+14tKEe87rT35JrDM1xzMIhrXvOlbYLmnmMjDCxgI9dBjsYED84RJB7GmCAHQ7334h1lh29Fth6YE9GLhRwxAlbOerkj2/Y8790Rr01sYBFjmGKaasO0Rxka9S5z/JsC4jbPDtw8u3e12kbUOKZjh29Ge1yjrTImNaNtDWW07enYaAKN/Agi1xlirLwN1RExOhrT1JIbh0biUMmVObIcjS9zizRSpjk52UimQ2ffWBqJpc8t+2Eqe2PYMKn8GjGQbTAM4OsYZqO+GdaSArWMiAVoh2SdE6DOjZwjRyU1plVoS1yDtfC8je56bl4VsgxzmlAnK3J1jlnOdWRFjt4RgEZHPZEV4mHJqixphZx63FBhYnu0ezU57lxs42ZyNMXcBdL7ctO8Oi7tcWBonu/a5lFDCwwvNvVQD5e9nsFDLrPsJp5OOeij4GxANE30dgFCRvRrGbdkTuirMHgo/d5tnNsNpsfNFI9q+Grb+phQhSNZQqLvo90tYYewEoFuQGmwZxXM1C3avJNjORGbNo17IMjM6J2yaeRCG9VR37BpdR4YUSS2+7WB9WPBpuT0lqc/i6PCD5qdXrRzwsxOuz6bana6TBKPcYAMG5BxC9ff4xDRmtumfzFooH5OEu0WlzeP4wwblt/uoU/nlGhOiJn5nmYObaSEN1Fucpnwdq/jKnb1jgA09rO+cmjuwDk0XOPmFTHCIKHk4EedgJwBzJFiSdfMqoGB8KTOUAfKqjmXmfoWhNXzpu8UabaA8PBI/WFsJOMHjPN0bOYrumLsVPx6Kv48s/5UPFp7z57jURWQdgX5W0dfo2TrhjSkw5xGDJM6s/pZT2M1p2WyejVYI0VW4NRRU0+b4qVnChem0zqp9x6dNd0/as2mfdy7nv+PbNqYv8ZoSrP+wmH7G1Z4oGTamCcfI13hhMZ9rauvcNrmTTUT8n1dMDN+EmPsBd19x/ovam8sGzU5dpELNUc5UrT8WemZX5ccO8e9Gomc5W1P5Wp4BqfOJWf5EwTl4pgd9UVO0is5RfH471oK9eP/xEEP/wE=</diagram></mxfile>
--- a/doc/frameworks/broker/connecting-connector.zeek
+++ b/doc/frameworks/broker/connecting-connector.zeek
@ -0,0 +1,12 @@
+redef exit_only_after_terminate = T;
+
+event zeek_init()
+	{
+	Broker::peer("127.0.0.1");
+	}
+
+event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer added", endpoint;
+	terminate();
+	}
--- a/doc/frameworks/broker/connecting-listener.zeek
+++ b/doc/frameworks/broker/connecting-listener.zeek
@ -0,0 +1,17 @@
+redef exit_only_after_terminate = T;
+
+event zeek_init()
+	{
+	Broker::listen("127.0.0.1");
+	}
+
+event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer added", endpoint;
+	}
+
+event Broker::peer_lost(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer lost", endpoint;
+	terminate();
+	}
--- a/doc/frameworks/broker/events-connector.zeek
+++ b/doc/frameworks/broker/events-connector.zeek
@ -0,0 +1,26 @@
+redef exit_only_after_terminate = T;
+global my_event: event(msg: string, c: count);
+
+event zeek_init()
+	{
+	Broker::peer("127.0.0.1");
+	}
+
+event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer added", endpoint;
+	Broker::publish("zeek/event/my_event", my_event, "hi", 0);
+	Broker::publish("zeek/event/my_event", my_event, "...", 1);
+	local e = Broker::make_event(my_event, "bye", 2);
+	Broker::publish("zeek/event/my_event", e);
+	}
+
+event Broker::peer_lost(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	terminate();
+	}
+
+event my_event(msg: string, c: count)
+	{
+	print "got my_event", msg, c;
+	}
--- a/doc/frameworks/broker/events-listener.zeek
+++ b/doc/frameworks/broker/events-listener.zeek
@ -0,0 +1,24 @@
+redef exit_only_after_terminate = T;
+global msg_count = 0;
+global my_event: event(msg: string, c: count);
+global my_auto_event: event(msg: string, c: count);
+
+event zeek_init()
+	{
+	Broker::subscribe("zeek/event/");
+	Broker::listen("127.0.0.1");
+	}
+
+event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer added", endpoint;
+	}
+
+event my_event(msg: string, c: count)
+	{
+	++msg_count;
+	print "got my_event", msg, c;
+
+	if ( msg_count == 5 )
+		terminate();
+	}
--- a/doc/frameworks/broker/logs-connector.zeek
+++ b/doc/frameworks/broker/logs-connector.zeek
@ -0,0 +1,36 @@
+@load ./testlog
+
+redef exit_only_after_terminate = T;
+global n = 0;
+
+event zeek_init()
+	{
+	Broker::peer("127.0.0.1");
+	}
+
+event do_write()
+	{
+	if ( n == 6 )
+		return;
+
+	Log::write(Test::LOG, [$msg = "ping", $num = n]);
+	++n;
+	event do_write();
+	}
+
+event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer added", endpoint;
+	event do_write();
+	}
+
+event Broker::peer_lost(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	terminate();
+	}
+
+event Test::log_test(rec: Test::Info)
+	{
+	print "wrote log", rec;
+	Broker::publish("zeek/logs/forward/test", Test::log_test, rec);
+	}
--- a/doc/frameworks/broker/logs-listener.zeek
+++ b/doc/frameworks/broker/logs-listener.zeek
@ -0,0 +1,22 @@
+@load ./testlog
+
+redef exit_only_after_terminate = T;
+
+event zeek_init()
+	{
+	Broker::subscribe("zeek/logs");
+	Broker::listen("127.0.0.1");
+	}
+
+event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer added", endpoint;
+	}
+
+event Test::log_test(rec: Test::Info)
+	{
+	print "got log event", rec;
+
+	if ( rec$num == 5 )
+		terminate();
+	}
--- a/doc/frameworks/broker/store-sqlite-tuning.zeek
+++ b/doc/frameworks/broker/store-sqlite-tuning.zeek
@ -0,0 +1,19 @@
+global h: opaque of Broker::Store;
+
+event zeek_init()
+	{
+	# Use WAL mode.
+	local sqlite_options=Broker::SQLiteOptions(
+		$synchronous=Broker::SQLITE_SYNCHRONOUS_NORMAL,
+		$journal_mode=Broker::SQLITE_JOURNAL_MODE_WAL,
+	);
+	local options = Broker::BackendOptions($sqlite=sqlite_options);
+	h = Broker::create_master("persistent-store", Broker::SQLITE, options);
+
+	local c = 1000;
+	while (c > 0)
+		{
+		Broker::put(h, cat(c), rand(10000));
+		--c;
+		}
+	}
--- a/doc/frameworks/broker/stores-connector.zeek
+++ b/doc/frameworks/broker/stores-connector.zeek
@ -0,0 +1,29 @@
+redef exit_only_after_terminate = T;
+
+global h: opaque of Broker::Store;
+
+global ready: event();
+
+event Broker::peer_lost(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	terminate();
+	}
+
+event zeek_init()
+	{
+	h = Broker::create_master("mystore");
+
+	local myset: set[string] = {"a", "b", "c"};
+	local myvec: vector of string = {"alpha", "beta", "gamma"};
+	Broker::put(h, "one", 110);
+	Broker::put(h, "two", 223);
+	Broker::put(h, "myset", myset);
+	Broker::put(h, "myvec", myvec);
+	Broker::increment(h, "one");
+	Broker::decrement(h, "two");
+	Broker::insert_into_set(h, "myset", "d");
+	Broker::remove_from(h, "myset", "b");
+	Broker::push(h, "myvec", "delta");
+
+	Broker::peer("127.0.0.1");
+	}
--- a/doc/frameworks/broker/stores-listener.zeek
+++ b/doc/frameworks/broker/stores-listener.zeek
@ -0,0 +1,79 @@
+redef exit_only_after_terminate = T;
+
+global h: opaque of Broker::Store;
+global expected_key_count = 4;
+global key_count = 0;
+
+# Lookup a value in the store based on an arbitrary key string.
+function do_lookup(key: string)
+	{
+	when ( local res = Broker::get(h, key) )
+		{
+		++key_count;
+		print "lookup", key, res;
+
+		# End after we iterated over looking up each key in the store twice.
+		if ( key_count == expected_key_count * 2 )
+			terminate();
+		}
+	# All data store queries must specify a timeout
+	timeout 3sec
+		{ print "timeout", key; }
+	}
+
+event check_keys()
+	{
+	# Here we just query for the list of keys in the store, and show how to
+	# look up each one's value.
+	when ( local res = Broker::keys(h) )
+		{
+		print "clone keys", res;
+
+		if ( res?$result )
+			{
+			# Since we know that the keys we are storing are all strings,
+			# we can conveniently cast the result of Broker::keys to
+			# a native Bro type, namely 'set[string]'.
+			for ( k in res$result as string_set )
+				do_lookup(k);
+
+			# Alternatively, we can use a generic iterator to iterate
+			# over the results (which we know is of the 'set' type because
+			# that's what Broker::keys() always returns).  If the keys
+			# we stored were not all of the same type, then you would
+			# likely want to use this method of inspecting the store's keys.
+			local i = Broker::set_iterator(res$result);
+
+			while ( ! Broker::set_iterator_last(i) )
+				{
+				do_lookup(Broker::set_iterator_value(i) as string);
+				Broker::set_iterator_next(i);
+				}
+			}
+		}
+	# All data store queries must specify a timeout.
+	# You also might see timeouts on connecting/initializing a clone since
+	# it hasn't had time to get fully set up yet.
+	timeout 1sec
+		{
+		print "timeout";
+		schedule 1sec { check_keys() };
+		}
+	}
+
+event Broker::peer_added(endpoint: Broker::EndpointInfo, msg: string)
+	{
+	print "peer added";
+	# We could create a clone early, like in zeek_init and it will periodically
+	# try to synchronize with its master once it connects, however, we just
+	# create it now since we know the peer w/ the master store has just
+	# connected.
+	h = Broker::create_clone("mystore");
+
+	event check_keys();
+	}
+
+event zeek_init()
+	{
+	Broker::listen("127.0.0.1");
+	}
--- a/doc/frameworks/broker/testlog.zeek
+++ b/doc/frameworks/broker/testlog.zeek
@ -0,0 +1,17 @@
+module Test;
+
+export {
+	redef enum Log::ID += { LOG };
+
+	type Info: record {
+		msg: string &log;
+		num: count &log;
+	};
+
+	global log_test: event(rec: Test::Info);
+}
+
+event zeek_init() &priority=5
+	{
+	Log::create_stream(Test::LOG, [$columns=Test::Info, $ev=log_test, $path="test"]);
+	}
--- a/doc/frameworks/cluster.rst
+++ b/doc/frameworks/cluster.rst
@ -0,0 +1,630 @@
+
+.. _cluster-framework:
+
+=================
+Cluster Framework
+=================
+
+The basic premise of Zeek clusterization is to break down network traffic into
+smaller pieces, while preserving the affinity of individual network sessions to
+a single analysis process.  Cluster architecture thus allows Zeek to distribute
+that analysis across many dozens or hundreds of worker processes, allowing the
+monitoring system to scale up to line speeds of 100G or more.
+
+.. figure:: /images/cluster-diagram.png
+
+  Figure 1: Block diagram of cluster setup showing multiple network feeds to a
+  traffic aggregator. This device sends traffic to workers after symmetric
+  hashing/load-balancing. Traffic is then fed to the Zeek cluster using
+  load-balancing network cards.
+
+Zeek's Cluster Components
+=========================
+
+By distributing network traffic across hosts and processes, overall traffic
+finally reaches a volume that can be effectively analyzed by a single worker
+process. Zeek then acts as a distributed network security monitor to perform
+analysis across many dozens or hundreds of workers, all acting on a small
+fraction of the overall traffic volume. The analysis of the worker process is
+further facilitated by nodes such as manager and proxies, ultimately logging
+the alerts and or relevant network logs. A Zeek cluster therefore consists of
+four main components: a manager, workers, proxies, and a logger.
+
+Manager
+-------
+
+The manager is a Zeek process that has two primary jobs. It normally receives
+log messages and notices from the rest of the nodes in the cluster using the
+Zeek communications protocol.  It combines the individual logs that each worker
+produces, so that the result is a set of joint logs instead of many discrete
+logs that you would have to combine in some manner with post-processing. (Note
+that if you use a separate logger node, then the logger receives all logs
+instead of the manager.) The manager also supports other functionality and
+analysis which requires a centralized, global view of events or data.
+
+Worker
+------
+
+The worker is the Zeek process that sniffs network traffic and does protocol
+analysis on the reassembled traffic streams. Most of the work of an active
+cluster takes place on the workers. Workers typically represent the bulk of the
+Zeek processes that are running in a cluster. The fastest memory and CPU core
+speed you can afford is recommended since all of the protocol parsing and most
+analysis will take place here. There are no particular requirements for the
+disks in workers since almost all logging is done remotely to the manager (or
+dedicated logger). Normally, very little is written to disk.
+
+Proxy
+-----
+
+A proxy is a Zeek process that may be used to offload data storage or any
+arbitrary workload. A cluster may contain multiple proxy nodes.
+Zeek's default scripts make only minimal use of proxies.
+Custom scripts or third-party packages may exercise proxies more heavily
+to partition data or workloads, providing greater cluster scalability potential.
+The number of required proxy nodes in a cluster depends on the deployed scripts,
+cluster size and traffic characteristics. For small clusters with four or less workers,
+a single proxy node is usually sufficient. For larger clusters, you may want to
+closely monitor :ref:`CPU and memory usage <framework-telemetry>` of proxy
+nodes and increase their number as needed.
+
+Zeek processes acting as proxies don’t tend to be extremely hard on CPU or
+memory, and users frequently run proxy processes on the same physical host as
+the manager.
+
+Logger
+------
+
+A logger is an optional Zeek process that receives log messages from the rest
+of the nodes in the cluster using the Zeek communications protocol. The purpose
+of having a logger to receive logs instead of the manager is to reduce the load
+on the manager. If no logger is needed, then the manager will receive logs
+instead.
+
+Running a Zeek Cluster
+======================
+
+Zeek Cluster Setup
+------------------
+
+This :ref:`link <cluster-configuration>` describes the cluster setup in great
+detail.
+
+General Usage and Deployment
+----------------------------
+
+The biggest advantage to using a Zeek cluster is that most of its inner
+workings are transparent to the user. Clusterization is a clever trick to
+divide-and-conquer ever increasing network traffic volume.
+
+As a practitioner one must know how to set up a cluster by defining components
+such as the manager, proxies, loggers and workers in the
+:samp:`{<prefix>}/etc/node.cfg` file on the manager.
+
+Edit the ZeekControl node configuration file, :samp:`{<prefix>}/etc/node.cfg`,
+to define where the logger, manager, proxies, and workers will run. For a
+cluster configuration, comment-out (or remove) the standalone node in that
+file, and either uncomment or add node entries for each node in your cluster
+(logger, manager, proxy, and workers).
+
+For example, to run five Zeek nodes (two workers, one proxy, a logger, and a
+manager) on a cluster consisting of three machines, the cluster configuration
+would look like this::
+
+  [logger]
+  type=logger
+  host=10.0.0.10
+
+  [manager]
+  type=manager
+  host=10.0.0.10
+
+  [proxy-1]
+  type=proxy
+  host=10.0.0.10
+
+  [worker-1]
+  type=worker
+  host=10.0.0.11
+  interface=eth0
+
+  [worker-2]
+  type=worker
+  host=10.0.0.12
+  interface=eth0
+
+
+To set up a cluster we need a network-aggregator/load balancing device which
+can aggregate inputs from network sources, such as taps or span ports. This
+device also performs the critical function of ensuring each TCP session is
+distributed to a single link. This function is provided through symmetric
+hashing.
+
+Once the tap aggregator is set, output from each port is sent to a “Zeek node”
+which is typically built on commodity hardware. Zeek clusters have evolved from
+running the manager, workers and proxies on individual servers, to most often
+now running a “cluster-in-a-box” setup, where a powerful multi-core box with
+dedicated cores hosts the workers, proxies logger and manager. We’ve seen
+instances of 90 workers running on a single physical server.
+
+At present the preferred way to run a cluster is to use a load-balancing
+network card such as Myricom NICs or Intel cards with PF_RING or AF_PACKET
+support.  The NIC (and associated software) further divides the traffic to
+multiple Zeek worker processes running on the ‘Zeek- node’.
+
+While the Zeek cluster allows us to monitor traffic at scale, an optional
+add-on technology called “shunting” is helpful to reduce the volume that needs
+be processed.. Shunting can detect specific large data flows based on
+predetermined characteristics and communicate with the network tap via an API
+to stop sending those flows to Zeek for analysis.  This allows Zeek to maintain
+awareness and logs of these shunted large flows while dramatically reducing the
+analysis load necessary to process traffic.
+
+The following links gives more specific information on how to set up
+clusterization using one of the above approaches: :ref:`cluster-configuration`.
+
+Developing Scripts/Heuristics
+=============================
+
+This section is for developers who are interested in writing
+packages/scripts/heuristics and want to take advantage of clusterization.
+
+In order to make your scripts/packages “clusterized,” one must understand the
+purpose of each of the cluster components (manager, workers, proxies and
+logger) and how/where the data is generated and how to move data/information
+across the different nodes in the cluster.
+
+* **Workers**: Workers are a good first choice for doing the brunt of any work.
+  They should be spending a lot of time parsing or analyzing incoming data from
+  packets. You might choose them to do a “first pass” analysis and then decide
+  how the results should be shared with other nodes in the cluster.
+
+* **Proxies**: Proxies serve as intermediaries for data storage and computation
+  offloading. Proxies help offload work or data in a scalable and distributed
+  way. Since any given worker is connected to all proxies and can agree on an
+  “arbitrary key -> proxy node” mapping (discussed later), you can partition
+  work or data amongst them in a uniform manner. You might choose to use
+  proxies as a method to share non-persistent state or as a “second pass”
+  analysis for any work that you don’t want interfering with the workers’
+  capacity to keep up with capturing and parsing packets. The default scripts
+  that come with Zeek make minimal use of proxies. If you are migrating from a
+  previous ZeekControl deployment, you may want to implement a single proxy
+  node. If you have custom or community scripts that utilize proxies,
+  considering scaling up the number of proxies to meet demand.
+
+* **Manager**: A manager will make decisions that require a global view, as it
+  is in a centralized location and connected to everything. However, that
+  connectivity also makes it easy to overload it. Try to use a manager
+  sparingly and only for tasks that must be done in a centralized or
+  authoritative location. Optionally, for some deployments, the manager can
+  also serve as the sole logger.
+
+* **Loggers**: Loggers should simply write logs to disk. In the default cluster
+  configuration, log content gets distributed among available loggers in a
+  round-robin fashion, providing failover capability should any given logger
+  temporarily go offline.
+
+The Need to Move Data and Events Across Different Nodes
+-------------------------------------------------------
+
+Imagine you have a list of IP addresses that you want to distribute across all
+workers to keep in a watch list, such as the Intel framework. You may also want
+to aggregate results across workers to see if that count crosses a threshold,
+such as using scan detection. Finally, you might want to extract URLs from
+emails and then redistribute the extracted URLs to all workers to be able to
+find which of these extracted URLs got clicked on. All these examples tend to
+introduce challenges in a Zeek cluster setup due to data centrality issues. In
+other words, the very advantageous divide-and-conquer approach of
+clusterization also introduces complexity in Zeek scripts. However, with the
+introduction of the Broker communication framework and additional helper
+functions, data centrality complexities can be addressed efficiently. One must
+rely on clusterization techniques provided by Zeek scripting, the Broker API,
+and clusterization components.
+
+When clustering your scripts, the fundamental work to move data or events in
+the context of a cluster falls primarily on few high level abstractions of
+communication patterns:
+
+  1. Manager-to-worker
+  2. Worker-to-manager
+  3. Worker-to-proxy
+  4. Worker-to-manager-to-worker
+  5. Manager-to-worker-to-manager
+
+All the communication between workers, proxies and manager is established by
+Zeek via the Broker framework. The Broker framework provides basic facilities
+for connecting Zeek instances to each other and exchanging messages, events or
+data.
+
+Cluster Topics
+--------------
+
+All Broker-based messaging involves two components: the information you want to
+send, such as an event with its arguments, along with an associated topic name
+string. The topic strings are used as a filtering mechanism: Broker uses a
+publish-subscribe communication pattern where peers advertise interest in topic
+prefixes and only receive messages which match one of their prefix
+subscriptions. Broker itself supports arbitrary topic strings. However, Zeek
+generally follows certain conventions in choosing these topics to help avoid
+conflicts and generally make them easier to remember.
+
+To communicate between workers, proxies and manager one needs to know the topic
+name to which all workers, proxies and manager are subscribed to. These are:
+
+  1. :zeek:see:`Cluster::worker_topic`  - to which all workers are subscribed
+  2. :zeek:see:`Cluster::proxy_topic` - to which all proxies are subscribed
+  3. :zeek:see:`Cluster::manager_topic` - to which manager is subscribed
+
+
+The following table illustrates all the topics and communication events for
+clusterization, along with potential use cases:
+
+.. list-table::
+  :header-rows: 1
+
+  * - Event
+    - Topic
+    - Use cases
+
+  * - Manager to worker
+    - :zeek:see:`Cluster::worker_topic`
+    - * Read input file on manager
+      * Distribute data and events from manager to workers
+
+  * - Worker to manager
+    - :zeek:see:`Cluster::manager_topic`
+    - * Find characteristics of a “scan” eg. SYN-only pkts
+      * Send data to manager for aggregation
+
+  * - Worker or manager to proxy
+    - :zeek:see:`Cluster::proxy_topic`
+    - * Run operation on all proxies
+      * Disseminate notice suppression
+
+  * - Worker to manager to worker
+    - :zeek:see:`Cluster::manager_topic` + :zeek:see:`Cluster::worker_topic`
+    - * Find URLs in emails
+      * Send to manager
+      * Distribute to workers to check against HTTP GET requests
+
+  * - Manager to worker to manager
+    - :zeek:see:`Cluster::worker_topic` + :zeek:see:`Cluster::manager_topic`
+    - * Read input file on manager
+      * Distribute data to workers
+      * Workers to report counts of connections to manager
+      * Aggregate the counts on manager
+
+Cluster Pools
+-------------
+
+In addition to topics, Zeek nodes can join a :zeek:see:`Cluster::Pool`.
+Using :zeek:see:`Cluster::publish_hrw` and :zeek:see:`Cluster::publish_rr`,
+pools allow to publish events to individual proxies without prior knowledge
+of a cluster's shape and size.
+
+A popular pool is the :zeek:see:`Cluster::proxy_pool`. It comprises all
+the proxies of a cluster. Examples of its use are listed in the following table.
+
+
+.. list-table::
+  :header-rows: 1
+
+  * - Event
+    - Pool
+    - Use cases
+
+  * - Workers to individual proxy processes
+    - :zeek:see:`Cluster::proxy_pool`
+    - * Aggregation based on Highest Random Weight (eg. DNS query types, see the :ref:`section below <cluster-framework-proxies-uniform>` for details.)
+      * Aggregation of Software versions for a given host
+      * Offloading tasks in round-robin fashion across proxies
+
+
+Publishing Events Across the Cluster
+------------------------------------
+
+Broker, as well as Zeek’s higher-level cluster framework, provide a set of
+function to publish events, including:
+
+.. list-table::
+  :header-rows: 1
+
+  * - Function
+    - Description
+    - Use
+
+  * - :zeek:see:`Cluster::publish`
+    - Publishes an event at a given topic
+    - Standard function to send an event to all nodes subscribed to a given
+      topic.
+
+  * - :zeek:see:`Cluster::publish_hrw`
+    - Publishes an event to a node within a pool according to
+      Highest Random Weight (HRW) hashing strategy; see details below
+    - Use this in cases of any aggregation needs - eg. scan detection or
+      anything that needs a counter going.
+
+  * - :zeek:see:`Cluster::publish_rr`
+    - Publishes an event to a node within a pool according to Round-Robin
+      distribution strategy.
+    - Generally used inside Zeek for multiple logger nodes.
+
+  * - :zeek:see:`Broker::publish`
+    - Publishes an event at a given topic
+    - Standard function to send an event to all nodes subscribed to a given
+      topic.
+
+      Starting with Zeek 7.1, this function should only be used in
+      Broker-specific scripts. Use :zeek:see:`Cluster::publish` otherwise.
+
+
+.. note::
+
+   The ``Cluster::publish`` function was added in Zeek 7.1. In contrast to
+   ``Broker:publish``, it publishes events even when a non-Broker cluster
+   backend is in use. Going forward, ``Cluster:publish`` should be preferred
+   over ``Broker::publish``, unless the script is specific to the Broker backend,
+   e.g. when interacting with an external application using native Python
+   bindings for Broker.
+
+
+An example sending an event from worker to manager:
+
+.. code-block:: zeek
+
+  event worker_to_manager(worker_name: string)
+      {
+      print "got event from worker", worker_name;
+      }
+
+  event some_event_handled_on_worker()
+      {
+      Broker::publish(Cluster::manager_topic, worker_to_manager,
+                      Cluster::node);
+      }
+
+More details and code snippets and documentation on Broker communication
+frameworks are available at :ref:`broker-framework`.
+
+
+.. _cluster-framework-proxies-uniform:
+
+Distributing Events Uniformly Across Proxies
+--------------------------------------------
+
+If you want to offload some data/work from a worker to your proxies, we can
+make use of a `Highest Random Weight (HRW) hashing
+<https://en.wikipedia.org/wiki/Rendezvous_hashing>`_ distribution strategy to
+uniformly map an arbitrary key space across all available proxies through
+:zeek:see:`Cluster::publish_hrw`. This function publishes an event to one node
+within a pool according to a Highest Random Weight hashing strategy. By
+assigning :zeek:see:`Cluster::proxy_pool` to this event, one can utilize
+proxies to handle it. Note that :zeek:see:`Cluster::publish_hrw` requires a
+unique key as an input to the hashing function to uniformly distribute keys
+among available nodes. Often this key is a source or destination IP address. If
+you are using :zeek:see:`Cluster::publish_hrw` for an aggregate function, such
+as counts unique across the workers, make sure to appropriately select the
+hashing key.
+
+The following example illustrates this issue. Assume that we are counting the
+number of scanner IPs from each ``/24`` subnet. If the key were the source IP,
+then depending on the hashing, different IP addresses from the same ``/24``
+might end up on different proxies for the aggregation function. In this case
+one might instead want to use a more inclusive hashing key, such as the subnet
+(``/24``) itself.  To illustrate the issue, in the notice log below, you see
+that 3 scanners each from ``52.100.165.0/24`` went to ``proxy-1`` and
+``proxy-2``.  Ideally we want a single count of 6 scanners instead.
+
+::
+
+  1600212249.061779             Scan::Subnet  52.100.165.0/24 has 3 spf IPs originating from it 52.100.165.249  52.100.165.237  52.100.165.246  -       52.100.165.246  -       -             proxy-2 Notice::ACTION_LOG      3600.000000          F
+
+  1600212293.581745       Scan::Subnet        52.100.165.0/24 has 3 spf IPs originating from it 52.100.165.247  52.100.165.244  52.100.165.205        -       52.100.165.205  -       -       proxy-1 Notice::ACTION_LOG      3600.000000
+
+Instead, we can ensure the hash key is ``52.100.165.0/24`` instead of the
+original IP, as the hash for ``52.100.165.0/24`` will be the same for all
+addresses belonging to this subnet. Then the data will reach only one proxy.
+To that end, we can use the ``mask_address`` function to extract subnet
+information for a given IP address to use as a key in the hash function:
+
+.. code-block:: zeek
+
+  local spf = mask_address(orig);
+
+  @if ( Cluster::is_enabled())
+      Cluster::publish_hrw(Cluster::proxy_pool, spf, smtpsink::aggregate_stats, c) ;
+  @else
+      event smtpsink::aggregate_stats(c);
+  @endif
+
+Carefully select the key for :zeek:see:`Cluster::publish_hrw`. If done right,
+this feature will bring tremendous benefits in code scalability, especially
+when working with aggregate and threshold functions.
+
+.. note::
+
+  In scripting for clusterization, using the correct module names and
+  namespaces is crucial as both events and data are transmitted to different
+  systems. In order to make sure the contexts are correct, all functions,
+  events and datasets should be scoped within their respective namespaces and
+  modules. An easy rule of thumb is to always use the explicit module namespace
+  scoping.  See :ref:`event-namespacing-pitfall` for further explanation and
+  examples.
+
+Clusterization of Zeek scripts can be an intimidating task for beginners.
+However, with reliance on the new Broker framework, clusterization has become
+simpler and straightforward.  Consider the following:
+
+1. Communication overhead: Be sure not to generate unnecessary communication
+   overhead. For example, scan detection is one of the worst cases for
+   distributed analysis. One needs to count connections from a given IP address
+   across all workers and then aggregate them on a proxy or manager. All the
+   connections have to reach an aggregate function before Zeek can determine if
+   a given source is a scanner or not. This happens because each worker only
+   has a limited picture of the activity generated by a given remote IP.
+
+2. Communication optimizations: Once a given remote IP is identified as
+   desired, make sure a manager reports that to the worker, and workers stop
+   sending any further data for that IP to the manager. This is especially
+   useful in scan detection where it takes only a few connections to identify
+   scans, while a given scanner might send millions of probes eventually. If
+   done right, workers will only send the first N connections, and stop after
+   that, thus saving a lot of communication overheads. However, it makes sense
+   to stop workers from sending any further connection information
+
+3. Clusterization also requires timely state synchronization across the
+   workers, to make sure that all workers have a common view of a particular
+   heuristic.
+
+4. When writing scripts for clusterization make sure your detection runs in
+   both cluster and standalone setup.
+
+A Cluster Script Walkthrough
+----------------------------
+
+Let's say we want to count how many connections a remote IP is making to a host
+in our network on port 3389 UDP. Due to the distributed nature of Zeek
+clusters, connections are distributed across the workers based on a 5-tuple
+hash (source IP, source port, destination IP, destination port, and protocol).
+To get a central view of a connection between a given IP pair, one must deploy
+a clusterized scripting approach. The following example highlights how to go
+about doing so.
+
+In this use case, we intend to create an aggregation function.
+:zeek:see:`Cluster::publish_hrw` appears to be the appropriate function, since
+it allows offloading a lot of work to proxies, thus leaving workers and manager
+to process traffic.
+
+In order to make sure all the connections between two hosts go to a single
+specific proxy, we need to make sure the key for the hashing function
+accommodates this constraint. We will use ``orig_h+resp_h`` as the key. We
+create a new data-type called ``pair``  as seen in code below. This allows us
+to use the ``orig+resp`` as a unique key across the code, including in the
+candidate table.  Further, we create a new data type called ``stats`` to keep
+track of additional data associated with a connection pair.
+
+.. code-block:: zeek
+
+  module DoS;
+
+  export {
+
+      redef enum Notice::Type += {
+          Threshold,
+          Victim_3389UDP,
+      };
+
+      type pair: record {
+            orig: addr;
+            resp: addr;
+      };
+
+      type stats: record {
+          orig: addr;
+          resp: addr ;
+          orig_bytes: count &default=0;
+          resp_bytes: count &default=0;
+          conns: count &default=0;
+      };
+
+      global dos_candidates: table [pair] of stats  &create_expire=1 day;
+
+      global DoS::aggregate_stats:event(s: stats);
+  }
+
+We choose the :zeek:see:`connection_state_remove` event as the primary event to
+tap into.  :zeek:see:`connection_state_remove` is generated when a connection’s
+internal state is about to be removed from memory. It's appropriate for this
+case, as all the information about the connection is now included in the
+:zeek:see:`connection` record ``c``.  One disadvantage of using
+:zeek:see:`connection_state_remove` is that the event is fired at the very end
+of the connection, after the expiration timeouts are over. Thus, there are
+delays, and any operation which happens on the data is “after-the-fact” that
+connection is over. While this could be a problem in approaches such as
+proactive blocking and early detection heuristics, in this case of aggregation
+it is not an issue.
+
+The thing to pay attention to in the code snippet below is the
+:zeek:see:`@if`-:zeek:see:`@else`-:zeek:see:`@endif` directives which
+differentiate between clusterized and standalone operation of the script.  With
+the :zeek:see:`@if` construct, the specified expression must evaluate to type
+bool. If the value is true, then the following script lines (up to the next
+:zeek:see:`@else` or :zeek:see:`@endif`) are available to be executed.  In this
+case we check if :zeek:see:`Cluster::is_enabled`. If so, we call
+:zeek:see:`Cluster::publish_hrw` along with the key (``hash_pair``) and the
+aggregate function followed by parameters, which is the stats record in this
+case. If the cluster isn’t running that aggregate function, it is directly
+called.
+
+.. code-block:: zeek
+
+  event connection_state_remove(c: connection)
+      {
+      local service = c$id$resp_p;
+      local resp = c$id$resp_h;
+
+      if ( service != 3389/udp )
+          return;
+
+      if ( resp !in Site::local_nets )
+          return;
+
+      local s: stats;
+      s$orig = c$id$orig_h;
+      s$resp = c$id$resp_h;
+      s$orig_bytes = c$conn$orig_ip_bytes;
+      s$resp_bytes = c$conn$resp_ip_bytes;
+
+      local hash_pair: pair;
+      hash_pair$orig = c$id$orig_h;
+      hash_pair$resp = resp;
+
+      @if ( Cluster::is_enabled() )
+          Cluster::publish_hrw(Cluster::proxy_pool, hash_pair, DoS::aggregate_stats, s);
+      @else
+          event DoS::aggregate_stats(s);
+      @endif
+      }
+
+Since ``hash_pair`` makes the key unique, irrespective of what worker this
+specific connection has gone to, it will end up on a one specific proxy only.
+
+.. code-block:: zeek
+
+  event DoS::aggregate_stats(s: stats)
+      {
+      local p: pair ;
+      p$orig = s$orig;
+      p$resp = s$resp ;
+
+      if ( p !in dos_candidates )
+          {
+          local tmp_s: stats;
+          tmp_s$orig = s$orig;
+          tmp_s$resp = s$resp;
+          tmp_s$orig_bytes = 0;
+          tmp_s$resp_bytes= 0;
+          tmp_s$conns = 0;
+
+          dos_candidates[p] = tmp_s;
+          }
+
+      dos_candidates[p]$conns += 1;
+      dos_candidates[p]$orig_bytes += s$orig_bytes;
+      dos_candidates[p]$resp_bytes += s$resp_bytes;
+
+      local n = dos_candidates[p]$conns;
+
+      local thresh = check_ip_threshold(dos_threshold, ip_pair_threshold_idx, p, n);
+
+      if ( thresh )
+          {
+          local msg = fmt("%s pair has reached %s threshold %s",
+                          p, n, dos_candidates[p]);
+          NOTICE([$note=DoS::Threshold, $src=p$orig, $msg=msg]);
+
+          if ( dos_candidates[p]$resp_bytes > 0 )
+              NOTICE([$note=DoS::Victim, $src=p$orig, $msg=msg,
+                     $identifier=cat(p$resp), $suppress_for=1 hrs]);
+          }
+      }
--- a/doc/frameworks/configuration.rst
+++ b/doc/frameworks/configuration.rst
@ -0,0 +1,356 @@
+
+.. _framework-configuration:
+
+=======================
+Configuration Framework
+=======================
+
+Zeek includes a configuration framework that allows updating script options at
+runtime. This functionality consists of an :zeek:see:`option` declaration in
+the Zeek language, configuration files that enable changing the value of
+options at runtime, option-change callbacks to process updates in your Zeek
+scripts, a couple of script-level functions to manage config settings directly,
+and a log file (:file:`config.log`) that contains information about every
+option value change according to :zeek:see:`Config::Info`.
+
+Introduction
+============
+
+The configuration framework provides an alternative to using Zeek script
+constants to store various Zeek settings.
+
+While traditional constants work well when a value is not expected to change at
+runtime, they cannot be used for values that need to be modified occasionally.
+While a :zeek:see:`redef` allows a re-definition of an already defined constant
+in Zeek, these redefinitions can only be performed when Zeek first starts.
+Afterwards, constants can no longer be modified.
+
+However, it is clearly desirable to be able to change at runtime many of the
+configuration options that Zeek offers. Restarting Zeek can be time-consuming
+and causes it to lose all connection state and knowledge that it accumulated.
+Zeek’s configuration framework solves this problem.
+
+Declaring Options
+=================
+
+The :zeek:see:`option` keyword allows variables to be declared as configuration
+options:
+
+.. code-block:: zeek
+
+  module Test;
+
+  export {
+      option my_networks: set[subnet] = {};
+      option enable_feature = F;
+      option hostname = "testsystem";
+      option timeout_after = 1min;
+      option my_ports: vector of port = {};
+  }
+
+Options combine aspects of global variables and constants. Like global
+variables, options cannot be declared inside a function, hook, or event
+handler. Like constants, options must be initialized when declared (the type
+can often be inferred from the initializer but may need to be specified when
+ambiguous). The value of an option can change at runtime, but options cannot be
+assigned a new value using normal assignments.
+
+The initial value of an option can be redefined with a :zeek:see:`redef`
+declaration just like for global variables and constants. However, there is no
+need to specify the :zeek:see:`&redef` attribute in the declaration of an
+option. For example, given the above option declarations, here are possible
+redefs that work anyway:
+
+.. code-block:: zeek
+
+  redef Test::enable_feature = T;
+  redef Test::my_networks += { 10.1.0.0/16, 10.2.0.0/16 };
+
+Changing Options
+================
+
+The configuration framework facilitates reading in new option values from
+external files at runtime. Configuration files contain a mapping between option
+names and their values. Each line contains one option assignment, formatted as
+follows::
+
+  [option name][tab/spaces][new value]
+
+Lines starting with ``#`` are comments and ignored.
+
+You register configuration files by adding them to
+:zeek:see:`Config::config_files`, a set of filenames. Simply say something like
+the following in :file:`local.zeek`:
+
+.. code-block:: zeek
+
+  redef Config::config_files += { "/path/to/config.dat" };
+
+Zeek will then monitor the specified file continuously for changes. For
+example, editing a line containing::
+
+  Test::enable_feature T
+
+to the config file while Zeek is running will cause it to automatically update
+the option’s value in the scripting layer. The next time your code accesses the
+option, it will see the new value.
+
+.. note::
+
+  The config framework is clusterized. In a cluster configuration, only the
+  manager node watches the specified configuration files, and relays option
+  updates across the cluster.
+
+Config File Formatting
+----------------------
+
+The formatting of config option values in the config file is not the same as in
+Zeek’s scripting language. Keep an eye on the :file:`reporter.log` for warnings
+from the config reader in case of incorrectly formatted values, which it’ll
+generally ignore when encountered. The following table summarizes supported
+types and their value representations:
+
+.. list-table::
+  :header-rows: 1
+
+  * - Data Type
+    - Sample Config File Entry
+    - Comments
+
+  * - :zeek:see:`addr`
+    - ``1.2.3.4``
+    - Plain IPv4 or IPv6 address, as in Zeek. No ``/32`` or similar netmasks.
+
+  * - :zeek:see:`bool`
+    - ``T``
+    - ``T`` or ``1`` for true, ``F`` or ``0`` for false
+
+  * - :zeek:see:`count`
+    - ``42``
+    - Plain, nonnegative integer.
+
+  * - :zeek:see:`double`
+    - ``-42.5``
+    - Plain double number.
+
+  * - :zeek:see:`enum`
+    - ``Enum::FOO_A``
+    - Plain enum string.
+
+  * - :zeek:see:`int`
+    - ``-1``
+    - Plain integer.
+
+  * - :zeek:see:`interval`
+    - ``3600.0``
+    - Always in epoch seconds, with optional fraction of seconds. Never
+      includes a time unit.
+
+  * - :zeek:see:`pattern`
+    - ``/(foo|bar)/``
+    - The regex pattern, within forward-slash characters.
+
+  * - :zeek:see:`port`
+    - ``42/tcp``
+    - Port number with protocol, as in Zeek. When the protocol part is missing,
+      Zeek interprets it as ``/unknown``.
+
+  * - :zeek:see:`set`
+    - ``80/tcp,53/udp``
+    - The set members, formatted as per their own type, separated by commas.
+      For an empty set, use an empty string: just follow the option name with
+      whitespace.
+
+      Sets with multiple index types (e.g. ``set[addr,string]``) are currently
+      not supported in config files.
+
+  * - :zeek:see:`string`
+    - ``Don’t bite, Zeek``
+    - Plain string, no quotation marks. Given quotation marks become part of
+      the string. Everything after the whitespace separator delineating the
+      option name becomes the string. Saces and special characters are fine.
+      Backslash characters (e.g. ``\n``) have no special meaning.
+
+  * - :zeek:see:`subnet`
+    - ``1.2.3.4/16``
+    - Plain subnet, as in Zeek.
+
+  * - :zeek:see:`time`
+    - ``1608164505.5``
+    - Always in epoch seconds, with optional fraction of seconds. Never
+      includes a time unit.
+
+  * - :zeek:see:`vector`
+    - ``1,2,3,4``
+    - The set members, formatted as per their own type, separated by commas.
+      For an empty vector, use an empty string: just follow the option name
+      with whitespace.
+
+This leaves a few data types unsupported, notably tables and records. If you
+require these, build up an instance of the corresponding type manually (perhaps
+from a separate input framework file) and then call
+:zeek:see:`Config::set_value` to update the option:
+
+.. code-block:: zeek
+
+  module Test;
+
+  export {
+      option host_port: table[addr] of port = {};
+  }
+
+  event zeek_init() {
+      local t: table[addr] of port = { [10.0.0.2] = 123/tcp };
+      Config::set_value("Test::host_port", t);
+  }
+
+
+Regardless of whether an option change is triggered by a config file or via
+explicit :zeek:see:`Config::set_value` calls, Zeek always logs the change to
+:file:`config.log`. A sample entry::
+
+  #fields ts      id      old_value       new_value       location
+  #types  time    string  string  string  string
+  1608167352.498872      Test::a_count     42      3      config.txt
+
+Mentioning options repeatedly in the config files leads to multiple update
+events; the last entry “wins”. Mentioning options that do not correspond to
+existing options in the script layer is safe, but triggers warnings in
+:file:`reporter.log`::
+
+  warning: config.txt/Input::READER_CONFIG: Option 'an_unknown' does not exist. Ignoring line.
+
+Internally, the framework uses the Zeek input framework to learn about config
+changes. If you inspect the configuration framework scripts, you will notice
+that the scripts simply catch input framework events and call
+:zeek:see:`Config::set_value` to set the relevant option to the new value. If
+you want to change an option in your scripts at runtime, you can likewise call
+:zeek:see:`Config::set_value` directly from a script (in a cluster
+configuration, this only needs to happen on the manager, as the change will be
+automatically sent to all other nodes in the cluster).
+
+.. note::
+
+  The input framework is usually very strict about the syntax of input files, but
+  that is not the case for configuration files. These require no header lines,
+  and both tabs and spaces are accepted as separators. A custom input reader,
+  specifically for reading config files, facilitates this.
+
+.. tip::
+
+  The gory details of option-parsing reside in ``Ascii::ParseValue()`` in
+  :file:`src/threading/formatters/Ascii.cc` and ``Value::ValueToVal`` in
+  :file:`src/threading/SerialTypes.cc` in the Zeek core.
+
+Change Handlers
+===============
+
+A change handler is a user-defined function that Zeek calls each time an option
+value changes. This allows you to react programmatically to option changes. The
+following example shows how to register a change handler for an option that has
+a data type of :zeek:see:`addr` (for other data types, the return type and
+second parameter data type must be adjusted accordingly):
+
+.. code-block:: zeek
+
+  module Test;
+
+  export {
+      option testaddr = 127.0.0.1;
+  }
+
+  # Note: the data type of 2nd parameter and return type must match
+  function change_addr(id: string, new_value: addr): addr
+      {
+      print fmt("Value of %s changed from %s to %s", id, testaddr, new_value);
+      return new_value;
+      }
+
+  event zeek_init()
+      {
+      Option::set_change_handler("Test::testaddr", change_addr);
+      }
+
+Immediately before Zeek changes the specified option value, it invokes any
+registered change handlers. The value returned by the change handler is the
+value Zeek assigns to the option.  This allows, for example, checking of values
+to reject invalid input (the original value can be returned to override the
+change).
+
+.. note::
+
+  :zeek:see:`Option::set_change_handler` expects the name of the option to
+  invoke the change handler for, not the option itself. Also, that name
+  includes the module name, even when registering from within the module.
+
+It is possible to define multiple change handlers for a single option. In this
+case, the change handlers are chained together: the value returned by the first
+change handler is the “new value” seen by the next change handler, and so on.
+The built-in function :zeek:see:`Option::set_change_handler` takes an optional
+third argument that can specify a priority for the handlers.
+
+A change handler function can optionally have a third argument of type string.
+When a config file triggers a change, then the third argument is the pathname
+of the config file. When the :zeek:see:`Config::set_value` function triggers a
+change, then the third argument of the change handler is the value passed to
+the optional third argument of the :zeek:see:`Config::set_value` function.
+
+.. tip::
+
+  Change handlers are also used internally by the configuration framework. If
+  you look at the script-level source code of the config framework, you can see
+  that change handlers log the option changes to :file:`config.log`.
+
+When Change Handlers Trigger
+----------------------------
+
+Change handlers often implement logic that manages additional internal state.
+For example, depending on a performance toggle option, you might initialize or
+clean up a caching structure. In such scenarios you need to know exactly when
+and whether a handler gets invoked. The following hold:
+
+* When no config files get registered in :zeek:see:`Config::config_files`,
+  change handlers do not run.
+* When none of any registered config files exist on disk, change handlers do
+  not run.
+
+That is, change handlers are tied to config files, and don’t automatically run
+with the option’s default values.
+
+* When a config file exists on disk at Zeek startup, change handlers run with
+  the file’s config values.
+* When the config file contains the same value the option already defaults to,
+  its change handlers are invoked anyway.
+* :zeek:see:`zeek_init` handlers run before any change handlers — i.e., they
+  run with the options’ default values.
+* Since the config framework relies on the input framework, the input
+  framework’s inherent asynchrony applies: you can’t assume when exactly an
+  option change manifests in the code.
+
+If your change handler needs to run consistently at startup and when options
+change, you can call the handler manually from :zeek:see:`zeek_init` when you
+register it. That way, initialization code always runs for the option’s default
+value, and also for any new values.
+
+.. code-block:: zeek
+
+  module Test;
+
+  export {
+      option use_cache = T;
+  }
+
+  function use_cache_hdlr(id: string, new_value: bool): bool
+      {
+      if ( new_value ) {
+          # Ensure caching structures are set up properly
+      }
+
+      return new_value;
+      }
+
+  event zeek_init()
+      {
+      use_cache_hdlr("Test::use_cache", use_cache);
+      Option::set_change_handler("Test::use_cache", use_cache_hdlr);
+      }
--- a/doc/frameworks/denylist.jsonl
+++ b/doc/frameworks/denylist.jsonl
@ -0,0 +1,3 @@
+{"ip": "192.168.17.1", "timestamp": 1333252748, "reason": "Malware host"}
+{"ip": "192.168.27.2", "timestamp": 1330235733, "reason": "Botnet server"}
+{"ip": "192.168.250.3", "timestamp": 1333145108, "reason": "Virus detected"}
--- a/Show more
+++ b/Show more
				`@ -1 +0,0 @@`
				`Subproject commit 2731def9159247e6da8a3191783c89683363689c`