No OneTemporary
Actions

Size

197 KB

Subscribers

None

View Options

	diff --git a/config.yml b/config.yml
	index 8c51e6e..bfe2a00 100644
	--- a/config.yml
	+++ b/config.yml
	@@ -1,125 +1,126 @@
	# number of attempted resummation phase space points for each input event
	trials: 10

	# maximum soft transverse momentum fraction in extremal jets
	max ext soft pt fraction: 0.1

	resummation jets: # resummation jet properties
	min pt: 35 # minimum jet transverse momentum
	algorithm: antikt # jet clustering algorithm
	R: 0.4 # jet R parameter

	fixed order jets: # properties of input jets
	min pt: 30
	# by default, algorithm and R are like for resummation jets

	# treatment of he various event classes
	# the supported settings are: reweight, keep, discard
	# non-resummable events cannot be reweighted
	event treatment:
	FKL: reweight
	unordered: keep
	extremal qqx: keep
	central qqx: keep
	non-resummable: keep

	# central scale choice or choices
	#
	# scales: [125, max jet pperp, H_T/2, 2*jet invariant mass, m_j1j2]
	scales: 91.188

	# factors by which the central scales should be multiplied
	# renormalisation and factorisation scales are varied independently
	#
	# scale factors: [0.5, 0.7071, 1, 1.41421, 2]

	# maximum ratio between renormalisation and factorisation scale
	#
	# max scale ratio: 2.0001

	# import scale setting functions
	#
	# import scales:
	# lib_my_scales.so: [scale0,scale1]

	log correction: false # whether or not to include higher order logs

	## unweighting setting
	## remove to obtain weighted events
	# unweight:
	# # type of unweighting (one of 'weighted', 'resummation', 'partial')
	# type: partial
	# trials: 10000
	# max deviation: 0

	# event output files
	#
	# the supported formats are
	# - Les Houches (suffix .lhe)
	# - HepMC2 (suffix .hepmc)
	# - HepMC3 (suffix .hepmc3 or .hepmc)
	+# - HDF5 (suffix .hdf5)
	# TODO: - ROOT ntuples (suffix .root)
	#
	# An output file's format is deduced either automatically from the suffix
	# or from an explicit specification, e.g.
	# - Les Houches: outfile

	event output:
	- HEJ.lhe
	# - HEJ_events.hepmc

	# to use a rivet analysis
	#
	# analysis:
	# rivet: MC_XS # rivet analysis name
	# output: HEJ # name of the yoda files, ".yoda" and scale suffix will be added
	#
	# to use a custom analysis
	#
	# analysis:
	# plugin: /path/to/libmyanalysis.so
	# my analysis parameter: some value

	# selection of random number generator and seed
	# the choices are
	# - mixmax (seed is an integer)
	# - ranlux64 (seed is a filename containing parameters)
	random generator:
	name: mixmax
	# seed: 1

	# Vacuum expectation value
	vev: 246.2196508

	# Properties of the weak gauge bosons
	particle properties:
	Higgs:
	mass: 125
	width: 0.004165
	W:
	mass: 80.385
	width: 2.085
	Z:
	mass: 91.187
	width: 2.495

	# parameters for Higgs-gluon couplings
	# this requires compilation with qcdloop
	#
	# Higgs coupling:
	# use impact factors: false
	# mt: 174
	# include bottom: true
	# mb: 4.7

	## ---------------------------------------------------------------------- ##
	## The following settings are only intended for advanced users. ##
	## Please DO NOT SET them unless you know exactly what you are doing! ##
	## ---------------------------------------------------------------------- ##
	#
	# minimum transverse momentum of extremal partons
	# deprecated: use "max ext soft pt fraction" instead
	# min extparton pt: 30
	#
	# max events: -1 # Maximal number of fixed order Events to process
	# regulator parameter: 0.2 # The regulator lambda for the subtraction terms
	diff --git a/doc/developer_manual/developer_manual.tex b/doc/developer_manual/developer_manual.tex
	index b7845bb..942c2ec 100644
	--- a/doc/developer_manual/developer_manual.tex
	+++ b/doc/developer_manual/developer_manual.tex
	@@ -1,1742 +1,1745 @@
	\documentclass[a4paper,11pt]{article}

	\usepackage{fourier}
	\usepackage[T1]{fontenc}
	\usepackage{microtype}
	\usepackage{geometry}
	\usepackage{enumitem}
	\setlist[description]{leftmargin=\parindent,labelindent=\parindent}
	\usepackage{amsmath}
	\usepackage{amssymb}
	\usepackage[utf8x]{inputenc}
	\usepackage{graphicx}
	\usepackage{xcolor}
	\usepackage{todonotes}
	\usepackage{listings}
	\usepackage{xspace}
	\usepackage{tikz}
	\usepackage{slashed}
	\usepackage{subcaption}
	\usetikzlibrary{arrows.meta}
	\usetikzlibrary{shapes}
	\usetikzlibrary{calc}
	\usepackage[colorlinks,linkcolor={blue!50!black}]{hyperref}
	\graphicspath{{build/figures/}{figures/}}
	\usepackage[left]{showlabels}
	\renewcommand{\showlabelfont}{\footnotesize\color{darkgreen}}
	\emergencystretch \hsize

	\newcommand{\HEJ}{{\tt HEJ}\xspace}
	\newcommand{\HIGHEJ}{\emph{High Energy Jets}\xspace}
	\newcommand{\cmake}{\href{https://cmake.org/}{cmake}\xspace}
	\newcommand{\html}{\href{https://www.w3.org/html/}{html}\xspace}
	\newcommand{\YAML}{\href{http://yaml.org/}{YAML}\xspace}
	\newcommand{\QCDloop}{\href{https://github.com/scarrazza/qcdloop}{QCDloop}\xspace}
	\newcommand\matel[4][]{\mathinner{\langle#2\vert#3\vert#4\rangle}_{#1}}

	\newcommand{\as}{\alpha_s}
	\DeclareRobustCommand{\mathgraphics}[1]{\vcenter{\hbox{\includegraphics{#1}}}}
	\def\spa#1.#2{\left\langle#1\,#2\right\rangle}
	\def\spb#1.#2{\left[#1\,#2\right]} \def\spaa#1.#2.#3{\langle\mskip-1mu{#1} \|
	#2 \| {#3}\mskip-1mu\rangle} \def\spbb#1.#2.#3{[\mskip-1mu{#1} \| #2 \|
	{#3}\mskip-1mu]} \def\spab#1.#2.#3{\langle\mskip-1mu{#1} \| #2 \|
	{#3}\mskip-1mu\rangle} \def\spba#1.#2.#3{\langle\mskip-1mu{#1}^+ \| #2 \|
	{#3}^+\mskip-1mu\rangle} \def\spav#1.#2.#3{\\|\mskip-1mu{#1} \| #2 \|
	{#3}\mskip-1mu\\|^2} \def\jc#1.#2.#3{j^{#1}_{#2#3}}

	% expectation value
	\newcommand{\ev}[1]{\text{E}\left[#1\right]}

	\definecolor{darkgreen}{rgb}{0,0.4,0}
	\lstset{ %
	backgroundcolor=\color{lightgray}, % choose the background color; you must add \usepackage{color} or \usepackage{xcolor}
	basicstyle=\footnotesize\usefont{T1}{DejaVuSansMono-TLF}{m}{n}, % the size of the fonts that are used for the code
	breakatwhitespace=false, % sets if automatic breaks should only happen at whitespace
	breaklines=false, % sets automatic line breaking
	captionpos=t, % sets the caption-position to bottom
	commentstyle=\color{red}, % comment style
	deletekeywords={...}, % if you want to delete keywords from the given language
	escapeinside={\%}{)}, % if you want to add LaTeX within your code
	extendedchars=true, % lets you use non-ASCII characters; for 8-bits encodings only, does not work with UTF-8
	frame=false, % adds a frame around the code
	keepspaces=true, % keeps spaces in text, useful for keeping indentation of code (possibly needs columns=flexible)
	keywordstyle=\color{blue}, % keyword style
	otherkeywords={}, % if you want to add more keywords to the set
	numbers=none, % where to put the line-numbers; possible values are (none, left, right)
	numbersep=5pt, % how far the line-numbers are from the code
	rulecolor=\color{black}, % if not set, the frame-color may be changed on line-breaks within not-black text (e.g. comments (green here))
	showspaces=false, % show spaces everywhere adding particular underscores; it overrides 'showstringspaces'
	showstringspaces=false, % underline spaces within strings only
	showtabs=false, % show tabs within strings adding particular underscores
	stepnumber=2, % the step between two line-numbers. If it's 1, each line will be numbered
	stringstyle=\color{gray}, % string literal style
	tabsize=2, % sets default tabsize to 2 spaces
	title=\lstname,
	emph={},
	emphstyle=\color{darkgreen}
	}

	\begin{document}

	\tikzstyle{mynode}=[rectangle split,rectangle split parts=2, draw,rectangle split part fill={lightgray, none}]

	\title{HEJ 2 developer manual}
	\author{}
	\maketitle
	\tableofcontents

	\newpage

	\section{Overview}
	\label{sec:overview}

	HEJ 2 is a C++ program and library implementing an algorithm to
	apply \HIGHEJ resummation~\cite{Andersen:2008ue,Andersen:2008gc} to
	pre-generated fixed-order events. This document is intended to give an
	overview over the concepts and structure of this implementation.

	\subsection{Project structure}
	\label{sec:project}

	HEJ 2 is developed under the \href{https://git-scm.com/}{git}
	version control system. The main repository is on the IPPP
	\href{https://gitlab.com/}{gitlab} server under
	\url{https://gitlab.dur.scotgrid.ac.uk/hej/hej}. To get a local
	copy, get an account on the gitlab server and use
	\begin{lstlisting}[language=sh,caption={}]
	git clone git@gitlab.dur.scotgrid.ac.uk:hej/hej.git
	\end{lstlisting}
	This should create a directory \texttt{hej} with the following
	contents:
	\begin{description}
	\item[doc:] Contains additional documentation, see section~\ref{sec:doc}.
	\item[include:] Contains the C++ header files.
	\item[src:] Contains the C++ source files.
	\item[t:] Contains the source code for the automated tests.
	\item[CMakeLists.txt:] Configuration file for the \cmake build
	system. See section~\ref{sec:cmake}.
	\item[cmake:] Auxiliary files for \cmake. This includes modules for
	finding installed software in \texttt{cmake/Modules} and templates for
	code generation during the build process in \texttt{cmake/Templates}.
	\item[config.yml:] Sample configuration file for running HEJ 2.
	\item[FixedOrderGen:] Contains the code for the fixed-order generator,
	see section~\ref{sec:HEJFOG}.
	\end{description}
	In the following all paths are given relative to the
	\texttt{hej} directory.

	\subsection{Documentation}
	\label{sec:doc}

	The \texttt{doc} directory contains user documentation in
	\texttt{doc/sphinx} and the configuration to generate source code
	documentation in \texttt{doc/doxygen}.

	The user documentation explains how to install and run HEJ 2. The
	format is
	\href{http://docutils.sourceforge.net/rst.html}{reStructuredText}, which
	is mostly human-readable. Other formats, like \html, can be generated with the
	\href{http://www.sphinx-doc.org/en/master/}{sphinx} generator with
	\begin{lstlisting}[language=sh,caption={}]
	make html
	\end{lstlisting}

	To document the source code we use
	\href{https://www.stack.nl/~dimitri/doxygen/}{doxygen}. To generate
	\html documentation, use the command
	\begin{lstlisting}[language=sh,caption={}]
	doxygen Doxyfile
	\end{lstlisting}
	in the \texttt{doc/doxygen} directory.

	\subsection{Build system}
	\label{sec:cmake}

	For the most part, HEJ 2 is a library providing classes and
	functions that can be used to add resummation to fixed-order events. In
	addition, there is a relatively small executable program leveraging this
	library to read in events from an input file and produce resummation
	events. Both the library and the program are built and installed with
	the help of \cmake.
	Debug information can be turned on by using
	\begin{lstlisting}[language=sh,caption={}]
	cmake base/directory -DCMAKE_BUILD_TYPE=Debug
	make install
	\end{lstlisting}
	This facilitates the use of debuggers like \href{https://www.gnu.org/software/gdb/}{gdb}.

	The main \cmake configuration file is \texttt{CMakeLists.txt}. It defines the
	compiler flags, software prerequisites, header and source files used to
	build HEJ 2, and the automated tests.
	\texttt{cmake/Modules} contains module files that help with the
	detection of the software prerequisites and \texttt{cmake/Templates}
	template files for the automatic generation of header and
	source files. For example, this allows to only keep the version
	information in one central location (\texttt{CMakeLists.txt}) and
	automatically generate a header file from the template \texttt{Version.hh.in} to propagate this to the C++ code.

	\subsection{General coding guidelines}
	\label{sec:notes}

	The goal is to make the HEJ 2 code well-structured and
	readable. Here are a number of guidelines to this end.

	\begin{description}
	\item[Observe the boy scout rule.] Always leave the code cleaner
	than how you found it. Ugly hacks can be useful for testing, but
	shouldn't make their way into the main branch.
	\item[Ask if something is unclear.] Often there is a good reason why
	code is written the way it is. Sometimes that reason is only obvious to
	the original author (use \lstinline!git blame! to find them), in which
	case they should be poked to add a comment. Sometimes there is no good
	reason, but nobody has had the time to come up with something better,
	yet. In some places the code might just be bad.
	\item[Don't break tests.] There are a number of tests in the \texttt{t}
	directory, which can be run with \lstinline!make test!. Ideally, all
	tests should run successfully in each git revision. If your latest
	commit broke a test and you haven't pushed to the central repository
	yet, you can fix it with \lstinline!git commit --amend!. If an earlier
	local commit broke a test, you can use \lstinline!git rebase -i! if
	you feel confident. Additionally each \lstinline!git push! is also
	automatically tested via the GitLab CI (see appendix~\ref{sec:CI}).
	\item[Test your new code.] When you add some new functionality, also add an
	automated test. This can be useful even if you don't know the
	``correct'' result because it prevents the code from changing its behaviour
	silently in the future. \href{http://www.valgrind.org/}{valgrind} is a
	very useful tool to detect potential memory leaks. The code coverage of all
	tests can be generated with \href{https://gcovr.com/en/stable/}{gcovr}.
	Therefore add the flag \lstinline!-DTEST_COVERAGE=True! to cmake and run
	\lstinline!make ctest_coverage!.
	\item[Stick to the coding style.] It is somewhat easier to read code
	that has a uniform coding and indentation style. We don't have a
	strict style, but it helps if your code looks similar to what is
	already there.
	\end{description}

	\section{Program flow}
	\label{sec:flow}

	A run of the HEJ 2 program has three stages: initialisation,
	event processing, and cleanup. The following sections outline these
	stages and their relations to the various classes and functions in the
	code. Unless denoted otherwise, all classes and functions are part of
	the \lstinline!HEJ! namespace. The code for the HEJ 2 program is
	in \texttt{src/bin/HEJ.cc}, all other code comprises the HEJ 2
	library. Classes and free functions are usually implemented in header
	and source files with a corresponding name, i.e. the code for
	\lstinline!MyClass! can usually be found in
	\texttt{include/HEJ/MyClass.hh} and \texttt{src/MyClass.cc}.

	\subsection{Initialisation}
	\label{sec:init}

	The first step is to load and parse the \YAML configuration file. The
	entry point for this is the \lstinline!load_config! function and the
	related code can be found in \texttt{include/HEJ/YAMLreader.hh},
	\texttt{include/HEJ/config.hh} and the corresponding \texttt{.cc} files
	in the \texttt{src} directory. The implementation is based on the
	\href{https://github.com/jbeder/yaml-cpp}{yaml-cpp} library.
	The \lstinline!load_config! function returns a \lstinline!Config! object
	containing all settings. To detect potential mistakes as early as
	possible, we throw an exception whenever one of the following errors
	occurs:
	\begin{itemize}
	\item There is an unknown option in the \YAML file.
	\item A setting is invalid, for example a string is given where a number
	would be expected.
	\item An option value is not set.
	\end{itemize}
	The third rule is sometimes relaxed for ``advanced'' settings with an
	obvious default, like for importing custom scales or analyses.

	The information stored in the \lstinline!Config! object is then used to
	initialise various objects required for the event processing stage
	described in section~\ref{sec:processing}. First, the
	\lstinline!get_analysis! function creates an object that inherits from
	the \lstinline!Analysis! interface.\footnote{In the context of C++ the
	proper technical expression is ``pure abstract class''.} Using an
	interface allows us to decide the concrete type of the analysis at run
	time instead of having to make a compile-time decision. Depending on the
	settings, \lstinline!get_analysis! creates either a user-defined
	analysis loaded from an external library (see the user documentation
	\url{https://hej.web.cern.ch/HEJ/doc/current/user/}) or the default \lstinline!EmptyAnalysis!, which does
	nothing.

	Together with a number of further objects, whose roles are described in
	section~\ref{sec:processing}, we also initialise the global random
	number generator. We again use an interface to defer deciding the
	concrete type until the program is actually run. Currently, we support the
	\href{https://mixmax.hepforge.org/}{MIXMAX}
	(\texttt{include/HEJ/Mixmax.hh}) and Ranlux64
	(\texttt{include/HEJ/Ranlux64.hh}) random number generators, both are provided
	by \href{http://proj-clhep.web.cern.ch/}{CLHEP}.

	We also set up a \lstinline!HEJ::EventReader! object for reading events
	either in the the Les Houches event file format~\cite{Alwall:2006yp} or
	an \href{https://www.hdfgroup.org/}{HDF5}-based
	format~\cite{Hoeche:2019rti}. To allow making the decision at run time,
	\lstinline!HEJ::EventReader! is an abstract base class defined in
	\texttt{include/HEJ/EventReader.hh} and the implementations of the
	derived classes are in \texttt{include/HEJ/LesHouchesReader.hh},
	\texttt{include/HEJ/HDF5Reader.hh} and the corresponding \texttt{.cc}
	source files in the \texttt{src} directory. The
	\lstinline!LesHouchesReader! leverages
	\href{http://home.thep.lu.se/~leif/LHEF/}{\texttt{include/LHEF/LHEF.h}}. A
	small wrapper around the
	\href{https://www.boost.org/doc/libs/1_67_0/libs/iostreams/doc/index.html}{boost
	iostreams} library allows us to also read event files compressed with
	\href{https://www.gnu.org/software/gzip/}{gzip}. The wrapper code is in
	\texttt{include/HEJ/stream.hh} and the \texttt{src/stream.cc}.

	If unweighting is enabled, we also initialise an unweighter as defined
	in \texttt{include/HEJ/Unweighter.hh}. The unweighting strategies are
	explained in section~\ref{sec:unweight}.

	\subsection{Event processing}
	\label{sec:processing}

	In the second stage events are continously read from the event
	file. After jet clustering, a number of corresponding resummation events
	are generated for each input event and fed into the analysis and a
	number of output files. The roles of various classes and functions are
	illustrated in the following flow chart:
	\begin{center}
	\begin{tikzpicture}[node distance=2cm and 5mm]
	\node (reader) [mynode]
	{\lstinline!EventReader::read_event!\nodepart{second}{read event}};
	\node
	(data) [mynode,below=of reader]
	{\lstinline!Event::EventData! constructor\nodepart{second}{convert to \HEJ object}};
	\node
	(cluster) [mynode,below=of data]
	{\lstinline!Event::EventData::cluster!\nodepart{second}{cluster jets \&
	classify \lstinline!EventType!}};
	\node
	(resum) [mynode,below=of cluster]
	{\lstinline!EventReweighter::reweight!\nodepart{second}{perform resummation}};
	\node
	(cut) [mynode,below=of resum]
	{\lstinline!Analysis::pass_cuts!\nodepart{second}{apply cuts}};
	\node
	(cut) [mynode,below=of resum]
	{\lstinline!Analysis::pass_cuts!\nodepart{second}{apply cuts}};
	\node
	(unweight) [mynode,below=of cut]
	{\lstinline!Unweighter::unweight!\nodepart{second}{unweight (optional)}};
	\node
	(fill) [mynode,below left=of unweight]
	{\lstinline!Analysis::fill!\nodepart{second}{analyse event}};
	\node
	(write) [mynode,below right=of unweight]
	{\lstinline!CombinedEventWriter::write!\nodepart{second}{write out event}};
	\node
	(control) [below=of unweight] {};
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(reader.south) -- node[left] {\lstinline!LHEF::HEPEUP!} (data.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(data.south) -- node[left] {\lstinline!Event::EventData!} (cluster.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(cluster.south) -- node[left] {\lstinline!Event!} (resum.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(resum.south) -- (cut.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(resum.south)+(10mm, 0cm)$) -- ($(cut.north)+(10mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(resum.south)+(5mm, 0cm)$) -- ($(cut.north)+(5mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(resum.south)-(5mm, 0cm)$) -- ($(cut.north)-(5mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(resum.south)-(10mm, 0cm)$) -- node[left] {\lstinline!Event!} ($(cut.north)-(10mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(cut.south) -- (unweight.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(cut.south)+(7mm, 0cm)$) -- ($(unweight.north)+(7mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(cut.south)-(7mm, 0cm)$) -- node[left] {\lstinline!Event!} ($(unweight.north)-(7mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(unweight.south)-(3mm,0mm)$) .. controls ($(control)-(3mm,0mm)$) ..node[left] {\lstinline!Event!} (fill.east);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(unweight.south)-(3mm,0mm)$) .. controls ($(control)-(3mm,0mm)$) .. (write.west);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(unweight.south)+(3mm,0mm)$) .. controls ($(control)+(3mm,0mm)$) .. (fill.east);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(unweight.south)+(3mm,0mm)$) .. controls ($(control)+(3mm,0mm)$) ..node[right] {\lstinline!Event!} (write.west);
	\end{tikzpicture}
	\end{center}

	\lstinline!EventData! is an intermediate container, its members are completely
	accessible. In contrast after jet clustering and classification the phase space
	inside \lstinline!Event! can not be changed any more
	(\href{https://wikipedia.org/wiki/Builder_pattern}{Builder design pattern}). The
	resummation is performed by the \lstinline!EventReweighter! class, which is
	described in more detail in section~\ref{sec:resum}. The
	\lstinline!CombinedEventWriter! writes events to zero or more output files. To
	this end, it contains a number of objects implementing the
	\lstinline!EventWriter! interface. These event writers typically write the
	events to a file in a given format. We currently have the
	\lstinline!LesHouchesWriter! for event files in the Les Houches Event File
	-format and the \lstinline!HepMC2Writer! or \lstinline!HepMC3Writer! for the
	-\href{https://hepmc.web.cern.ch/hepmc/}{HepMC} format (Version 2 and 3).
	+format, the \lstinline!HDF5Writer! for
	+\href{https://www.hdfgroup.org/}{HDF5}~\cite{Hoeche:2019rti} and the
	+\lstinline!HepMC2Writer! or \lstinline!HepMC3Writer! for the
	+\href{https://hepmc.web.cern.ch/hepmc/}{HepMC} format (Version 2 and
	+3).

	\subsection{Resummation}
	\label{sec:resum}

	In the \lstinline!EventReweighter::reweight! member function, we first
	classify the input fixed-order event (FKL, unordered, non-resummable, \dots)
	and decide according to the user settings whether to discard, keep, or
	resum the event. If we perform resummation for the given event, we
	generate a number of trial \lstinline!PhaseSpacePoint! objects. Phase
	space generation is discussed in more detail in
	section~\ref{sec:pspgen}. We then perform jet clustering according to
	the settings for the resummation jets on each
	\lstinline!PhaseSpacePoint!, update the factorisation and
	renormalisation scale in the resulting \lstinline!Event! and reweight it
	according to the ratio of pdf factors and \HEJ matrix elements between
	resummation and original fixed-order event:
	\begin{center}
	\begin{tikzpicture}[node distance=1.5cm and 5mm]
	\node (in) {};
	\node (treat) [diamond,draw,below=of in,minimum size=3.5cm,
	label={[anchor=west, inner sep=8pt]west:discard},
	label={[anchor=east, inner sep=14pt]east:keep},
	label={[anchor=south, inner sep=20pt]south:reweight}
	] {};
	\draw (treat.north west) -- (treat.south east);
	\draw (treat.north east) -- (treat.south west);
	\node
	(psp) [mynode,below=of treat]
	{\lstinline!PhaseSpacePoint! constructor};
	\node
	(cluster) [mynode,below=of psp]
	{\lstinline!Event::EventData::cluster!\nodepart{second}{cluster jets}};
	\node
	(colour) [mynode,below=of cluster]
	{\lstinline!Event::generate_colours()!\nodepart{second}{generate particle colour}};
	\node
	(gen_scales) [mynode,below=of colour]
	{\lstinline!ScaleGenerator::operator()!\nodepart{second}{update scales}};
	\node
	(rescale) [mynode,below=of gen_scales]
	{\lstinline!PDF::pdfpt!,
	\lstinline!MatrixElement!\nodepart{second}{reweight}};
	\node (out) [below of=rescale] {};

	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(in.south) -- node[left] {\lstinline!Event!} (treat.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(treat.south) -- node[left] {\lstinline!Event!} (psp.north);

	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(psp.south) -- (cluster.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(psp.south)+(7mm, 0cm)$) -- ($(cluster.north)+(7mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(psp.south)-(7mm, 0cm)$) -- node[left]
	{\lstinline!PhaseSpacePoint!} ($(cluster.north)-(7mm, 0cm)$);

	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(cluster.south) -- (colour.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(cluster.south)+(7mm, 0cm)$) -- ($(colour.north)+(7mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(cluster.south)-(7mm, 0cm)$) -- node[left]
	{\lstinline!Event!} ($(colour.north)-(7mm, 0cm)$);

	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(colour.south) -- (gen_scales.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(colour.south)+(7mm, 0cm)$) -- ($(gen_scales.north)+(7mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(colour.south)-(7mm, 0cm)$) -- node[left]
	{\lstinline!Event!} ($(gen_scales.north)-(7mm, 0cm)$);

	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(gen_scales.south) -- (rescale.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(gen_scales.south)+(7mm, 0cm)$) -- ($(rescale.north)+(7mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(gen_scales.south)-(7mm, 0cm)$) -- node[left]
	{\lstinline!Event!} ($(rescale.north)-(7mm, 0cm)$);

	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(rescale.south) -- (out.north);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(rescale.south)+(7mm, 0cm)$) -- ($(out.north)+(7mm, 0cm)$);
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	($(rescale.south)-(7mm, 0cm)$) -- node[left]
	{\lstinline!Event!} ($(out.north)-(7mm, 0cm)$);

	\node (helper) at ($(treat.east) + (15mm,0cm)$) {};
	\draw[-{Latex[length=3mm, width=1.5mm]}]
	(treat.east) -- ($(treat.east) + (15mm,0cm)$)
	-- node[left] {\lstinline!Event!} (helper \|- gen_scales.east) -- (gen_scales.east)
	;
	\end{tikzpicture}
	\end{center}

	\subsection{Phase space point generation}
	\label{sec:pspgen}

	The resummed and matched \HEJ cross section for pure jet production of
	FKL configurations is given by (cf. eq. (3) of~\cite{Andersen:2018tnm})
	\begin{align}
	\label{eq:resumdijetFKLmatched2}
	% \begin{split}
	\sigma&_{2j}^\mathrm{resum, match}=\sum_{f_1, f_2}\ \sum_m
	\prod_{j=1}^m\left(
	\int_{p_{j\perp}^B=0}^{p_{j\perp}^B=\infty}
	\frac{\mathrm{d}^2\mathbf{p}_{j\perp}^B}{(2\pi)^3}\ \int
	\frac{\mathrm{d} y_j^B}{2} \right) \
	(2\pi)^4\ \delta^{(2)}\!\!\left(\sum_{k=1}^{m}
	\mathbf{p}_{k\perp}^B\right)\nonumber\\
	&\times\ x_a^B\ f_{a, f_1}(x_a^B, Q_a^B)\ x_b^B\ f_{b, f_2}(x_b^B, Q_b^B)\
	\frac{\overline{\left\|\mathcal{M}_\text{LO}^{f_1f_2\to f_1g\cdots
	gf_2}\big(\big\{p^B_j\big\}\big)\right\|}^2}{(\hat {s}^B)^2}\nonumber\\
	& \times (2\pi)^{-4+3m}\ 2^m \nonumber\\
	&\times\ \sum_{n=2}^\infty\
	\int_{p_{1\perp}=p_{\perp,\mathrm{min}} }^{p_{1\perp}=\infty}
	\frac{\mathrm{d}^2\mathbf{p}_{1\perp}}{(2\pi)^3}\
	\int_{p_{n\perp}=p_{\perp,\mathrm{min}}}^{p_{n\perp}=\infty}
	\frac{\mathrm{d}^2\mathbf{p}_{n\perp}}{(2\pi)^3}\
	\prod_{i=2}^{n-1}\int_{p_{i\perp}=\lambda}^{p_{i\perp}=\infty}
	\frac{\mathrm{d}^2\mathbf{p}_{i\perp}}{(2\pi)^3}\ (2\pi)^4\ \delta^{(2)}\!\!\left(\sum_{k=1}^n
	\mathbf{p}_{k\perp}\right )\\
	&\times \ \mathbf{T}_y \prod_{i=1}^n
	\left(\int \frac{\mathrm{d} y_i}{2}\right)\
	\mathcal{O}_{mj}^e\
	\left(\prod_{l=1}^{m-1}\delta^{(2)}(\mathbf{p}_{\mathcal{J}_{l}\perp}^B -
	\mathbf{j}_{l\perp})\right)\
	\left(\prod_{l=1}^m\delta(y^B_{\mathcal{J}_l}-y_{\mathcal{J}_l})\right)
	\ \mathcal{O}_{2j}(\{p_i\})\nonumber\\
	&\times \frac{(\hat{s}^B)^2}{\hat{s}^2}\ \frac{x_a f_{a,f_1}(x_a, Q_a)\ x_b f_{b,f_2}(x_b, Q_b)}{x_a^B\ f_{a,f_1}(x_a^B, Q_a^B)\ x_b^B\ f_{b,f_2}(x_b^B, Q_b^B)}\ \frac{\overline{\left\|\mathcal{M}_{\mathrm{HEJ}}^{f_1 f_2\to f_1 g\cdots
	gf_2}(\{ p_i\})\right\|}^2}{\overline{\left\|\mathcal{M}_\text{LO, HEJ}^{f_1f_2\to f_1g\cdots
	gf_2}\big(\big\{p^B_j\big\}\big)\right\|}^{2}} \,.\nonumber
	% \end{split}
	\end{align}
	The first two lines correspond to the generation of the fixed-order
	input events with incoming partons $f_1, f_2$ and outgoing momenta
	$p_j^B$, where $\mathbf{p}_{j\perp}^B$ and $y_j^B$ denote the respective
	transverse momentum and rapidity. Note that, at leading order, these
	coincide with the fixed-order jet momenta $p_{\mathcal{J}_j}^B$.
	$f_{a,f_1}(x_a, Q_a),f_{b,f_2}(x_b, Q_b)$ are the pdf factors for the incoming partons with
	momentum fractions $x_a$ and $x_b$. The square of the partonic
	centre-of-mass energy is denoted by $\hat{s}^B$ and
	$\mathcal{M}_\text{LO}^{f_1f_2\to f_1g\cdots gf_2}$ is the
	leading-order matrix element.

	The third line is a factor accounting for the different multiplicities
	between fixed-order and resummation events. Lines four and five are
	the integration over the resummation phase space described in this
	section. $p_i$ are the momenta of the outgoing partons in resummation
	phase space. $\mathbf{T}_y$ denotes rapidity
	ordering and $\mathcal{O}_{mj}^e$ projects out the exclusive $m$-jet
	component. The relation between resummation and fixed-order momenta is
	fixed by the $\delta$ functions. The first sets each transverse fixed-order jet
	momentum to some function $\mathbf{j_{l\perp}}$ of the resummation
	momenta. The exact form is described in section~\ref{sec:ptj_res}. The second
	$\delta$ forces the rapidities of resummation and fixed-order jets to be
	the same. Finally, the last line is the reweighting of pdf and matrix
	element factors already shown in section~\ref{sec:resum}.

	There are two kinds of cut-off in the integration over the resummation
	partons. $\lambda$ is a technical cut-off connected to the cancellation
	of infrared divergencies between real and virtual corrections. Its
	numerical value is set in
	\texttt{include/HEJ/Constants.h}. $p_{\perp,\mathrm{min}}$ regulates
	and \emph{uncancelled} divergence in the extremal parton momenta. Its
	size is set by the user configuration \url{https://hej.web.cern.ch/HEJ/doc/current/user/HEJ.html#settings}.

	It is straightforward to generalise eq.~(\ref{eq:resumdijetFKLmatched2})
	to unordered configurations and processes with additional colourless
	emissions, for example a Higgs or electroweak boson. In the latter case only
	the fixed-order integration and the matrix elements change.

	\subsubsection{Gluon Multiplicity}
	\label{sec:psp_ng}

	The first step in evaluating the resummation phase space in
	eq.~(\ref{eq:resumdijetFKLmatched2}) is to randomly pick terms in the
	sum over the number of emissions. This sampling of the gluon
	multiplicity is done in the \lstinline!PhaseSpacePoint::sample_ng!
	function in \texttt{src/PhaseSpacePoint.cc}.

	The typical number of extra emissions depends strongly on the rapidity
	span of the underlying fixed-order event. Let us, for example, consider
	a fixed-order FKL-type multi-jet configuration with rapidities
	$y_{j_f},\,y_{j_b}$ of the most forward and backward jets,
	respectively. By eq.~(\ref{eq:resumdijetFKLmatched2}), the jet
	multiplicity and the rapidity of each jet are conserved when adding
	resummation. This implies that additional hard radiation is restricted
	to rapidities $y$ within a region $y_{j_b} \lesssim y \lesssim
	y_{j_f}$. Within \HEJ, we require the most forward and most backward
	emissions to be hard \todo{specify how hard} in order to avoid divergences, so this constraint
	in fact applies to \emph{all} additional radiation.

	To simplify the remaining discussion, let us remove the FKL rapidity
	ordering
	\begin{equation}
	\label{eq:remove_y_order}
	\mathbf{T}_y \prod_{i=1}^n\int \frac{\mathrm{d}y_i}{2} =
	\frac{1}{n!}\prod_{i=1}^n\int
	\frac{\mathrm{d}y_i}{2}\,,
	\end{equation}
	where all rapidity integrals now cover a region which is approximately
	bounded by $y_{j_b}$ and $y_{j_f}$. Each of the $m$ jets has to contain at least
	one parton; selecting random emissions we can rewrite the phase space
	integrals as
	\begin{equation}
	\label{eq:select_jets}
	\frac{1}{n!}\prod_{i=1}^n\int [\mathrm{d}p_i] =
	\left(\prod_{i=1}^{m}\int [\mathrm{d}p_i]\ {\cal J}_i(p_i)\right)
	\frac{1}{n_g!}\prod_{i=m+1}^{m+n_g}\int [\mathrm{d}p_i]
	\end{equation}
	with jet selection functions
	\begin{equation}
	\label{eq:def_jet_selection}
	{\cal J}_i(p) =
	\begin{cases}
	1 &p\text{ clustered into jet }i\\
	0 & \text{otherwise}
	\end{cases}
	\end{equation}
	and $n_g \equiv n - m$. Here and in the following we use the short-hand
	notation $[\mathrm{d}p_i]$ to denote the phase-space measure for parton
	$i$. As is evident from eq.~\eqref{eq:select_jets}, adding an extra emission
	$n_g+1$ introduces a suppression factor $\tfrac{1}{n_g+1}$. However, the
	additional phase space integral also results in an enhancement proportional
	to $\Delta y_{j_f j_b} = y_{j_f} - y_{j_b}$. This is a result of the
	rapidity-independence of the MRK limit of the integrand, consisting of the
	matrix elements divided by the flux factor. Indeed, we observe that the
	typical number of gluon emissions is to a good approximation proportional to
	the rapidity separation and the phase space integral is dominated by events
	with $n_g \approx \Delta y_{j_f j_b}$.

	For the actual phase space sampling, we assume a Poisson distribution
	and extract the mean number of gluon emissions in different rapidity
	bins and fit the results to a linear function in $\Delta y_{j_f j_b}$,
	finding a coefficient of $0.975$ for the inclusive production of a Higgs
	boson with two jets. Here are the observed and fitted average gluon
	multiplicities as a function of $\Delta y_{j_f j_b}$:
	\begin{center}
	\includegraphics[width=.75\textwidth]{ng_mean}
	\end{center}
	As shown for two rapidity slices the assumption of a Poisson
	distribution is also a good approximation:
	\begin{center}
	\includegraphics[width=.49\textwidth]{{ng_1.5}.pdf}\hfill
	\includegraphics[width=.49\textwidth]{{ng_5.5}.pdf}
	\end{center}

	\subsubsection{Number of Gluons inside Jets}
	\label{sec:psp_ng_jet}

	For each of the $n_g$ gluon emissions we can split the phase-space
	integral into a (disconnected) region inside the jets and a remainder:
	\begin{equation}
	\label{eq:psp_split}
	\int [\mathrm{d}p_i] = \int [\mathrm{d}p_i]\,
	\theta\bigg(\sum_{j=1}^{m}{\cal J}_j(p_i)\bigg) + \int [\mathrm{d}p_i]\,
	\bigg[1-\theta\bigg(\sum_{j=1}^{m}{\cal J}_j(p_i)\bigg)\bigg]\,.
	\end{equation}
	The next step is to decide how many of the gluons will form part of a
	jet. This is done in the \lstinline!PhaseSpacePoint::sample_ng_jets!
	function.

	We choose an importance sampling which is flat in the plane
	spanned by the azimuthal angle $\phi$ and the rapidity $y$. This is
	observed in BFKL and valid in the limit of Multi-Regge-Kinematics
	(MRK). Furthermore, we assume anti-$k_t$ jets, which cover an area of
	$\pi R^2$.

	In principle, the total accessible area in the $y$-$\phi$ plane is given
	by $2\pi \Delta y_{fb}$, where $\Delta y_{fb}\geq \Delta y_{j_f j_b}$ is
	the a priori unknown rapidity separation between the most forward and
	backward partons. In most cases the extremal jets consist of single
	partons, so that $\Delta y_{fb} = \Delta y_{j_f j_b}$. For the less common
	case of two partons forming a jet we observe a maximum distance of $R$
	between the constituents and the jet centre. In rare cases jets have
	more than two constituents. Empirically, they are always within a
	distance of $\tfrac{5}{3}R$ to the centre of the jet, so
	$\Delta y_{fb} \leq \Delta y_{j_f j_b} + \tfrac{10}{3} R$. In practice, the
	extremal partons are required to carry a large fraction of the jet
	transverse momentum and will therefore be much closer to the jet axis.

	In summary, for sufficiently large rapidity separations we can use the
	approximation $\Delta y_{fb} \approx \Delta y_{j_f j_b}$. This scenario
	is depicted here:
	\begin{center}
	\includegraphics[width=0.5\linewidth]{ps_large_y}
	\end{center}
	If there is no overlap between jets, the probability $p_{\cal J, >}$ for
	an extra gluon to end up inside a jet is then given by
	\begin{equation}
	\label{eq:p_J_large}
	p_{\cal J, >} = \frac{(m - 1)\*R^2}{2\Delta y_{j_f j_b}}\,.
	\end{equation}
	For a very small rapidity separation, eq.~\eqref{eq:p_J_large}
	obviously overestimates the true probability. The maximum phase space
	covered by jets in the limit of a vanishing rapidity distance between
	all partons is $2mR \Delta y_{fb}$:
	\begin{center}
	\includegraphics[width=0.5\linewidth]{ps_small_y}
	\end{center}
	We therefore estimate the probability for a parton to end up inside a jet as
	\begin{equation}
	\label{eq:p_J}
	p_{\cal J} = \min\bigg(\frac{(m - 1)\*R^2}{2\Delta y_{j_f j_b}}, \frac{mR}{\pi}\bigg)\,.
	\end{equation}
	Here we compare this estimate with the actually observed
	fraction of additional emissions into jets as a function of the rapidity
	separation:
	\begin{center}
	\includegraphics[width=0.75\linewidth]{pJ}
	\end{center}

	\subsubsection{Gluons outside Jets}
	\label{sec:gluons_nonjet}

	Using our estimate for the probability of a gluon to be a jet
	constituent, we choose a number $n_{g,{\cal J}}$ of gluons inside
	jets, which also fixes the number $n_g - n_{g,{\cal J}}$ of gluons
	outside jets. As explained later on, we need to generate the momenta of
	the gluons outside jets first. This is done in
	\lstinline!PhaseSpacePoint::gen_non_jet!.

	The azimuthal angle $\phi$ is generated flat within $0\leq \phi \leq 2
	\pi$. The allowed rapidity interval is set by the most forward and
	backward partons, which are necessarily inside jets. Since these parton
	rapidities are not known at this point, we also have to postpone the
	rapidity generation for the gluons outside jets. For the scalar
	transverse momentum $p_\perp = \|\mathbf{p}_\perp\|$ of a gluon outside
	jets we use the parametrisation
	\begin{equation}
	\label{eq:p_nonjet}
	p_\perp = \lambda + \tilde{p}_\perp\\tan(\tau\r)\,, \qquad
	\tau = \arctan\bigg(\frac{p_{\perp{\cal J}_\text{min}} - \lambda}{\tilde{p}_\perp}\bigg)\,.
	\end{equation}
	For $r \in [0,1)$, $p_\perp$ is always less than the minimum momentum
	$p_{\perp{\cal J}_\text{min}}$ required for a jet. $\tilde{p}_\perp$ is
	a free parameter, a good empirical value is $\tilde{p}_\perp = [1.3 +
	0.2\*(n_g - n_{g,\cal J})]\,$GeV

	\subsubsection{Resummation jet momenta}
	\label{sec:ptj_res}

	On the one hand, each jet momentum is given by the sum of its
	constituent momenta. On the other hand, the resummation jet momenta are
	fixed by the constraints in line five of the master
	equation~\eqref{eq:resumdijetFKLmatched2}. We therefore have to
	calculate the resummation jet momenta from these constraints before
	generating the momenta of the gluons inside jets. This is done in
	\lstinline!PhaseSpacePoint::reshuffle! and in the free
	\lstinline!resummation_jet_momenta! function (declared in \texttt{resummation\_jet.hh}).

	The resummation jet momenta are determined by the $\delta$ functions in
	line five of eq.~(\ref{eq:resumdijetFKLmatched2}). The rapidities are
	fixed to the rapidities of the jets in the input fixed-order events, so
	that the FKL ordering is guaranteed to be preserved.

	In traditional \HEJ reshuffling the transverse momentum are given through
	\begin{equation}
	\label{eq:ptreassign_old}
	\mathbf{p}^B_{\mathcal{J}_{l\perp}} = \mathbf{j}_{l\perp} \equiv \mathbf{p}_{\mathcal{J}_{l}\perp}
	+ \mathbf{q}_\perp \,\frac{\|\mathbf{p}_{\mathcal{J}_{l}\perp}\|}{P_\perp},
	\end{equation}
	where $\mathbf{q}_\perp = \sum_{j=1}^n \mathbf{p}_{i\perp}
	\bigg[1-\theta\bigg(\sum_{j=1}^{m}{\cal J}_j(p_i)\bigg)\bigg] $ is the
	total transverse momentum of all partons \emph{outside} jets and
	$P_\perp = \sum_{j=1}^m \|\mathbf{p}_{\mathcal{J}_{j}\perp}\|$. Since the
	total transverse momentum of an event vanishes, we can also use
	$\mathbf{q}_\perp = - \sum_{j=1}^m
	\mathbf{p}_{\mathcal{J}_{j}\perp}$. Eq.~(\ref{eq:ptreassign}) is a
	non-linear system of equations in the resummation jet momenta
	$\mathbf{p}_{\mathcal{J}_{l}\perp}$. Hence we would have to solve
	\begin{equation}
	\label{eq:ptreassign_eq}
	\mathbf{p}_{\mathcal{J}_{l}\perp}=\mathbf{j}^B_{l\perp} \equiv\mathbf{j}_{l\perp}^{-1}
	\left(\mathbf{p}^B_{\mathcal{J}_{l\perp}}\right)
	\end{equation}
	numerically.

	Since solving such a system is computationally expensive, we instead
	change the reshuffling around to be linear in the resummation jet
	momenta. Hence~\eqref{eq:ptreassign_eq} gets replaces by
	\begin{equation}
	\label{eq:ptreassign}
	\mathbf{p}_{\mathcal{J}_{l\perp}} = \mathbf{j}^B_{l\perp} \equiv \mathbf{p}^B_{\mathcal{J}_{l}\perp}
	- \mathbf{q}_\perp \,\frac{\|\mathbf{p}^B_{\mathcal{J}_{l}\perp}\|}{P^B_\perp},
	\end{equation}
	which is linear in the resummation momentum. Consequently the equivalent
	of~\eqref{eq:ptreassign_old} is non-linear in the Born momentum. However
	the exact form of~\eqref{eq:ptreassign_old} is not relevant for the resummation.
	Both methods have been tested for two and three jets with the \textsc{rivet}
	standard analysis \texttt{MC\_JETS}. They didn't show any differences even
	after $10^9$ events.

	The reshuffling relation~\eqref{eq:ptreassign} allows the transverse
	momenta $p^B_{\mathcal{J}_{l\perp}}$ of the fixed-order jets to be
	somewhat below the minimum transverse momentum of resummation jets. It
	is crucial that this difference does not become too large, as the
	fixed-order cross section diverges for vanishing transverse momenta. In
	the production of a Higgs boson with resummation jets above $30\,$GeV we observe
	that the contribution from fixed-order events with jets softer than
	about $20\,$GeV can be safely neglected. This is shown in the following
	plot of the differential cross section over the transverse momentum of
	the softest fixed-order jet:
	\begin{center}
	\includegraphics[width=.75\textwidth]{ptBMin}
	\end{center}

	Finally, we have to account for the fact that the reshuffling
	relation~\eqref{eq:ptreassign} is non-linear in the Born momenta. To
	arrive at the master formula~\eqref{eq:resumdijetFKLmatched2} for the
	cross section, we have introduced unity in the form of an integral over
	the Born momenta with $\delta$ functions in the integrand, that is
	\begin{equation}
	\label{eq:delta_intro}
	1 = \int_{p_{j\perp}^B=0}^{p_{j\perp}^B=\infty}
	\mathrm{d}^2\mathbf{p}_{j\perp}^B\delta^{(2)}(\mathbf{p}_{\mathcal{J}_{j\perp}}^B -
	\mathbf{j}_{j\perp})\,.
	\end{equation}
	If the arguments of the $\delta$ functions are not linear in the Born
	momenta, we have to compensate with additional Jacobians as
	factors. Explicitly, for the reshuffling relation~\eqref{eq:ptreassign}
	we have
	\begin{equation}
	\label{eq:delta_rewrite}
	\prod_{l=1}^m \delta^{(2)}(\mathbf{p}_{\mathcal{J}_{l\perp}}^B -
	\mathbf{j}_{l\perp}) = \Delta \prod_{l=1}^m \delta^{(2)}(\mathbf{p}_{\mathcal{J}_{l\perp}} -
	\mathbf{j}_{l\perp}^B)\,,
	\end{equation}
	where $\mathbf{j}_{l\perp}^B$ is given by~\eqref{eq:ptreassign_eq} and only
	depends on the Born momenta. We have extended the product to run to $m$
	instead of $m-1$ by eliminating the last $\delta$ function
	$\delta^{(2)}\!\!\left(\sum_{k=1}^n \mathbf{p}_{k\perp}\right )$.
	The Jacobian $\Delta$ is the determinant of a $2m \times 2m$ matrix with $l, l' = 1,\dots,m$
	and $X, X' = x,y$.
	\begin{equation}
	\label{eq:jacobian}
	\Delta = \left\|\frac{\partial\,\mathbf{j}^B_{l'\perp}}{\partial\, \mathbf{p}^B_{{\cal J}_l \perp}} \right\|
	= \left\| \delta_{l l'} \delta_{X X'} - \frac{q_X\, p^B_{{\cal
	J}_{l'}X'}}{\left\|\mathbf{p}^B_{{\cal J}_{l'} \perp}\right\| P^B_\perp}\left(\delta_{l l'}
	- \frac{\left\|\mathbf{p}^B_{{\cal J}_l \perp}\right\|}{P^B_\perp}\right)\right\|\,.
	\end{equation}
	The determinant is calculated in \lstinline!resummation_jet_weight!,
	again coming from the \texttt{resummation\_jet.hh} header.
	Having to introduce this Jacobian is not a disadvantage specific to the new
	reshuffling. If we instead use the old reshuffling
	relation~\eqref{eq:ptreassign_old} we \emph{also} have to introduce a
	similar Jacobian since we actually want to integrate over the
	resummation phase space and need to transform the argument of the
	$\delta$ function to be linear in the resummation momenta for this.

	\subsubsection{Gluons inside Jets}
	\label{sec:gluons_jet}

	After the steps outlined in section~\ref{sec:psp_ng_jet}, we have a
	total number of $m + n_{g,{\cal J}}$ constituents. In
	\lstinline!PhaseSpacePoint::distribute_jet_partons! we distribute them
	randomly among the jets such that each jet has at least one
	constituent. We then generate their momenta in
	\lstinline!PhaseSpacePoint::split! using the \lstinline!Splitter! class.

	The phase space integral for a jet ${\cal J}$ is given by
	\begin{equation}
	\label{eq:ps_jetparton} \prod_{i\text{ in }{\cal J}} \bigg(\int
	\mathrm{d}\mathbf{p}_{i\perp}\ \int \mathrm{d} y_i
	\bigg)\delta^{(2)}\Big(\sum_{i\text{ in }{\cal J}} \mathbf{p}_{i\perp} -
	\mathbf{j}_{\perp}^B\Big)\delta(y_{\mathcal{J}}-y^B_{\mathcal{J}})\,.
	\end{equation}
	For jets with a single constituent, the parton momentum is obiously equal to the
	jet momentum. In the case of two constituents, we observe that the
	partons are always inside the jet cone with radius $R$ and often very
	close to the jet centre. The following plots show the typical relative
	distance $\Delta R/R$ for this scenario:
	\begin{center}
	\includegraphics[width=0.45\linewidth]{dR_2}
	\includegraphics[width=0.45\linewidth]{dR_2_small}
	\end{center}
	According to this preference for small values of $\Delta R$, we
	parametrise the $\Delta R$ integrals as
	\begin{equation}
	\label{eq:dR_sampling}
	\frac{\Delta R}{R} =
	\begin{cases}
	0.25\,x_R & x_R < 0.4 \\
	1.5\,x_R - 0.5 & x_R \geq 0.4
	\end{cases}\,.
	\end{equation}
	Next, we generate $\Theta_1 \equiv \Theta$ and use the constraint $\Theta_2 = \Theta
	\pm \pi$. The transverse momentum of the first parton is then given by
	\begin{equation}
	\label{eq:delta_constraints}
	p_{1\perp} =
	\frac{p_{\mathcal{J} y} - \tan(\phi_2) p_{\mathcal{J} x}}{\sin(\phi_1)
	- \tan(\phi_2)\cos(\phi_1)}\,.
	\end{equation}
	We get $p_{2\perp}$ by exchanging $1 \leftrightarrow 2$ in the
	indices. To obtain the Jacobian of the transformation, we start from the
	single jet phase space eq.~(\ref{eq:ps_jetparton}) with the rapidity
	delta function already rewritten to be linear in the rapidity of the
	last parton, i.e.
	\begin{equation}
	\label{eq:jet_2p}
	\prod_{i=1,2} \bigg(\int
	\mathrm{d}\mathbf{p}_{i\perp}\ \int \mathrm{d} y_i
	\bigg)\delta^{(2)}\Big(\mathbf{p}_{1\perp} + \mathbf{p}_{2\perp} -
	\mathbf{j}_{\perp}^B\Big)\delta(y_2- \dots)\,.
	\end{equation}
	The integral over the second parton momentum is now trivial; we can just replace
	the integral over $y_2$ with the equivalent constraint
	\begin{equation}
	\label{eq:R2}
	\int \mathrm{d}R_2 \ \delta\bigg(R_2 - \bigg[\phi_{\cal J} - \arctan
	\bigg(\frac{p_{{\cal J}y} - p_{1y}}{p_{{\cal J}x} -
	p_{1x}}\bigg)\bigg]/\cos \Theta\bigg) \,.
	\end{equation}
	In order to fix the integral over $p_{1\perp}$ instead, we rewrite this
	$\delta$ function. This introduces the Jacobian
	\begin{equation}
	\label{eq:jac_pt1}
	\bigg\|\frac{\partial p_{1\perp}}{\partial R_2} \bigg\| =
	\frac{\cos(\Theta)\mathbf{p}_{2\perp}^2}{p_{{\cal J}\perp}\sin(\phi_{\cal J}-\phi_1)}\,.
	\end{equation}
	The final form of the integral over the two parton momenta is then
	\begin{equation}
	\label{eq:ps_jet_2p}
	\int \mathrm{d}R_1\ R_1 \int \mathrm{d}R_2 \int \mathrm{d}x_\Theta\ 2\pi \int
	\mathrm{d}p_{1\perp}\ p_{1\perp} \int \mathrm{d}p_{2\perp}
	\ \bigg\|\frac{\partial p_{1\perp}}{\partial R_2} \bigg\|\delta(p_{1\perp}
	-\dots) \delta(p_{2\perp} - \dots)\,.
	\end{equation}

	As is evident from section~\ref{sec:psp_ng_jet}, jets with three or more
	constituents are rare and an efficient phase-space sampling is less
	important. For such jets, we exploit the observation that partons with a
	distance larger than $R_{\text{max}} = \tfrac{5}{3} R$ to
	the jet centre are never clustered into the jet. Assuming $N$
	constituents, we generate all components
	for the first $N-1$ partons and fix the remaining parton with the
	$\delta$-functional. In order to end up inside the jet, we use the
	parametrisation
	\begin{align}
	\label{eq:ps_jet_param}
	\phi_i ={}& \phi_{\cal J} + \Delta \phi_i\,, & \Delta \phi_i ={}& \Delta
	R_i
	\cos(\Theta_i)\,, \\
	y_i ={}& y_{\cal J} + \Delta y_i\,, & \Delta y_i ={}& \Delta
	R_i
	\sin(\Theta_i)\,,
	\end{align}
	and generate $\Theta_i$ and $\Delta R_i$ randomly with $\Delta R_i \leq
	R_{\text{max}}$ and the empiric value $R_{\text{max}} = 5\*R/3$. We can
	then write the phase space integral for a single parton as $(p_\perp = \|\mathbf{p}_\perp\|)$
	\begin{equation}
	\label{eq:ps_jetparton_x}
	\int \mathrm{d}\mathbf{p}_{\perp}\ \int
	\mathrm{d} y \approx \int_{\Box} \mathrm{d}x_{\perp}
	\mathrm{d}x_{ R}
	\mathrm{d}x_{\theta}\
	2\\pi\,\R_{\text{max}}^2\,\x_{R}\,\p_{\perp}\,\*(p_{\perp,\text{max}}
	- p_{\perp,\text{min}})
	\end{equation}
	with
	\begin{align}
	\label{eq:ps_jetparton_parameters}
	\Delta \phi ={}& R_{\text{max}}\x_{R}\\cos(2\\pi\x_\theta)\,,&
	\Delta y ={}& R_{\text{max}}\x_{R}\\sin(2\\pi\x_\theta)\,, \\
	p_{\perp} ={}& (p_{\perp,\text{max}} - p_{\perp,\text{min}})\*x_\perp +
	p_{\perp,\text{min}}\,.
	\end{align}
	$p_{\perp,\text{max}}$ is determined from the requirement that the total
	contribution from the first $n-1$ partons --- i.e. the projection onto the
	jet $p_{\perp}$ axis --- must never exceed the jet $p_\perp$. This gives
	\todo{This bound is too high}
	\begin{equation}
	\label{eq:pt_max}
	p_{i\perp,\text{max}} = \frac{p_{{\cal J}\perp} - \sum_{j<i} p_{j\perp}
	\cos \Delta
	\phi_j}{\cos \Delta
	\phi_i}\,.
	\end{equation}
	The $x$ and $y$ components of the last parton follow immediately from
	the first $\delta$ function. The last rapidity is fixed by the condition that
	the jet rapidity is kept fixed by the reshuffling, i.e.
	\begin{equation}
	\label{eq:yJ_delta}
	y^B_{\cal J} = y_{\cal J} = \frac 1 2 \ln \frac{\sum_{i=1}^n E_i+ p_{iz}}{\sum_{i=1}^n E_i - p_{iz}}\,.
	\end{equation}
	With $E_n \pm p_{nz} = p_{n\perp}\exp(\pm y_n)$ this can be rewritten to
	\begin{equation}
	\label{eq:yn_quad_eq}
	\exp(2y_{\cal J}) = \frac{\sum_{i=1}^{n-1} E_i+ p_{iz}+p_{n\perp} \exp(y_n)}{\sum_{i=1}^{n-1} E_i - p_{iz}+p_{n\perp} \exp(-y_n)}\,,
	\end{equation}
	which is a quadratic equation in $\exp(y_n)$. The physical solution is
	\begin{align}
	\label{eq:yn}
	y_n ={}& \log\Big(-b + \sqrt{b^2 + \exp(2y_{\cal J})}\,\Big)\,,\\
	b ={}& \bigg(\sum_{i=1}^{n-1} E_i + p_{iz} - \exp(2y_{\cal J})
	\sum_{i=1}^{n-1} E_i - p_{iz}\bigg)/(2 p_{n\perp})\,.
	\end{align}
	\todo{what's wrong with the following?} To eliminate the remaining rapidity
	integral, we transform the $\delta$ function to be linear in the
	rapidity $y$ of the last parton. The corresponding Jacobian is
	\begin{equation}
	\label{eq:jacobian_y}
	\bigg\|\frac{\partial y_{\cal J}}{\partial y_n}\bigg\|^{-1} = 2 \bigg( \frac{E_n +
	p_{nz}}{E_{\cal J} + p_{{\cal J}z}} + \frac{E_n - p_{nz}}{E_{\cal J} -
	p_{{\cal J}z}}\bigg)^{-1}\,.
	\end{equation}
	Finally, we check that all designated constituents are actually
	clustered into the considered jet.

	\subsubsection{Final steps}
	\label{sec:final}

	Knowing the rapidity span covered by the extremal partons, we can now
	generate the rapdities for the partons outside jets. We perform jet
	clustering on all partons and check in
	\lstinline!PhaseSpacePoint::jets_ok! that all the following criteria are
	fulfilled:
	\begin{itemize}
	\item The number of resummation jets must match the number of
	fixed-order jets.
	\item No partons designated to be outside jets may end up inside jets.
	\item All other outgoing partons \emph{must} end up inside jets.
	\item The extremal (in rapidity) partons must be inside the extremal
	jets. If there is, for example, an unordered forward emission, the
	most forward parton must end up inside the most forward jet and the
	next parton must end up inside second jet.
	\item The rapidities of fixed-order and resummation jets must match.
	\end{itemize}
	After this, we adjust the phase-space normalisation according to the
	third line of eq.~(\ref{eq:resumdijetFKLmatched2}), determine the
	flavours of the outgoing partons, and adopt any additional colourless
	bosons from the fixed-order input event. Finally, we use momentum
	conservation to reconstruct the momenta of the incoming partons.

	\subsection{Colour connection}
	\label{sec:Colour}

	\begin{figure}
	\input{src/ColourConnect.tex}
	\caption{Left: Non-crossing colour flow dominating in the MRK limit. The
	crossing of the colour line connecting to particle 2 can be resolved by
	writing particle 2 on the left. Right: A colour flow with a (manifest)
	colour-crossing. The crossing can only be resolved if one breaks the
	rapidities order, e.g. switching particles 2 and 3. From~\cite{Andersen:2017sht}.}
	\label{fig:Colour_crossing}
	\end{figure}

	After the phase space for the resummation event is generated, we can construct
	the colour for each particle. To generate the colour flow one has to call
	\lstinline!Event::generate_colours! on any \HEJ configuration. For non-\HEJ
	event we do not change the colour, and assume it is provided by the user (e.g.
	through the LHE file input). The colour connection is done in the large $N_c$
	(infinite number of colour) limit with leading colour in
	MRK~\cite{Andersen:2008ue, Andersen:2017sht}. The idea is to allow only
	$t$-channel colour exchange, without any crossing colour lines. For example the
	colour crossing in the colour connection on the left of
	figure~\ref{fig:Colour_crossing} can be resolved by switching \textit{particle
	2} to the left.

	We can write down the colour connections by following the colour flow from
	\textit{gluon a} to \textit{gluon b} and back to \textit{gluon a}, e.g.
	figure~\ref{fig:Colour_gleft} corresponds to $a123ba$. In such an expression any
	valid, non-crossing colour flow will connect all external legs while respecting
	the rapidity ordering. Thus configurations like the left of
	figure~\ref{fig:Colour_crossing} are allowed ($a134b2a$), but the right of the
	same figures breaks the rapidity ordering between 2 and 3 ($a1324ba$). Note that
	connections between $b$ and $a$ are in inverse order, e.g. $ab321a$ corresponds to~\ref{fig:Colour_gright} ($a123ba$) just with colour and anti-colour swapped.

	\begin{figure}
	\centering
	\subcaptionbox{$a123ba$\label{fig:Colour_gright}}{
	\includegraphics[height=0.25\textwidth]{figures/colour_gright.jpg}}
	\subcaptionbox{$a13b2a$\label{fig:Colour_gleft}}{
	\includegraphics[height=0.25\textwidth]{figures/colour_gleft.jpg}}
	\subcaptionbox{$a\_123ba$\label{fig:Colour_qx}}{
	\includegraphics[height=0.25\textwidth]{figures/colour_qx.jpg}}
	\subcaptionbox{$a\_23b1a$\label{fig:Colour_uno}}{
	\includegraphics[height=0.25\textwidth]{figures/colour_uno.jpg}}
	\subcaptionbox{$a14b3\_2a$\label{fig:Colour_qqx}}{
	\includegraphics[height=0.25\textwidth]{figures/colour_centralqqx.jpg}}
	\caption{Different colour non-crossing colour connections. Both incoming
	particles are drawn at the top or bottom and the outgoing left or right.
	The Feynman diagram is shown in black and the colour flow in blue.}
	%TODO Maybe make these plots nicer (in Latex/asy)
	\end{figure}

	If we replace two gluons with a quark, (anti-)quark pair we break one of the
	colour connections. Still the basic concept from before holds, we just have to
	treat the connection between two (anti-)quarks like an unmovable (anti-)colour.
	We denote such a connection by a underscore (e.g. $1\_a$). For example the
	equivalent of~\ref{fig:Colour_gright} ($a123ba$) with an incoming antiquark
	is~\ref{fig:Colour_qx} ($a\_123ba$). As said this also holds for other
	subleading configurations like unordered emission~\ref{fig:Colour_uno} or
	central quark-antiquark pairs~\ref{fig:Colour_qqx} \footnote{Obviously this can
	not be guaranteed for non-\HEJ configurations, e.g. $qQ\to Qq$ requires a
	$u$-channel exchange.}.

	Some rapidity ordering can have multiple possible colour connections,
	e.g.~\ref{fig:Colour_gright} and~\ref{fig:Colour_gleft}. This is always the case
	if a gluon radiates off a gluon line. In that case we randomly connect the gluon
	to either the colour or anti-colour. Thus in the generation we keep track
	whether we are on a quark or gluon line, and act accordingly.

	\subsection{The matrix element }
	\label{sec:ME}

	The derivation of the \HEJ matrix element is explained in some detail
	in~\cite{Andersen:2017kfc}, where also results for leading and
	subleading matrix elements for pure multijet production and production
	of a Higgs boson with at least two associated jets are listed. Matrix
	elements for $Z/\gamma^*$ production together with jets are
	given in~\cite{Andersen:2016vkp}, but not yet included.
	A full list of all implemented currents is given in
	section~\ref{sec:currents_impl}.

	The matrix elements are implemented in the \lstinline!MatrixElement!
	class. To discuss the structure, let us consider the squared matrix
	element for FKL multijet production with $n$ final-state partons:
	\begin{align}
	\label{eq:ME}
	\begin{split}
	\overline{\left\|\mathcal{M}_\text{HEJ}^{f_1 f_2 \to f_1
	g\cdots g f_2}\right\|}^2 = \ &\frac {(4\pi\alpha_s)^n} {4\ (N_c^2-1)}
	\cdot\ \textcolor{blue}{\frac {K_{f_1}(p_1^-, p_a^-)} {t_1}\ \cdot\ \frac{K_{f_2}(p_n^+, p_b^+)}{t_{n-1}}\ \cdot\ \left\\|S_{f_1 f_2\to f_1 f_2}\right\\|^2}\\
	& \cdot \prod_{i=1}^{n-2} \textcolor{gray}{\left( \frac{-C_A}{t_it_{i+1}}\
	V^\mu(q_i,q_{i+1})V_\mu(q_i,q_{i+1}) \right)}\\
	& \cdot \prod_{j=1}^{n-1} \textcolor{red}{\exp\left[\omega^0(q_{j\perp})(y_{j+1}-y_j)\right]}.
	\end{split}
	\end{align}
	The structure and momentum assignment of the unsquared matrix element is
	as illustrated here:
	\begin{center}
	\includegraphics{HEJ_amplitude}
	\end{center}
	The square
	of the complete matrix element as given in eq.~\eqref{eq:ME} is
	calculated by \lstinline!MatrixElement::operator()!. The \textcolor{red}{last line} of
	eq.~\eqref{eq:ME} constitutes the all-order virtual correction,
	implemented in
	\lstinline!MatrixElement::virtual_corrections!.
	$\omega^0$ is the
	\textit{regularised Regge trajectory}
	\begin{equation}
	\label{eq:omega_0}
	\omega^0(q_\perp) = - C_A \frac{\alpha_s}{\pi} \log \left(\frac{q_\perp^2}{\lambda^2}\right)\,,
	\end{equation}
	where $\lambda$ is the slicing parameter limiting the softness of real
	gluon emissions, cf. eq.~\eqref{eq:resumdijetFKLmatched2}. $\lambda$ can be
	changed at runtime by setting \lstinline!regulator parameter! in
	\lstinline!conifg.yml!.

	The remaining parts, which correspond to the square of the leading-order
	HEJ matrix element $\overline{\left\|\mathcal{M}_\text{LO,
	HEJ}^{f_1f_2\to f_1g\cdots
	gf_2}\big(\big\{p^B_j\big\}\big)\right\|}^{2}$, are computed in
	\lstinline!MatrixElement::tree!. We can further factor off the
	scale-dependent ``parametric'' part
	\lstinline!MatrixElement::tree_param! containing all factors of the
	strong coupling $4\pi\alpha_s$. Using this function saves some CPU time
	when adjusting the renormalisation scale, see
	section~\ref{sec:resum}. The remaining ``kinematic'' factors are
	calculated in \lstinline!MatrixElement::kin!.

	\subsubsection{Matrix elements for Higgs plus dijet}
	\label{sec:ME_h_jets}

	In the production of a Higgs boson together with jets the parametric
	parts and the virtual corrections only require minor changes in the
	respective functions. However, in the ``kinematic'' parts we have to
	distinguish between several cases, which is done in
	\lstinline!MatrixElement::tree_kin_Higgs!. The Higgs boson can be
	\emph{central}, i.e. inside the rapidity range spanned by the extremal
	partons (\lstinline!MatrixElement::tree_kin_Higgs_central!) or
	\emph{peripheral} and outside this range
	(\lstinline!MatrixElement::tree_kin_Higgs_first! or
	\lstinline!MatrixElement::tree_kin_Higgs_last!). Currently the current for an
	unordered emission with an Higgs on the same side it not implemented
	\footnote{In principle emitting a Higgs boson \textit{on the other
	side} of the unordered gluon is possible by contracting an unordered and
	external Higgs current. Obviously this would not cover all possible
	configurations, e.g. $qQ\to HgqQ$ requires contraction of the standard $Q\to Q$
	current with an (unknown) $q\to Hgq$ one.}.

	If a Higgs boson with momentum $p_H$ is emitted centrally, after parton
	$j$ in rapidity, the matrix element reads
	\begin{equation}
	\label{eq:ME_h_jets_central}
	\begin{split}
	\overline{\left\|\mathcal{M}_\text{HEJ}^{f_1 f_2 \to f_1 g\cdot H
	\cdot g f_2}\right\|}^2 = \ &\frac {\alpha_s^2 (4\pi\alpha_s)^n} {4\ (N_c^2-1)}
	\cdot\ \textcolor{blue}{\frac {K_{f_1}(p_1^-, p_a^-)} {t_1}\
	\cdot\ \frac{1}{t_j t_{j+1}} \cdot\ \frac{K_{f_2}(p_n^+, p_b^+)}{t_{n}}\ \cdot\ \left\\|S_{f_1
	f_2\to f_1 H f_2}\right\\|^2}\\
	& \cdot \prod_{\substack{i=1\\i \neq j}}^{n-1} \textcolor{gray}{\left( \frac{-C_A}{t_it_{i+1}}\
	V^\mu(q_i,q_{i+1})V_\mu(q_i,q_{i+1}) \right)}\\
	& \cdot \textcolor{red}{\prod_{i=1}^{n-1}
	\exp\left[\omega^0(q_{i\perp})\Delta y_i\right]}
	\end{split}
	\end{equation}
	with the momentum definitions
	\begin{center}
	\includegraphics{HEJ_central_Higgs_amplitude}
	\end{center}
	$q_i$ is the $i$th $t$-channel momentum and $\Delta y_i$ the rapidity
	gap between outgoing \emph{particles} (not partons) $i$ and $i+1$ in
	rapidity ordering.

	For \emph{peripheral} emission in the backward direction
	(\lstinline!MatrixElement::tree_kin_Higgs_first!) we first check whether
	the most backward parton is a gluon or an (anti-)quark. In the latter
	case the leading contribution to the matrix element arises through
	emission off the $t$-channel gluons and we can use the same formula
	eq.~(\ref{eq:ME_h_jets_central}) as for central emission. If the most
	backward parton is a gluon, the square of the matrix element can be
	written as
	\begin{equation}
	\label{eq:ME_h_jets_peripheral}
	\begin{split}
	\overline{\left\|\mathcal{M}_\text{HEJ}^{g f_2 \to H g\cdot g f_2}\right\|}^2 = \ &\frac {\alpha_s^2 (4\pi\alpha_s)^n} {\textcolor{blue}{4\ (N_c^2-1)}}
	\textcolor{blue}{\cdot\ K_{H}\
	\frac{K_{f_2}(p_n^+, p_b^+)}{t_{n-1}}\ \cdot\ \left\\|S_{g
	f_2\to H g f_2}\right\\|^2}\\
	& \cdot \prod_{\substack{i=1}}^{n-2} \textcolor{gray}{\left( \frac{-C_A}{t_it_{i+1}}\
	V^\mu(q_i,q_{i+1})V_\mu(q_i,q_{i+1}) \right)}\\
	& \cdot \textcolor{red}{\prod_{i=1}^{n-1}
	\exp\left[\omega^0(q_{i\perp}) (y_{i+1} - y_i)\right]}
	\end{split}
	\end{equation}
	with the momenta as follows:
	\begin{center}
	\includegraphics{HEJ_peripheral_Higgs_amplitude}
	\end{center}
	The \textcolor{blue}{blue part} is implemented in
	\lstinline!MatrixElement::MH2_forwardH!. All other building blocks are
	already available.\todo{Impact factors} The actual current contraction
	is calculated in \lstinline!MH2gq_outsideH! inside
	\lstinline!src/Hjets.cc!, which corresponds to $\tfrac{16 \pi^2}{t_1} \left\\|S_{g
	f_2\to H g f_2}\right\\|^2$.\todo{Fix this insane normalisation}

	The forward emission of a Higgs boson is completely analogous. We can
	use the same function \lstinline!MatrixElement::MH2_forwardH!, swapping
	$p_1 \leftrightarrow p_n,\,p_a \leftrightarrow p_b$.

	\subsubsection{FKL ladder and Lipatov vertices}
	\label{sec:FKL_ladder}

	The ``FKL ladder'' is the product
	\begin{equation}
	\label{eq:FKL_ladder}
	\prod_{i=1}^{n-2} \left( \frac{-C_A}{t_it_{i+1}}\
	V^\mu(q_i,q_{i+1})V_\mu(q_i,q_{i+1}) \right)
	\end{equation}
	appearing in the square of the matrix element for $n$ parton production,
	cf. eq.~(\ref{eq:ME}), and implemented in
	\lstinline!MatrixElement::FKL_ladder_weight!. The Lipatov vertex contraction
	$V^\mu(q_i,q_{i+1})V_\mu(q_i,q_{i+1})$ is implemented \lstinline!C2Lipatovots!.
	It is given by \todo{equation} \todo{mention difference between the two versions
	of \lstinline!C2Lipatovots!, maybe even get rid of one}.

	\subsubsection{Currents}
	\label{sec:currents}

	The current factors $\frac{K_{f_1}K_{f_2}}{t_1 t_{n-1}}\left\\|S_{f_1
	f_2\to f_1 f_2}\right\\|^2$ and their extensions for unordered and Higgs
	boson emissions are implemented in the \lstinline!jM2!$\dots$ functions
	of \texttt{src/Hjets.cc}. \todo{Only $\\|S\\|^2$ should be in currents}
	\footnote{The current implementation for
	Higgs production in \texttt{src/Hjets.cc} includes the $1/4$ factor
	inside $S$, opposing to~\eqref{eq:ME}. Thus the overall normalisation is
	unaffected.} The ``colour acceleration multiplier'' (CAM) $K_{f}$
	for a parton $f\in\{g,q,\bar{q}\}$ is defined as
	\begin{align}
	\label{eq:K_g}
	K_g(p_1^-, p_a^-) ={}& \frac{1}{2}\left(\frac{p_1^-}{p_a^-} + \frac{p_a^-}{p_1^-}\right)\left(C_A -
	\frac{1}{C_A}\right)+\frac{1}{C_A}\\
	\label{eq:K_q}
	K_q(p_1^-, p_a^-) ={}&K_{\bar{q}}(p_1^-, p_a^-) = C_F\,.
	\end{align}
	The Higgs current CAM used in eq.~(\ref{eq:ME_h_jets_peripheral}) is
	\begin{equation}
	\label{eq:K_H}
	K_H = C_A\,.
	\end{equation}
	The current contractions are given by\todo{check all this
	carefully!}
	\begin{align}
	\label{eq:S}
	\left\\|S_{f_1 f_2\to f_1 f_2}\right\\|^2 ={}& \sum_{\substack{\lambda_a =
	+,-\\\lambda_b = +,-}} \left\|j^{\lambda_a}_\mu(p_1, p_a)\
	j^{\lambda_b\,\mu}(p_n, p_b)\right\|^2 = 2\sum_{\lambda =
	+,-} \left\|j^{-}_\mu(p_1, p_a)\ j^{\lambda\,\mu}(p_n, p_b)\right\|^2\,,\\
	\left\\|S_{f_1 f_2\to f_1 H f_2}\right\\|^2 ={}& \sum_{\substack{\lambda_a =
	+,-\\\lambda_b = +,-}} \left\|j^{\lambda_a}_\mu(p_1, p_a)V_H^{\mu\nu}(q_j, q_{j+1})\
	j^{\lambda_b}_\nu(p_n, p_b)\right\|^2\,,\\
	\left\\|S_{g f_2 \to H g f_2}\right\\|^2 ={}& \sum_{
	\substack{
	\lambda_{a} = +,-\\
	\lambda_{1} =+,-\\
	\lambda_{b} = +,-
	}}
	\left\|j^{\lambda_a\lambda_1}_{H\,\mu}(p_1, p_a, p_H)\ j^{\lambda_b\,\mu}(p_n, p_b)\right\|^2\,.
	\end{align}
	The ``basic'' currents $j$ are independent of the parton flavour and read
	\begin{equation}
	\label{eq:j}
	j^\pm_\mu(p, q) = u^{\pm,\dagger}(p)\ \sigma^\pm_\mu\ u^{\pm}(q)\,,
	\end{equation}
	where $\sigma_\mu^\pm = (1, \pm \sigma_i)$ and $\sigma_i$ are the Pauli
	matrices
	\begin{equation}
	\label{eq:Pauli_matrices}
	\sigma_1 =
	\begin{pmatrix}
	0 & 1\\ 1 & 0
	\end{pmatrix}
	\,,
	\qquad \sigma_2 =
	\begin{pmatrix}
	0 & -i\\ i & 0
	\end{pmatrix}
	\,,
	\qquad \sigma_3 =
	\begin{pmatrix}
	1 & 0\\ 0 & -1
	\end{pmatrix}
	\,.
	\end{equation}
	The two-component chiral spinors are given by
	\begin{align}
	\label{eq:u_plus}
	u^+(p)={}& \left(\sqrt{p^+}, \sqrt{p^-} \hat{p}_\perp \right) \,,\\
	\label{eq:u_minus}
	u^-(p)={}& \left(\sqrt{p^-} \hat{p}^*_\perp, -\sqrt{p^+}\right)\,,
	\end{align}
	with $p^\pm = E\pm p_z,\, \hat{p}_\perp = \tfrac{p_\perp}{\|p_\perp\|},\,
	p_\perp = p_x + i p_y$. The spinors for vanishing transverse momentum
	are obtained by replacing $\hat{p}_\perp \to -1$.

	Explicitly, the currents read
	\begin{align}
	\label{eq:j-_explicit}
	j^-_\mu(p, q) ={}&
	\begin{pmatrix}
	\sqrt{p^+\,q^+} + \sqrt{p^-\,q^-} \hat{p}_{\perp} \hat{q}_{\perp}^*\\
	\sqrt{p^-\,q^+}\, \hat{p}_{\perp} + \sqrt{p^+\,q^-}\,\hat{q}_{\perp}^*\\
	-i \sqrt{p^-\,q^+}\, \hat{p}_{\perp} + i \sqrt{p^+\,q^-}\, \hat{q}_{\perp}^*\\
	\sqrt{p^+\,q^+} - \sqrt{p^-\,q^-}\, \hat{p}_{\perp}\, \hat{q}_{\perp}^*
	\end{pmatrix}\,,\\
	j^+_\mu(p, q) ={}&\big(j^-_\mu(p, q)\big)^*\,,\\
	j^\pm_\mu(q, p) ={}&\big(j^\pm_\mu(p, q)\big)^*\,.
	\end{align}
	If $q= p_{\text{in}}$ is the momentum of an incoming parton, we have
	$\hat{p}_{\text{in} \perp} = -1$ and either $p_{\text{in}}^+ = 0$ or
	$p_{\text{in}}^- = 0$. The current simplifies further:\todo{Helicities flipped w.r.t code}
	\begin{align}
	\label{eq:j_explicit}
	j^-_\mu(p_{\text{out}}, p_{\text{in}}) ={}&
	\begin{pmatrix}
	\sqrt{p_{\text{in}}^+\,p_{\text{out}}^+}\\
	\sqrt{p_{\text{in}}^+\,p_{\text{out}}^-} \ \hat{p}_{\text{out}\,\perp}\\
	-i\,j^-_1\\
	j^-_0
	\end{pmatrix}
	& p_{\text{in}\,z} > 0\,,\\
	j^-_\mu(p_{\text{out}}, p_{\text{in}}) ={}&
	\begin{pmatrix}
	-\sqrt{p_{\text{in}}^-\,p_{\text{out}}^{-\phantom{+}}} \ \hat{p}_{\text{out}\,\perp}\\
	- \sqrt{p_{\text{in}}^-\,p_{\text{out}}^+}\\
	i\,j^-_1\\
	-j^-_0
	\end{pmatrix} & p_{\text{in}\,z} < 0\,.
	\end{align}
	We also employ the usual short-hand notation
	\begin{align}
	\label{eq:angle_product}
	\spa i.j ={}& {\big(u^-(p_i)\big)}^\dagger u^+(p_j) =
	\sqrt{p_i^-p_j^+}\hat{p}_{i,\perp} - \sqrt{p_i^+p_j^-}\hat{p}_{j,\perp}\,,\\
	\label{eq:square_product}
	\spb i.j ={}& {\big(u^+(p_i)\big)}^\dagger u^-(p_j) = -\spa i.j ^*\,.
	\end{align}
	For the gluon polarisation vectors with gluon momentum $p_g$ and auxiliary
	reference vector $p_r$ we use
	\begin{equation}
	\label{eq:pol_vector}
	\epsilon_\mu^+(p_g, p_r) = \frac{j_\mu^+(p_r, p_g)}{\sqrt{2}\spb g.r}\,,\qquad\epsilon_\mu^-(p_g, p_r) = \frac{j_\mu^-(p_r, p_g)}{\sqrt{2}\spa g.r}\,.
	\end{equation}

	\subsection{Unweighting}
	\label{sec:unweight}

	Straightforward event generation tends to produce many events with small
	weights. Those events have a negligible contribution to the final
	observables, but can take up considerable storage space and CPU time in
	later processing stages. This problem can be addressed by unweighting.

	For naive unweighting, one would determine the maximum weight
	$w_\text{max}$ of all events, discard each event with weight $w$ with a
	probability $p=w/w_\text{max}$, and set the weights of all remaining
	events to $w_\text{max}$. The downside to this procedure is that it also
	eliminates a sizeable fraction of events with moderate weight, so that
	the statistical convergence deteriorates. Naive unweighting can be
	performed by using the \lstinline!set_cut_to_maxwt! member function of the
	\lstinline!Unweighter! on the events and then call the
	\lstinline!unweight! member function. It can be enabled for the
	resummation events as explained in the user documentation.

	To ameliorate the problem of naive unweighting, we also implement
	partial unweighting. That is, we perform unweighting only for events with
	sufficiently small weights. When using the \lstinline!Unweighter! member
	function \lstinline!set_cut_to_peakwt! we estimate the
	mean and width of the weight-weight distribution from a sample of
	events. We use these estimates to determine the maximum weight below
	which unweighting is performed. The actual unweighting is again done in
	the \lstinline!Unweighter::unweight! function.

	\section{The fixed-order generator}
	\label{sec:HEJFOG}

	Even at leading order, standard fixed-order generators can only generate
	events with a limited number of final-state particles within reasonable
	CPU time. The purpose of the fixed-order generator is to supplement this
	with high-multiplicity input events according to the first two lines of
	eq.~\eqref{eq:resumdijetFKLmatched2} with the \HEJ approximation
	$\mathcal{M}_\text{LO, HEJ}^{f_1f_2\to f_1g\cdots gf_2}$ instead of the
	full fixed-order matrix element $\mathcal{M}_\text{LO}^{f_1f_2\to
	f_1g\cdots gf_2}$. Its usage is described in the user
	documentation \url{https://hej.web.cern.ch/HEJ/doc/current/user/HEJFOG.html}.

	\subsection{File structure}
	\label{sec:HEJFOG_structure}

	The code for the fixed-order generator is in the \texttt{FixedOrderGen}
	directory, which contains the following:
	\begin{description}
	\item[include:] Contains the C++ header files.
	\item[src:] Contains the C++ source files.
	\item[t:] Contains the source code for the automated tests.
	\item[CMakeLists.txt:] Configuration file for the \cmake build system.
	\item[configFO.yml:] Sample configuration file for the fixed-order generator.
	\end{description}
	The code is generally in the \lstinline!HEJFOG! namespace. Functions and
	classes \lstinline!MyClass! are usually declared in
	\texttt{include/MyClass.hh} and implemented in \texttt{src/MyClass.cc}.

	\subsection{Program flow}
	\label{sec:prog_flow}

	A single run of the fixed-order generator consists of three or four
	stages.

	First, we perform initialisation similar to HEJ 2, see
	section~\ref{sec:init}. Since there is a lot of overlap we frequently
	reuse classes and functions from HEJ 2, i.e. from the
	\lstinline!HEJ! namespace. The code for parsing the configuration file
	is in \texttt{include/config.hh} and implemented in
	\texttt{src/config.cc}.

	If partial unweighting is requested in the user settings \url{https://hej.web.cern.ch/HEJ/doc/current/user/HEJFOG.html#settings},
	the initialisation is followed by a calibration phase. We use a
	\lstinline!EventGenerator! to produce a number of trial
	events. We use these to calibrate the \lstinline!Unweighter! in
	its constructor and produce a first batch of partially unweighted
	events. This also allows us to estimate our unweighting efficiency.

	In the next step, we continue to generate events and potentially
	unweight them. Once the user-defined target number of events is reached,
	we adjust their weights according to the number of required trials. As
	in HEJ 2 (see section~\ref{sec:processing}), we pass the final
	events to a \lstinline!HEJ::Analysis! and a
	\lstinline!HEJ::CombinedEventWriter!.

	\subsection{Event generation}
	\label{sec:evgen}

	Event generation is performed by the
	\lstinline!EventGenerator::gen_event! member function. We begin by generating a
	\lstinline!PhaseSpacePoint!. This is not to be confused with
	the resummation phase space points represented by
	\lstinline!HEJ::PhaseSpacePoint!! After jet clustering, we compute the
	leading-order matrix element (see section~\ref{sec:ME}) and pdf factors.

	The phase space point generation is performed in the
	\lstinline!PhaseSpacePoint! constructor. We first construct the
	user-defined number of $n_p$ partons (by default gluons) in
	\lstinline!PhaseSpacePoint::gen_LO_partons!. We use flat sampling in
	rapidity and azimuthal angle. For the scalar transverse momenta, we
	distinguish between two cases. By default, they are generated based on a
	random variable $x_{p_\perp}$ according to
	\begin{equation}
	\label{eq:pt_sampling}
	p_\perp = p_{\perp,\text{min}} +
	\begin{cases}
	p_{\perp,\text{par}}
	\tan\left(
	x_{p_\perp}
	\arctan\left(
	\frac{p_{\perp,\text{max}} - p_{\perp,\text{min}}}{p_{\perp,\text{par}}}
	\right)
	\right)
	& y < y_\text{cut}
	\\
	- \tilde{p}_{\perp,\text{par}}\log\left(1 - x_{p_\perp}\left[1 -
	\exp\left(\frac{p_{\perp,\text{min}} -
	p_{\perp,\text{max}}}{\tilde{p}_{\perp,\text{par}}}\right)\right]\right)
	& y \geq y_\text{cut}
	\end{cases}\,,
	\end{equation}
	where $p_{\perp,\text{min}}$ is the minimum jet transverse momentum,
	$p_{\perp,\text{max}}$ is the maximum transverse parton momentum,
	tentatively set to the beam energy, and $y_\text{cut}$, $p_{\perp,\text{par}}$
	and $\tilde{p}_{\perp,\text{par}}$ are generation parameters set to
	heuristically determined values of
	\begin{align}
	y_\text{cut}&=3,\\
	p_{\perp,\text{par}}&=p_{\perp,\min}+\frac{n_p}{5}, \\
	\tilde{p}_{\perp,\text{par}}&=\frac{p_{\perp,\text{par}}}{1 +
	5(y-y_\text{cut})}.
	\end{align}
	The problem with this generation is that the transverse momenta peak at
	the minimum transverse momentum required for fixed-order jets. However,
	if we use the generated events as input for \HEJ resummation, events
	with such soft transverse momenta hardly contribute, see
	section~\ref{sec:ptj_res}. To generate efficient input for resummation,
	there is the user option \texttt{peak pt}, which specifies the
	dominant transverse momentum for resummation jets. If this option is
	set, most jets will be generated as above, but with
	$p_{\perp,\text{min}}$ set to the peak transverse momentum $p_{\perp,
	\text{peak}}$. In addition, there is a small chance of around $2\%$ to
	generate softer jets. The heuristic ansatz for the transverse momentum
	distribution in the ``soft'' region is
	\begin{equation}
	\label{FO_pt_soft}
	\frac{\partial \sigma}{\partial p_\perp} \propto e^{n_p\frac{p_\perp- p_{\perp,
	\text{peak}}}{\bar{p}_\perp}}\,,
	\end{equation}
	where $n_p$ is the number of partons and $\bar{p}_\perp \approx
	4\,$GeV. To achieve this distribution, we use
	\begin{equation}
	\label{eq:FO_pt_soft_sampling}
	p_\perp = p_{\perp, \text{peak}} + \bar{p}_\perp \frac{\log x_{p_\perp}}{n_p}
	\end{equation}
	and discard the phase space point if the parton is too soft, i.e. below the threshold for
	fixed-order jets.

	After ensuring that all partons form separate jets, we generate any
	potential colourless emissions. We then determine the incoming momenta
	and flavours in \lstinline!PhaseSpacePoint::reconstruct_incoming! and
	adjust the outgoing flavours to ensure an FKL configuration. Finally, we
	may reassign outgoing flavours to generate suppressed (for example
	unordered) configurations.

	\input{currents}
	\input{tensor}

	\appendix
	\section{Continuous Integration}
	\label{sec:CI}

	Whenever you are implementing something new or fixed a bug, please also add a
	test for the new behaviour to \texttt{t/CMakeLists.txt} via
	\lstinline!add_test!. These test can be triggered by running
	\lstinline!make test! or \lstinline!ctest! after compiling. A typical test
	should be at most a few seconds, so it can be potentially run on each commit
	change by each developer. If you require a longer, more careful test, preferably
	on top of a small one, surround it with
	\begin{lstlisting}[caption={}]
	if(${TEST_ALL})
	add_test(
	NAME t_feature
	COMMAND really_long_test
	)
	endif()
	\end{lstlisting}
	Afterwards you can execute the longer tests with\footnote{No recompiling is
	needed, as long as only the \lstinline!add_test! command is guarded, not the
	compiling commands itself.}
	\begin{lstlisting}[language=sh,caption={}]
	cmake base/directory -DTEST_ALL=TRUE
	make test
	\end{lstlisting}

	On top of that you should add
	\href{https://en.cppreference.com/w/cpp/error/assert}{\lstinline!assert!s} in
	the code itself. They are only executed when compiled with
	\lstinline!CMAKE_BUILD_TYPE=Debug!, without slowing down release code. So you
	can use them everywhere to test \textit{expected} or \textit{assumed} behaviour,
	e.g. requiring a Higgs boson or relying on rapidity ordering.

	GitLab provides ways to directly test code via \textit{Continuous integrations}.
	The CI is controlled by \texttt{.gitlab-ci.yml}. For all options for the YAML
	file see \href{https://docs.gitlab.com/ee/ci/yaml/}{docs.gitlab.com/ee/ci/yaml/}.https://gitlab.dur.scotgrid.ac.uk/hej/docold/tree/master/Theses
	GitLab also provides a small tool to check that YAML syntax is correct under
	\lstinline!CI/CD > Pipelines > CI Lint! or
	\href{https://gitlab.dur.scotgrid.ac.uk/hej/HEJ/-/ci/lint}{gitlab.dur.scotgrid.ac.uk/hej/HEJ/-/ci/lint}.

	Currently the CI is configured to trigger a \textit{Pipeline} on each
	\lstinline!git push!. The corresponding \textit{GitLab runners} are configured
	under \lstinline!CI/CD Settings>Runners! in the GitLab UI. All runners use a
	\href{https://www.docker.com/}{docker} image as virtual environments\footnote{To
	use only Docker runners set the \lstinline!docker! tag in
	\texttt{.gitlab-ci.yml}.}. The specific docker images maintained separately. If
	you add a new dependencies, please also provide a docker image for the CI. The
	goal to be able to test \HEJ with all possible configurations.

	Each pipeline contains multiple stages (see \lstinline!stages! in
	\texttt{.gitlab-ci.yml}) which are executed in order from top to bottom.
	Additionally each stage contains multiple jobs. For example the stage
	\lstinline!build! contains the jobs \lstinline!build:basic!,
	\lstinline!build:qcdloop!, \lstinline!build:rivet!, etc., which compile \HEJ for
	different environments and dependencies, by using different Docker images. Jobs
	starting with an dot are ignored by the Runner, e.g. \lstinline!.HEJ_build! is
	only used as a template, but never executed directly. Only after all jobs of the
	previous stage was executed without any error the next stage will start.

	To pass information between multiple stages we use \lstinline!artifacts!. The
	runner will automatically load all artifacts form all \lstinline!dependencies!
	for each job\footnote{If no dependencies are defined \textit{all} artifacts from
	all previous jobs are downloaded. Thus please specify an empty dependence if you
	do not want to load any artifacts.}. For example the compiled \HEJ code from
	\lstinline!build:basic! gets loaded in \lstinline!test:basic! and
	\lstinline!FOG:build:basic!, without recompiling \HEJ again. Additionally
	artifacts can be downloaded from the GitLab web page, which could be handy for
	debugging.

	We also trigger some jobs \lstinline!only! on specific events. For example we
	only push the code to
	\href{https://phab.hepforge.org/source/hej/repository/v2.0/}{HepForge} on
	release branches (e.g. v2.0). Also we only execute the \textit{long} tests for
	merge requests, on pushes for any release or the \lstinline!master! branch, or
	when triggered manually from the GitLab web page.

	The actual commands are given in the \lstinline!before_script!,
	\lstinline!script! and \lstinline!after_script!
	\footnote{\lstinline!after_script! is always executed} sections, and are
	standard Linux shell commands (dependent on the docker image). Any failed
	command, i.e. returning not zero, stops the job and making the pipeline fail
	entirely. Most tests are just running \lstinline!make test! or are based on it.
	Thus, to emphasise it again, write tests for your code in \lstinline!cmake!. The
	CI is only intended to make automated testing in different environments easier.

	\section{Monte Carlo uncertainty}
	\label{sec:MC_err}

	Since \HEJ is reweighting each Fixed Order point with multiple resummation
	events, the Monte Carlo uncertainty of \HEJ is a little bit more complicated
	then usual. We start by defining the \HEJ cross section after $N$ FO points
	\begin{align}
	\sigma_N:=\sum_{i}^N x_i \sum_{j}^{M_i} y_{i,j}=:\sum_i^N\sum_j^{M_i} w_{i,j},
	\end{align}
	where $x_i$ are the FO weights\footnote{In this definition $x_i$ can be zero,
	see the discussion in the next section.}, $y_{i,j}$ are the reweighting weights
	, and $M_i$ the number of resummation points. We can set $M=M_i \forall i$ by
	potentially adding some points with $y_{i,j}=0$, i.e. $M$ correspond to the
	\lstinline!trials! in \lstinline!EventReweighter!. $w_{i,j}$ are the weights as
	written out by \HEJ. The expectation value of $\sigma$ is then
	\begin{align}
	\ev{\sigma_N}= \sum_i \ev{x_i}\sum_j\ev{y_{i,j}}=M \mu_x\sum_i\mu_{y_i},\label{eq:true_sigma}
	\end{align}
	with $\mu_{x/y}$ being the (true) mean value of $x$ or $y$, i.e.
	\begin{align}
	\mu_{x}:=\ev{\bar{x}}=\ev{\frac{\sum_i x_i}{N}}=\ev{x}.
	\end{align}

	The true underlying standard derivation on $\sigma_N$, assuming $\delta_{x}$
	and $\delta_{y_i}$ are the standard derivations of $x$ and $y_i$ is
	\begin{align}
	\delta_{\sigma_N}^2&=M^2 \delta_{x}^2 \sum_i \mu_{y_i}^2
	+M \mu_x^2 \sum_i \delta_{y_i}^2. \label{eq:true_err}
	\end{align}
	Notice that each point $i$ can have an different expectation for $y_i$.
	Since we do not know the true distribution of $x$ and $y$ we need to estimate
	it. We use the standard derivation
	\begin{align}
	\tilde{\delta}_{x_i}^2&:=\left(x_i-\bar x\right)^2
	=\left(\frac{N-1}{N} x_i - \frac{\sum_{j\neq i} x_j}{N}\right)^2
	\label{eq:err_x}\\
	\tilde{\delta}_{y_{i,j}}^2&:=\left(y_{i,j}-\bar y_i\right)^2 \label{eq:err_y},
	\end{align}
	and the mean values $\bar x$ and $\bar y$, to get an estimator for
	$\delta_{\sigma_N}$
	\begin{align}
	\tilde\delta_{\sigma_N}^2&=M^2 \sum_i \tilde\delta_{x_i}^2 \bar{y_i}^2
	+\sum_{i,j} x_i^2\tilde\delta_{y_{i,j}}^2. \label{eq:esti_err}
	\end{align}

	Trough error propagation we can connect the estimated uncertainties back to the
	fundamental ones
	\begin{align}
	\delta_{\tilde{\delta}_{x_i}}^2=\frac{N-1}{N} \delta_x^2.
	\end{align}
	Together with $\delta_x^2=\ev{x^2}-\ev{x}^2$ and $\ev{\tilde\delta}=0$ this
	leads to
	\begin{align}
	\ev{\tilde{\delta}_{x_i}^2 \bar y_i^2}&=\ev{\tilde{\delta}_{x_i} \bar y_i}^2
	+\delta_{\tilde{\delta}_{x_i}}^2 \mu_{y_i}^2
	+\delta_{y_i}^2 \mu_{\tilde\delta}^2 \\
	&=\frac{N-1}{N} \delta_x^2\mu_{y_i}^2,
	\end{align}
	and a similar results for $y$. Therefore
	\begin{align}
	\ev{\delta_{\sigma_N}}=\frac{N-1}{N} M^2 \delta_{x}^2 \sum_i \mu_{y_i}^2
	+\frac{M-1}{M} M \mu_x^2 \sum_i \delta_{y_i}^2,
	\end{align}
	where we can compensate for the additional factors compared to~\eqref{eq:true_err}, by replacing
	\begin{align}
	\tilde\delta_x&\to\frac{N}{N-1}\tilde\delta_x \label{eq:xcom_bias}\\
	\tilde\delta_{y_i}&\to\frac{M}{M-1}\tilde\delta_{y_i}. \label{eq:ycom_bias}
	\end{align}
	Thus~\eqref{eq:esti_err} is an unbiased estimator of $\delta_{\sigma_N}$.

	\subsection{Number of events vs. number of trials}

	Even though the above calculation is completely valid, it is unpractical. Both
	$x_i$ and $y_{ij}$ could be zero, but zero weight events are typically not
	written out. In that sense $N$ and $M$ are the \textit{number of trials} it took
	to generate $N'$ and $M'$ (non-zero) events. We can not naively replace all $N$
	and $M$ with $N'$ and $M'$ in the above equations, since this would also change
	the definition of the average $\bar x$ and $\bar y$.

	For illustration let us consider unweighted events, with all weights equal to
	$x'$, without changing the cross section $\sum_i^N x_i=\sum_i^{N'} x'_i=N' x'$.
	Then the average trial weight is unequal to the average event weight
	\begin{align}
	\bar x = \frac{\sum_i^{N} x_i}{N} = \frac{\sum_i^{N'} x'}{N}=x'\frac{N'}{N}
	\neq x'=\frac{\sum_i^{N'} x'}{N'}.
	\end{align}
	$N=N'$ would correspond to an $100\%$ efficient unweighting, i.e. a perfect
	sampling, where we know the analytical results. In particular using $N'$ instead
	of $N$ in the standard derivation gives
	\begin{align}
	\sum_i \left(x_i-\frac{\sum_i^{N} x_i}{N'}\right)^2=\sum_i \left(x'-x' \frac{\sum_i^{N'}}{N'}\right)^2=0,
	\end{align}
	which is obviously not true in general for $\tilde\delta^2_x$.

	Hence we would have to use the number of trials $N$ everywhere. This would
	require an additional parameter to be passed with each events, which is not
	always available in practice\footnote{ \texttt{Sherpa} gives the number of
	trials, as an \lstinline!attribute::trials! of \lstinline!HEPEUP! in the
	\texttt{LHE} file, or similarly as a data member in the HDF5 format
	\cite{Hoeche:2019rti}. The \texttt{LHE} standard itself provides the
	variable \lstinline!ntries! per event (see
	\href{https://phystev.cnrs.fr/wiki/2017:groups:tools:lhe}{this proposal}),
	though I have not seen this used anywhere.}. Instead we use
	\begin{align}
	\tilde\delta_{x}'^2:=\sum_i^{N} x_i^2\geq\tilde\delta_x^2, \label{eq:err_prac}
	\end{align}
	where the bias of $\delta_x'^2$ vanishes for large $N$. Thus we can use the sum
	of weight squares~\eqref{eq:err_prac} instead of~\eqref{eq:err_x}
	and~\eqref{eq:err_y}, without worrying about the difference between trials and
	generated events. The total error~\eqref{eq:esti_err} becomes
	\begin{align}
	\tilde\delta_{\sigma_N}^2=\sum_i \left(\sum_j w_{i,j}\right)^2+\sum_{i,j} \left(w_{i,j}\right)^2,
	\end{align}
	which (conveniently) only dependent on the \HEJ weights $w_{i,j}$.

	\bibliographystyle{JHEP}
	\bibliography{biblio}

	\end{document}
	diff --git a/doc/doxygen/mainpage.dox b/doc/doxygen/mainpage.dox
	index ce7ce18..91e4744 100644
	--- a/doc/doxygen/mainpage.dox
	+++ b/doc/doxygen/mainpage.dox
	@@ -1,224 +1,225 @@
	namespace HEJ { // so that doxygen links names in this namespace
	/**
	* @mainpage
	*
	* @section intro Introduction
	*
	* HEJ 2 is a library for all-order resummation of high-energy
	* logarithms. It includes a program to add resummation to fixed-order
	* events. User documentation for the program can be found <a
	* href="https://hej.web.cern.ch/HEJ/doc/2.0/user/">here</a>. This
	* documentation is instead aimed at users of the library itself.
	*
	* @section overview Overview
	*
	* The main functionality is contained in the HEJ namespace. Particles are
	* defined via the Particle struct, which consists of the particle
	* four-momentum, its identifier according to the <a
	* href="http://pdg.lbl.gov/2017/reviews/rpp2017-rev-monte-carlo-numbering.pdf">
	* PDG Monte Carlo numbering scheme </a> and an optional Colour charge. Given a
	* number of incoming and outgoing particles, the square of the resummation
	* matrix element can be calculated with the help of the MatrixElement class.
	*
	* The EventReweighter class adds resummation to existing fixed-order
	* events. Both fixed-order and resummation events are objects of the
	* Event class, which are created from EventData objects with the
	* help of a <a
	* href="http://fastjet.fr/repo/doxygen-3.3.1/classfastjet_1_1JetDefinition.html">jet
	* definition according to the fastjet</a> library. EventData
	* objects can be assembled manually or converted from input events in
	* the LesHouches standard, read from file with a EventReader (e.g.
	* LesHouchesReader or HDF5Reader).
	*
	* Events can be saved with one of the EventWriter classes. Currently,
	* there is support for the Les Houches event file format with the
	* LesHouchesWriter class. If HEJ 2 was installed with HepMC 2 or 3
	* support, the respective format is available through the HepMC2Writer
	- * or HepMC3Writer class.
	+ * or HepMC3Writer class. The HDF5Writer class can be used if HEJ 2 was
	+ * compiled with HDF5 support.
	*
	* Further classes of interest are the interfaces to the Mixmax and
	* Ranlux64 random number generators, the PDF class to interact with <a
	* href="https://lhapdf.hepforge.org/"> LHAPDF </a> and the ScaleGenerator
	* and ScaleConfig classes to calculate renormalisation and factorisation
	* scales for a given Event.
	*
	* @section example Example
	*
	* As an example, we show a toy program that computes the square of a
	* matrix element in the HEJ approximation for a single event. First, we
	* include the necessary header files:
	* @code{.cpp}
	* #include "HEJ/Event.hh"
	* #include "HEJ/MatrixElement.hh"
	* @endcode
	* We then specify the incoming and outgoing particles. A particle
	* has a type, a four-momentum \f$(p_x, p_y, p_z, E)\f$ and optionally a colour
	* charge. For instance, an incoming gluon could be defined as
	* @code{.cpp}
	* fastjet::PseudoJet momentum{0, 0, 308., 308.};
	* HEJ::Colour colours{501,502};
	* HEJ::Particle gluon_in{HEJ::ParticleID::gluon, momentum, colours};
	* @endcode
	* We collect all incoming and outgoing particles in a partonic event. Here
	* is an example for a partonic \f$gu \to gghu\f$ event (omitting colours):
	* @code{.cpp}
	* HEJ::Event::EventData partonic_event;
	*
	* // incoming particles
	* partonic_event.incoming[0] = {
	* HEJ::ParticleID::gluon,
	* { 0., 0., 308., 308.}
	* };
	* partonic_event.incoming[1] = {
	* HEJ::ParticleID::up,
	* { 0., 0.,-164., 164.}
	* };
	* // outgoing particles
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::higgs,
	* { 98., 82., 14., 180.}
	* });
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::up,
	* { 68.,-54., 36., 94.}
	* });
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::gluon,
	* {-72., 9., 48., 87.}
	* });
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::gluon,
	* {-94.,-37., 46., 111.}
	* });
	* @endcode
	* Alternatively, we could read the event from e.g. a Les Houches event file,
	* possibly compressed with gzip. For this, the additional header file
	* @c HEJ/EventReader.hh have to be included.
	* @code{.cpp}
	* auto reader = HEJ::make_reader("events.lhe.gz");
	* reader->read_event();
	* HEJ::Event::EventData partonic_event{reader->hepeup()};
	* @endcode
	*
	* In this specific example we will later choose a constant value for the
	* strong coupling, so that the HEJ matrix element does not depend on the
	* renormalisation scale. However, in a more general scenario, we will want
	* to set a central scale:
	* @code{.cpp}
	* partonic_event.parameters.central.mur = 50.;
	* @endcode
	* It is possible to add more scales in order to perform scale variation:
	* @code{.cpp}
	* partonic_event.parameters.variations.resize(2);
	* partonic_event.parameters.variations[0].mur = 25.;
	* partonic_event.parameters.variations[1].mur = 100.;
	* @endcode
	*
	* In the next step, we leverage FastJet to construct an event with
	* clustered jets. Here, we use antikt jets with R=0.4 and transverse
	* momenta of at least 30 GeV.
	* @code{.cpp}
	* const fastjet::JetDefinition jet_def{
	* fastjet::JetAlgorithm::antikt_algorithm, 0.4
	* };
	* const double min_jet_pt = 30.;
	* HEJ::Event event{partonic_event.cluster(jet_def, min_jet_pt)};
	* @endcode
	* In order to calculate the Matrix element, we now have to fix the physics
	* parameters. For the sake of simplicity, we assume an effective coupling
	* of the Higgs boson to gluons in the limit of an infinite top-quark mass
	* and a fixed value of \f$\alpha_s = 0.118\f$ for the strong coupling.
	* @code{.cpp}
	* const auto alpha_s = [](double /* mu_r */) { return 0.118; };
	* HEJ::MatrixElementConfig ME_config;
	* // whether to include corrections from the
	* // evolution of \alpha_s in virtual corrections
	* ME_config.log_correction = false;
	* HEJ::MatrixElement ME{alpha_s, ME_config};
	* @endcode
	* If QCDLoop is installed, we can also take into account the full loop
	* effects with finite top and bottom quark masses:
	* @code{.cpp}
	* HEJ::MatrixElementConfig ME_config;
	* ME_config.Higgs_coupling.use_impact_factors = false;
	* ME_config.Higgs_coupling.mt = 163;
	* ME_config.Higgs_coupling.include_bottom = true;
	* ME_config.Higgs_coupling.mb = 2.8;
	* @endcode
	* Finally, we can compute and print the square of the matrix element with
	* @code{.cpp}
	* std::cout << "HEJ ME: " << ME(event).central << '\n';
	* @endcode
	* In the case of scale variation, the weight associated with the scale
	* @c event.variations[i].mur is @c ME(event).variations[i].
	*
	* Collecting the above pieces, we have the following program:
	* @code{.cpp}
	* #include "HEJ/Event.hh"
	* #include "HEJ/MatrixElement.hh"
	*
	* int main(){
	* HEJ::Event::EventData partonic_event;
	* // incoming particles
	* partonic_event.incoming[0] = {
	* HEJ::ParticleID::gluon,
	* { 0., 0., 308., 308.}
	* };
	* partonic_event.incoming[1] = {
	* HEJ::ParticleID::up,
	* { 0., 0.,-164., 164.}
	* };
	* // outgoing particles
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::higgs,
	* { 98., 82., 14., 180.}
	* });
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::up,
	* { 68.,-54., 36., 94.}
	* });
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::gluon,
	* {-72., 9., 48., 87.}
	* });
	* partonic_event.outgoing.push_back({
	* HEJ::ParticleID::gluon,
	* {-94.,-37., 46., 111.}
	* });
	*
	* const fastjet::JetDefinition jet_def{
	* fastjet::JetAlgorithm::antikt_algorithm, 0.4
	* };
	* const double min_jet_pt = 30.;
	* HEJ::Event event{partonic_event.cluster(jet_def, min_jet_pt)};
	* const auto alpha_s = [](double /* mu_r */) { return 0.118; };
	* HEJ::MatrixElementConfig ME_config;
	* // whether to include corrections from the
	* // evolution of \alpha_s in virtual corrections
	* ME_config.log_correction = false;
	* HEJ::MatrixElement ME{alpha_s, ME_config};
	*
	* std::cout
	* << "HEJ ME: " << ME(event).central
	* << " = tree * virtual = " << ME.tree(event).central
	* << " * " << ME.virtual_corrections(event).central
	* << '\n';
	* }
	* @endcode
	* After saving the above code to a file @c matrix_element.cc, it
	* can be compiled into an executable @c matrix_element with a
	* suitable compiler. For example, with @c g++ this can be done
	* with the command
	* @code{.sh}
	* g++ -o matrix_element matrix_element.cc -lHEJ -lfastjet
	* @endcode
	* If HEJ or any of the required libraries was installed to a
	* non-standard location, it may be necessary to explicitly specify the
	* paths to the required header and library files. This can be done with
	* the @c HEJ-config executable and similar programs for the
	* other dependencies:
	* @code{.sh}
	* g++ $(fastjet-config --cxxflags) $(HEJ-config --cxxflags) -o matrix_element matrix_element.cc $(HEJ-config --libs) $(fastjet-config --libs)
	* @endcode
	*/
	}
	diff --git a/doc/sphinx/HEJ.rst b/doc/sphinx/HEJ.rst
	index f1fa90e..a263722 100644
	--- a/doc/sphinx/HEJ.rst
	+++ b/doc/sphinx/HEJ.rst
	@@ -1,414 +1,416 @@
	.. _`Running HEJ 2`:

	Running HEJ 2
	=============

	Quick start
	-----------

	In order to run HEJ 2, you need a configuration file and a file
	containing fixed-order events. A sample configuration is given by the
	:file:`config.yml` file distributed together with HEJ 2. Events in the
	Les Houches Event File format can be generated with standard Monte Carlo
	generators like `MadGraph5_aMC@NLO <https://launchpad.net/mg5amcnlo>`_
	or `Sherpa <https://sherpa.hepforge.org/trac/wiki>`_. If HEJ 2 was
	compiled with `HDF5 <https://www.hdfgroup.org/>`_ support, it can also
	-read event files in the format suggested in
	+read and write event files in the format suggested in
	`arXiv:1905.05120 <https://arxiv.org/abs/1905.05120>`_.
	HEJ 2 assumes that the cross section is given by the sum of the event
	weights. Depending on the fixed-order generator it may be necessary to
	adjust the weights in the Les Houches Event File accordingly.

	The processes supported by HEJ 2 are

	- Pure multijet production
	- Production of a Higgs boson with jets
	- Production of a W boson with jets

	..
	- TODO Production of a Z boson or photon with jets

	where at least two jets are required in each case. For the time being,
	only leading-order events are supported.

	After generating an event file :file:`events.lhe` adjust the parameters
	under the `fixed order jets`_ setting in :file:`config.yml` to the
	settings in the fixed-order generation. Resummation can then be added by
	running::

	HEJ config.yml events.lhe

	Using the default settings, this will produce an output event file
	:file:`HEJ.lhe` with events including high-energy resummation.

	When using the `Docker image <https://hub.docker.com/r/hejdock/hej>`_,
	HEJ can be run with

	.. code-block:: bash

	docker run -v $PWD:$PWD -w $PWD hejdock/hej HEJ config.yml events.lhe

	.. _`HEJ 2 settings`:

	Settings
	--------

	HEJ 2 configuration files follow the `YAML <http://yaml.org/>`_
	format. The following configuration parameters are supported:

	.. _`trials`:

	trials
	High-energy resummation is performed by generating a number of
	resummation phase space configurations corresponding to an input
	fixed-order event. This parameter specifies how many such
	configurations HEJ 2 should try to generate for each input
	event. Typical values vary between 10 and 100.

	.. _`max ext soft pt fraction`:

	max ext soft pt fraction
	Specifies the maximum fraction that soft radiation can contribute to the
	transverse momentum of each the most forward and the most backward jet. This
	setting is needed to regulate an otherwise uncancelled divergence. Values
	between around 0.05 and 0.1 are recommended.

	.. _`fixed order jets`:

	fixed order jets
	This tag collects a number of settings specifying the jet definition
	in the event input. The settings should correspond to the ones used in
	the fixed-order Monte Carlo that generated the input events.

	.. _`fixed order jets: min pt`:

	min pt
	Minimum transverse momentum in GeV of fixed-order jets.

	.. _`fixed order jets: algorithm`:

	algorithm
	The algorithm used to define jets. Allowed settings are
	:code:`kt`, :code:`cambridge`, :code:`antikt`,
	:code:`cambridge for passive`. See the `FastJet
	<http://fastjet.fr/>`_ documentation for a description of these
	algorithms.

	.. _`fixed order jets: R`:

	R
	The R parameter used in the jet algorithm, roughly corresponding
	to the jet radius in the plane spanned by the rapidity and the
	azimuthal angle.

	.. _`resummation jets`:

	resummation jets
	This tag collects a number of settings specifying the jet definition
	in the observed, i.e. resummed events. These settings are optional, by
	default the same values as for the `fixed order jets`_ are assumed.

	.. _`resummation jets: min pt`:

	min pt
	Minimum transverse momentum in GeV of resummation jets. This
	should be between 25% and 50% larger than the minimum transverse
	momentum of fixed order jets set by `fixed order jets: min pt`_.

	.. _`resummation jets: algorithm`:

	algorithm
	The algorithm used to define jets. The HEJ 2 approach to
	resummation relies on properties of :code:`antikt` jets, so this
	value is strongly recommended. For a list of possible other
	values, see the `fixed order jets: algorithm`_ setting.

	.. _`resummation jets: R`:

	R
	The R parameter used in the jet algorithm.

	.. _`event treatment`:

	event treatment
	Specify how to treat different event types. The different event types
	contribute to different orders in the high-energy limit. The possible values
	are :code:`reweight` to enable resummation, :code:`keep` to keep the events as
	they are up to a possible change of renormalisation and factorisation scale,
	and :code:`discard` to discard these events.

	.. _`FKL`:

	FKL
	Specifies how to treat events respecting FKL rapidity ordering. These
	configurations are dominant in the high-energy limit.

	.. _`unordered`:

	unordered
	Specifies how to treat events with one emission that does not respect FKL
	ordering, e.g. :code:`u d => g u d`. In the high-energy limit, such
	configurations are logarithmically suppressed compared to FKL
	configurations.

	.. _`extremal qqx`:

	extremal qqx
	Specifies how to treat events with a quark-antiquark pair as extremal
	partons in rapidity, e.g. :code:`g d => u u_bar d`. In the high-energy
	limit, such configurations are logarithmically suppressed compared to FKL
	configurations. :code:`reweight` is currently only supported for W boson
	plus jets production.

	.. _`central qqx`:

	central qqx
	Specifies how to treat events with a quark-antiquark pair central in
	rapidity, e.g. :code:`g g => g u u_bar g`. In the high-energy limit, such
	configurations are logarithmically suppressed compared to FKL
	configurations. :code:`reweight` is currently only supported for W boson
	plus jets production.

	.. _`non-resummable`:

	non-resummable
	Specifies how to treat events where no resummation is possible. Only
	:code:`keep` or :code:`discard` are valid options, not :code:`reweight`
	for obvious reasons.

	.. _`scales`:

	scales
	Specifies the renormalisation and factorisation scales for the output
	events. This can either be a single entry or a list :code:`[scale1,
	scale2, ...]`. For the case of a list the first entry defines the
	central scale. Possible values are fixed numbers to set the scale in
	GeV or the following:

	- :code:`H_T`: The sum of the scalar transverse momenta of all
	final-state particles
	- :code:`max jet pperp`: The maximum transverse momentum of all jets
	- :code:`jet invariant mass`: Sum of the invariant masses of all jets
	- :code:`m_j1j2`: Invariant mass between the two hardest jets.

	Scales can be multiplied or divided by overall factors, e.g. :code:`H_T/2`.

	It is also possible to import scales from an external library, see
	:ref:`Custom scales`

	.. _`scale factors`:

	scale factors
	A list of numeric factors by which each of the `scales`_ should be
	multiplied. Renormalisation and factorisation scales are varied
	independently. For example, a list with entries :code:`[0.5, 2]`
	would give the four scale choices (0.5μ\ :sub:`r`, 0.5μ\ :sub:`f`);
	(0.5μ\ :sub:`r`, 2μ\ :sub:`f`); (2μ\ :sub:`r`, 0.5μ\ :sub:`f`); (2μ\
	:sub:`r`, 2μ\ :sub:`f`) in this order. The ordering corresponds to
	the order of the final event weights.

	.. _`max scale ratio`:

	max scale ratio
	Specifies the maximum factor by which renormalisation and
	factorisation scales may difer. For a value of :code:`2` and the
	example given for the `scale factors`_ the scale choices
	(0.5μ\ :sub:`r`, 2μ\ :sub:`f`) and (2μ\ :sub:`r`, 0.5μ\ :sub:`f`)
	will be discarded.

	.. _`log correction`:

	log correction
	Whether to include corrections due to the evolution of the strong
	coupling constant in the virtual corrections. Allowed values are
	:code:`true` and :code:`false`.

	.. _`unweight`:

	unweight
	Settings for unweighting events. Unweighting can greatly reduce the
	number of resummation events, speeding up analyses and shrinking
	event file sizes.

	.. _`type`:

	type
	How to unweight events. The supported settings are

	- :code:`weighted`: Generate weighted events. Default, if nothing
	else specified.
	- :code:`resummation`: Unweight only resummation events. Each set
	of resummation events coming from a single fixed order event
	are unweighted separately according to the largest weight in the
	current chunk of events.
	- :code:`partial`: Unweight only resummation events with weights
	below a certain threshold. The weight threshold is determined
	automatically in a calibration run prior to the usual event
	generation.

	.. _`unweight: trials`:

	trials
	Maximum number of trial resummation events generated in the
	calibration run for partial unweighting. This option should only
	be set for partial unweighting.

	If possible, each trial is generated from a different input
	fixed-order event. If there are not sufficiently many input
	events, more than one trial event may be generated for each of
	them and the actual number of trial events may be smaller than
	requested.

	Increasing the number of trials generally leads to better
	unweighting calibration but increases the run time. Between 1000
	and 10000 trials are usually sufficient.

	.. _`unweight: max deviation`:

	max deviation
	Controls the range of events to which unweighting is
	applied. This option should only be set for partial unweighting.

	A larger value means that a larger fraction of events are
	unweighted. Typical values are between -1 and 1.

	.. _`event output`:

	event output
	Specifies the name of a single event output file or a list of such
	files. The file format is either specified explicitly or derived from
	the suffix. For example, :code:`events.lhe` or, equivalently
	:code:`Les Houches: events.lhe` generates an output event file
	:code:`events.lhe` in the Les Houches format. The supported formats
	are

	- :code:`file.lhe` or :code:`Les Houches: file`: The Les Houches
	event file format.
	- :code:`file.hepmc2` or :code:`HepMC2: file`: HepMC format version 2.
	- :code:`file.hepmc3` or :code:`HepMC3: file`: HepMC format version 3.
	- :code:`file.hepmc` or :code:`HepMC: file`: The latest supported
	version of the HepMC format, currently version 3.
	+ - :code:`file.hdf5` or :code:`HDF5: file`: The HDF5-based format of
	+ `arXiv:1905.05120 <https://arxiv.org/abs/1905.05120>`_.

	.. _`random generator`:

	random generator
	Sets parameters for random number generation.

	.. _`random generator: name`:

	name
	Which random number generator to use. Currently, :code:`mixmax`
	and :code:`ranlux64` are supported. Mixmax is recommended. See
	the `CLHEP documentation
	<http://proj-clhep.web.cern.ch/proj-clhep/index.html#docu>`_ for
	details on the generators.

	.. _`random generator: seed`:

	seed
	The seed for random generation. This should be a single number for
	:code:`mixmax` and the name of a state file for :code:`ranlux64`.

	.. _`analysis`:

	analysis
	Name and Setting for the event analyses; either a custom
	analysis plugin or Rivet. For the first the :code:`plugin` sub-entry
	should be set to the analysis file path. All further entries are passed on
	to the analysis. To use Rivet a list of Rivet analyses have to be
	given in :code:`rivet` and prefix for the yoda file has to be set
	through :code:`output`. See :ref:`Writing custom analyses` for details.

	.. _`vev`:

	vev
	Higgs vacuum expectation value in GeV. All electro-weak constants are derived
	from this together with the `particle properties`_.

	.. _`particle properties`:

	particle properties

	Specifies various properties of the different particles (Higgs, W or Z). All
	electro-weak constants are derived from these together with the :ref:`vacuum
	expectation value<vev>`.

	.. _`particle properties: particle`:

	Higgs, W or Z
	The particle (Higgs, \|W+\| or \|W-\|, Z) for which the following properties
	are defined.

	.. \|W+\| replace:: W\ :sup:`+`
	.. \|W-\| replace:: W\ :sup:`-`

	.. _`particle properties: particle: mass`:

	mass
	The mass of the particle in GeV.

	.. _`particle properties: particle: width`:

	width
	The total decay width of the particle in GeV.

	.. _`Higgs coupling`:

	Higgs coupling
	This collects a number of settings concerning the effective coupling
	of the Higgs boson to gluons. This is only relevant for the
	production process of a Higgs boson with jets and only supported if
	HEJ 2 was compiled with `QCDLoop
	<https://github.com/scarrazza/qcdloop>`_ support.

	.. _`Higgs coupling: use impact factors`:

	use impact factors
	Whether to use impact factors for the coupling to the most forward
	and most backward partons. Impact factors imply the infinite
	top-quark mass limit.

	.. _`Higgs coupling: mt`:

	mt
	The value of the top-quark mass in GeV. If this is not specified,
	the limit of an infinite mass is taken.

	.. _`Higgs coupling: include bottom`:

	include bottom
	Whether to include the Higgs coupling to bottom quarks.

	.. _`Higgs coupling: mb`:

	mb
	The value of the bottom-quark mass in GeV. Only used for the Higgs
	coupling, external bottom-quarks are always assumed to be massless.

	Advanced Settings
	~~~~~~~~~~~~~~~~~

	All of the following settings are optional. Please do not set any of the
	following options, unless you know exactly what you are doing. The default
	behaviour gives the most reliable results for a wide range of observables.

	.. _`min extparton pt`:

	min extparton pt
	Specifies the minimum transverse momentum in GeV of the most forward and the
	most backward parton. Its value should be slightly below the minimum
	transverse momentum of jets specified by `resummation jets: min pt`_. This
	setting got superseded by `max ext soft pt fraction`_ and will be removed in
	future versions.

	.. _`max events`:

	max events
	Maximal number of (input) Fixed Order events. HEJ will stop after processing
	`max events` many events. Default considers all events.

	.. _`regulator parameter`:

	regulator parameter
	Slicing parameter to regularise the subtraction term, called :math:`\lambda`
	in `arxiv:1706.01002 <https://arxiv.org/abs/1706.01002>`_. Default is 0.2
	diff --git a/doc/sphinx/installation.rst b/doc/sphinx/installation.rst
	index 24c5f27..349082c 100644
	--- a/doc/sphinx/installation.rst
	+++ b/doc/sphinx/installation.rst
	@@ -1,97 +1,97 @@
	.. _Installation:

	Installation
	============

	Download
	--------

	A tar archive of the HEJ 2 source code can be downloaded and
	decompressed with the command::

	curl https://hej.web.cern.ch/HEJ/downloads/HEJ_2.0.tar.gz \| tar -xz

	To obtain the latest stable HEJ version, `HEJ_2.0.tar.gz` should be
	replaced by `HEJ.tar.gz`.

	Alternatively, the HEJ source code can be obtained by installing the
	`git version control system <https://git-scm.com/>`_. and running::

	git clone https://phab.hepforge.org/source/hej.git

	We also provide a `Docker image <https://hub.docker.com/r/hejdock/hej>`_
	containing a HEJ 2 installation on. This image can be pulled with::

	docker pull hejdock/hej

	When using the Docker image the remaining installation steps can be
	skipped.

	Prerequisites
	-------------

	Before installing HEJ 2, you need the following programs and
	libraries:

	- `CMake <https://cmake.org/>`_ version 3.1
	- A compiler supporting the C++14 standard, for example
	`gcc <https://gcc.gnu.org/>`_ 5 or later
	- `FastJet <http://fastjet.fr/>`_
	- `CLHEP <https://gitlab.cern.ch/CLHEP/CLHEP>`_
	- `LHAPDF <https://lhapdf.hepforge.org/>`_
	- The `IOStreams` and `uBLAS` `boost <https://www.boost.org>`_ libraries
	- `yaml-cpp <https://github.com/jbeder/yaml-cpp>`_

	In addition, some optional features have additional dependencies:

	- `Version 2 of QCDLoop <https://github.com/scarrazza/qcdloop>`_ is
	required to include finite top mass corrections in Higgs boson + jets
	production.
	- `HepMC versions 2 and 3 <https://hepmc.web.cern.ch/hepmc/>`_ enable
	event output in the respective format.
	- `Rivet <https://rivet.hepforge.org/>`_ together with HepMC 2 allow
	using Rivet analyses.
	- `HighFive <https://github.com/BlueBrain/HighFive>`_ has to be
	- installed in order to read event files in the
	+ installed in order to read and write event files in the
	`HDF5 <https://www.hdfgroup.org/>`_-based format suggested in
	`arXiv:1905.05120 <https://arxiv.org/abs/1905.05120>`_.

	Compilation
	-----------

	To compile and install HEJ 2 run::

	cmake source/directory -DCMAKE_INSTALL_PREFIX=target/directory
	make install

	:file:`source/directory` is the directory containing the file
	:file:`CMakeLists.txt`. If you omit
	:code:`-DCMAKE_INSTALL_PREFIX=target/directory` HEJ 2 will be
	installed to some default location.

	In case some of the aforementioned prerequisites are not found by
	:code:`cmake` you can give a hint by adding an additional argument
	:code:`-Dlibname_ROOT_DIR=/directory/with/library`, where
	:code:`libname` should be replaced by the name of the library in
	question.

	To not include specific packages one can add
	:code:`-DEXCLUDE_packagename=TRUE` to :code:`cmake`, e.g. by
	setting :code:`-DEXCLUDE_rivet=TRUE` HEJ 2 will not be interfaced
	to `rivet` even if rivet is available on the system.

	Testing
	-------

	To test your installation, download the NNPDF 2.3 PDF set with::

	lhapdf install NNPDF23_nlo_as_0119

	and run::

	make test

	The test data of HEJ are sorted in a
	`Git Large File Storage <https://git-lfs.github.com/>`_ format.
	:code:`git clone` therefore requires :code:`git-lfs` to download the data
	correctly.
	diff --git a/include/HEJ/HDF5Writer.hh b/include/HEJ/HDF5Writer.hh
	new file mode 100644
	index 0000000..01103bf
	--- /dev/null
	+++ b/include/HEJ/HDF5Writer.hh
	@@ -0,0 +1,55 @@
	+/** \file
	+ * \brief Contains the EventWriter for HDF5 Output.
	+ *
	+ * The output format is specified in arXiv:1905.05120.
	+ *
	+ * \authors The HEJ collaboration (see AUTHORS for details)
	+ * \date 2019
	+ * \copyright GPLv2 or later
	+ */
	+#pragma once
	+
	+#include <memory>
	+#include <string>
	+
	+#include "HEJ/EventWriter.hh"
	+
	+namespace LHEF {
	+ class HEPRUP;
	+}
	+
	+namespace HEJ{
	+ class Event;
	+
	+ //! This is an event writer specifically for HDF5 output.
	+ /**
	+ * \internal Implementation note: This uses the pimpl ("pointer to
	+ * implementation") idiom. HDF5 support is optional. Without pimpl,
	+ * we would have to specify whether HDF5 is available via the
	+ * preprocessor whenever this header is included. We don't want to
	+ * burden users of the HEJ library (for example the HEJ fixed-order
	+ * generator) with those details
	+ */
	+ class HDF5Writer: public EventWriter{
	+ public:
	+ //! Constructor
	+ /**
	+ * @param file name of the output file
	+ * @param heprup general process information
	+ */
	+ HDF5Writer(std::string const & file, LHEF::HEPRUP heprup);
	+ ~HDF5Writer() override = default;
	+
	+ //! Write an event to the output file
	+ void write(Event const & ev) override;
	+
	+ private:
	+ struct HDF5WriterImpl;
	+ struct HDF5WriterImplDeleter {
	+ void operator()(HDF5WriterImpl* p);
	+ };
	+
	+ std::unique_ptr<HDF5WriterImpl, HDF5WriterImplDeleter> impl_;
	+ };
	+
	+}
	diff --git a/include/HEJ/output_formats.hh b/include/HEJ/output_formats.hh
	index ef2a471..d1c08bd 100644
	--- a/include/HEJ/output_formats.hh
	+++ b/include/HEJ/output_formats.hh
	@@ -1,40 +1,42 @@
	/** \file
	* \brief Defines formats for output to event files
	*
	* \authors The HEJ collaboration (see AUTHORS for details)
	* \date 2019
	* \copyright GPLv2 or later
	*/
	#pragma once

	#include <stdexcept>
	#include <string>

	namespace HEJ{

	//! Supported event file formats
	enum class FileFormat{
	Les_Houches, /!< Les Houches Output /
	HepMC3, /!< HepMC3 Output /
	HepMC2, /!< HepMC2 Output /
	+ HDF5, /!< HDF5 Output /
	HepMC=HepMC3 /!< HepMC3 Output /
	};

	//! Convert a file format to a string
	inline std::string to_string(FileFormat f){
	switch(f){
	case FileFormat::Les_Houches: return "Les Houches";
	case FileFormat::HepMC2: return "HepMC2";
	case FileFormat::HepMC3: return "HepMC3";
	+ case FileFormat::HDF5: return "HDF5";
	default:
	throw std::logic_error("unhandled file format");
	}
	}

	//! Output file specification
	struct OutputFile{
	std::string name; /*< Output File Name /
	FileFormat format; /*< Output File Format /
	};

	}
	diff --git a/src/Event.cc b/src/Event.cc
	index 0a9544b..8d04a70 100644
	--- a/src/Event.cc
	+++ b/src/Event.cc
	@@ -1,942 +1,941 @@
	/**
	* \authors The HEJ collaboration (see AUTHORS for details)
	* \date 2019
	* \copyright GPLv2 or later
	*/
	#include "HEJ/Event.hh"

	#include <algorithm>
	#include <assert.h>
	#include <numeric>
	#include <unordered_set>
	#include <utility>

	#include "LHEF/LHEF.h"

	#include "fastjet/JetDefinition.hh"

	#include "HEJ/Constants.hh"
	#include "HEJ/exceptions.hh"
	#include "HEJ/PDG_codes.hh"

	namespace HEJ{

	namespace {
	constexpr int status_in = -1;
	constexpr int status_decayed = 2;
	constexpr int status_out = 1;

	//! true if leptonic W decay
	bool valid_W_decay( int const w_type, // sign of W
	std::vector<Particle> const & decays
	){
	if(decays.size() != 2) // no 1->2 decay
	return false;
	const int pidsum = decays[0].type + decays[1].type;
	if( std::abs(pidsum) != 1 \|\| pidsum != w_type ) // correct charge
	return false;
	// leptonic decay (only check first, second follows from pidsum)
	if( w_type == 1 ) // W+
	return is_antilepton(decays[0]) \|\| is_neutrino(decays[0]);
	// W-
	return is_lepton(decays[0]) \|\| is_antineutrino(decays[0]);
	}

	/// @name helper functions to determine event type
	//@{

	/**
	* \brief check if final state valid for HEJ
	*
	* check if there is at most one photon, W, H, Z in the final state
	* and all the rest are quarks or gluons
	*/
	bool final_state_ok(Event const & ev){
	std::vector<Particle> const & outgoing = ev.outgoing();
	if(ev.decays().size() > 1) // at most one decay
	return false;
	bool has_AWZH_boson = false;
	for( size_t i=0; i<outgoing.size(); ++i ){
	auto const & out{ outgoing[i] };
	if(is_AWZH_boson(out.type)){
	// at most one boson
	if(has_AWZH_boson) return false;
	has_AWZH_boson = true;

	// valid decay for W
	if(std::abs(out.type) == ParticleID::Wp){
	// exactly 1 decay of W
	if( ev.decays().size() != 1 \|\| ev.decays().cbegin()->first != i )
	return false;
	if( !valid_W_decay(out.type>0?+1:-1, ev.decays().cbegin()->second) )
	return false;
	}
	}
	else if(! is_parton(out.type)) return false;
	}
	return true;
	}

	/**
	* returns all EventTypes implemented in HEJ
	*/
	size_t implemented_types(std::vector<Particle> const & bosons){
	using namespace event_type;
	if(bosons.empty()) return FKL \| unob \| unof; // pure jets
	if(bosons.size()>1) return non_resummable; // multi boson
	switch (bosons[0].type) {
	case ParticleID::Wp:
	case ParticleID::Wm:
	return FKL \| unob \| unof \| qqxexb \| qqxexf \| qqxmid;
	case ParticleID::h:
	return FKL \| unob \| unof;
	default:
	return non_resummable;
	}
	}

	/**
	* \brief function which determines if type change is consistent with Wp emission.
	* @param in incoming Particle id
	* @param out outgoing Particle id
	* @param qqx Current both incoming/both outgoing?
	*
	* \see is_Wm_Change
	*/
	bool is_Wp_Change(ParticleID in, ParticleID out, bool qqx){
	if(!qqx && (in==-1 \|\| in== 2 \|\| in==-3 \|\| in== 4)) return out== (in-1);
	if( qqx && (in== 1 \|\| in==-2 \|\| in== 3 \|\| in==-4)) return out==-(in+1);
	return false;
	}

	/**
	* \brief function which determines if type change is consistent with Wm emission.
	* @param in incoming Particle id
	* @param out outgoing Particle id
	* @param qqx Current both incoming/both outgoing?
	*
	* Ensures that change type of quark line is possible by a flavour changing
	* Wm emission. Allows checking of qqx currents also.
	*/
	bool is_Wm_Change(ParticleID in, ParticleID out, bool qqx){
	if(!qqx && (in== 1 \|\| in==-2 \|\| in== 3 \|\| in==-4)) return out== (in+1);
	if( qqx && (in==-1 \|\| in== 2 \|\| in==-3 \|\| in== 4)) return out==-(in-1);
	return false;
	}

	/**
	* \brief checks if particle type remains same from incoming to outgoing
	* @param in incoming Particle
	* @param out outgoing Particle
	* @param qqx Current both incoming/outgoing?
	*/
	bool no_flavour_change(ParticleID in, ParticleID out, bool qqx){
	const int qqxCurrent = qqx?-1:1;
	if(abs(in)<=6 \|\| in==pid::gluon) return (in==out*qqxCurrent);
	else return false;
	}

	bool has_2_jets(Event const & event){
	return event.jets().size() >= 2;
	}

	/**
	* \brief check if we have a valid Impact factor
	* @param in incoming Particle
	* @param out outgoing Particle
	* @param qqx Current both incoming/outgoing?
	* @param qqx returns +1 if Wp, -1 if Wm, else 0
	*/
	bool is_valid_impact_factor(
	ParticleID in, ParticleID out, bool qqx, int & W_change
	){
	if( no_flavour_change(in, out, qqx) ){
	return true;
	}
	if( is_Wp_Change(in, out, qqx) ) {
	W_change+=1;
	return true;
	}
	if( is_Wm_Change(in, out, qqx) ) {
	W_change-=1;
	return true;
	}
	return false;
	}

	//! Returns all possible classifications from the impact factors
	// the beginning points are changed s.t. after the the classification they
	// point to the beginning of the (potential) FKL chain
	// sets W_change: + if Wp change
	// 0 if no change
	// - if Wm change
	// This function can be used with forward & backwards iterators
	template<class OutIterator>
	size_t possible_impact_factors(
	ParticleID incoming_id, // incoming
	OutIterator & begin_out, OutIterator const & end_out, // outgoing
	int & W_change, std::vector<Particle> const & boson,
	bool const backward // backward?
	){
	using namespace event_type;
	assert(boson.size() < 2);
	// keep track of all states that we don't test
	size_t not_tested = qqxmid;
	if(backward)
	not_tested \|= unof \| qqxexf;
	else
	not_tested \|= unob \| qqxexb;

	// Is this LL current?
	if( is_valid_impact_factor(incoming_id, begin_out->type, false, W_change) ){
	++begin_out;
	return not_tested \| FKL;
	}

	// or NLL current?
	// -> needs two partons in two different jets
	if( std::distance(begin_out, end_out)>=2
	){
	// Is this unordered emisson?
	if( incoming_id!=pid::gluon && begin_out->type==pid::gluon ){
	if( is_valid_impact_factor(
	incoming_id, (begin_out+1)->type, false, W_change )
	){
	// veto Higgs inside uno
	assert((begin_out+1)<end_out);
	if( !boson.empty() && boson.front().type == ParticleID::h
	){
	if( (backward && boson.front().rapidity() < (begin_out+1)->rapidity())
	\|\|(!backward && boson.front().rapidity() > (begin_out+1)->rapidity()))
	return non_resummable;
	}
	begin_out+=2;
	return not_tested \| (backward?unob:unof);
	}
	}
	// Is this QQbar?
	else if( incoming_id==pid::gluon ){
	if( is_valid_impact_factor(
	begin_out->type, (begin_out+1)->type, true, W_change )
	){
	// veto Higgs inside qqx
	assert((begin_out+1)<end_out);
	if( !boson.empty() && boson.front().type == ParticleID::h
	){
	if( (backward && boson.front().rapidity() < (begin_out+1)->rapidity())
	\|\|(!backward && boson.front().rapidity() > (begin_out+1)->rapidity()))
	return non_resummable;
	}
	begin_out+=2;
	return not_tested \| (backward?qqxexb:qqxexf);
	}
	}
	}
	return non_resummable;
	}

	//! Returns all possible classifications from central emissions
	// the beginning points are changed s.t. after the the classification they
	// point to the end of the emission chain
	// sets W_change: + if Wp change
	// 0 if no change
	// - if Wm change
	template<class OutIterator>
	size_t possible_central(
	OutIterator & begin_out, OutIterator const & end_out,
	int & W_change, std::vector<Particle> const & boson,
	OutIterator & qqx_pos
	){
	using namespace event_type;
	assert(boson.size() < 2);
	// if we already passed the central chain,
	// then it is not a valid all-order state
	if(std::distance(begin_out, end_out) < 0) return non_resummable;
	// keep track of all states that we don't test
	size_t possible = unob \| unof
	\| qqxexb \| qqxexf;

	// Find the first non-gluon/non-FKL
	while( (begin_out->type==pid::gluon) && (begin_out<end_out) ){
	++begin_out;
	}
	// end of chain -> FKL
	if( begin_out==end_out ){
	return possible \| FKL;
	}

	// is this a qqbar-pair?
	// needs two partons in two separate jets
	if( is_valid_impact_factor(
	begin_out->type, (begin_out+1)->type, true, W_change )
	){
	// veto Higgs inside qqx
	if( !boson.empty() && boson.front().type == ParticleID::h
	&& boson.front().rapidity() > begin_out->rapidity()
	&& boson.front().rapidity() < (begin_out+1)->rapidity()
	){
	return non_resummable;
	}
	qqx_pos=begin_out;
	begin_out+=2;
	// remaining chain should be pure gluon/FKL
	for(; begin_out<end_out; ++begin_out){
	if(begin_out->type != pid::gluon) return non_resummable;
	}
	return possible \| qqxmid;
	}
	return non_resummable;
	}

	bool invalid_jet(std::unordered_set<int> & other, int const idx){
	if(idx<0) return true;
	if(other.find(idx) != other.cend()) return true;
	other.insert(idx);
	return false;
	}

	bool jets_ok( size_t const final_type,
	std::vector<int> const & jet_idx, size_t const qqx_pos
	){
	using namespace event_type;

	std::unordered_set<int> other;
	auto idx_begin{jet_idx.cbegin()};
	auto idx_end{jet_idx.crbegin()};

	// always seperate extremal jets
	if(invalid_jet(other, *idx_begin)) return false;
	if(invalid_jet(other, *idx_end)) return false;

	// unob -> second parton in own jet
	if( (final_type & (unob \| qqxexb))
	&& invalid_jet(other, *(idx_begin+1)) ) return false;

	if( (final_type & (unof \| qqxexf))
	&& invalid_jet(other, *(idx_end+1)) ) return false;

	assert( !(final_type & qqxmid) \|\| jet_idx.size()>qqx_pos+1 );
	if( (final_type & qqxmid)
	&& ( invalid_jet(other, *(idx_begin+qqx_pos))
	\|\| invalid_jet(other, *(idx_begin+qqx_pos+1)) ) ) return false;

	return true;
	}

	/**
	* \brief Checks for all event types
	* @param ev Event
	* @returns Event Type
	*
	*/
	event_type::EventType classify(Event const & ev){
	using namespace event_type;
	if(! has_2_jets(ev))
	return no_2_jets;
	// currently we can't handle multiple boson states in the ME. So they are
	// considered "bad_final_state" even though the "classify" could work with
	// them.
	if(! final_state_ok(ev))
	return bad_final_state;

	// initialise variables
	auto const & in = ev.incoming();
	auto const & out = filter_partons(ev.outgoing());

	assert(std::distance(begin(in), end(in)) == 2);
	assert(out.size() >= 2);
	assert(std::distance(begin(out), end(out)) >= 2);
	assert(std::is_sorted(begin(out), end(out), rapidity_less{}));

	auto const boson{ filter_AWZH_bosons(ev.outgoing()) };
	// we only allow one boson through final_state_ok
	assert(boson.size()<=1);

	// keep track of potential W couplings, at the end the sum should be 0
	int remaining_Wp = 0;
	int remaining_Wm = 0;
	if(!boson.empty() && abs(boson.front().type) == ParticleID::Wp ){
	if(boson.front().type>0) ++remaining_Wp;
	else ++remaining_Wm;
	}
	int W_change = 0;

	// range for current checks
	auto begin_out{out.cbegin()};
	auto end_out{out.crbegin()};

	size_t final_type = ~(no_2_jets \| bad_final_state);

	// check forward impact factor
	final_type &= possible_impact_factors(
	in.front().type,
	begin_out, end_out.base(),
	W_change, boson, true );
	if( final_type == non_resummable )
	return non_resummable;
	if(W_change>0) remaining_Wp-=W_change;
	else if(W_change<0) remaining_Wm+=W_change;
	W_change = 0;

	// check backward impact factor
	final_type &= possible_impact_factors(
	in.back().type,
	end_out, std::make_reverse_iterator(begin_out),
	W_change, boson, false );
	if( final_type == non_resummable )
	return non_resummable;
	if(W_change>0) remaining_Wp-=W_change;
	else if(W_change<0) remaining_Wm+=W_change;
	W_change = 0;

	// check central emissions
	auto qqx_pos{out.cend()};
	final_type &= possible_central(
	begin_out, end_out.base(), W_change, boson, qqx_pos );
	if( final_type == non_resummable )
	return non_resummable;
	assert( !(final_type&qqxmid) \|\| qqx_pos != out.cend() );
	if(W_change>0) remaining_Wp-=W_change;
	else if(W_change<0) remaining_Wm+=W_change;

	// Check whether the right number of Ws are present
	if( remaining_Wp != 0 \|\| remaining_Wm != 0 ) return non_resummable;

	// result has to be unique
	if( (final_type & (final_type-1)) != 0) return non_resummable;

	// check jet configurations
	if(!jets_ok( final_type,
	ev.particle_jet_indices( ev.jets() ),
	std::distance( out.cbegin(), qqx_pos) ))
	return non_resummable;

	// check that each sub processes is implemented
	// (has to be done at the end)
	if( (final_type & ~implemented_types(boson)) != 0 )
	return non_resummable;

	return static_cast<EventType>(final_type);
	}
	//@}

	Particle extract_particle(LHEF::HEPEUP const & hepeup, int i){
	const ParticleID id = static_cast<ParticleID>(hepeup.IDUP[i]);
	const fastjet::PseudoJet momentum{
	hepeup.PUP[i][0], hepeup.PUP[i][1],
	hepeup.PUP[i][2], hepeup.PUP[i][3]
	};
	if(is_parton(id))
	return Particle{ id, std::move(momentum), hepeup.ICOLUP[i] };
	return Particle{ id, std::move(momentum), {} };
	}

	bool is_decay_product(std::pair<int, int> const & mothers){
	if(mothers.first == 0) return false;
	return mothers.second == 0 \|\| mothers.first == mothers.second;
	}

	} // namespace anonymous

	Event::EventData::EventData(LHEF::HEPEUP const & hepeup){
	parameters.central = EventParameters{
	hepeup.scales.mur, hepeup.scales.muf, hepeup.weight()
	};
	size_t in_idx = 0;
	for (int i = 0; i < hepeup.NUP; ++i) {
	// skip decay products
	// we will add them later on, but we have to ensure that
	// the decayed particle is added before
	if(is_decay_product(hepeup.MOTHUP[i])) continue;

	auto particle = extract_particle(hepeup, i);
	// needed to identify mother particles for decay products
	particle.p.set_user_index(i+1);

	if(hepeup.ISTUP[i] == status_in){
	if(in_idx > incoming.size()) {
	throw std::invalid_argument{
	"Event has too many incoming particles"
	};
	}
	incoming[in_idx++] = std::move(particle);
	}
	else outgoing.emplace_back(std::move(particle));
	}

	// add decay products
	for (int i = 0; i < hepeup.NUP; ++i) {
	if(!is_decay_product(hepeup.MOTHUP[i])) continue;
	const int mother_id = hepeup.MOTHUP[i].first;
	const auto mother = std::find_if(
	begin(outgoing), end(outgoing),
	[mother_id](Particle const & particle){
	return particle.p.user_index() == mother_id;
	}
	);
	if(mother == end(outgoing)){
	throw std::invalid_argument{"invalid decay product parent"};
	}
	const int mother_idx = std::distance(begin(outgoing), mother);
	assert(mother_idx >= 0);
	decays[mother_idx].emplace_back(extract_particle(hepeup, i));
	}
	}

	Event::Event(
	UnclusteredEvent const & ev,
	fastjet::JetDefinition const & jet_def, double const min_jet_pt
	):
	Event( Event::EventData{
	ev.incoming, ev.outgoing, ev.decays,
	Parameters<EventParameters>{ev.central, ev.variations}
	}.cluster(jet_def, min_jet_pt) )
	{}

	//! @TODO remove in HEJ 2.2.0
	UnclusteredEvent::UnclusteredEvent(LHEF::HEPEUP const & hepeup){
	Event::EventData const evData{hepeup};
	incoming = evData.incoming;
	outgoing = evData.outgoing;
	decays = evData.decays;
	central = evData.parameters.central;
	variations = evData.parameters.variations;
	}

	void Event::EventData::sort(){
	// sort particles
	std::sort(
	begin(incoming), end(incoming),
	[](Particle o1, Particle o2){return o1.p.pz()<o2.p.pz();}
	);

	auto old_outgoing = std::move(outgoing);
	std::vector<size_t> idx(old_outgoing.size());
	std::iota(idx.begin(), idx.end(), 0);
	std::sort(idx.begin(), idx.end(), [&old_outgoing](size_t i, size_t j){
	return old_outgoing[i].rapidity() < old_outgoing[j].rapidity();
	});
	outgoing.clear();
	outgoing.reserve(old_outgoing.size());
	for(size_t i: idx) {
	outgoing.emplace_back(std::move(old_outgoing[i]));
	}

	// find decays again
	if(!decays.empty()){
	auto old_decays = std::move(decays);
	decays.clear();
	for(size_t i=0; i<idx.size(); ++i) {
	auto decay = old_decays.find(idx[i]);
	if(decay != old_decays.end())
	decays.emplace(i, std::move(decay->second));
	}
	assert(old_decays.size() == decays.size());
	}
	}

	namespace {
	Particle reconstruct_boson(std::vector<Particle> const & leptons) {
	Particle decayed_boson;
	decayed_boson.p = leptons[0].p + leptons[1].p;
	const int pidsum = leptons[0].type + leptons[1].type;
	if(pidsum == +1) {
	assert(is_antilepton(leptons[0]));
	if(is_antineutrino(leptons[0])) {
	throw not_implemented{"lepton-flavour violating final state"};
	}
	assert(is_neutrino(leptons[1]));
	// charged antilepton + neutrino means we had a W+
	decayed_boson.type = pid::Wp;
	}
	else if(pidsum == -1) {
	assert(is_antilepton(leptons[0]));
	if(is_neutrino(leptons[1])) {
	throw not_implemented{"lepton-flavour violating final state"};
	}
	assert(is_antineutrino(leptons[0]));
	// charged lepton + antineutrino means we had a W-
	decayed_boson.type = pid::Wm;
	}
	else {
	throw not_implemented{
	"final state with leptons "
	+ name(leptons[0].type)
	+ " and "
	+ name(leptons[1].type)
	};
	}
	return decayed_boson;
	}
	}

	void Event::EventData::reconstruct_intermediate() {
	const auto begin_leptons = std::partition(
	begin(outgoing), end(outgoing),
	[](Particle const & p) {return !is_anylepton(p);}
	);
	if(begin_leptons == end(outgoing)) return;
	assert(is_anylepton(*begin_leptons));
	std::vector<Particle> leptons(begin_leptons, end(outgoing));
	outgoing.erase(begin_leptons, end(outgoing));
	if(leptons.size() != 2) {
	throw not_implemented{"Final states with one or more than two leptons"};
	}
	std::sort(
	begin(leptons), end(leptons),
	[](Particle const & p0, Particle const & p1) {
	return p0.type < p1.type;
	}
	);
	outgoing.emplace_back(reconstruct_boson(leptons));
	decays.emplace(outgoing.size()-1, std::move(leptons));
	}

	Event Event::EventData::cluster(
	fastjet::JetDefinition const & jet_def, double const min_jet_pt
	){
	sort();
	Event ev{ std::move(incoming), std::move(outgoing), std::move(decays),
	std::move(parameters),
	jet_def, min_jet_pt
	};
	assert(std::is_sorted(begin(ev.outgoing_), end(ev.outgoing_),
	rapidity_less{}));
	ev.type_ = classify(ev);
	return ev;
	}

	Event::Event(
	std::array<Particle, 2> && incoming,
	std::vector<Particle> && outgoing,
	std::unordered_map<size_t, std::vector<Particle>> && decays,
	Parameters<EventParameters> && parameters,
	fastjet::JetDefinition const & jet_def,
	double const min_jet_pt
	): incoming_{std::move(incoming)},
	outgoing_{std::move(outgoing)},
	decays_{std::move(decays)},
	parameters_{std::move(parameters)},
	cs_{ to_PseudoJet( filter_partons(outgoing_) ), jet_def },
	min_jet_pt_{min_jet_pt}
	{
	jets_ = sorted_by_rapidity(cs_.inclusive_jets(min_jet_pt_));
	}

	namespace {
	// check that Particles have a reasonable colour
	bool correct_colour(Particle const & part){
	ParticleID id{ part.type };
	if(!is_parton(id))
	return !part.colour;

	if(!part.colour)
	return false;

	Colour const & col{ *part.colour };
	if(is_quark(id))
	return col.first != 0 && col.second == 0;
	if(is_antiquark(id))
	return col.first == 0 && col.second != 0;
	assert(id==ParticleID::gluon);
	return col.first != 0 && col.second != 0 && col.first != col.second;
	}
	}

	bool Event::is_leading_colour() const {
	if( !correct_colour(incoming()[0]) \|\| !correct_colour(incoming()[1]) )
	return false;

	Colour line_colour = *incoming()[0].colour;
	std::swap(line_colour.first, line_colour.second);

	for(auto const & part: outgoing()){
	// reasonable colour
	if(!correct_colour(part))
	return false;
	if(!is_parton(part)) // skip colour neutral particles
	continue;

	// if possible connect to line
	if( line_colour.first == part.colour->second )
	line_colour.first = part.colour->first;
	else if( line_colour.second == part.colour->first )
	line_colour.second = part.colour->second;
	else
	return false;

	// no colour singlet exchange/disconnected diagram
	if(line_colour.first == line_colour.second)
	return false;
	}

	return (incoming()[1].colour->first == line_colour.first)
	&& (incoming()[1].colour->second == line_colour.second);
	}

	namespace {
	void connect_incoming(Particle & in, int & colour, int & anti_colour){
	in.colour = std::make_pair(anti_colour, colour);
	// gluon
	if(in.type == pid::gluon)
	return;
	if(in.type > 0){
	// quark
	assert(is_quark(in));
	in.colour->second = 0;
	colour*=-1;
	return;
	}
	// anti-quark
	assert(is_antiquark(in));
	in.colour->first = 0;
	anti_colour*=-1;
	return;
	}
	}

	bool Event::generate_colours(RNG & ran){
	// generate only for HEJ events
	if(!event_type::is_resummable(type()))
	return false;
	assert(std::is_sorted(
	begin(outgoing()), end(outgoing()), rapidity_less{}));
	assert(incoming()[0].pz() < incoming()[1].pz());

	// positive (anti-)colour -> can connect
	// negative (anti-)colour -> not available/used up by (anti-)quark
	int colour = COLOUR_OFFSET;
	int anti_colour = colour+1;
	// initialise first
	connect_incoming(incoming_[0], colour, anti_colour);

	for(auto & part: outgoing_){
	assert(colour>0 \|\| anti_colour>0);
	if(part.type == ParticleID::gluon){
	// gluon
	if(colour>0 && anti_colour>0){
	// on g line => connect to colour OR anti-colour (random)
	if(ran.flat() < 0.5){
	part.colour = std::make_pair(colour+2,colour);
	colour+=2;
	} else {
	part.colour = std::make_pair(anti_colour, anti_colour+2);
	anti_colour+=2;
	}
	} else if(colour > 0){
	// on q line => connect to available colour
	part.colour = std::make_pair(colour+2, colour);
	colour+=2;
	} else {
	assert(colour<0 && anti_colour>0);
	// on qx line => connect to available anti-colour
	part.colour = std::make_pair(anti_colour, anti_colour+2);
	anti_colour+=2;
	}
	} else if(is_quark(part)) {
	// quark
	assert(anti_colour>0);
	if(colour>0){
	// on g line => connect and remove anti-colour
	part.colour = std::make_pair(anti_colour, 0);
	anti_colour+=2;
	anti_colour*=-1;
	} else {
	// on qx line => new colour
	colour*=-1;
	part.colour = std::make_pair(colour, 0);
	}
	} else if(is_antiquark(part)) {
	// anti-quark
	assert(colour>0);
	if(anti_colour>0){
	// on g line => connect and remove colour
	part.colour = std::make_pair(0, colour);
	colour+=2;
	colour*=-1;
	} else {
	// on q line => new anti-colour
	anti_colour*=-1;
	part.colour = std::make_pair(0, anti_colour);
	}
	} else { // not a parton
	assert(!is_parton(part));
	part.colour = {};
	}
	}
	// Connect last
	connect_incoming(incoming_[1], anti_colour, colour);
	assert(is_leading_colour());
	return true;
	} // generate_colours

	Event::ConstPartonIterator Event::begin_partons() const {
	return cbegin_partons();
	};
	Event::ConstPartonIterator Event::cbegin_partons() const {
	return boost::make_filter_iterator(
	static_cast<bool (*)(Particle const &)>(is_parton),
	cbegin(outgoing()),
	cend(outgoing())
	);
	};

	Event::ConstPartonIterator Event::end_partons() const {
	return cend_partons();
	};
	Event::ConstPartonIterator Event::cend_partons() const {
	return boost::make_filter_iterator(
	static_cast<bool (*)(Particle const &)>(is_parton),
	cend(outgoing()),
	cend(outgoing())
	);
	};

	namespace {
	void print_momentum(std::ostream & os, fastjet::PseudoJet const & part){
	const std::streamsize orig_prec = os.precision();
	os <<std::scientific<<std::setprecision(6) << "["
	<<std::setw(13)<<std::right<< part.px() << ", "
	<<std::setw(13)<<std::right<< part.py() << ", "
	<<std::setw(13)<<std::right<< part.pz() << ", "
	<<std::setw(13)<<std::right<< part.E() << "]"<< std::fixed;
	os.precision(orig_prec);
	}

	void print_colour(std::ostream & os, optional<Colour> const & col){
	if(!col)
	os << "(no color)"; // American spelling for better alignment
	else
	os << "(" <<std::setw(3)<<std::right<< col->first
	<< ", " <<std::setw(3)<<std::right<< col->second << ")";
	}
	}

	std::ostream& operator<<(std::ostream & os, Event const & ev){
	const std::streamsize orig_prec = os.precision();
	os <<std::setprecision(4)<<std::fixed;
	os << "########## " << event_type::name(ev.type()) << " ##########" << std::endl;
	os << "Incoming particles:\n";
	for(auto const & in: ev.incoming()){
	os <<std::setw(3)<< in.type << ": ";
	print_colour(os, in.colour);
	os << " ";
	print_momentum(os, in.p);
	os << std::endl;
	}
	os << "\nOutgoing particles: " << ev.outgoing().size() << "\n";
	for(auto const & out: ev.outgoing()){
	os <<std::setw(3)<< out.type << ": ";
	print_colour(os, out.colour);
	os << " ";
	print_momentum(os, out.p);
	os << " => rapidity="
	<<std::setw(7)<<std::right<< out.rapidity() << std::endl;
	}
	os << "\nForming Jets: " << ev.jets().size() << "\n";
	for(auto const & jet: ev.jets()){
	print_momentum(os, jet);
	os << " => rapidity="
	<<std::setw(7)<<std::right<< jet.rapidity() << std::endl;
	}
	if(ev.decays().size() > 0 ){
	os << "\nDecays: " << ev.decays().size() << "\n";
	for(auto const & decay: ev.decays()){
	os <<std::setw(3)<< ev.outgoing()[decay.first].type
	<< " (" << decay.first << ") to:\n";
	for(auto const & out: decay.second){
	os <<" "<<std::setw(3)<< out.type << ": ";
	print_momentum(os, out.p);
	os << " => rapidity="
	<<std::setw(7)<<std::right<< out.rapidity() << std::endl;
	}
	}

	}
	os << std::defaultfloat;
	os.precision(orig_prec);
	return os;
	}

	double shat(Event const & ev){
	return (ev.incoming()[0].p + ev.incoming()[1].p).m2();
	}

	LHEF::HEPEUP to_HEPEUP(Event const & event, LHEF::HEPRUP * heprup){
	LHEF::HEPEUP result;
	result.heprup = heprup;
	result.weights = {{event.central().weight, nullptr}};
	for(auto const & var: event.variations()){
	result.weights.emplace_back(var.weight, nullptr);
	}
	size_t num_particles = event.incoming().size() + event.outgoing().size();
	for(auto const & decay: event.decays()) num_particles += decay.second.size();
	result.NUP = num_particles;
	// the following entries are pretty much meaningless
	result.IDPRUP = event.type(); // event type
	result.AQEDUP = 1./128.; // alpha_EW
	//result.AQCDUP = 0.118 // alpha_QCD
	// end meaningless part
	result.XWGTUP = event.central().weight;
	result.SCALUP = event.central().muf;
	result.scales.muf = event.central().muf;
	result.scales.mur = event.central().mur;
	result.scales.SCALUP = event.central().muf;
	result.pdfinfo.p1 = event.incoming().front().type;
	result.pdfinfo.p2 = event.incoming().back().type;
	result.pdfinfo.scale = event.central().muf;

	result.IDUP.reserve(num_particles); // PID
	result.ISTUP.reserve(num_particles); // status (in, out, decay)
	result.PUP.reserve(num_particles); // momentum
	result.MOTHUP.reserve(num_particles); // index mother particle
	result.ICOLUP.reserve(num_particles); // colour
	// incoming
	std::array<Particle, 2> incoming{ event.incoming() };
	// First incoming should be positive pz according to LHE standard
	// (or at least most (everyone?) do it this way, and Pythia assumes it)
	if(incoming[0].pz() < incoming[1].pz())
	std::swap(incoming[0], incoming[1]);
	for(Particle const & in: incoming){
	result.IDUP.emplace_back(in.type);
	result.ISTUP.emplace_back(status_in);
	result.PUP.push_back({in.p[0], in.p[1], in.p[2], in.p[3], in.p.m()});
	result.MOTHUP.emplace_back(0, 0);
	assert(in.colour);
	result.ICOLUP.emplace_back(*in.colour);
	}
	// outgoing
	for(size_t i = 0; i < event.outgoing().size(); ++i){
	Particle const & out = event.outgoing()[i];
	result.IDUP.emplace_back(out.type);
	const int status = event.decays().count(i)?status_decayed:status_out;
	result.ISTUP.emplace_back(status);
	result.PUP.push_back({out.p[0], out.p[1], out.p[2], out.p[3], out.p.m()});
	result.MOTHUP.emplace_back(1, 2);
	if(out.colour)
	result.ICOLUP.emplace_back(*out.colour);
	else{
	- assert(is_AWZH_boson(out));
	result.ICOLUP.emplace_back(std::make_pair(0,0));
	}
	}
	// decays
	for(auto const & decay: event.decays()){
	for(auto const out: decay.second){
	result.IDUP.emplace_back(out.type);
	result.ISTUP.emplace_back(status_out);
	result.PUP.push_back({out.p[0], out.p[1], out.p[2], out.p[3], out.p.m()});
	const size_t mother_idx = 1 + event.incoming().size() + decay.first;
	result.MOTHUP.emplace_back(mother_idx, mother_idx);
	result.ICOLUP.emplace_back(0,0);
	}
	}

	assert(result.ICOLUP.size() == num_particles);
	static constexpr double unknown_spin = 9.; //per Les Houches accord
	result.VTIMUP = std::vector<double>(num_particles, unknown_spin);
	result.SPINUP = result.VTIMUP;
	return result;
	}

	}
	diff --git a/src/HDF5Writer.cc b/src/HDF5Writer.cc
	new file mode 100644
	index 0000000..c61d1e0
	--- /dev/null
	+++ b/src/HDF5Writer.cc
	@@ -0,0 +1,386 @@
	+/**
	+ * \authors The HEJ collaboration (see AUTHORS for details)
	+ * \date 2019
	+ * \copyright GPLv2 or later
	+ */
	+#include "HEJ/HDF5Writer.hh"
	+
	+#include <cassert>
	+
	+#include "LHEF/LHEF.h"
	+
	+#ifdef HEJ_BUILD_WITH_HDF5
	+
	+#include <type_traits>
	+
	+#include "HEJ/event_types.hh"
	+#include "HEJ/Event.hh"
	+
	+#include "highfive/H5File.hpp"
	+
	+namespace HEJ{
	+
	+ using HighFive::File;
	+ using HighFive::DataSpace;
	+
	+ namespace{
	+ constexpr std::size_t chunk_size = 1000;
	+ constexpr unsigned compression_level = 3;
	+
	+ size_t to_index(event_type::EventType const type){
	+ return type==0?0:floor(log2(type))+1;
	+ }
	+
	+ template<typename T>
	+ void write_dataset(HighFive::Group & group, std::string const & name, T val) {
	+ using data_t = std::decay_t<T>;
	+ group.createDataSet<data_t>(name, DataSpace::From(val)).write(val);
	+ }
	+
	+ template<typename T>
	+ void write_dataset(
	+ HighFive::Group & group, std::string const & name,
	+ std::vector<T> const & val
	+ ) {
	+ using data_t = std::decay_t<T>;
	+ group.createDataSet<data_t>(name, DataSpace::From(val)).write(val);
	+ }
	+
	+ struct Cache {
	+ explicit Cache(size_t capacity):
	+ capacity{capacity}
	+ {
	+ nparticles.reserve(capacity);
	+ start.reserve(capacity);
	+ pid.reserve(capacity);
	+ weight.reserve(capacity);
	+ scale.reserve(capacity);
	+ fscale.reserve(capacity);
	+ rscale.reserve(capacity);
	+ aqed.reserve(capacity);
	+ aqcd.reserve(capacity);
	+ trials.reserve(capacity);
	+ }
	+
	+ void fill(HEJ::Event ev) {
	+ const auto hepeup = to_HEPEUP(ev, nullptr);
	+
	+ fill_event_params(hepeup);
	+ fill_event_particles(hepeup);
	+ }
	+
	+ void fill_event_params(LHEF::HEPEUP const & ev) {
	+ nparticles.emplace_back(ev.NUP);
	+ start.emplace_back(particle_pos);
	+ pid.emplace_back(ev.IDPRUP);
	+ weight.emplace_back(ev.XWGTUP);
	+ scale.emplace_back(ev.SCALUP);
	+ fscale.emplace_back(ev.scales.muf);
	+ rscale.emplace_back(ev.scales.mur);
	+ aqed.emplace_back(ev.AQEDUP);
	+ aqcd.emplace_back(ev.AQCDUP);
	+ // set first trial=1 for first event
	+ // -> sum(trials) = 1 -> xs=sum(weights)/sum(trials) as in Sherpa
	+ if(particle_pos == 0){
	+ trials.emplace_back(1.);
	+ } else {
	+ trials.emplace_back(0.);
	+ }
	+ particle_pos += ev.NUP;
	+ }
	+
	+ void fill_event_particles(LHEF::HEPEUP const & ev) {
	+ id.insert(end(id), begin(ev.IDUP), end(ev.IDUP));
	+ status.insert(end(status), begin(ev.ISTUP), end(ev.ISTUP));
	+ lifetime.insert(end(lifetime), begin(ev.VTIMUP), end(ev.VTIMUP));
	+ spin.insert(end(spin), begin(ev.SPINUP), end(ev.SPINUP));
	+ for(int i = 0; i < ev.NUP; ++i) {
	+ mother1.emplace_back(ev.MOTHUP[i].first);
	+ mother2.emplace_back(ev.MOTHUP[i].second);
	+ color1.emplace_back(ev.ICOLUP[i].first);
	+ color2.emplace_back(ev.ICOLUP[i].second);
	+ px.emplace_back(ev.PUP[i][0]);
	+ py.emplace_back(ev.PUP[i][1]);
	+ pz.emplace_back(ev.PUP[i][2]);
	+ e.emplace_back(ev.PUP[i][3]);
	+ m.emplace_back(ev.PUP[i][4]);
	+ }
	+ }
	+
	+ bool is_full() const {
	+ return nparticles.size() >= capacity;
	+ }
	+
	+ void clear() {
	+ nparticles.clear();
	+ start.clear();
	+ pid.clear();
	+ id.clear();
	+ status.clear();
	+ mother1.clear();
	+ mother2.clear();
	+ color1.clear();
	+ color2.clear();
	+ weight.clear();
	+ scale.clear();
	+ fscale.clear();
	+ rscale.clear();
	+ aqed.clear();
	+ aqcd.clear();
	+ trials.clear();
	+ px.clear();
	+ py.clear();
	+ pz.clear();
	+ e.clear();
	+ m.clear();
	+ lifetime.clear();
	+ spin.clear();
	+ }
	+
	+ size_t capacity;
	+ std::vector<int> nparticles, start, pid, id, status,
	+ mother1, mother2, color1, color2;
	+ std::vector<double> weight, scale, fscale, rscale, aqed,
	+ aqcd, trials, px, py, pz, e, m, lifetime, spin;
	+
	+ private:
	+ size_t particle_pos = 0;
	+ };
	+
	+ }
	+
	+ struct HDF5Writer::HDF5WriterImpl{
	+ File file;
	+ LHEF::HEPRUP heprup;
	+ Cache cache{chunk_size};
	+ size_t event_idx = 0;
	+ size_t particle_idx = 0;
	+
	+ HDF5WriterImpl(std::string const & filename, LHEF::HEPRUP && hepr):
	+ file{filename, File::ReadWrite \| File::Create \| File::Truncate},
	+ heprup{std::move(hepr)}
	+ {
	+ // TODO: code duplication with Les Houches Writer
	+ const int max_number_types = to_index(event_type::last_type)+1;
	+ heprup.NPRUP = max_number_types;
	+ // ids of event types
	+ heprup.LPRUP.clear();
	+ heprup.LPRUP.reserve(max_number_types);
	+ heprup.LPRUP.emplace_back(0);
	+ for(size_t i=event_type::first_type+1; i<=event_type::last_type; i*=2) {
	+ heprup.LPRUP.emplace_back(i);
	+ }
	+
	+ heprup.XSECUP = std::vector<double>(max_number_types, 0.);
	+ heprup.XERRUP = std::vector<double>(max_number_types, 0.);
	+ heprup.XMAXUP = std::vector<double>(max_number_types, 0.);
	+
	+ write_init();
	+ create_event_group();
	+ create_particle_group();
	+ }
	+
	+ void write_init() {
	+ auto init = file.createGroup("init");
	+
	+ write_dataset(init, "PDFgroupA" , heprup.PDFGUP.first);
	+ write_dataset(init, "PDFgroupB" , heprup.PDFGUP.second);
	+ write_dataset(init, "PDFsetA" , heprup.PDFSUP.first);
	+ write_dataset(init, "PDFsetB" , heprup.PDFSUP.second);
	+ write_dataset(init, "beamA" , heprup.IDBMUP.first);
	+ write_dataset(init, "beamB" , heprup.IDBMUP.second);
	+ write_dataset(init, "energyA" , heprup.EBMUP.first);
	+ write_dataset(init, "energyB" , heprup.EBMUP.second);
	+ write_dataset(init, "numProcesses" , heprup.NPRUP);
	+ write_dataset(init, "weightingStrategy", heprup.IDWTUP);
	+
	+ auto proc_info = file.createGroup("procInfo");
	+ write_dataset(proc_info, "procId", heprup.LPRUP);
	+ }
	+
	+ static HighFive::DataSetCreateProps const & hdf5_chunk() {
	+ static const auto props = [](){
	+ HighFive::DataSetCreateProps props;
	+ props.add(HighFive::Chunking({chunk_size}));
	+ props.add(HighFive::Deflate(compression_level));
	+ return props;
	+ }();
	+ return props;
	+ }
	+
	+ void create_event_group() {
	+ static const auto dim = DataSpace({0}, {DataSpace::UNLIMITED});
	+ auto events = file.createGroup("event");
	+ events.createDataSet<int>("nparticles", dim, hdf5_chunk());
	+ events.createDataSet<int>("start", dim, hdf5_chunk());
	+ events.createDataSet<int>("pid", dim, hdf5_chunk());
	+ events.createDataSet<double>("weight", dim, hdf5_chunk());
	+ events.createDataSet<double>("scale", dim, hdf5_chunk());
	+ events.createDataSet<double>("fscale", dim, hdf5_chunk());
	+ events.createDataSet<double>("rscale", dim, hdf5_chunk());
	+ events.createDataSet<double>("aqed", dim, hdf5_chunk());
	+ events.createDataSet<double>("aqcd", dim, hdf5_chunk());
	+ events.createDataSet<double>("trials", dim, hdf5_chunk());
	+ }
	+
	+ void resize_event_group(size_t new_size) {
	+ auto events = file.getGroup("event");
	+ events.getDataSet("nparticles").resize({new_size});
	+ events.getDataSet("start").resize({new_size});
	+ events.getDataSet("pid").resize({new_size});
	+ events.getDataSet("weight").resize({new_size});
	+ events.getDataSet("scale").resize({new_size});
	+ events.getDataSet("fscale").resize({new_size});
	+ events.getDataSet("rscale").resize({new_size});
	+ events.getDataSet("aqed").resize({new_size});
	+ events.getDataSet("aqcd").resize({new_size});
	+ events.getDataSet("trials").resize({new_size});
	+ }
	+
	+ void create_particle_group() {
	+ static const auto dim = DataSpace({0}, {DataSpace::UNLIMITED});
	+ auto particles = file.createGroup("particle");
	+ particles.createDataSet<int>("id", dim, hdf5_chunk());
	+ particles.createDataSet<int>("status", dim, hdf5_chunk());
	+ particles.createDataSet<int>("mother1", dim, hdf5_chunk());
	+ particles.createDataSet<int>("mother2", dim, hdf5_chunk());
	+ particles.createDataSet<int>("color1", dim, hdf5_chunk());
	+ particles.createDataSet<int>("color2", dim, hdf5_chunk());
	+ particles.createDataSet<double>("px", dim, hdf5_chunk());
	+ particles.createDataSet<double>("py", dim, hdf5_chunk());
	+ particles.createDataSet<double>("pz", dim, hdf5_chunk());
	+ particles.createDataSet<double>("e", dim, hdf5_chunk());
	+ particles.createDataSet<double>("m", dim, hdf5_chunk());
	+ particles.createDataSet<double>("lifetime", dim, hdf5_chunk());
	+ particles.createDataSet<double>("spin", dim, hdf5_chunk());
	+ }
	+
	+ void resize_particle_group(size_t new_size) {
	+ auto particles = file.getGroup("particle");
	+ particles.getDataSet("id").resize({new_size});
	+ particles.getDataSet("status").resize({new_size});
	+ particles.getDataSet("mother1").resize({new_size});
	+ particles.getDataSet("mother2").resize({new_size});
	+ particles.getDataSet("color1").resize({new_size});
	+ particles.getDataSet("color2").resize({new_size});
	+ particles.getDataSet("px").resize({new_size});
	+ particles.getDataSet("py").resize({new_size});
	+ particles.getDataSet("pz").resize({new_size});
	+ particles.getDataSet("e").resize({new_size});
	+ particles.getDataSet("m").resize({new_size});
	+ particles.getDataSet("lifetime").resize({new_size});
	+ particles.getDataSet("spin").resize({new_size});
	+ }
	+
	+ void write(Event const & ev){
	+ cache.fill(ev);
	+ if(cache.is_full()) {
	+ dump_cache();
	+ }
	+ const double wt = ev.central().weight;
	+ const size_t idx = to_index(ev.type());
	+ heprup.XSECUP[idx] += wt;
	+ heprup.XERRUP[idx] += wt*wt;
	+ if(wt > heprup.XMAXUP[idx]){
	+ heprup.XMAXUP[idx] = wt;
	+ }
	+ }
	+
	+ void dump_cache() {
	+ write_event_params();
	+ write_event_particles();
	+ cache.clear();
	+ }
	+
	+ void write_event_params() {
	+ auto events = file.getGroup("event");
	+ // choose arbitrary dataset to find size
	+ const auto dataset = events.getDataSet("nparticles");
	+ const size_t size = dataset.getSpace().getDimensions().front();
	+ resize_event_group(size + cache.nparticles.size());
	+
	+#define WRITE_FROM_CACHE(GROUP, PROPERTY) \
	+ GROUP.getDataSet(#PROPERTY).select({size}, {cache.PROPERTY.size()}).write(cache.PROPERTY)
	+
	+ WRITE_FROM_CACHE(events, nparticles);
	+ WRITE_FROM_CACHE(events, start);
	+ WRITE_FROM_CACHE(events, pid);
	+ WRITE_FROM_CACHE(events, weight);
	+ WRITE_FROM_CACHE(events, scale);
	+ WRITE_FROM_CACHE(events, fscale);
	+ WRITE_FROM_CACHE(events, rscale);
	+ WRITE_FROM_CACHE(events, aqed);
	+ WRITE_FROM_CACHE(events, aqcd);
	+ WRITE_FROM_CACHE(events, trials);
	+ }
	+
	+ void write_event_particles() {
	+ auto particles = file.getGroup("particle");
	+ // choose arbitrary dataset to find size
	+ const auto dataset = particles.getDataSet("id");
	+ const size_t size = dataset.getSpace().getDimensions().front();
	+ resize_particle_group(size + cache.id.size());
	+ WRITE_FROM_CACHE(particles, id);
	+ WRITE_FROM_CACHE(particles, status);
	+ WRITE_FROM_CACHE(particles, lifetime);
	+ WRITE_FROM_CACHE(particles, spin);
	+ WRITE_FROM_CACHE(particles, mother1);
	+ WRITE_FROM_CACHE(particles, mother2);
	+ WRITE_FROM_CACHE(particles, color1);
	+ WRITE_FROM_CACHE(particles, color2);
	+ WRITE_FROM_CACHE(particles, px);
	+ WRITE_FROM_CACHE(particles, py);
	+ WRITE_FROM_CACHE(particles, pz);
	+ WRITE_FROM_CACHE(particles, e);
	+ WRITE_FROM_CACHE(particles, m);
	+ }
	+#undef WRITE_FROM_CACHE
	+
	+ ~HDF5WriterImpl(){
	+ dump_cache();
	+ auto proc_info = file.getGroup("procInfo");
	+ write_dataset(proc_info, "xSection", heprup.XSECUP);
	+ write_dataset(proc_info, "error", heprup.XERRUP);
	+ write_dataset(proc_info, "unitWeight", heprup.XMAXUP);
	+ }
	+
	+ };
	+
	+ HDF5Writer::HDF5Writer(std::string const & filename, LHEF::HEPRUP heprup):
	+ impl_{
	+ new HDF5Writer::HDF5WriterImpl{filename, std::move(heprup)},
	+ HDF5Writer::HDF5WriterImplDeleter{}
	+ }
	+ {}
	+
	+ void HDF5Writer::write(Event const & ev){
	+ impl_->write(ev);
	+ }
	+}
	+
	+#else // no HDF5 support
	+
	+namespace HEJ{
	+
	+ class HDF5Writer::HDF5WriterImpl{};
	+
	+ HDF5Writer::HDF5Writer(std::string const &, LHEF::HEPRUP){
	+ throw std::invalid_argument{
	+ "Failed to create HDF5 writer: "
	+ "HEJ 2 was built without HDF5 support"
	+ };
	+ }
	+
	+ void HDF5Writer::write(Event const &){
	+ assert(false);
	+ }
	+
	+}
	+
	+#endif
	+
	+namespace HEJ {
	+ void HDF5Writer::HDF5WriterImplDeleter::operator()(HDF5WriterImpl* p) {
	+ delete p;
	+ }
	+}
	diff --git a/src/YAMLreader.cc b/src/YAMLreader.cc
	index 720e528..943c4f0 100644
	--- a/src/YAMLreader.cc
	+++ b/src/YAMLreader.cc
	@@ -1,553 +1,555 @@
	/**
	* \authors The HEJ collaboration (see AUTHORS for details)
	* \date 2019
	* \copyright GPLv2 or later
	*/
	#include "HEJ/YAMLreader.hh"

	#include <algorithm>
	#include <iostream>
	#include <limits>
	#include <map>
	#include <string>
	#include <unordered_map>
	#include <vector>

	#include <dlfcn.h>

	#include "HEJ/ScaleFunction.hh"
	#include "HEJ/event_types.hh"
	#include "HEJ/output_formats.hh"
	#include "HEJ/Constants.hh"

	namespace HEJ{
	class Event;

	namespace{
	//! Get YAML tree of supported options
	/**
	* The configuration file is checked against this tree of options
	* in assert_all_options_known.
	*/
	YAML::Node const & get_supported_options(){
	const static YAML::Node supported = [](){
	YAML::Node supported;
	static const auto opts = {
	"trials", "min extparton pt", "max ext soft pt fraction",
	"scales", "scale factors", "max scale ratio", "import scales",
	"log correction", "event output", "analysis", "vev",
	"regulator parameter", "max events"
	};
	// add subnodes to "supported" - the assigned value is irrelevant
	for(auto && opt: opts) supported[opt] = "";
	for(auto && jet_opt: {"min pt", "algorithm", "R"}){
	supported["resummation jets"][jet_opt] = "";
	supported["fixed order jets"][jet_opt] = "";
	}
	for(auto && opt: {"mt", "use impact factors", "include bottom", "mb"}){
	supported["Higgs coupling"][opt] = "";
	}
	for(auto && opt: {"name", "seed"}){
	supported["random generator"][opt] = "";
	}
	for(auto && opt: {"FKL", "unordered", "extremal qqx", "central qqx", "non-resummable"}){
	supported["event treatment"][opt] = "";
	}
	for(auto && particle_type: {"Higgs", "W", "Z"}){
	for(auto && particle_opt: {"mass", "width"}){
	supported["particle properties"][particle_type][particle_opt] = "";
	}
	}
	for(auto && opt: {"type", "trials", "max deviation"}){
	supported["unweight"][opt] = "";
	}
	return supported;
	}();
	return supported;
	}

	fastjet::JetAlgorithm to_JetAlgorithm(std::string const & algo){
	using namespace fastjet;
	static const std::map<std::string, fastjet::JetAlgorithm> known = {
	{"kt", kt_algorithm},
	{"cambridge", cambridge_algorithm},
	{"antikt", antikt_algorithm},
	{"cambridge for passive", cambridge_for_passive_algorithm},
	{"plugin", plugin_algorithm}
	};
	const auto res = known.find(algo);
	if(res == known.end()){
	throw std::invalid_argument("Unknown jet algorithm \"" + algo + "\"");
	}
	return res->second;
	}

	EventTreatment to_EventTreatment(std::string const & name){
	static const std::map<std::string, EventTreatment> known = {
	{"reweight", EventTreatment::reweight},
	{"keep", EventTreatment::keep},
	{"discard", EventTreatment::discard}
	};
	const auto res = known.find(name);
	if(res == known.end()){
	throw std::invalid_argument("Unknown event treatment \"" + name + "\"");
	}
	return res->second;
	}

	WeightType to_weight_type(std::string const & setting){
	if(setting == "weighted")
	return WeightType::weighted;
	if(setting =="resummation")
	return WeightType::unweighted_resum;
	if(setting =="partial")
	return WeightType::partially_unweighted;
	throw std::invalid_argument{"Unknown weight type \"" + setting + "\""};
	}

	} // namespace anonymous

	namespace detail{
	void set_from_yaml(fastjet::JetAlgorithm & setting, YAML::Node const & yaml){
	setting = to_JetAlgorithm(yaml.as<std::string>());
	}

	void set_from_yaml(EventTreatment & setting, YAML::Node const & yaml){
	setting = to_EventTreatment(yaml.as<std::string>());
	}

	void set_from_yaml(ParticleID & setting, YAML::Node const & yaml){
	setting = to_ParticleID(yaml.as<std::string>());
	}

	void set_from_yaml(WeightType & setting, YAML::Node const & yaml){
	setting = to_weight_type(yaml.as<std::string>());
	}

	} // namespace detail

	JetParameters get_jet_parameters(
	YAML::Node const & node,
	std::string const & entry
	){
	assert(node);
	JetParameters result;
	fastjet::JetAlgorithm jet_algo = fastjet::antikt_algorithm;
	double R;
	set_from_yaml_if_defined(jet_algo, node, entry, "algorithm");
	set_from_yaml(R, node, entry, "R");
	result.def = fastjet::JetDefinition{jet_algo, R};
	set_from_yaml(result.min_pt, node, entry, "min pt");
	return result;
	}

	RNGConfig to_RNGConfig(
	YAML::Node const & node,
	std::string const & entry
	){
	assert(node);
	RNGConfig result;
	set_from_yaml(result.name, node, entry, "name");
	set_from_yaml_if_defined(result.seed, node, entry, "seed");
	return result;
	}

	ParticleProperties get_particle_properties(
	YAML::Node const & node, std::string const & entry,
	std::string const & boson
	){
	ParticleProperties result;
	set_from_yaml(result.mass, node, entry, boson, "mass");
	set_from_yaml(result.width, node, entry, boson, "width");
	return result;
	}

	EWConstants get_ew_parameters(YAML::Node const & node){
	EWConstants result;
	double vev;
	set_from_yaml(vev, node, "vev");
	result.set_vevWZH(vev,
	get_particle_properties(node, "particle properties", "W"),
	get_particle_properties(node, "particle properties", "Z"),
	get_particle_properties(node, "particle properties", "Higgs")
	);
	return result;
	}

	HiggsCouplingSettings get_Higgs_coupling(
	YAML::Node const & node,
	std::string const & entry
	){
	assert(node);
	static constexpr double mt_max = 2e4;
	#ifndef HEJ_BUILD_WITH_QCDLOOP
	if(node[entry]){
	throw std::invalid_argument{
	"Higgs coupling settings require building HEJ 2 "
	"with QCDloop support"
	};
	}
	#endif
	HiggsCouplingSettings settings;
	set_from_yaml_if_defined(settings.mt, node, entry, "mt");
	set_from_yaml_if_defined(settings.mb, node, entry, "mb");
	set_from_yaml_if_defined(settings.include_bottom, node, entry, "include bottom");
	set_from_yaml_if_defined(settings.use_impact_factors, node, entry, "use impact factors");
	if(settings.use_impact_factors){
	if(settings.mt != std::numeric_limits<double>::infinity()){
	throw std::invalid_argument{
	"Conflicting settings: "
	"impact factors may only be used in the infinite top mass limit"
	};
	}
	}
	else{
	// huge values of the top mass are numerically unstable
	settings.mt = std::min(settings.mt, mt_max);
	}
	return settings;
	}

	FileFormat to_FileFormat(std::string const & name){
	static const std::map<std::string, FileFormat> known = {
	{"Les Houches", FileFormat::Les_Houches},
	{"HepMC", FileFormat::HepMC},
	{"HepMC2", FileFormat::HepMC2},
	- {"HepMC3", FileFormat::HepMC3}
	+ {"HepMC3", FileFormat::HepMC3},
	+ {"HDF5", FileFormat::HDF5}
	};
	const auto res = known.find(name);
	if(res == known.end()){
	throw std::invalid_argument("Unknown file format \"" + name + "\"");
	}
	return res->second;
	}

	std::string extract_suffix(std::string const & filename){
	size_t separator = filename.rfind('.');
	if(separator == filename.npos) return {};
	return filename.substr(separator + 1);
	}

	FileFormat format_from_suffix(std::string const & filename){
	const std::string suffix = extract_suffix(filename);
	if(suffix == "lhe") return FileFormat::Les_Houches;
	if(suffix == "hepmc") return FileFormat::HepMC;
	if(suffix == "hepmc3") return FileFormat::HepMC3;
	if(suffix == "hepmc2") return FileFormat::HepMC2;
	+ if(suffix == "hdf5") return FileFormat::HDF5;
	throw std::invalid_argument{
	"Can't determine format for output file \"" + filename + "\""
	};
	}

	void assert_all_options_known(
	YAML::Node const & conf, YAML::Node const & supported
	){
	if(!conf.IsMap()) return;
	if(!supported.IsMap()) throw invalid_type{"must not have sub-entries"};
	for(auto const & entry: conf){
	const auto name = entry.first.as<std::string>();
	if(! supported[name]) throw unknown_option{name};
	/* check sub-options, e.g. 'resummation jets: min pt'
	* we don't check analysis sub-options
	* those depend on the analysis being used and should be checked there
	* similar for "import scales"
	*/
	if(name != "analysis" && name != "import scales"){
	try{
	assert_all_options_known(conf[name], supported[name]);
	}
	catch(unknown_option const & ex){
	throw unknown_option{name + ": " + ex.what()};
	}
	catch(invalid_type const & ex){
	throw invalid_type{name + ": " + ex.what()};
	}
	}
	}
	}

	} // namespace HEJ

	namespace YAML {

	Node convert<HEJ::OutputFile>::encode(HEJ::OutputFile const & outfile) {
	Node node;
	node[to_string(outfile.format)] = outfile.name;
	return node;
	};

	bool convert<HEJ::OutputFile>::decode(Node const & node, HEJ::OutputFile & out) {
	switch(node.Type()){
	case NodeType::Map: {
	YAML::const_iterator it = node.begin();
	out.format = HEJ::to_FileFormat(it->first.as<std::string>());
	out.name = it->second.as<std::string>();
	return true;
	}
	case NodeType::Scalar:
	out.name = node.as<std::string>();
	out.format = HEJ::format_from_suffix(out.name);
	return true;
	default:
	return false;
	}
	}
	} // namespace YAML

	namespace HEJ{

	namespace detail{
	void set_from_yaml(OutputFile & setting, YAML::Node const & yaml){
	setting = yaml.as<OutputFile>();
	}
	}

	namespace{
	void update_fixed_order_jet_parameters(
	JetParameters & fixed_order_jets, YAML::Node const & yaml
	){
	if(!yaml["fixed order jets"]) return;
	set_from_yaml_if_defined(
	fixed_order_jets.min_pt, yaml, "fixed order jets", "min pt"
	);
	fastjet::JetAlgorithm algo = fixed_order_jets.def.jet_algorithm();
	set_from_yaml_if_defined(algo, yaml, "fixed order jets", "algorithm");
	double R = fixed_order_jets.def.R();
	set_from_yaml_if_defined(R, yaml, "fixed order jets", "R");
	fixed_order_jets.def = fastjet::JetDefinition{algo, R};
	}

	// like std::stod, but throw if not the whole string can be converted
	double to_double(std::string const & str){
	std::size_t pos;
	const double result = std::stod(str, &pos);
	if(pos < str.size()){
	throw std::invalid_argument(str + " is not a valid double value");
	}
	return result;
	}

	using EventScale = double (*)(Event const &);

	void import_scale_functions(
	std::string const & file,
	std::vector<std::string> const & scale_names,
	std::unordered_map<std::string, EventScale> & known
	) {
	auto handle = dlopen(file.c_str(), RTLD_NOW);
	char * error = dlerror();
	if(error != nullptr) throw std::runtime_error{error};

	for(auto const & scale: scale_names) {
	void * sym = dlsym(handle, scale.c_str());
	error = dlerror();
	if(error != nullptr) throw std::runtime_error{error};
	known.emplace(scale, reinterpret_cast<EventScale>(sym));
	}
	}

	auto get_scale_map(
	YAML::Node const & yaml
	) {
	std::unordered_map<std::string, EventScale> scale_map;
	scale_map.emplace("H_T", H_T);
	scale_map.emplace("max jet pperp", max_jet_pt);
	scale_map.emplace("jet invariant mass", jet_invariant_mass);
	scale_map.emplace("m_j1j2", m_j1j2);
	if(yaml["import scales"]) {
	if(! yaml["import scales"].IsMap()) {
	throw invalid_type{"Entry 'import scales' is not a map"};
	}
	for(auto const & import: yaml["import scales"]) {
	const auto file = import.first.as<std::string>();
	const auto scale_names =
	import.second.IsSequence()
	?import.second.as<std::vector<std::string>>()
	:std::vector<std::string>{import.second.as<std::string>()};
	import_scale_functions(file, scale_names, scale_map);
	}
	}
	return scale_map;
	}

	// simple (as in non-composite) scale functions
	/**
	* An example for a simple scale function would be H_T,
	* H_T/2 is then composite (take H_T and then divide by 2)
	*/
	ScaleFunction parse_simple_ScaleFunction(
	std::string const & scale_fun,
	std::unordered_map<std::string, EventScale> const & known
	) {
	assert(
	scale_fun.empty() \|\|
	(!std::isspace(scale_fun.front()) && !std::isspace(scale_fun.back()))
	);
	const auto it = known.find(scale_fun);
	if(it != end(known)) return {it->first, it->second};
	try{
	const double scale = to_double(scale_fun);
	return {scale_fun, FixedScale{scale}};
	} catch(std::invalid_argument const &){}
	throw std::invalid_argument{"Unknown scale choice: \"" + scale_fun + "\""};
	}

	std::string trim_front(std::string const & str){
	const auto new_begin = std::find_if(
	begin(str), end(str), [](char c){ return ! std::isspace(c); }
	);
	return std::string(new_begin, end(str));
	}

	std::string trim_back(std::string str){
	size_t pos = str.size() - 1;
	// use guaranteed wrap-around behaviour to check whether we have
	// traversed the whole string
	for(; pos < str.size() && std::isspace(str[pos]); --pos) {}
	str.resize(pos + 1); // note that pos + 1 can be 0
	return str;
	}

	ScaleFunction parse_ScaleFunction(
	std::string const & scale_fun,
	std::unordered_map<std::string, EventScale> const & known
	){
	assert(
	scale_fun.empty() \|\|
	(!std::isspace(scale_fun.front()) && !std::isspace(scale_fun.back()))
	);
	// parse from right to left => a/b/c gives (a/b)/c
	const size_t delim = scale_fun.find_last_of("*/");
	if(delim == scale_fun.npos){
	return parse_simple_ScaleFunction(scale_fun, known);
	}
	const std::string first = trim_back(std::string{scale_fun, 0, delim});
	const std::string second = trim_front(std::string{scale_fun, delim+1});
	if(scale_fun[delim] == '/'){
	return parse_ScaleFunction(first, known)
	/ parse_ScaleFunction(second, known);
	}
	else{
	assert(scale_fun[delim] == '*');
	return parse_ScaleFunction(first, known)
	* parse_ScaleFunction(second, known);
	}
	}

	EventTreatMap get_event_treatment(
	YAML::Node const & node, std::string const & entry
	){
	using namespace event_type;
	EventTreatMap treat {
	{no_2_jets, EventTreatment::discard},
	{bad_final_state, EventTreatment::discard},
	{FKL, EventTreatment::discard},
	{unob, EventTreatment::discard},
	{unof, EventTreatment::discard},
	{qqxexb, EventTreatment::discard},
	{qqxexf, EventTreatment::discard},
	{qqxmid, EventTreatment::discard},
	{non_resummable, EventTreatment::discard}
	};
	set_from_yaml(treat.at(FKL), node, entry, "FKL");
	set_from_yaml(treat.at(unob), node, entry, "unordered");
	treat.at(unof) = treat.at(unob);
	set_from_yaml(treat.at(qqxexb), node, entry, "extremal qqx");
	treat.at(qqxexf) = treat.at(qqxexb);
	set_from_yaml(treat.at(qqxmid), node, entry, "central qqx");
	set_from_yaml(treat.at(non_resummable), node, entry, "non-resummable");
	if(treat[non_resummable] == EventTreatment::reweight){
	throw std::invalid_argument{"Cannot reweight Fixed Order events"};
	}
	return treat;
	}

	Config to_Config(YAML::Node const & yaml){
	try{
	assert_all_options_known(yaml, get_supported_options());
	}
	catch(unknown_option const & ex){
	throw unknown_option{std::string{"Unknown option '"} + ex.what() + "'"};
	}

	Config config;
	config.resummation_jets = get_jet_parameters(yaml, "resummation jets");
	config.fixed_order_jets = config.resummation_jets;
	update_fixed_order_jet_parameters(config.fixed_order_jets, yaml);
	set_from_yaml_if_defined(config.min_extparton_pt, yaml, "min extparton pt");
	if(config.min_extparton_pt!=0)
	std::cerr << "WARNING: \"min extparton pt\" is deprecated."
	<< " Please use \"max ext soft pt fraction\" instead.\n";
	set_from_yaml(
	config.max_ext_soft_pt_fraction, yaml, "max ext soft pt fraction"
	);
	// Sets the standard value, then changes this if defined
	config.regulator_lambda=CLAMBDA;
	set_from_yaml_if_defined(config.regulator_lambda, yaml, "regulator parameter");
	set_from_yaml_if_defined(config.max_events, yaml, "max events");
	set_from_yaml(config.trials, yaml, "trials");
	config.weight_type = WeightType::weighted;
	set_from_yaml_if_defined(config.weight_type, yaml, "unweight", "type");
	if(config.weight_type == WeightType::partially_unweighted) {
	config.unweight_config = PartialUnweightConfig{};
	set_from_yaml(
	config.unweight_config->trials, yaml,
	"unweight", "trials"
	);
	set_from_yaml(
	config.unweight_config->max_dev, yaml,
	"unweight", "max deviation"
	);
	}
	else if(yaml["unweight"]) {
	for(auto && opt: {"trials", "max deviation"}) {
	if(yaml["unweight"][opt]) {
	throw std::invalid_argument{
	"'unweight: " + std::string{opt} + "' "
	"is only supported if 'unweight: type' is set to 'partial'"
	};
	}
	}
	}
	set_from_yaml(config.log_correction, yaml, "log correction");
	config.treat = get_event_treatment(yaml, "event treatment");
	set_from_yaml_if_defined(config.output, yaml, "event output");
	config.rng = to_RNGConfig(yaml, "random generator");
	set_from_yaml_if_defined(config.analysis_parameters, yaml, "analysis");
	config.scales = to_ScaleConfig(yaml);
	config.ew_parameters = get_ew_parameters(yaml);
	config.Higgs_coupling = get_Higgs_coupling(yaml, "Higgs coupling");
	return config;
	}

	} // namespace anonymous

	ScaleConfig to_ScaleConfig(YAML::Node const & yaml){
	ScaleConfig config;
	auto scale_funs = get_scale_map(yaml);
	std::vector<std::string> scales;
	set_from_yaml(scales, yaml, "scales");
	config.base.reserve(scales.size());
	std::transform(
	begin(scales), end(scales), std::back_inserter(config.base),
	[scale_funs](auto const & entry){
	return parse_ScaleFunction(entry, scale_funs);
	}
	);
	set_from_yaml_if_defined(config.factors, yaml, "scale factors");
	config.max_ratio = std::numeric_limits<double>::infinity();
	set_from_yaml_if_defined(config.max_ratio, yaml, "max scale ratio");
	return config;
	}

	Config load_config(std::string const & config_file){
	try{
	return to_Config(YAML::LoadFile(config_file));
	}
	catch(...){
	std::cerr << "Error reading " << config_file << ":\n ";
	throw;
	}
	}

	} // namespace HEJ
	diff --git a/src/make_writer.cc b/src/make_writer.cc
	index 5f87f01..10a71b0 100644
	--- a/src/make_writer.cc
	+++ b/src/make_writer.cc
	@@ -1,36 +1,41 @@
	/**
	* \authors The HEJ collaboration (see AUTHORS for details)
	* \date 2019
	* \copyright GPLv2 or later
	*/
	#include "HEJ/make_writer.hh"

	#include "HEJ/exceptions.hh"
	#include "HEJ/HepMC2Writer.hh"
	#include "HEJ/HepMC3Writer.hh"
	+#include "HEJ/HDF5Writer.hh"
	#include "HEJ/LesHouchesWriter.hh"

	namespace HEJ{
	std::unique_ptr<EventWriter> make_format_writer(
	FileFormat format, std::string const & outfile,
	LHEF::HEPRUP const & heprup
	){
	switch(format){
	case FileFormat::Les_Houches:
	return std::unique_ptr<EventWriter>{
	new LesHouchesWriter{outfile, heprup}
	};
	case FileFormat::HepMC2:
	return std::unique_ptr<EventWriter>{
	new HepMC2Writer{outfile, heprup}
	};
	case FileFormat::HepMC3:
	return std::unique_ptr<EventWriter>{
	new HepMC3Writer{outfile, heprup}
	};
	+ case FileFormat::HDF5:
	+ return std::unique_ptr<EventWriter>{
	+ new HDF5Writer{outfile, heprup}
	+ };
	default:
	throw std::logic_error("unhandled file format");
	}
	}

	}
	diff --git a/t/CMakeLists.txt b/t/CMakeLists.txt
	index e704bef..15da670 100644
	--- a/t/CMakeLists.txt
	+++ b/t/CMakeLists.txt
	@@ -1,289 +1,299 @@
	set(tst_dir "${CMAKE_CURRENT_SOURCE_DIR}")
	set(tst_ME_data_dir "${tst_dir}/ME_data")

	# test event classification
	add_executable(test_classify ${tst_dir}/test_classify.cc)
	target_link_libraries(test_classify HEJ)
	add_test(
	NAME t_classify
	COMMAND test_classify
	)
	add_executable(test_classify_ref ${tst_dir}/test_classify_ref.cc)
	target_link_libraries(test_classify_ref HEJ)
	add_test(
	NAME t_classify_ref
	COMMAND test_classify_ref ${tst_dir}/classify_ref ${tst_dir}/classify.lhe.gz
	)
	add_test(
	NAME t_classify_ref_4j
	COMMAND test_classify_ref ${tst_dir}/classify_ref_4j ${tst_dir}/4j.lhe.gz
	)
	add_test(
	NAME t_classify_ref_W4j
	COMMAND test_classify_ref ${tst_dir}/classify_ref_W4j ${tst_dir}/MGemnubar4j_unweighted.lhe.gz
	)

	# test for valid W decays
	add_executable(test_decay ${tst_dir}/test_decay.cc)
	target_link_libraries(test_decay HEJ)
	add_test(
	NAME t_valid_decay
	COMMAND test_decay
	)

	# test phase space point
	add_executable(test_psp ${tst_dir}/test_psp.cc)
	target_link_libraries(test_psp HEJ)
	add_test(
	NAME t_psp
	COMMAND test_psp ${tst_dir}/psp_gen.lhe.gz
	)

	# test importing scales
	add_library(scales SHARED ${tst_dir}/scales.cc)
	target_link_libraries(scales HEJ)
	add_executable(test_scale_import ${tst_dir}/test_scale_import)
	target_link_libraries(test_scale_import HEJ)
	add_test(
	NAME t_scale_import
	COMMAND test_scale_import ${tst_dir}/jet_config_with_import.yml
	)

	# test scale arithmetic (e.g. 2*H_T/4)
	add_executable(test_scale_arithmetics ${tst_dir}/test_scale_arithmetics)
	target_link_libraries(test_scale_arithmetics HEJ)
	add_test(
	NAME t_scale_arithmetics
	COMMAND test_scale_arithmetics ${tst_dir}/jet_config.yml ${tst_dir}/2j.lhe.gz
	)

	# test "ParameterDescription"
	add_executable(test_descriptions ${tst_dir}/test_descriptions)
	target_link_libraries(test_descriptions HEJ)
	add_test(
	NAME t_descriptions
	COMMAND test_descriptions
	)

	# test "EventParameters*Weight"
	add_executable(test_parameters ${tst_dir}/test_parameters)
	target_link_libraries(test_parameters HEJ)
	add_test(
	NAME test_parameters
	COMMAND test_parameters
	)

	# test unweighting
	add_executable(test_unweighter ${tst_dir}/test_unweighter)
	target_link_libraries(test_unweighter HEJ)
	add_test(
	NAME test_unweighter
	COMMAND test_unweighter ${tst_dir}/4j.lhe.gz
	)

	# test colour generation
	add_executable(test_colours ${tst_dir}/test_colours)
	target_link_libraries(test_colours HEJ)
	add_test(
	NAME t_colour_flow
	COMMAND test_colours
	)

	# test matrix elements
	add_executable(test_ME_generic ${tst_dir}/test_ME_generic.cc)
	target_link_libraries(test_ME_generic HEJ)
	add_test(
	NAME t_ME_j
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_mtinf.yml ${tst_ME_data_dir}/ME_jets_tree.dat ${tst_ME_data_dir}/PSP_jets.lhe.gz
	)
	add_test(
	NAME t_ME_j_virt
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_mtinf.yml ${tst_ME_data_dir}/ME_jets_tree_virt.dat ${tst_ME_data_dir}/PSP_jets.lhe.gz
	)
	add_test(
	NAME t_ME_h
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_mtinf.yml ${tst_ME_data_dir}/ME_h_mtinf_tree.dat ${tst_ME_data_dir}/PSP_h.lhe.gz
	)
	add_test(
	NAME t_ME_h_virt
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_mtinf.yml ${tst_ME_data_dir}/ME_h_mtinf_virt.dat ${tst_ME_data_dir}/PSP_h.lhe.gz
	)
	if(${QCDloop_FOUND})
	add_test(
	NAME t_ME_h_mt
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_mt.yml ${tst_ME_data_dir}/ME_h_mt_tree.dat ${tst_ME_data_dir}/PSP_h.lhe.gz
	)
	add_test(
	NAME t_ME_h_mtmb
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_mtmb.yml ${tst_ME_data_dir}/ME_h_mtmb_tree.dat ${tst_ME_data_dir}/PSP_h.lhe.gz
	)
	endif()
	add_test(
	NAME t_ME_w_FKL
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_w_ME.yml ${tst_ME_data_dir}/ME_w_FKL_tree.dat ${tst_ME_data_dir}/PSP_w_FKL.lhe.gz
	)
	add_test(
	NAME t_ME_w_FKL_virt
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_w_ME.yml ${tst_ME_data_dir}/ME_w_FKL_virt.dat ${tst_ME_data_dir}/PSP_w_FKL.lhe.gz
	)
	add_test(
	NAME t_ME_Wp
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_w_ME.yml ${tst_ME_data_dir}/ME_Wp.dat ${tst_ME_data_dir}/PSP_Wp.lhe.gz
	)
	add_test(
	NAME t_ME_Wp_virt
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_w_ME.yml ${tst_ME_data_dir}/ME_Wp_virt.dat ${tst_ME_data_dir}/PSP_Wp.lhe.gz
	)
	add_test(
	NAME t_ME_Wm
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_w_ME.yml ${tst_ME_data_dir}/ME_Wm.dat ${tst_ME_data_dir}/PSP_Wm.lhe.gz
	)
	add_test(
	NAME t_ME_Wm_virt
	COMMAND test_ME_generic ${tst_ME_data_dir}/config_w_ME.yml ${tst_ME_data_dir}/ME_Wm_virt.dat ${tst_ME_data_dir}/PSP_Wm.lhe.gz
	)

	# test main executable
	file(COPY "${tst_dir}/jet_config.yml" DESTINATION "${CMAKE_BINARY_DIR}")
	set(test_config "${CMAKE_BINARY_DIR}/jet_config.yml")
	+if(${HighFive_FOUND})
	+ file(READ ${test_config} config)
	+ file(WRITE ${test_config} "${config} - tst.hdf5\n")
	+endif()
	if(${HepMC3_FOUND})
	file(READ ${test_config} config)
	file(WRITE ${test_config} "${config} - tst.hepmc\n")
	endif()
	if(${HepMC_FOUND})
	file(READ ${test_config} config)
	file(WRITE ${test_config} "${config} - tst.hepmc2\n")
	if(${rivet_FOUND})
	file(READ ${test_config} config)
	file(WRITE ${test_config} "${config}\nanalysis:\n rivet: MC_XS\n output: tst\n")
	endif()
	endif()
	set(test_cmd_main "$<TARGET_FILE:HEJ_main>\\\;${test_config}\\\;${tst_dir}/2j.lhe.gz")
	# check that HepMC3 output is correct
	if(${HepMC3_FOUND})
	add_executable(check_hepmc ${tst_dir}/check_hepmc.cc)
	target_link_libraries(check_hepmc HEJ ${HEPMC3_LIBRARIES})
	target_include_directories(check_hepmc PRIVATE ${HEPMC3_INCLUDE_DIR})
	set(test_cmd_hepmc "$<TARGET_FILE:check_hepmc>\\\;tst.hepmc")
	else()
	set(test_cmd_hepmc "")
	endif()
	# check that LHEF output is correct
	add_executable(check_lhe ${tst_dir}/check_lhe.cc)
	target_link_libraries(check_lhe HEJ)
	set(test_cmd_lhe "$<TARGET_FILE:check_lhe>\\\;tst.lhe")
	# Run dependent tests in one command to ensure correct execution order
	# Note: The commands are concatenated with "\;" to escape CMake lists.
	# Thus arguments have to be escaped twice "\\\;".
	# e.g. "cmd1\;cmd2\\\;arg1\\\;arg2" is executed like "cmd1 && cmd2 arg1 arg2"
	add_test(
	NAME t_main
	COMMAND ${CMAKE_COMMAND}
	-DCMDS=${test_cmd_main}\;${test_cmd_hepmc}\;${test_cmd_lhe}
	-P ${PROJECT_SOURCE_DIR}/cmake/run_multiple_tests.cmake
	)
	-# check HDF5 reader
	+# check HDF5 reader & writer
	if(${HighFive_FOUND})
	add_executable(test_hdf5 ${tst_dir}/test_hdf5.cc)
	target_link_libraries(test_hdf5 HEJ)
	add_test(
	NAME t_hdf5
	COMMAND test_hdf5 ${tst_dir}/Wm9-g4-repack.hdf5
	)
	+ add_executable(test_hdf5_write ${tst_dir}/test_hdf5_write.cc)
	+ target_link_libraries(test_hdf5_write HEJ)
	+ add_test(
	+ NAME t_hdf5_write
	+ COMMAND test_hdf5_write ${tst_dir}/Wm9-g4-repack.hdf5
	+ )
	endif()
	# check rivet interface
	if(${RIVET_FOUND})
	add_executable(check_rivet ${tst_dir}/check_rivet.cc)
	target_link_libraries(check_rivet HEJ rivet::rivet HepMC::HepMC)
	add_test(
	NAME t_rivet
	COMMAND check_rivet
	)
	endif()

	# test boson reconstruction
	add_executable(cmp_events ${tst_dir}/cmp_events.cc)
	target_link_libraries(cmp_events HEJ)
	add_test(
	NAME t_epnu_2j_noW
	COMMAND cmp_events ${tst_dir}/epnu2jLOFKL_unweight.lhe.tar.gz ${tst_dir}/epnu2jLOFKL_unweight_noW.lhe.gz
	)

	# test resummed result
	add_executable(check_res ${tst_dir}/check_res.cc)
	target_link_libraries(check_res HEJ)

	if(${TEST_ALL}) # deactivate long tests by default
	add_test(
	NAME t_2j
	COMMAND check_res ${tst_dir}/2j.lhe.gz 3.49391e+07 419684
	)
	add_test(
	NAME t_3j
	COMMAND check_res ${tst_dir}/3j.lhe.gz 2.37902e+06 25746.6
	)
	add_test(
	NAME t_3j_unof
	COMMAND check_res ${tst_dir}/3j.lhe.gz 133399 4688.83 unof
	)
	add_test(
	NAME t_3j_unob
	COMMAND check_res ${tst_dir}/3j.lhe.gz 105247 3449.45 unob
	)
	add_test(
	NAME t_4j
	COMMAND check_res ${tst_dir}/4j.lhe.gz 603713 72822.6
	)
	add_test(
	NAME t_h_3j
	COMMAND check_res ${tst_dir}/h_3j.lhe.gz 0.821622 0.0220334
	)
	add_test(
	NAME t_h_3j_unof
	COMMAND check_res ${tst_dir}/h_3j_uno.lhe.gz 0.0127362 0.000271555 unof
	)
	add_test(
	NAME t_h_3j_unob
	COMMAND check_res ${tst_dir}/h_3j_uno.lhe.gz 0.0130615 0.000224793 unob
	)
	add_test(
	NAME t_epnu_2j
	COMMAND check_res ${tst_dir}/epnu2jLOFKL_unweight.lhe.tar.gz 262.7 3
	)
	add_test(
	NAME t_MGepnu_3j
	COMMAND check_res ${tst_dir}/MGepnu3j_unweighted.lhe.gz 38.9512 1
	)
	add_test(
	NAME t_MGemnubar_3j
	COMMAND check_res ${tst_dir}/MGemnubar3j_unweighted.lhe.gz 24.1575 1
	)
	add_test(
	NAME t_MGepnu_3j_unof
	COMMAND check_res ${tst_dir}/MGepnu3j_unweighted.lhe.gz 9.63702 0.128355 unof
	)
	add_test(
	NAME t_MGepnu_3j_unob
	COMMAND check_res ${tst_dir}/MGepnu3j_unweighted.lhe.gz 9.70119 0.108436 unob
	)
	add_test(
	NAME t_MGepnu_3j_splitf
	COMMAND check_res ${tst_dir}/MGepnu3j_unweighted.lhe.gz 2.91995 0.0463182 splitf
	)
	add_test(
	NAME t_MGepnu_3j_splitb
	COMMAND check_res ${tst_dir}/MGepnu3j_unweighted.lhe.gz 3.40708 0.0550975 splitb
	)
	add_test(
	NAME t_MGepnu_4j
	COMMAND check_res ${tst_dir}/MGepnu4j_unweighted.lhe.gz 10.2542 0.135106
	)
	add_test(
	NAME t_MGemnubar_4j
	COMMAND check_res ${tst_dir}/MGemnubar4j_unweighted.lhe.gz 5.57909 0.0300496
	)
	add_test(
	NAME t_MGepnu_4j_qqxmid
	COMMAND check_res ${tst_dir}/MGepnu4j_unweighted.lhe.gz 0.732084 0.005 qqxmid
	)
	endif()
	diff --git a/t/test_hdf5_write.cc b/t/test_hdf5_write.cc
	new file mode 100644
	index 0000000..4eb04be
	--- /dev/null
	+++ b/t/test_hdf5_write.cc
	@@ -0,0 +1,92 @@
	+/**
	+ * \authors The HEJ collaboration (see AUTHORS for details)
	+ * \date 2019
	+ * \copyright GPLv2 or later
	+ */
	+
	+#include "HEJ/Event.hh"
	+#include "HEJ/HDF5Reader.hh"
	+#include "HEJ/make_writer.hh"
	+#include "HEJ/utility.hh"
	+
	+#include <cstdio>
	+#include <iostream>
	+#include <unistd.h>
	+
	+// apparently hdf5 can't deal with the (safer) files in /proc/self/fd
	+// so we use tmpnam instead and RAII to ensure it gets deleted
	+class Tempfile {
	+public:
	+ Tempfile():
	+ file_{std::tmpnam(nullptr)}
	+ {}
	+
	+ std::string const & name() const {
	+ return file_;
	+ }
	+
	+ ~Tempfile(){
	+ unlink(file_.c_str());
	+ }
	+
	+private:
	+ std::string file_;
	+};
	+
	+int main(int argc, char** argv) {
	+ if(argc != 2) {
	+ std::cerr << "Usage: " << argv[0] << " file.hdf5\n";
	+ return EXIT_FAILURE;
	+ }
	+
	+ Tempfile file;
	+ std::vector<HEJ::Event> events;
	+ size_t max_nevent = 15299;
	+
	+ // this scope is needed to trigger the HEJ::HDF5Writer destructor
	+ // don't remove it
	+ {
	+ auto reader = HEJ::make_reader(argv[1]);
	+
	+ auto writer = HEJ::make_format_writer(
	+ HEJ::FileFormat::HDF5, file.name(), reader->heprup()
	+ );
	+
	+ size_t nevent = 0;
	+ while(reader->read_event()) {
	+ ++nevent;
	+ const auto event = HEJ::Event::EventData{reader->hepeup()}.cluster(
	+ fastjet::JetDefinition{fastjet::antikt_algorithm, 0.4}, 20.
	+ );
	+ events.emplace_back(event);
	+ writer->write(event);
	+ if(nevent>=max_nevent)
	+ break;
	+ }
	+ max_nevent = std::min(nevent,max_nevent);
	+ }
	+
	+ HEJ::HDF5Reader reader{file.name()};
	+ size_t nevent = 0;
	+ for(auto const & event: events) {
	+ ++nevent;
	+ reader.read_event();
	+ const auto ev = HEJ::Event::EventData{reader.hepeup()}.cluster(
	+ fastjet::JetDefinition{fastjet::antikt_algorithm, 0.4}, 20.
	+ );
	+ for(size_t i = 0; i < ev.incoming().size(); ++i) {
	+ if(!HEJ::nearby(ev.incoming()[i].p, event.incoming()[i].p)) return EXIT_FAILURE;
	+ }
	+ if(ev.outgoing().size() != event.outgoing().size()) return EXIT_FAILURE;
	+ for(size_t i = 0; i < ev.outgoing().size(); ++i) {
	+ if(!HEJ::nearby(ev.outgoing()[i].p, event.outgoing()[i].p)) return EXIT_FAILURE;
	+ }
	+ if(ev.decays().size() != event.decays().size()) return EXIT_FAILURE;
	+ if(ev.type() != event.type()) return EXIT_FAILURE;
	+ if(ev.central().weight != ev.central().weight) return EXIT_FAILURE;
	+ }
	+ if(nevent!=max_nevent)
	+ return EXIT_FAILURE;
	+
	+ return EXIT_SUCCESS;
	+}

File Metadata

Mime Type: text/x-diff
Expires: Tue, Nov 19, 8:23 PM (1 d, 5 h)
Storage Engine: blob
Storage Format: Raw Data
Storage Handle: 3799031
Default Alt Text: (197 KB)

No OneTemporaryActions

View Options

File Metadata

Event Timeline

No OneTemporary
Actions